In [None]:
from pathlib import Path
from docling.document_converter import DocumentConverter

def process_files(crawl_dir, processed_dir):
    input_path = Path(crawl_dir)
    processed_path = Path(processed_dir)
    processed_path.mkdir(parents=True, exist_ok=True)

    input_files = list(input_path.glob('*')) 
    print(f"Found {len(input_files)} files to process in {input_path}")

    converter = DocumentConverter(format_options={"preserve_links": True})

    files_processed = 0
    errors = 0

    for input_file in input_files:
        file_ext = input_file.suffix.lower()
        md_file_name = processed_path / f"{input_file.stem}.md"

        if md_file_name.exists():
            print(f"Skipping '{input_file.name}' — already processed.")
            continue

        try:
            result = converter.convert(input_file)
            markdown_content = result.document.export_to_markdown()
            
            with open(md_file_name, "w", encoding="utf-8") as md_file:
                md_file.write(markdown_content)
                
            print(f"Converted '{input_file}' --> '{md_file_name}'")
            files_processed += 1
            
        except Exception as e:
            errors += 1
            print(f"Error processing {input_file}: {e}")

    print(f"Processed {files_processed} new files. Errors: {errors}")

In [None]:
# process the edgar documents
import os

crawl_dir = 'data/edgar_documents'
processed_dir = 'data/processed_data'

entries = os.listdir(crawl_dir)
ticker_folders = []
for entry in entries:
    full_path = crawl_dir + '/' + entry
    if os.path.isdir(full_path):
        ticker_folders.append(entry)
print(ticker_folders)

for folder in ticker_folders:
    full_path = crawl_dir + '/' + folder
    output_dir = processed_dir + '/' + folder
    process_files(crawl_dir=full_path, processed_dir=output_dir)

2025-11-14 15:25:15,781 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:25:15,782 - ERROR - Input document 4_2023-05-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:25:15,786 - INFO - Going to convert document batch...
2025-11-14 15:25:15,794 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:25:15,795 - ERROR - Input document 4_2023-05-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

['AAPL', 'ABBV', 'ABT', 'ACN', 'ADBE', 'AIG', 'AMD', 'AMGN', 'AMT', 'AMZN', 'AVGO', 'AXP', 'BA', 'BK', 'BKNG', 'BLK', 'BMY', 'BRK-B', 'CAT', 'CHTR', 'CL', 'CMCSA', 'COF', 'COP', 'COST', 'CRM', 'CSCO', 'CVS', 'CVX', 'DE', 'DHR', 'DIS', 'DUK', 'EMR', 'FDX', 'GD', 'GE', 'GILD', 'GM', 'GOOGL', 'HD', 'HON', 'IBM', 'INTC', 'INTU', 'ISRG', 'JNJ', 'KO', 'LIN', 'LLY', 'LMT', 'LOW', 'MA', 'MCD', 'MDLZ', 'MDT', 'MET', 'META', 'MMM', 'MO', 'MRK', 'MSFT', 'NEE', 'NFLX', 'NKE', 'NOW', 'NVDA', 'ORCL', 'PEP', 'PFE', 'PG', 'PLTR', 'PM', 'PYPL', 'QCOM', 'RTX', 'SBUX', 'SCHW', 'SO', 'SPG', 'T', 'TGT', 'TMO', 'TMUS', 'TSLA', 'TXN', 'UNH', 'UNP', 'UPS', 'USB', 'V', 'VZ', 'WFC', 'WMT', 'XOM']
Found 91 files to process in data\edgar_documents\AAPL
Skipping '10-K_2023-11-03' — already processed.
Skipping '10-K_2024-11-01' — already processed.
Skipping '10-K_2025-10-31' — already processed.
Skipping '10-Q_2023-02-03' — already processed.
Skipping '10-Q_2023-05-05' — already processed.
Skipping '10-Q_2023-08-04

2025-11-14 15:25:15,991 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:17,062 - INFO - Going to convert document batch...
2025-11-14 15:25:17,062 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:25:17,063 - INFO - Processing document 10-K_2023-02-17
2025-11-14 15:25:19,639 - INFO - Finished converting document 10-K_2023-02-17 in 3.77 sec.
2025-11-14 15:25:20,421 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\10-K_2023-02-17' --> 'data\processed_data\ABBV\10-K_2023-02-17.md'


2025-11-14 15:25:21,470 - INFO - Going to convert document batch...
2025-11-14 15:25:21,473 - INFO - Processing document 10-K_2024-02-20
2025-11-14 15:25:23,983 - INFO - Finished converting document 10-K_2024-02-20 in 3.64 sec.
2025-11-14 15:25:24,790 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\10-K_2024-02-20' --> 'data\processed_data\ABBV\10-K_2024-02-20.md'


2025-11-14 15:25:26,098 - INFO - Going to convert document batch...
2025-11-14 15:25:26,099 - INFO - Processing document 10-K_2025-02-14
2025-11-14 15:25:29,061 - INFO - Finished converting document 10-K_2025-02-14 in 4.34 sec.
2025-11-14 15:25:29,830 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\10-K_2025-02-14' --> 'data\processed_data\ABBV\10-K_2025-02-14.md'


2025-11-14 15:25:30,634 - INFO - Going to convert document batch...
2025-11-14 15:25:30,636 - INFO - Processing document 10-Q_2023-05-05
2025-11-14 15:25:31,436 - INFO - Finished converting document 10-Q_2023-05-05 in 1.64 sec.
2025-11-14 15:25:31,857 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\10-Q_2023-05-05' --> 'data\processed_data\ABBV\10-Q_2023-05-05.md'


2025-11-14 15:25:32,343 - INFO - Going to convert document batch...
2025-11-14 15:25:32,344 - INFO - Processing document 10-Q_2023-08-07
2025-11-14 15:25:33,323 - INFO - Finished converting document 10-Q_2023-08-07 in 1.52 sec.
2025-11-14 15:25:33,745 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\10-Q_2023-08-07' --> 'data\processed_data\ABBV\10-Q_2023-08-07.md'


2025-11-14 15:25:34,706 - INFO - Going to convert document batch...
2025-11-14 15:25:34,707 - INFO - Processing document 10-Q_2023-11-06
2025-11-14 15:25:35,689 - INFO - Finished converting document 10-Q_2023-11-06 in 1.98 sec.
2025-11-14 15:25:36,112 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\10-Q_2023-11-06' --> 'data\processed_data\ABBV\10-Q_2023-11-06.md'


2025-11-14 15:25:36,862 - INFO - Going to convert document batch...
2025-11-14 15:25:36,864 - INFO - Processing document 10-Q_2024-05-03
2025-11-14 15:25:37,746 - INFO - Finished converting document 10-Q_2024-05-03 in 1.67 sec.
2025-11-14 15:25:38,156 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\10-Q_2024-05-03' --> 'data\processed_data\ABBV\10-Q_2024-05-03.md'


2025-11-14 15:25:38,617 - INFO - Going to convert document batch...
2025-11-14 15:25:38,617 - INFO - Processing document 10-Q_2024-08-07
2025-11-14 15:25:40,009 - INFO - Finished converting document 10-Q_2024-08-07 in 1.89 sec.
2025-11-14 15:25:40,463 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\10-Q_2024-08-07' --> 'data\processed_data\ABBV\10-Q_2024-08-07.md'


2025-11-14 15:25:40,951 - INFO - Going to convert document batch...
2025-11-14 15:25:40,951 - INFO - Processing document 10-Q_2024-11-04
2025-11-14 15:25:42,025 - INFO - Finished converting document 10-Q_2024-11-04 in 1.59 sec.
2025-11-14 15:25:42,486 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\10-Q_2024-11-04' --> 'data\processed_data\ABBV\10-Q_2024-11-04.md'


2025-11-14 15:25:43,210 - INFO - Going to convert document batch...
2025-11-14 15:25:43,211 - INFO - Processing document 10-Q_2025-05-09
2025-11-14 15:25:44,026 - INFO - Finished converting document 10-Q_2025-05-09 in 1.58 sec.
2025-11-14 15:25:44,425 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\10-Q_2025-05-09' --> 'data\processed_data\ABBV\10-Q_2025-05-09.md'


2025-11-14 15:25:45,221 - INFO - Going to convert document batch...
2025-11-14 15:25:45,222 - INFO - Processing document 10-Q_2025-08-04
2025-11-14 15:25:46,207 - INFO - Finished converting document 10-Q_2025-08-04 in 1.81 sec.
2025-11-14 15:25:46,715 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\10-Q_2025-08-04' --> 'data\processed_data\ABBV\10-Q_2025-08-04.md'


2025-11-14 15:25:47,215 - INFO - Going to convert document batch...
2025-11-14 15:25:47,216 - INFO - Processing document 10-Q_2025-11-04
2025-11-14 15:25:48,605 - INFO - Finished converting document 10-Q_2025-11-04 in 2.00 sec.
2025-11-14 15:25:49,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,051 - INFO - Going to convert document batch...
2025-11-14 15:25:49,051 - INFO - Processing document 4_2023-01-03
2025-11-14 15:25:49,070 - INFO - Finished converting document 4_2023-01-03 in 0.03 sec.
2025-11-14 15:25:49,109 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,119 - INFO - Going to convert document batch...
2025-11-14 15:25:49,119 - INFO - Processing document 4_2023-02-21
2025-11-14 15:25:49,136 - INFO - Finished converting document 4_2023-02-21 in 0.05 sec.
2025-11-14 15:25:49,183 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,194 - INFO - Going to convert document batch...
2025-11-14 15:25:49,

Converted 'data\edgar_documents\ABBV\10-Q_2025-11-04' --> 'data\processed_data\ABBV\10-Q_2025-11-04.md'
Converted 'data\edgar_documents\ABBV\4_2023-01-03' --> 'data\processed_data\ABBV\4_2023-01-03.md'
Converted 'data\edgar_documents\ABBV\4_2023-02-21' --> 'data\processed_data\ABBV\4_2023-02-21.md'


2025-11-14 15:25:49,217 - INFO - Finished converting document 4_2023-02-22 in 0.06 sec.
2025-11-14 15:25:49,253 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,261 - INFO - Going to convert document batch...
2025-11-14 15:25:49,262 - INFO - Processing document 4_2023-03-02
2025-11-14 15:25:49,280 - INFO - Finished converting document 4_2023-03-02 in 0.05 sec.
2025-11-14 15:25:49,332 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,341 - INFO - Going to convert document batch...
2025-11-14 15:25:49,342 - INFO - Processing document 4_2023-03-07
2025-11-14 15:25:49,362 - INFO - Finished converting document 4_2023-03-07 in 0.06 sec.
2025-11-14 15:25:49,412 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,424 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ABBV\4_2023-02-22' --> 'data\processed_data\ABBV\4_2023-02-22.md'
Converted 'data\edgar_documents\ABBV\4_2023-03-02' --> 'data\processed_data\ABBV\4_2023-03-02.md'
Converted 'data\edgar_documents\ABBV\4_2023-03-07' --> 'data\processed_data\ABBV\4_2023-03-07.md'


2025-11-14 15:25:49,425 - INFO - Processing document 4_2023-03-15
2025-11-14 15:25:49,449 - INFO - Finished converting document 4_2023-03-15 in 0.08 sec.
2025-11-14 15:25:49,486 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,492 - INFO - Going to convert document batch...
2025-11-14 15:25:49,495 - INFO - Processing document 4_2023-04-04
2025-11-14 15:25:49,519 - INFO - Finished converting document 4_2023-04-04 in 0.05 sec.
2025-11-14 15:25:49,574 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,584 - INFO - Going to convert document batch...
2025-11-14 15:25:49,584 - INFO - Processing document 4_2023-04-05
2025-11-14 15:25:49,605 - INFO - Finished converting document 4_2023-04-05 in 0.06 sec.
2025-11-14 15:25:49,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,656 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ABBV\4_2023-03-15' --> 'data\processed_data\ABBV\4_2023-03-15.md'
Converted 'data\edgar_documents\ABBV\4_2023-04-04' --> 'data\processed_data\ABBV\4_2023-04-04.md'
Converted 'data\edgar_documents\ABBV\4_2023-04-05' --> 'data\processed_data\ABBV\4_2023-04-05.md'


2025-11-14 15:25:49,656 - INFO - Processing document 4_2023-04-19
2025-11-14 15:25:49,677 - INFO - Finished converting document 4_2023-04-19 in 0.05 sec.
2025-11-14 15:25:49,714 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,724 - INFO - Going to convert document batch...
2025-11-14 15:25:49,725 - INFO - Processing document 4_2023-04-27
2025-11-14 15:25:49,746 - INFO - Finished converting document 4_2023-04-27 in 0.05 sec.
2025-11-14 15:25:49,799 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,810 - INFO - Going to convert document batch...
2025-11-14 15:25:49,812 - INFO - Processing document 4_2023-05-02
2025-11-14 15:25:49,833 - INFO - Finished converting document 4_2023-05-02 in 0.06 sec.
2025-11-14 15:25:49,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,879 - INFO - Going to convert document batch...
2025-11-14 15:25:49,880 - INFO - Processing document 4_2023-05-09
2025-11-14 15:25:49,899 - IN

Converted 'data\edgar_documents\ABBV\4_2023-04-19' --> 'data\processed_data\ABBV\4_2023-04-19.md'
Converted 'data\edgar_documents\ABBV\4_2023-04-27' --> 'data\processed_data\ABBV\4_2023-04-27.md'
Converted 'data\edgar_documents\ABBV\4_2023-05-02' --> 'data\processed_data\ABBV\4_2023-05-02.md'


2025-11-14 15:25:49,938 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:49,947 - INFO - Going to convert document batch...
2025-11-14 15:25:49,948 - INFO - Processing document 4_2023-05-12
2025-11-14 15:25:49,966 - INFO - Finished converting document 4_2023-05-12 in 0.05 sec.
2025-11-14 15:25:50,003 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:50,012 - INFO - Going to convert document batch...
2025-11-14 15:25:50,013 - INFO - Processing document 4_2023-07-05
2025-11-14 15:25:50,035 - INFO - Finished converting document 4_2023-07-05 in 0.05 sec.
2025-11-14 15:25:50,091 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:50,105 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ABBV\4_2023-05-09' --> 'data\processed_data\ABBV\4_2023-05-09.md'
Converted 'data\edgar_documents\ABBV\4_2023-05-12' --> 'data\processed_data\ABBV\4_2023-05-12.md'
Converted 'data\edgar_documents\ABBV\4_2023-07-05' --> 'data\processed_data\ABBV\4_2023-07-05.md'


2025-11-14 15:25:50,106 - INFO - Processing document 4_2023-08-02
2025-11-14 15:25:50,155 - INFO - Finished converting document 4_2023-08-02 in 0.09 sec.
2025-11-14 15:25:50,196 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:50,202 - INFO - Going to convert document batch...
2025-11-14 15:25:50,203 - INFO - Processing document 4_2023-09-11
2025-11-14 15:25:50,220 - INFO - Finished converting document 4_2023-09-11 in 0.03 sec.
2025-11-14 15:25:50,265 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:50,279 - INFO - Going to convert document batch...
2025-11-14 15:25:50,280 - INFO - Processing document 4_2023-09-27
2025-11-14 15:25:50,302 - INFO - Finished converting document 4_2023-09-27 in 0.06 sec.
2025-11-14 15:25:50,335 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:50,342 - INFO - Going to convert document batch...
2025-11-14 15:25:50,343 - INFO - Processing document 4_2023-10-03
2025-11-14 15:25:50,363 - IN

Converted 'data\edgar_documents\ABBV\4_2023-08-02' --> 'data\processed_data\ABBV\4_2023-08-02.md'
Converted 'data\edgar_documents\ABBV\4_2023-09-11' --> 'data\processed_data\ABBV\4_2023-09-11.md'
Converted 'data\edgar_documents\ABBV\4_2023-09-27' --> 'data\processed_data\ABBV\4_2023-09-27.md'
Converted 'data\edgar_documents\ABBV\4_2023-10-03' --> 'data\processed_data\ABBV\4_2023-10-03.md'


2025-11-14 15:25:50,418 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:50,428 - INFO - Going to convert document batch...
2025-11-14 15:25:50,429 - INFO - Processing document 4_2023-12-28
2025-11-14 15:25:50,450 - INFO - Finished converting document 4_2023-12-28 in 0.06 sec.
2025-11-14 15:25:50,483 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:50,491 - INFO - Going to convert document batch...
2025-11-14 15:25:50,491 - INFO - Processing document 4_2024-01-03
2025-11-14 15:25:50,513 - INFO - Finished converting document 4_2024-01-03 in 0.05 sec.
2025-11-14 15:25:50,547 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:50,555 - INFO - Going to convert document batch...
2025-11-14 15:25:50,556 - INFO - Processing document 4_2024-02-06
2025-11-14 15:25:50,578 - INFO - Finished converting document 4_2024-02-06 in 0.05 sec.
2025-11-14 15:25:50,624 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\ABBV\4_2023-12-28' --> 'data\processed_data\ABBV\4_2023-12-28.md'
Converted 'data\edgar_documents\ABBV\4_2024-01-03' --> 'data\processed_data\ABBV\4_2024-01-03.md'
Converted 'data\edgar_documents\ABBV\4_2024-02-06' --> 'data\processed_data\ABBV\4_2024-02-06.md'


2025-11-14 15:25:50,719 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:25:50,720 - ERROR - Input document 4_2024-02-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:25:50,721 - INFO - Going to convert document batch...
2025-11-14 15:25:50,734 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:50,744 - INFO - Going to convert document batch...
2025-11-14 15:25:50,745 - INFO - Processing document 4_2024-02-23
2025-11-14 15:25:50,768 - INFO - Fin

Converted 'data\edgar_documents\ABBV\4_2024-02-20' --> 'data\processed_data\ABBV\4_2024-02-20.md'
Error processing data\edgar_documents\ABBV\4_2024-02-21: File format not allowed: data\edgar_documents\ABBV\4_2024-02-21
Converted 'data\edgar_documents\ABBV\4_2024-02-23' --> 'data\processed_data\ABBV\4_2024-02-23.md'
Error processing data\edgar_documents\ABBV\4_2024-02-26: File format not allowed: data\edgar_documents\ABBV\4_2024-02-26


2025-11-14 15:25:50,908 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:50,917 - INFO - Going to convert document batch...
2025-11-14 15:25:50,918 - INFO - Processing document 4_2024-02-29
2025-11-14 15:25:50,937 - INFO - Finished converting document 4_2024-02-29 in 0.05 sec.
2025-11-14 15:25:50,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,002 - INFO - Going to convert document batch...
2025-11-14 15:25:51,003 - INFO - Processing document 4_2024-03-01
2025-11-14 15:25:51,026 - INFO - Finished converting document 4_2024-03-01 in 0.08 sec.
2025-11-14 15:25:51,063 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,074 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ABBV\4_2024-02-27' --> 'data\processed_data\ABBV\4_2024-02-27.md'
Converted 'data\edgar_documents\ABBV\4_2024-02-29' --> 'data\processed_data\ABBV\4_2024-02-29.md'
Converted 'data\edgar_documents\ABBV\4_2024-03-01' --> 'data\processed_data\ABBV\4_2024-03-01.md'


2025-11-14 15:25:51,075 - INFO - Processing document 4_2024-03-05
2025-11-14 15:25:51,102 - INFO - Finished converting document 4_2024-03-05 in 0.05 sec.
2025-11-14 15:25:51,138 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,149 - INFO - Going to convert document batch...
2025-11-14 15:25:51,149 - INFO - Processing document 4_2024-03-20
2025-11-14 15:25:51,175 - INFO - Finished converting document 4_2024-03-20 in 0.05 sec.
2025-11-14 15:25:51,214 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,221 - INFO - Going to convert document batch...
2025-11-14 15:25:51,221 - INFO - Processing document 4_2024-03-22
2025-11-14 15:25:51,237 - INFO - Finished converting document 4_2024-03-22 in 0.03 sec.
2025-11-14 15:25:51,289 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,299 - INFO - Going to convert document batch...
2025-11-14 15:25:51,300 - INFO - Processing document 4_2024-04-02
2025-11-14 15:25:51,317 - IN

Converted 'data\edgar_documents\ABBV\4_2024-03-05' --> 'data\processed_data\ABBV\4_2024-03-05.md'
Converted 'data\edgar_documents\ABBV\4_2024-03-20' --> 'data\processed_data\ABBV\4_2024-03-20.md'
Converted 'data\edgar_documents\ABBV\4_2024-03-22' --> 'data\processed_data\ABBV\4_2024-03-22.md'


2025-11-14 15:25:51,351 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,358 - INFO - Going to convert document batch...
2025-11-14 15:25:51,359 - INFO - Processing document 4_2024-05-07
2025-11-14 15:25:51,381 - INFO - Finished converting document 4_2024-05-07 in 0.05 sec.
2025-11-14 15:25:51,412 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,421 - INFO - Going to convert document batch...
2025-11-14 15:25:51,421 - INFO - Processing document 4_2024-07-02
2025-11-14 15:25:51,439 - INFO - Finished converting document 4_2024-07-02 in 0.05 sec.
2025-11-14 15:25:51,472 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,484 - INFO - Going to convert document batch...
2025-11-14 15:25:51,485 - INFO - Processing document 4_2024-07-19
2025-11-14 15:25:51,517 - INFO - Finished converting document 4_2024-07-19 in 0.06 sec.


Converted 'data\edgar_documents\ABBV\4_2024-04-02' --> 'data\processed_data\ABBV\4_2024-04-02.md'
Converted 'data\edgar_documents\ABBV\4_2024-05-07' --> 'data\processed_data\ABBV\4_2024-05-07.md'
Converted 'data\edgar_documents\ABBV\4_2024-07-02' --> 'data\processed_data\ABBV\4_2024-07-02.md'


2025-11-14 15:25:51,564 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,579 - INFO - Going to convert document batch...
2025-11-14 15:25:51,580 - INFO - Processing document 4_2024-08-07
2025-11-14 15:25:51,602 - INFO - Finished converting document 4_2024-08-07 in 0.05 sec.
2025-11-14 15:25:51,634 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,642 - INFO - Going to convert document batch...
2025-11-14 15:25:51,642 - INFO - Processing document 4_2024-09-30
2025-11-14 15:25:51,661 - INFO - Finished converting document 4_2024-09-30 in 0.03 sec.
2025-11-14 15:25:51,692 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,700 - INFO - Going to convert document batch...
2025-11-14 15:25:51,701 - INFO - Processing document 4_2024-10-02
2025-11-14 15:25:51,719 - INFO - Finished converting document 4_2024-10-02 in 0.05 sec.


Converted 'data\edgar_documents\ABBV\4_2024-07-19' --> 'data\processed_data\ABBV\4_2024-07-19.md'
Converted 'data\edgar_documents\ABBV\4_2024-08-07' --> 'data\processed_data\ABBV\4_2024-08-07.md'
Converted 'data\edgar_documents\ABBV\4_2024-09-30' --> 'data\processed_data\ABBV\4_2024-09-30.md'
Converted 'data\edgar_documents\ABBV\4_2024-10-02' --> 'data\processed_data\ABBV\4_2024-10-02.md'


2025-11-14 15:25:51,768 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,782 - INFO - Going to convert document batch...
2025-11-14 15:25:51,783 - INFO - Processing document 4_2024-12-18
2025-11-14 15:25:51,802 - INFO - Finished converting document 4_2024-12-18 in 0.06 sec.
2025-11-14 15:25:51,834 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,841 - INFO - Going to convert document batch...
2025-11-14 15:25:51,842 - INFO - Processing document 4_2025-01-03
2025-11-14 15:25:51,862 - INFO - Finished converting document 4_2025-01-03 in 0.05 sec.
2025-11-14 15:25:51,892 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:51,902 - INFO - Going to convert document batch...
2025-11-14 15:25:51,903 - INFO - Processing document 4_2025-02-07
2025-11-14 15:25:51,928 - INFO - Finished converting document 4_2025-02-07 in 0.05 sec.
2025-11-14 15:25:51,965 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\ABBV\4_2024-12-18' --> 'data\processed_data\ABBV\4_2024-12-18.md'
Converted 'data\edgar_documents\ABBV\4_2025-01-03' --> 'data\processed_data\ABBV\4_2025-01-03.md'
Converted 'data\edgar_documents\ABBV\4_2025-02-07' --> 'data\processed_data\ABBV\4_2025-02-07.md'


2025-11-14 15:25:52,047 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:25:52,048 - ERROR - Input document 4_2025-02-20 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:25:52,050 - INFO - Going to convert document batch...
2025-11-14 15:25:52,062 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:52,071 - INFO - Going to convert document batch...
2025-11-14 15:25:52,072 - INFO - Processing document 4_2025-02-24
2025-11-14 15:25:52,090 - INFO - Fin

Converted 'data\edgar_documents\ABBV\4_2025-02-18' --> 'data\processed_data\ABBV\4_2025-02-18.md'
Error processing data\edgar_documents\ABBV\4_2025-02-20: File format not allowed: data\edgar_documents\ABBV\4_2025-02-20
Converted 'data\edgar_documents\ABBV\4_2025-02-24' --> 'data\processed_data\ABBV\4_2025-02-24.md'
Converted 'data\edgar_documents\ABBV\4_2025-02-28' --> 'data\processed_data\ABBV\4_2025-02-28.md'


2025-11-14 15:25:52,204 - INFO - Processing document 4_2025-03-04
2025-11-14 15:25:52,222 - INFO - Finished converting document 4_2025-03-04 in 0.03 sec.
2025-11-14 15:25:52,252 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:52,259 - INFO - Going to convert document batch...
2025-11-14 15:25:52,260 - INFO - Processing document 4_2025-03-18
2025-11-14 15:25:52,277 - INFO - Finished converting document 4_2025-03-18 in 0.05 sec.
2025-11-14 15:25:52,338 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:52,349 - INFO - Going to convert document batch...
2025-11-14 15:25:52,349 - INFO - Processing document 4_2025-04-02
2025-11-14 15:25:52,368 - INFO - Finished converting document 4_2025-04-02 in 0.05 sec.
2025-11-14 15:25:52,400 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:52,409 - INFO - Going to convert document batch...
2025-11-14 15:25:52,410 - INFO - Processing document 4_2025-05-13
2025-11-14 15:25:52,429 - IN

Converted 'data\edgar_documents\ABBV\4_2025-03-04' --> 'data\processed_data\ABBV\4_2025-03-04.md'
Converted 'data\edgar_documents\ABBV\4_2025-03-18' --> 'data\processed_data\ABBV\4_2025-03-18.md'
Converted 'data\edgar_documents\ABBV\4_2025-04-02' --> 'data\processed_data\ABBV\4_2025-04-02.md'


2025-11-14 15:25:52,462 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:52,469 - INFO - Going to convert document batch...
2025-11-14 15:25:52,471 - INFO - Processing document 4_2025-07-02
2025-11-14 15:25:52,491 - INFO - Finished converting document 4_2025-07-02 in 0.03 sec.
2025-11-14 15:25:52,542 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:52,555 - INFO - Going to convert document batch...
2025-11-14 15:25:52,556 - INFO - Processing document 4_2025-08-07
2025-11-14 15:25:52,577 - INFO - Finished converting document 4_2025-08-07 in 0.06 sec.
2025-11-14 15:25:52,610 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:52,620 - INFO - Going to convert document batch...
2025-11-14 15:25:52,620 - INFO - Processing document 4_2025-08-14
2025-11-14 15:25:52,642 - INFO - Finished converting document 4_2025-08-14 in 0.05 sec.


Converted 'data\edgar_documents\ABBV\4_2025-05-13' --> 'data\processed_data\ABBV\4_2025-05-13.md'
Converted 'data\edgar_documents\ABBV\4_2025-07-02' --> 'data\processed_data\ABBV\4_2025-07-02.md'
Converted 'data\edgar_documents\ABBV\4_2025-08-07' --> 'data\processed_data\ABBV\4_2025-08-07.md'


2025-11-14 15:25:52,676 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:52,684 - INFO - Going to convert document batch...
2025-11-14 15:25:52,685 - INFO - Processing document 4_2025-10-02
2025-11-14 15:25:52,704 - INFO - Finished converting document 4_2025-10-02 in 0.05 sec.
2025-11-14 15:25:52,736 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:52,753 - INFO - Going to convert document batch...
2025-11-14 15:25:52,754 - INFO - Processing document 8-K_2023-01-06
2025-11-14 15:25:52,774 - INFO - Finished converting document 8-K_2023-01-06 in 0.05 sec.
2025-11-14 15:25:52,801 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:52,816 - INFO - Going to convert document batch...
2025-11-14 15:25:52,816 - INFO - Processing document 8-K_2023-01-10
2025-11-14 15:25:52,838 - INFO - Finished converting document 8-K_2023-01-10 in 0.05 sec.


Converted 'data\edgar_documents\ABBV\4_2025-08-14' --> 'data\processed_data\ABBV\4_2025-08-14.md'
Converted 'data\edgar_documents\ABBV\4_2025-10-02' --> 'data\processed_data\ABBV\4_2025-10-02.md'
Converted 'data\edgar_documents\ABBV\8-K_2023-01-06' --> 'data\processed_data\ABBV\8-K_2023-01-06.md'


2025-11-14 15:25:52,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:52,887 - INFO - Going to convert document batch...
2025-11-14 15:25:52,889 - INFO - Processing document 8-K_2023-02-09
2025-11-14 15:25:52,912 - INFO - Finished converting document 8-K_2023-02-09 in 0.05 sec.
2025-11-14 15:25:52,935 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:52,950 - INFO - Going to convert document batch...
2025-11-14 15:25:52,951 - INFO - Processing document 8-K_2023-03-28
2025-11-14 15:25:52,976 - INFO - Finished converting document 8-K_2023-03-28 in 0.05 sec.
2025-11-14 15:25:53,025 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:53,044 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ABBV\8-K_2023-01-10' --> 'data\processed_data\ABBV\8-K_2023-01-10.md'
Converted 'data\edgar_documents\ABBV\8-K_2023-02-09' --> 'data\processed_data\ABBV\8-K_2023-02-09.md'
Converted 'data\edgar_documents\ABBV\8-K_2023-03-28' --> 'data\processed_data\ABBV\8-K_2023-03-28.md'


2025-11-14 15:25:53,045 - INFO - Processing document 8-K_2023-04-05
2025-11-14 15:25:53,068 - INFO - Finished converting document 8-K_2023-04-05 in 0.08 sec.
2025-11-14 15:25:53,090 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:53,108 - INFO - Going to convert document batch...
2025-11-14 15:25:53,110 - INFO - Processing document 8-K_2023-04-27
2025-11-14 15:25:53,132 - INFO - Finished converting document 8-K_2023-04-27 in 0.05 sec.
2025-11-14 15:25:53,154 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:53,179 - INFO - Going to convert document batch...
2025-11-14 15:25:53,179 - INFO - Processing document 8-K_2023-05-10
2025-11-14 15:25:53,221 - INFO - Finished converting document 8-K_2023-05-10 in 0.08 sec.
2025-11-14 15:25:53,254 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:53,266 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ABBV\8-K_2023-04-05' --> 'data\processed_data\ABBV\8-K_2023-04-05.md'
Converted 'data\edgar_documents\ABBV\8-K_2023-04-27' --> 'data\processed_data\ABBV\8-K_2023-04-27.md'
Converted 'data\edgar_documents\ABBV\8-K_2023-05-10' --> 'data\processed_data\ABBV\8-K_2023-05-10.md'


2025-11-14 15:25:53,267 - INFO - Processing document 8-K_2023-06-29
2025-11-14 15:25:53,288 - INFO - Finished converting document 8-K_2023-06-29 in 0.05 sec.
2025-11-14 15:25:53,316 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:53,333 - INFO - Going to convert document batch...
2025-11-14 15:25:53,334 - INFO - Processing document 8-K_2023-07-06
2025-11-14 15:25:53,355 - INFO - Finished converting document 8-K_2023-07-06 in 0.06 sec.
2025-11-14 15:25:53,381 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:53,396 - INFO - Going to convert document batch...
2025-11-14 15:25:53,398 - INFO - Processing document 8-K_2023-07-27
2025-11-14 15:25:53,416 - INFO - Finished converting document 8-K_2023-07-27 in 0.05 sec.
2025-11-14 15:25:53,440 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:53,456 - INFO - Going to convert document batch...
2025-11-14 15:25:53,457 - INFO - Processing document 8-K_2023-10-04
2025-11-14 15:

Converted 'data\edgar_documents\ABBV\8-K_2023-06-29' --> 'data\processed_data\ABBV\8-K_2023-06-29.md'
Converted 'data\edgar_documents\ABBV\8-K_2023-07-06' --> 'data\processed_data\ABBV\8-K_2023-07-06.md'
Converted 'data\edgar_documents\ABBV\8-K_2023-07-27' --> 'data\processed_data\ABBV\8-K_2023-07-27.md'


2025-11-14 15:25:53,503 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:53,521 - INFO - Going to convert document batch...
2025-11-14 15:25:53,521 - INFO - Processing document 8-K_2023-10-12
2025-11-14 15:25:53,550 - INFO - Finished converting document 8-K_2023-10-12 in 0.06 sec.
2025-11-14 15:25:53,581 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:53,596 - INFO - Going to convert document batch...
2025-11-14 15:25:53,597 - INFO - Processing document 8-K_2023-10-27
2025-11-14 15:25:53,619 - INFO - Finished converting document 8-K_2023-10-27 in 0.06 sec.
2025-11-14 15:25:53,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:53,662 - INFO - Going to convert document batch...
2025-11-14 15:25:53,663 - INFO - Processing document 8-K_2023-11-30
2025-11-14 15:25:53,688 - INFO - Finished converting document 8-K_2023-11-30 in 0.06 sec.


Converted 'data\edgar_documents\ABBV\8-K_2023-10-04' --> 'data\processed_data\ABBV\8-K_2023-10-04.md'
Converted 'data\edgar_documents\ABBV\8-K_2023-10-12' --> 'data\processed_data\ABBV\8-K_2023-10-12.md'
Converted 'data\edgar_documents\ABBV\8-K_2023-10-27' --> 'data\processed_data\ABBV\8-K_2023-10-27.md'


2025-11-14 15:25:53,720 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:53,736 - INFO - Going to convert document batch...
2025-11-14 15:25:53,737 - INFO - Processing document 8-K_2023-12-06


Converted 'data\edgar_documents\ABBV\8-K_2023-11-30' --> 'data\processed_data\ABBV\8-K_2023-11-30.md'


2025-11-14 15:25:54,243 - INFO - Finished converting document 8-K_2023-12-06 in 0.53 sec.
2025-11-14 15:25:54,308 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:54,328 - INFO - Going to convert document batch...
2025-11-14 15:25:54,329 - INFO - Processing document 8-K_2024-01-05
2025-11-14 15:25:54,349 - INFO - Finished converting document 8-K_2024-01-05 in 0.08 sec.
2025-11-14 15:25:54,372 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:54,384 - INFO - Going to convert document batch...
2025-11-14 15:25:54,385 - INFO - Processing document 8-K_2024-02-02
2025-11-14 15:25:54,405 - INFO - Finished converting document 8-K_2024-02-02 in 0.05 sec.
2025-11-14 15:25:54,427 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:54,440 - INFO - Going to convert document batch...
2025-11-14 15:25:54,441 - INFO - Processing document 8-K_2024-02-12
2025-11-14 15:25:54,473 - INFO - Finished converting document 8-K_2024-02-12 in 0.

Converted 'data\edgar_documents\ABBV\8-K_2023-12-06' --> 'data\processed_data\ABBV\8-K_2023-12-06.md'
Converted 'data\edgar_documents\ABBV\8-K_2024-01-05' --> 'data\processed_data\ABBV\8-K_2024-01-05.md'
Converted 'data\edgar_documents\ABBV\8-K_2024-02-02' --> 'data\processed_data\ABBV\8-K_2024-02-02.md'


2025-11-14 15:25:54,504 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:54,520 - INFO - Going to convert document batch...
2025-11-14 15:25:54,521 - INFO - Processing document 8-K_2024-02-20
2025-11-14 15:25:54,550 - INFO - Finished converting document 8-K_2024-02-20 in 0.06 sec.
2025-11-14 15:25:54,607 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:54,627 - INFO - Going to convert document batch...
2025-11-14 15:25:54,628 - INFO - Processing document 8-K_2024-02-26
2025-11-14 15:25:54,667 - INFO - Finished converting document 8-K_2024-02-26 in 0.09 sec.


Converted 'data\edgar_documents\ABBV\8-K_2024-02-12' --> 'data\processed_data\ABBV\8-K_2024-02-12.md'
Converted 'data\edgar_documents\ABBV\8-K_2024-02-20' --> 'data\processed_data\ABBV\8-K_2024-02-20.md'


2025-11-14 15:25:54,704 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:54,717 - INFO - Going to convert document batch...
2025-11-14 15:25:54,718 - INFO - Processing document 8-K_2024-04-03
2025-11-14 15:25:54,744 - INFO - Finished converting document 8-K_2024-04-03 in 0.05 sec.
2025-11-14 15:25:54,768 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:54,782 - INFO - Going to convert document batch...
2025-11-14 15:25:54,783 - INFO - Processing document 8-K_2024-04-26
2025-11-14 15:25:54,803 - INFO - Finished converting document 8-K_2024-04-26 in 0.05 sec.
2025-11-14 15:25:54,829 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:54,852 - INFO - Going to convert document batch...
2025-11-14 15:25:54,853 - INFO - Processing document 8-K_2024-05-08
2025-11-14 15:25:54,891 - INFO - Finished converting document 8-K_2024-05-08 in 0.08 sec.


Converted 'data\edgar_documents\ABBV\8-K_2024-02-26' --> 'data\processed_data\ABBV\8-K_2024-02-26.md'
Converted 'data\edgar_documents\ABBV\8-K_2024-04-03' --> 'data\processed_data\ABBV\8-K_2024-04-03.md'
Converted 'data\edgar_documents\ABBV\8-K_2024-04-26' --> 'data\processed_data\ABBV\8-K_2024-04-26.md'


2025-11-14 15:25:54,931 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:54,973 - INFO - Going to convert document batch...
2025-11-14 15:25:54,974 - INFO - Processing document 8-K_2024-07-03
2025-11-14 15:25:54,999 - INFO - Finished converting document 8-K_2024-07-03 in 0.09 sec.
2025-11-14 15:25:55,021 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,034 - INFO - Going to convert document batch...
2025-11-14 15:25:55,034 - INFO - Processing document 8-K_2024-07-25
2025-11-14 15:25:55,056 - INFO - Finished converting document 8-K_2024-07-25 in 0.05 sec.
2025-11-14 15:25:55,080 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,093 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ABBV\8-K_2024-05-08' --> 'data\processed_data\ABBV\8-K_2024-05-08.md'
Converted 'data\edgar_documents\ABBV\8-K_2024-07-03' --> 'data\processed_data\ABBV\8-K_2024-07-03.md'
Converted 'data\edgar_documents\ABBV\8-K_2024-07-25' --> 'data\processed_data\ABBV\8-K_2024-07-25.md'


2025-11-14 15:25:55,094 - INFO - Processing document 8-K_2024-09-10
2025-11-14 15:25:55,119 - INFO - Finished converting document 8-K_2024-09-10 in 0.05 sec.
2025-11-14 15:25:55,149 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,162 - INFO - Going to convert document batch...
2025-11-14 15:25:55,163 - INFO - Processing document 8-K_2024-10-03
2025-11-14 15:25:55,182 - INFO - Finished converting document 8-K_2024-10-03 in 0.05 sec.
2025-11-14 15:25:55,204 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,218 - INFO - Going to convert document batch...
2025-11-14 15:25:55,219 - INFO - Processing document 8-K_2024-10-30
2025-11-14 15:25:55,239 - INFO - Finished converting document 8-K_2024-10-30 in 0.05 sec.
2025-11-14 15:25:55,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,274 - INFO - Going to convert document batch...
2025-11-14 15:25:55,275 - INFO - Processing document 8-K_2024-12-13
2025-11-14 15:

Converted 'data\edgar_documents\ABBV\8-K_2024-09-10' --> 'data\processed_data\ABBV\8-K_2024-09-10.md'
Converted 'data\edgar_documents\ABBV\8-K_2024-10-03' --> 'data\processed_data\ABBV\8-K_2024-10-03.md'
Converted 'data\edgar_documents\ABBV\8-K_2024-10-30' --> 'data\processed_data\ABBV\8-K_2024-10-30.md'
Converted 'data\edgar_documents\ABBV\8-K_2024-12-13' --> 'data\processed_data\ABBV\8-K_2024-12-13.md'


2025-11-14 15:25:55,331 - INFO - Processing document 8-K_2025-01-06
2025-11-14 15:25:55,359 - INFO - Finished converting document 8-K_2025-01-06 in 0.06 sec.
2025-11-14 15:25:55,381 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,393 - INFO - Going to convert document batch...
2025-11-14 15:25:55,393 - INFO - Processing document 8-K_2025-01-10
2025-11-14 15:25:55,411 - INFO - Finished converting document 8-K_2025-01-10 in 0.05 sec.
2025-11-14 15:25:55,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,441 - INFO - Going to convert document batch...
2025-11-14 15:25:55,443 - INFO - Processing document 8-K_2025-01-31
2025-11-14 15:25:55,462 - INFO - Finished converting document 8-K_2025-01-31 in 0.03 sec.
2025-11-14 15:25:55,507 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,522 - INFO - Going to convert document batch...
2025-11-14 15:25:55,524 - INFO - Processing document 8-K_2025-02-05
2025-11-14 15:

Converted 'data\edgar_documents\ABBV\8-K_2025-01-06' --> 'data\processed_data\ABBV\8-K_2025-01-06.md'
Converted 'data\edgar_documents\ABBV\8-K_2025-01-10' --> 'data\processed_data\ABBV\8-K_2025-01-10.md'
Converted 'data\edgar_documents\ABBV\8-K_2025-01-31' --> 'data\processed_data\ABBV\8-K_2025-01-31.md'


2025-11-14 15:25:55,579 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,592 - INFO - Going to convert document batch...
2025-11-14 15:25:55,593 - INFO - Processing document 8-K_2025-02-14
2025-11-14 15:25:55,623 - INFO - Finished converting document 8-K_2025-02-14 in 0.06 sec.
2025-11-14 15:25:55,654 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,668 - INFO - Going to convert document batch...
2025-11-14 15:25:55,669 - INFO - Processing document 8-K_2025-02-19
2025-11-14 15:25:55,699 - INFO - Finished converting document 8-K_2025-02-19 in 0.06 sec.


Converted 'data\edgar_documents\ABBV\8-K_2025-02-05' --> 'data\processed_data\ABBV\8-K_2025-02-05.md'
Converted 'data\edgar_documents\ABBV\8-K_2025-02-14' --> 'data\processed_data\ABBV\8-K_2025-02-14.md'
Converted 'data\edgar_documents\ABBV\8-K_2025-02-19' --> 'data\processed_data\ABBV\8-K_2025-02-19.md'


2025-11-14 15:25:55,756 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,783 - INFO - Going to convert document batch...
2025-11-14 15:25:55,784 - INFO - Processing document 8-K_2025-02-26
2025-11-14 15:25:55,819 - INFO - Finished converting document 8-K_2025-02-26 in 0.09 sec.
2025-11-14 15:25:55,854 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,867 - INFO - Going to convert document batch...
2025-11-14 15:25:55,867 - INFO - Processing document 8-K_2025-04-03
2025-11-14 15:25:55,887 - INFO - Finished converting document 8-K_2025-04-03 in 0.05 sec.
2025-11-14 15:25:55,910 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:55,921 - INFO - Going to convert document batch...
2025-11-14 15:25:55,922 - INFO - Processing document 8-K_2025-04-25
2025-11-14 15:25:55,942 - INFO - Finished converting document 8-K_2025-04-25 in 0.05 sec.
2025-11-14 15:25:55,965 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\ABBV\8-K_2025-02-26' --> 'data\processed_data\ABBV\8-K_2025-02-26.md'
Converted 'data\edgar_documents\ABBV\8-K_2025-04-03' --> 'data\processed_data\ABBV\8-K_2025-04-03.md'
Converted 'data\edgar_documents\ABBV\8-K_2025-04-25' --> 'data\processed_data\ABBV\8-K_2025-04-25.md'


2025-11-14 15:25:56,044 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:56,059 - INFO - Going to convert document batch...
2025-11-14 15:25:56,059 - INFO - Processing document 8-K_2025-07-03
2025-11-14 15:25:56,081 - INFO - Finished converting document 8-K_2025-07-03 in 0.05 sec.
2025-11-14 15:25:56,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:56,143 - INFO - Going to convert document batch...
2025-11-14 15:25:56,144 - INFO - Processing document 8-K_2025-07-31
2025-11-14 15:25:56,166 - INFO - Finished converting document 8-K_2025-07-31 in 0.06 sec.
2025-11-14 15:25:56,186 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:56,197 - INFO - Going to convert document batch...
2025-11-14 15:25:56,198 - INFO - Processing document 8-K_2025-09-11


Converted 'data\edgar_documents\ABBV\8-K_2025-05-13' --> 'data\processed_data\ABBV\8-K_2025-05-13.md'
Converted 'data\edgar_documents\ABBV\8-K_2025-07-03' --> 'data\processed_data\ABBV\8-K_2025-07-03.md'
Converted 'data\edgar_documents\ABBV\8-K_2025-07-31' --> 'data\processed_data\ABBV\8-K_2025-07-31.md'


2025-11-14 15:25:56,217 - INFO - Finished converting document 8-K_2025-09-11 in 0.05 sec.
2025-11-14 15:25:56,250 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:56,263 - INFO - Going to convert document batch...
2025-11-14 15:25:56,264 - INFO - Processing document 8-K_2025-10-03
2025-11-14 15:25:56,284 - INFO - Finished converting document 8-K_2025-10-03 in 0.05 sec.
2025-11-14 15:25:56,310 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:25:56,321 - INFO - Going to convert document batch...
2025-11-14 15:25:56,321 - INFO - Processing document 8-K_2025-10-31
2025-11-14 15:25:56,339 - INFO - Finished converting document 8-K_2025-10-31 in 0.05 sec.
2025-11-14 15:25:56,408 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\8-K_2025-09-11' --> 'data\processed_data\ABBV\8-K_2025-09-11.md'
Converted 'data\edgar_documents\ABBV\8-K_2025-10-03' --> 'data\processed_data\ABBV\8-K_2025-10-03.md'
Converted 'data\edgar_documents\ABBV\8-K_2025-10-31' --> 'data\processed_data\ABBV\8-K_2025-10-31.md'


2025-11-14 15:25:57,301 - INFO - Going to convert document batch...
2025-11-14 15:25:57,302 - INFO - Processing document DEF-14A_2023-03-20
2025-11-14 15:26:01,382 - INFO - Finished converting document DEF-14A_2023-03-20 in 5.03 sec.
2025-11-14 15:26:02,132 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\DEF-14A_2023-03-20' --> 'data\processed_data\ABBV\DEF-14A_2023-03-20.md'


2025-11-14 15:26:02,778 - INFO - Going to convert document batch...
2025-11-14 15:26:02,779 - INFO - Processing document DEF-14A_2024-03-18
2025-11-14 15:26:06,912 - INFO - Finished converting document DEF-14A_2024-03-18 in 4.83 sec.
2025-11-14 15:26:07,675 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\DEF-14A_2024-03-18' --> 'data\processed_data\ABBV\DEF-14A_2024-03-18.md'


2025-11-14 15:26:08,382 - INFO - Going to convert document batch...
2025-11-14 15:26:08,383 - INFO - Processing document DEF-14A_2025-03-24
2025-11-14 15:26:12,953 - INFO - Finished converting document DEF-14A_2025-03-24 in 5.34 sec.
2025-11-14 15:26:13,740 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABBV\DEF-14A_2025-03-24' --> 'data\processed_data\ABBV\DEF-14A_2025-03-24.md'
Processed 109 new files. Errors: 3
Found 82 files to process in data\edgar_documents\ABT


2025-11-14 15:26:14,283 - INFO - Going to convert document batch...
2025-11-14 15:26:14,284 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:26:14,285 - INFO - Processing document 10-K_2023-02-17
2025-11-14 15:26:15,370 - INFO - Finished converting document 10-K_2023-02-17 in 1.69 sec.
2025-11-14 15:26:15,908 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\10-K_2023-02-17' --> 'data\processed_data\ABT\10-K_2023-02-17.md'


2025-11-14 15:26:16,907 - INFO - Going to convert document batch...
2025-11-14 15:26:16,908 - INFO - Processing document 10-K_2024-02-16
2025-11-14 15:26:17,975 - INFO - Finished converting document 10-K_2024-02-16 in 2.11 sec.
2025-11-14 15:26:18,515 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\10-K_2024-02-16' --> 'data\processed_data\ABT\10-K_2024-02-16.md'


2025-11-14 15:26:19,426 - INFO - Going to convert document batch...
2025-11-14 15:26:19,428 - INFO - Processing document 10-K_2025-02-21
2025-11-14 15:26:20,555 - INFO - Finished converting document 10-K_2025-02-21 in 2.09 sec.
2025-11-14 15:26:21,085 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\10-K_2025-02-21' --> 'data\processed_data\ABT\10-K_2025-02-21.md'


2025-11-14 15:26:21,308 - INFO - Going to convert document batch...
2025-11-14 15:26:21,309 - INFO - Processing document 10-Q_2023-05-04
2025-11-14 15:26:21,727 - INFO - Finished converting document 10-Q_2023-05-04 in 0.67 sec.
2025-11-14 15:26:21,982 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\10-Q_2023-05-04' --> 'data\processed_data\ABT\10-Q_2023-05-04.md'


2025-11-14 15:26:22,690 - INFO - Going to convert document batch...
2025-11-14 15:26:22,690 - INFO - Processing document 10-Q_2023-08-03
2025-11-14 15:26:23,302 - INFO - Finished converting document 10-Q_2023-08-03 in 1.34 sec.
2025-11-14 15:26:23,624 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\10-Q_2023-08-03' --> 'data\processed_data\ABT\10-Q_2023-08-03.md'


2025-11-14 15:26:23,950 - INFO - Going to convert document batch...
2025-11-14 15:26:23,951 - INFO - Processing document 10-Q_2023-11-01
2025-11-14 15:26:24,550 - INFO - Finished converting document 10-Q_2023-11-01 in 0.95 sec.
2025-11-14 15:26:25,180 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\10-Q_2023-11-01' --> 'data\processed_data\ABT\10-Q_2023-11-01.md'


2025-11-14 15:26:25,399 - INFO - Going to convert document batch...
2025-11-14 15:26:25,400 - INFO - Processing document 10-Q_2024-05-02
2025-11-14 15:26:25,829 - INFO - Finished converting document 10-Q_2024-05-02 in 0.67 sec.
2025-11-14 15:26:26,098 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\10-Q_2024-05-02' --> 'data\processed_data\ABT\10-Q_2024-05-02.md'


2025-11-14 15:26:26,406 - INFO - Going to convert document batch...
2025-11-14 15:26:26,407 - INFO - Processing document 10-Q_2024-07-31
2025-11-14 15:26:27,024 - INFO - Finished converting document 10-Q_2024-07-31 in 0.95 sec.
2025-11-14 15:26:27,349 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\10-Q_2024-07-31' --> 'data\processed_data\ABT\10-Q_2024-07-31.md'


2025-11-14 15:26:27,953 - INFO - Going to convert document batch...
2025-11-14 15:26:27,954 - INFO - Processing document 10-Q_2024-10-31
2025-11-14 15:26:28,543 - INFO - Finished converting document 10-Q_2024-10-31 in 1.23 sec.
2025-11-14 15:26:28,864 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\10-Q_2024-10-31' --> 'data\processed_data\ABT\10-Q_2024-10-31.md'


2025-11-14 15:26:29,104 - INFO - Going to convert document batch...
2025-11-14 15:26:29,105 - INFO - Processing document 10-Q_2025-04-30
2025-11-14 15:26:29,568 - INFO - Finished converting document 10-Q_2025-04-30 in 0.73 sec.
2025-11-14 15:26:29,839 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\10-Q_2025-04-30' --> 'data\processed_data\ABT\10-Q_2025-04-30.md'


2025-11-14 15:26:30,449 - INFO - Going to convert document batch...
2025-11-14 15:26:30,450 - INFO - Processing document 10-Q_2025-07-30
2025-11-14 15:26:31,120 - INFO - Finished converting document 10-Q_2025-07-30 in 1.33 sec.
2025-11-14 15:26:31,474 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\10-Q_2025-07-30' --> 'data\processed_data\ABT\10-Q_2025-07-30.md'


2025-11-14 15:26:32,093 - INFO - Going to convert document batch...
2025-11-14 15:26:32,094 - INFO - Processing document 10-Q_2025-10-29
2025-11-14 15:26:32,732 - INFO - Finished converting document 10-Q_2025-10-29 in 1.30 sec.
2025-11-14 15:26:33,077 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:33,086 - INFO - Going to convert document batch...
2025-11-14 15:26:33,087 - INFO - Processing document 4_2023-01-03
2025-11-14 15:26:33,108 - INFO - Finished converting document 4_2023-01-03 in 0.05 sec.
2025-11-14 15:26:33,142 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:33,152 - INFO - Going to convert document batch...
2025-11-14 15:26:33,152 - INFO - Processing document 4_2023-01-04
2025-11-14 15:26:33,172 - INFO - Finished converting document 4_2023-01-04 in 0.05 sec.
2025-11-14 15:26:33,221 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:33,230 - INFO - Going to convert document batch...
2025-11-14 15:26:33,

Converted 'data\edgar_documents\ABT\10-Q_2025-10-29' --> 'data\processed_data\ABT\10-Q_2025-10-29.md'
Converted 'data\edgar_documents\ABT\4_2023-01-03' --> 'data\processed_data\ABT\4_2023-01-03.md'
Converted 'data\edgar_documents\ABT\4_2023-01-04' --> 'data\processed_data\ABT\4_2023-01-04.md'


2025-11-14 15:26:33,287 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:33,298 - INFO - Going to convert document batch...
2025-11-14 15:26:33,299 - INFO - Processing document 4_2023-03-02
2025-11-14 15:26:33,321 - INFO - Finished converting document 4_2023-03-02 in 0.05 sec.
2025-11-14 15:26:33,375 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:33,385 - INFO - Going to convert document batch...
2025-11-14 15:26:33,386 - INFO - Processing document 4_2023-04-04
2025-11-14 15:26:33,407 - INFO - Finished converting document 4_2023-04-04 in 0.06 sec.
2025-11-14 15:26:33,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\4_2023-02-22' --> 'data\processed_data\ABT\4_2023-02-22.md'
Converted 'data\edgar_documents\ABT\4_2023-03-02' --> 'data\processed_data\ABT\4_2023-03-02.md'
Converted 'data\edgar_documents\ABT\4_2023-04-04' --> 'data\processed_data\ABT\4_2023-04-04.md'


2025-11-14 15:26:33,473 - INFO - Going to convert document batch...
2025-11-14 15:26:33,474 - INFO - Processing document 4_2023-05-02
2025-11-14 15:26:33,492 - INFO - Finished converting document 4_2023-05-02 in 0.05 sec.
2025-11-14 15:26:33,531 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:33,540 - INFO - Going to convert document batch...
2025-11-14 15:26:33,541 - INFO - Processing document 4_2023-05-03
2025-11-14 15:26:33,561 - INFO - Finished converting document 4_2023-05-03 in 0.05 sec.
2025-11-14 15:26:33,603 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:33,610 - INFO - Going to convert document batch...
2025-11-14 15:26:33,610 - INFO - Processing document 4_2023-06-20
2025-11-14 15:26:33,633 - INFO - Finished converting document 4_2023-06-20 in 0.03 sec.
2025-11-14 15:26:33,669 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:33,678 - INFO - Going to convert document batch...
2025-11-14 15:26:33,679 - 

Converted 'data\edgar_documents\ABT\4_2023-05-02' --> 'data\processed_data\ABT\4_2023-05-02.md'
Converted 'data\edgar_documents\ABT\4_2023-05-03' --> 'data\processed_data\ABT\4_2023-05-03.md'
Converted 'data\edgar_documents\ABT\4_2023-06-20' --> 'data\processed_data\ABT\4_2023-06-20.md'


2025-11-14 15:26:33,739 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:33,756 - INFO - Going to convert document batch...
2025-11-14 15:26:33,757 - INFO - Processing document 4_2023-07-28
2025-11-14 15:26:33,805 - INFO - Finished converting document 4_2023-07-28 in 0.08 sec.
2025-11-14 15:26:33,877 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:33,890 - INFO - Going to convert document batch...
2025-11-14 15:26:33,891 - INFO - Processing document 4_2023-08-10
2025-11-14 15:26:33,916 - INFO - Finished converting document 4_2023-08-10 in 0.06 sec.


Converted 'data\edgar_documents\ABT\4_2023-07-05' --> 'data\processed_data\ABT\4_2023-07-05.md'
Converted 'data\edgar_documents\ABT\4_2023-07-28' --> 'data\processed_data\ABT\4_2023-07-28.md'


2025-11-14 15:26:33,951 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:33,963 - INFO - Going to convert document batch...
2025-11-14 15:26:33,964 - INFO - Processing document 4_2023-09-06
2025-11-14 15:26:33,985 - INFO - Finished converting document 4_2023-09-06 in 0.05 sec.
2025-11-14 15:26:34,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,030 - INFO - Going to convert document batch...
2025-11-14 15:26:34,031 - INFO - Processing document 4_2023-09-15
2025-11-14 15:26:34,052 - INFO - Finished converting document 4_2023-09-15 in 0.05 sec.
2025-11-14 15:26:34,104 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,114 - INFO - Going to convert document batch...
2025-11-14 15:26:34,115 - INFO - Processing document 4_2023-10-03
2025-11-14 15:26:34,134 - INFO - Finished converting document 4_2023-10-03 in 0.05 sec.


Converted 'data\edgar_documents\ABT\4_2023-08-10' --> 'data\processed_data\ABT\4_2023-08-10.md'
Converted 'data\edgar_documents\ABT\4_2023-09-06' --> 'data\processed_data\ABT\4_2023-09-06.md'
Converted 'data\edgar_documents\ABT\4_2023-09-15' --> 'data\processed_data\ABT\4_2023-09-15.md'


2025-11-14 15:26:34,171 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,180 - INFO - Going to convert document batch...
2025-11-14 15:26:34,181 - INFO - Processing document 4_2023-10-30
2025-11-14 15:26:34,256 - INFO - Finished converting document 4_2023-10-30 in 0.09 sec.
2025-11-14 15:26:34,321 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,337 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ABT\4_2023-10-03' --> 'data\processed_data\ABT\4_2023-10-03.md'
Converted 'data\edgar_documents\ABT\4_2023-10-30' --> 'data\processed_data\ABT\4_2023-10-30.md'


2025-11-14 15:26:34,338 - INFO - Processing document 4_2023-12-18
2025-11-14 15:26:34,374 - INFO - Finished converting document 4_2023-12-18 in 0.09 sec.
2025-11-14 15:26:34,407 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,415 - INFO - Going to convert document batch...
2025-11-14 15:26:34,416 - INFO - Processing document 4_2024-01-03
2025-11-14 15:26:34,435 - INFO - Finished converting document 4_2024-01-03 in 0.05 sec.
2025-11-14 15:26:34,468 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,479 - INFO - Going to convert document batch...
2025-11-14 15:26:34,481 - INFO - Processing document 4_2024-01-31
2025-11-14 15:26:34,503 - INFO - Finished converting document 4_2024-01-31 in 0.05 sec.
2025-11-14 15:26:34,537 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,546 - INFO - Going to convert document batch...
2025-11-14 15:26:34,547 - INFO - Processing document 4_2024-02-23
2025-11-14 15:26:34,566 - IN

Converted 'data\edgar_documents\ABT\4_2023-12-18' --> 'data\processed_data\ABT\4_2023-12-18.md'
Converted 'data\edgar_documents\ABT\4_2024-01-03' --> 'data\processed_data\ABT\4_2024-01-03.md'
Converted 'data\edgar_documents\ABT\4_2024-01-31' --> 'data\processed_data\ABT\4_2024-01-31.md'


2025-11-14 15:26:34,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,608 - INFO - Going to convert document batch...
2025-11-14 15:26:34,609 - INFO - Processing document 4_2024-02-27
2025-11-14 15:26:34,631 - INFO - Finished converting document 4_2024-02-27 in 0.05 sec.
2025-11-14 15:26:34,664 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,671 - INFO - Going to convert document batch...
2025-11-14 15:26:34,671 - INFO - Processing document 4_2024-03-04
2025-11-14 15:26:34,687 - INFO - Finished converting document 4_2024-03-04 in 0.03 sec.
2025-11-14 15:26:34,720 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,728 - INFO - Going to convert document batch...
2025-11-14 15:26:34,729 - INFO - Processing document 4_2024-04-02
2025-11-14 15:26:34,752 - INFO - Finished converting document 4_2024-04-02 in 0.05 sec.


Converted 'data\edgar_documents\ABT\4_2024-02-23' --> 'data\processed_data\ABT\4_2024-02-23.md'
Converted 'data\edgar_documents\ABT\4_2024-02-27' --> 'data\processed_data\ABT\4_2024-02-27.md'
Converted 'data\edgar_documents\ABT\4_2024-03-04' --> 'data\processed_data\ABT\4_2024-03-04.md'
Converted 'data\edgar_documents\ABT\4_2024-04-02' --> 'data\processed_data\ABT\4_2024-04-02.md'


2025-11-14 15:26:34,800 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,809 - INFO - Going to convert document batch...
2025-11-14 15:26:34,810 - INFO - Processing document 4_2024-04-30
2025-11-14 15:26:34,828 - INFO - Finished converting document 4_2024-04-30 in 0.06 sec.
2025-11-14 15:26:34,862 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,870 - INFO - Going to convert document batch...
2025-11-14 15:26:34,871 - INFO - Processing document 4_2024-05-08
2025-11-14 15:26:34,889 - INFO - Finished converting document 4_2024-05-08 in 0.05 sec.
2025-11-14 15:26:34,920 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:34,930 - INFO - Going to convert document batch...
2025-11-14 15:26:34,932 - INFO - Processing document 4_2024-05-14
2025-11-14 15:26:34,956 - INFO - Finished converting document 4_2024-05-14 in 0.05 sec.
2025-11-14 15:26:34,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\ABT\4_2024-04-30' --> 'data\processed_data\ABT\4_2024-04-30.md'
Converted 'data\edgar_documents\ABT\4_2024-05-08' --> 'data\processed_data\ABT\4_2024-05-08.md'
Converted 'data\edgar_documents\ABT\4_2024-05-14' --> 'data\processed_data\ABT\4_2024-05-14.md'
Converted 'data\edgar_documents\ABT\4_2024-07-02' --> 'data\processed_data\ABT\4_2024-07-02.md'


2025-11-14 15:26:35,064 - INFO - Going to convert document batch...
2025-11-14 15:26:35,065 - INFO - Processing document 4_2024-09-04
2025-11-14 15:26:35,087 - INFO - Finished converting document 4_2024-09-04 in 0.03 sec.
2025-11-14 15:26:35,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:35,133 - INFO - Going to convert document batch...
2025-11-14 15:26:35,134 - INFO - Processing document 4_2024-09-13
2025-11-14 15:26:35,160 - INFO - Finished converting document 4_2024-09-13 in 0.05 sec.
2025-11-14 15:26:35,218 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:35,231 - INFO - Going to convert document batch...
2025-11-14 15:26:35,232 - INFO - Processing document 4_2024-10-01
2025-11-14 15:26:35,256 - INFO - Finished converting document 4_2024-10-01 in 0.06 sec.
2025-11-14 15:26:35,288 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:35,298 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ABT\4_2024-09-04' --> 'data\processed_data\ABT\4_2024-09-04.md'
Converted 'data\edgar_documents\ABT\4_2024-09-13' --> 'data\processed_data\ABT\4_2024-09-13.md'
Converted 'data\edgar_documents\ABT\4_2024-10-01' --> 'data\processed_data\ABT\4_2024-10-01.md'


2025-11-14 15:26:35,299 - INFO - Processing document 4_2024-10-23
2025-11-14 15:26:35,323 - INFO - Finished converting document 4_2024-10-23 in 0.06 sec.
2025-11-14 15:26:35,380 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:35,389 - INFO - Going to convert document batch...
2025-11-14 15:26:35,390 - INFO - Processing document 4_2025-01-03
2025-11-14 15:26:35,408 - INFO - Finished converting document 4_2025-01-03 in 0.06 sec.
2025-11-14 15:26:35,440 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:35,449 - INFO - Going to convert document batch...
2025-11-14 15:26:35,450 - INFO - Processing document 4_2025-01-30
2025-11-14 15:26:35,468 - INFO - Finished converting document 4_2025-01-30 in 0.05 sec.
2025-11-14 15:26:35,502 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:35,512 - INFO - Going to convert document batch...
2025-11-14 15:26:35,514 - INFO - Processing document 4_2025-01-31
2025-11-14 15:26:35,540 - IN

Converted 'data\edgar_documents\ABT\4_2024-10-23' --> 'data\processed_data\ABT\4_2024-10-23.md'
Converted 'data\edgar_documents\ABT\4_2025-01-03' --> 'data\processed_data\ABT\4_2025-01-03.md'
Converted 'data\edgar_documents\ABT\4_2025-01-30' --> 'data\processed_data\ABT\4_2025-01-30.md'


2025-11-14 15:26:35,599 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:35,611 - INFO - Going to convert document batch...
2025-11-14 15:26:35,613 - INFO - Processing document 4_2025-02-07
2025-11-14 15:26:35,640 - INFO - Finished converting document 4_2025-02-07 in 0.08 sec.
2025-11-14 15:26:35,678 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:35,689 - INFO - Going to convert document batch...
2025-11-14 15:26:35,690 - INFO - Processing document 4_2025-02-27
2025-11-14 15:26:35,709 - INFO - Finished converting document 4_2025-02-27 in 0.05 sec.
2025-11-14 15:26:35,744 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\4_2025-01-31' --> 'data\processed_data\ABT\4_2025-01-31.md'
Converted 'data\edgar_documents\ABT\4_2025-02-07' --> 'data\processed_data\ABT\4_2025-02-07.md'
Converted 'data\edgar_documents\ABT\4_2025-02-27' --> 'data\processed_data\ABT\4_2025-02-27.md'


2025-11-14 15:26:35,753 - INFO - Going to convert document batch...
2025-11-14 15:26:35,754 - INFO - Processing document 4_2025-03-04
2025-11-14 15:26:35,772 - INFO - Finished converting document 4_2025-03-04 in 0.03 sec.
2025-11-14 15:26:35,803 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:35,816 - INFO - Going to convert document batch...
2025-11-14 15:26:35,817 - INFO - Processing document 4_2025-03-07
2025-11-14 15:26:35,840 - INFO - Finished converting document 4_2025-03-07 in 0.05 sec.
2025-11-14 15:26:35,876 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:35,885 - INFO - Going to convert document batch...
2025-11-14 15:26:35,885 - INFO - Processing document 4_2025-04-02
2025-11-14 15:26:35,904 - INFO - Finished converting document 4_2025-04-02 in 0.05 sec.
2025-11-14 15:26:35,935 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:35,944 - INFO - Going to convert document batch...
2025-11-14 15:26:35,945 - 

Converted 'data\edgar_documents\ABT\4_2025-03-04' --> 'data\processed_data\ABT\4_2025-03-04.md'
Converted 'data\edgar_documents\ABT\4_2025-03-07' --> 'data\processed_data\ABT\4_2025-03-07.md'
Converted 'data\edgar_documents\ABT\4_2025-04-02' --> 'data\processed_data\ABT\4_2025-04-02.md'


2025-11-14 15:26:35,999 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:36,007 - INFO - Going to convert document batch...
2025-11-14 15:26:36,008 - INFO - Processing document 4_2025-05-02
2025-11-14 15:26:36,027 - INFO - Finished converting document 4_2025-05-02 in 0.05 sec.
2025-11-14 15:26:36,078 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:36,089 - INFO - Going to convert document batch...
2025-11-14 15:26:36,090 - INFO - Processing document 4_2025-07-01
2025-11-14 15:26:36,108 - INFO - Finished converting document 4_2025-07-01 in 0.06 sec.
2025-11-14 15:26:36,142 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:36,150 - INFO - Going to convert document batch...
2025-11-14 15:26:36,151 - INFO - Processing document 4_2025-08-11
2025-11-14 15:26:36,168 - INFO - Finished converting document 4_2025-08-11 in 0.05 sec.


Converted 'data\edgar_documents\ABT\4_2025-04-29' --> 'data\processed_data\ABT\4_2025-04-29.md'
Converted 'data\edgar_documents\ABT\4_2025-05-02' --> 'data\processed_data\ABT\4_2025-05-02.md'
Converted 'data\edgar_documents\ABT\4_2025-07-01' --> 'data\processed_data\ABT\4_2025-07-01.md'


2025-11-14 15:26:36,202 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:36,212 - INFO - Going to convert document batch...
2025-11-14 15:26:36,213 - INFO - Processing document 4_2025-09-03
2025-11-14 15:26:36,234 - INFO - Finished converting document 4_2025-09-03 in 0.05 sec.
2025-11-14 15:26:36,286 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:36,302 - INFO - Going to convert document batch...
2025-11-14 15:26:36,303 - INFO - Processing document 4_2025-10-02
2025-11-14 15:26:36,323 - INFO - Finished converting document 4_2025-10-02 in 0.08 sec.


Converted 'data\edgar_documents\ABT\4_2025-08-11' --> 'data\processed_data\ABT\4_2025-08-11.md'
Converted 'data\edgar_documents\ABT\4_2025-09-03' --> 'data\processed_data\ABT\4_2025-09-03.md'
Converted 'data\edgar_documents\ABT\4_2025-10-02' --> 'data\processed_data\ABT\4_2025-10-02.md'


2025-11-14 15:26:36,399 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:36,432 - INFO - Going to convert document batch...
2025-11-14 15:26:36,434 - INFO - Processing document 8-K_2023-01-25
2025-11-14 15:26:36,466 - INFO - Finished converting document 8-K_2023-01-25 in 0.11 sec.
2025-11-14 15:26:36,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:36,510 - INFO - Going to convert document batch...
2025-11-14 15:26:36,511 - INFO - Processing document 8-K_2023-02-17
2025-11-14 15:26:36,529 - INFO - Finished converting document 8-K_2023-02-17 in 0.05 sec.
2025-11-14 15:26:36,554 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:36,566 - INFO - Going to convert document batch...
2025-11-14 15:26:36,567 - INFO - Processing document 8-K_2023-04-19
2025-11-14 15:26:36,582 - INFO - Finished converting document 8-K_2023-04-19 in 0.03 sec.
2025-11-14 15:26:36,606 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\ABT\8-K_2023-01-25' --> 'data\processed_data\ABT\8-K_2023-01-25.md'
Converted 'data\edgar_documents\ABT\8-K_2023-02-17' --> 'data\processed_data\ABT\8-K_2023-02-17.md'
Converted 'data\edgar_documents\ABT\8-K_2023-04-19' --> 'data\processed_data\ABT\8-K_2023-04-19.md'


2025-11-14 15:26:36,740 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:36,784 - INFO - Going to convert document batch...
2025-11-14 15:26:36,786 - INFO - Processing document 8-K_2023-06-09
2025-11-14 15:26:36,811 - INFO - Finished converting document 8-K_2023-06-09 in 0.12 sec.
2025-11-14 15:26:36,855 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:36,872 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ABT\8-K_2023-05-02' --> 'data\processed_data\ABT\8-K_2023-05-02.md'
Converted 'data\edgar_documents\ABT\8-K_2023-06-09' --> 'data\processed_data\ABT\8-K_2023-06-09.md'


2025-11-14 15:26:36,873 - INFO - Processing document 8-K_2023-06-12
2025-11-14 15:26:36,895 - INFO - Finished converting document 8-K_2023-06-12 in 0.06 sec.
2025-11-14 15:26:36,927 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:36,939 - INFO - Going to convert document batch...
2025-11-14 15:26:36,940 - INFO - Processing document 8-K_2023-07-20
2025-11-14 15:26:36,956 - INFO - Finished converting document 8-K_2023-07-20 in 0.05 sec.
2025-11-14 15:26:36,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:36,988 - INFO - Going to convert document batch...
2025-11-14 15:26:36,989 - INFO - Processing document 8-K_2023-09-01
2025-11-14 15:26:37,005 - INFO - Finished converting document 8-K_2023-09-01 in 0.03 sec.
2025-11-14 15:26:37,032 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:37,042 - INFO - Going to convert document batch...
2025-11-14 15:26:37,043 - INFO - Processing document 8-K_2023-10-18
2025-11-14 15:

Converted 'data\edgar_documents\ABT\8-K_2023-06-12' --> 'data\processed_data\ABT\8-K_2023-06-12.md'
Converted 'data\edgar_documents\ABT\8-K_2023-07-20' --> 'data\processed_data\ABT\8-K_2023-07-20.md'
Converted 'data\edgar_documents\ABT\8-K_2023-09-01' --> 'data\processed_data\ABT\8-K_2023-09-01.md'
Converted 'data\edgar_documents\ABT\8-K_2023-10-18' --> 'data\processed_data\ABT\8-K_2023-10-18.md'


2025-11-14 15:26:37,094 - INFO - Processing document 8-K_2024-01-24
2025-11-14 15:26:37,109 - INFO - Finished converting document 8-K_2024-01-24 in 0.05 sec.
2025-11-14 15:26:37,138 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:37,149 - INFO - Going to convert document batch...
2025-11-14 15:26:37,150 - INFO - Processing document 8-K_2024-01-29


Converted 'data\edgar_documents\ABT\8-K_2024-01-24' --> 'data\processed_data\ABT\8-K_2024-01-24.md'


2025-11-14 15:26:37,550 - INFO - Finished converting document 8-K_2024-01-29 in 0.42 sec.
2025-11-14 15:26:37,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:37,590 - INFO - Going to convert document batch...
2025-11-14 15:26:37,590 - INFO - Processing document 8-K_2024-04-17
2025-11-14 15:26:37,604 - INFO - Finished converting document 8-K_2024-04-17 in 0.05 sec.
2025-11-14 15:26:37,631 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:37,649 - INFO - Going to convert document batch...
2025-11-14 15:26:37,649 - INFO - Processing document 8-K_2024-04-29
2025-11-14 15:26:37,676 - INFO - Finished converting document 8-K_2024-04-29 in 0.06 sec.
2025-11-14 15:26:37,707 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:37,717 - INFO - Going to convert document batch...
2025-11-14 15:26:37,717 - INFO - Processing document 8-K_2024-05-01
2025-11-14 15:26:37,736 - INFO - Finished converting document 8-K_2024-05-01 in 0.

Converted 'data\edgar_documents\ABT\8-K_2024-01-29' --> 'data\processed_data\ABT\8-K_2024-01-29.md'
Converted 'data\edgar_documents\ABT\8-K_2024-04-17' --> 'data\processed_data\ABT\8-K_2024-04-17.md'
Converted 'data\edgar_documents\ABT\8-K_2024-04-29' --> 'data\processed_data\ABT\8-K_2024-04-29.md'


2025-11-14 15:26:37,762 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:37,771 - INFO - Going to convert document batch...
2025-11-14 15:26:37,772 - INFO - Processing document 8-K_2024-07-18
2025-11-14 15:26:37,788 - INFO - Finished converting document 8-K_2024-07-18 in 0.03 sec.
2025-11-14 15:26:37,810 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:37,819 - INFO - Going to convert document batch...
2025-11-14 15:26:37,821 - INFO - Processing document 8-K_2024-10-16
2025-11-14 15:26:37,837 - INFO - Finished converting document 8-K_2024-10-16 in 0.03 sec.
2025-11-14 15:26:37,858 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:37,869 - INFO - Going to convert document batch...
2025-11-14 15:26:37,870 - INFO - Processing document 8-K_2024-11-15
2025-11-14 15:26:37,887 - INFO - Finished converting document 8-K_2024-11-15 in 0.05 sec.
2025-11-14 15:26:37,913 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\ABT\8-K_2024-05-01' --> 'data\processed_data\ABT\8-K_2024-05-01.md'
Converted 'data\edgar_documents\ABT\8-K_2024-07-18' --> 'data\processed_data\ABT\8-K_2024-07-18.md'
Converted 'data\edgar_documents\ABT\8-K_2024-10-16' --> 'data\processed_data\ABT\8-K_2024-10-16.md'
Converted 'data\edgar_documents\ABT\8-K_2024-11-15' --> 'data\processed_data\ABT\8-K_2024-11-15.md'


2025-11-14 15:26:37,961 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:37,969 - INFO - Going to convert document batch...
2025-11-14 15:26:37,970 - INFO - Processing document 8-K_2025-04-16
2025-11-14 15:26:37,987 - INFO - Finished converting document 8-K_2025-04-16 in 0.03 sec.
2025-11-14 15:26:38,009 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:38,030 - INFO - Going to convert document batch...
2025-11-14 15:26:38,031 - INFO - Processing document 8-K_2025-04-28
2025-11-14 15:26:38,062 - INFO - Finished converting document 8-K_2025-04-28 in 0.06 sec.
2025-11-14 15:26:38,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:38,103 - INFO - Going to convert document batch...
2025-11-14 15:26:38,104 - INFO - Processing document 8-K_2025-05-01
2025-11-14 15:26:38,120 - INFO - Finished converting document 8-K_2025-05-01 in 0.05 sec.
2025-11-14 15:26:38,144 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\8-K_2025-01-22' --> 'data\processed_data\ABT\8-K_2025-01-22.md'
Converted 'data\edgar_documents\ABT\8-K_2025-04-16' --> 'data\processed_data\ABT\8-K_2025-04-16.md'
Converted 'data\edgar_documents\ABT\8-K_2025-04-28' --> 'data\processed_data\ABT\8-K_2025-04-28.md'
Converted 'data\edgar_documents\ABT\8-K_2025-05-01' --> 'data\processed_data\ABT\8-K_2025-05-01.md'


2025-11-14 15:26:38,153 - INFO - Going to convert document batch...
2025-11-14 15:26:38,154 - INFO - Processing document 8-K_2025-07-17
2025-11-14 15:26:38,170 - INFO - Finished converting document 8-K_2025-07-17 in 0.05 sec.
2025-11-14 15:26:38,193 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:38,203 - INFO - Going to convert document batch...
2025-11-14 15:26:38,204 - INFO - Processing document 8-K_2025-10-15
2025-11-14 15:26:38,220 - INFO - Finished converting document 8-K_2025-10-15 in 0.05 sec.
2025-11-14 15:26:38,266 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:26:38,267 - ERROR - Input document DEF-14A_2023-03-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputForm

Converted 'data\edgar_documents\ABT\8-K_2025-07-17' --> 'data\processed_data\ABT\8-K_2025-07-17.md'
Converted 'data\edgar_documents\ABT\8-K_2025-10-15' --> 'data\processed_data\ABT\8-K_2025-10-15.md'
Error processing data\edgar_documents\ABT\DEF-14A_2023-03-17: File format not allowed: data\edgar_documents\ABT\DEF-14A_2023-03-17


2025-11-14 15:26:38,708 - INFO - Going to convert document batch...
2025-11-14 15:26:38,709 - INFO - Processing document DEF-14A_2024-03-15
2025-11-14 15:26:44,422 - INFO - Finished converting document DEF-14A_2024-03-15 in 6.16 sec.


Converted 'data\edgar_documents\ABT\DEF-14A_2024-03-15' --> 'data\processed_data\ABT\DEF-14A_2024-03-15.md'


2025-11-14 15:26:45,394 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:26:46,202 - INFO - Going to convert document batch...
2025-11-14 15:26:46,203 - INFO - Processing document DEF-14A_2025-03-14
2025-11-14 15:26:57,389 - INFO - Finished converting document DEF-14A_2025-03-14 in 12.28 sec.
2025-11-14 15:26:58,344 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ABT\DEF-14A_2025-03-14' --> 'data\processed_data\ABT\DEF-14A_2025-03-14.md'
Processed 81 new files. Errors: 1
Found 153 files to process in data\edgar_documents\ACN


2025-11-14 15:26:59,272 - INFO - Going to convert document batch...
2025-11-14 15:26:59,273 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:26:59,274 - INFO - Processing document 10-K_2023-10-12
2025-11-14 15:27:01,081 - INFO - Finished converting document 10-K_2023-10-12 in 2.80 sec.
2025-11-14 15:27:01,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\10-K_2023-10-12' --> 'data\processed_data\ACN\10-K_2023-10-12.md'


2025-11-14 15:27:02,663 - INFO - Going to convert document batch...
2025-11-14 15:27:02,664 - INFO - Processing document 10-K_2024-10-10
2025-11-14 15:27:04,496 - INFO - Finished converting document 10-K_2024-10-10 in 2.78 sec.
2025-11-14 15:27:05,229 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\10-K_2024-10-10' --> 'data\processed_data\ACN\10-K_2024-10-10.md'


2025-11-14 15:27:06,273 - INFO - Going to convert document batch...
2025-11-14 15:27:06,274 - INFO - Processing document 10-K_2025-10-10
2025-11-14 15:27:08,122 - INFO - Finished converting document 10-K_2025-10-10 in 2.95 sec.
2025-11-14 15:27:08,858 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\10-K_2025-10-10' --> 'data\processed_data\ACN\10-K_2025-10-10.md'


2025-11-14 15:27:09,221 - INFO - Going to convert document batch...
2025-11-14 15:27:09,221 - INFO - Processing document 10-Q_2023-03-23
2025-11-14 15:27:10,027 - INFO - Finished converting document 10-Q_2023-03-23 in 1.20 sec.
2025-11-14 15:27:10,539 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\10-Q_2023-03-23' --> 'data\processed_data\ACN\10-Q_2023-03-23.md'


2025-11-14 15:27:11,371 - INFO - Going to convert document batch...
2025-11-14 15:27:11,372 - INFO - Processing document 10-Q_2023-06-22
2025-11-14 15:27:12,192 - INFO - Finished converting document 10-Q_2023-06-22 in 1.69 sec.
2025-11-14 15:27:12,649 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\10-Q_2023-06-22' --> 'data\processed_data\ACN\10-Q_2023-06-22.md'


2025-11-14 15:27:12,921 - INFO - Going to convert document batch...
2025-11-14 15:27:12,922 - INFO - Processing document 10-Q_2023-12-19
2025-11-14 15:27:13,498 - INFO - Finished converting document 10-Q_2023-12-19 in 0.89 sec.
2025-11-14 15:27:13,842 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\10-Q_2023-12-19' --> 'data\processed_data\ACN\10-Q_2023-12-19.md'


2025-11-14 15:27:14,541 - INFO - Going to convert document batch...
2025-11-14 15:27:14,542 - INFO - Processing document 10-Q_2024-03-21
2025-11-14 15:27:15,318 - INFO - Finished converting document 10-Q_2024-03-21 in 1.50 sec.
2025-11-14 15:27:15,763 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\10-Q_2024-03-21' --> 'data\processed_data\ACN\10-Q_2024-03-21.md'


2025-11-14 15:27:16,104 - INFO - Going to convert document batch...
2025-11-14 15:27:16,105 - INFO - Processing document 10-Q_2024-06-20
2025-11-14 15:27:17,180 - INFO - Finished converting document 10-Q_2024-06-20 in 1.44 sec.
2025-11-14 15:27:17,612 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\10-Q_2024-06-20' --> 'data\processed_data\ACN\10-Q_2024-06-20.md'


2025-11-14 15:27:17,877 - INFO - Going to convert document batch...
2025-11-14 15:27:17,878 - INFO - Processing document 10-Q_2024-12-19
2025-11-14 15:27:18,477 - INFO - Finished converting document 10-Q_2024-12-19 in 0.89 sec.
2025-11-14 15:27:18,831 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\10-Q_2024-12-19' --> 'data\processed_data\ACN\10-Q_2024-12-19.md'


2025-11-14 15:27:19,183 - INFO - Going to convert document batch...
2025-11-14 15:27:19,183 - INFO - Processing document 10-Q_2025-03-20
2025-11-14 15:27:20,359 - INFO - Finished converting document 10-Q_2025-03-20 in 1.56 sec.
2025-11-14 15:27:20,816 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\10-Q_2025-03-20' --> 'data\processed_data\ACN\10-Q_2025-03-20.md'


2025-11-14 15:27:21,162 - INFO - Going to convert document batch...
2025-11-14 15:27:21,163 - INFO - Processing document 10-Q_2025-06-20
2025-11-14 15:27:21,934 - INFO - Finished converting document 10-Q_2025-06-20 in 1.16 sec.
2025-11-14 15:27:22,369 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:22,376 - INFO - Going to convert document batch...
2025-11-14 15:27:22,377 - INFO - Processing document 4_2023-01-04
2025-11-14 15:27:22,397 - INFO - Finished converting document 4_2023-01-04 in 0.05 sec.
2025-11-14 15:27:22,436 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:22,445 - INFO - Going to convert document batch...
2025-11-14 15:27:22,448 - INFO - Processing document 4_2023-01-09
2025-11-14 15:27:22,472 - INFO - Finished converting document 4_2023-01-09 in 0.05 sec.
2025-11-14 15:27:22,507 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:22,516 - INFO - Going to convert document batch...
2025-11-14 15:27:22,

Converted 'data\edgar_documents\ACN\10-Q_2025-06-20' --> 'data\processed_data\ACN\10-Q_2025-06-20.md'
Converted 'data\edgar_documents\ACN\4_2023-01-04' --> 'data\processed_data\ACN\4_2023-01-04.md'
Converted 'data\edgar_documents\ACN\4_2023-01-09' --> 'data\processed_data\ACN\4_2023-01-09.md'


2025-11-14 15:27:22,539 - INFO - Finished converting document 4_2023-01-17 in 0.05 sec.
2025-11-14 15:27:22,576 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:22,585 - INFO - Going to convert document batch...
2025-11-14 15:27:22,586 - INFO - Processing document 4_2023-01-18
2025-11-14 15:27:22,612 - INFO - Finished converting document 4_2023-01-18 in 0.05 sec.
2025-11-14 15:27:22,650 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:22,662 - INFO - Going to convert document batch...
2025-11-14 15:27:22,663 - INFO - Processing document 4_2023-01-23
2025-11-14 15:27:22,691 - INFO - Finished converting document 4_2023-01-23 in 0.05 sec.
2025-11-14 15:27:22,731 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:22,741 - INFO - Going to convert document batch...
2025-11-14 15:27:22,742 - INFO - Processing document 4_2023-01-24


Converted 'data\edgar_documents\ACN\4_2023-01-17' --> 'data\processed_data\ACN\4_2023-01-17.md'
Converted 'data\edgar_documents\ACN\4_2023-01-18' --> 'data\processed_data\ACN\4_2023-01-18.md'
Converted 'data\edgar_documents\ACN\4_2023-01-23' --> 'data\processed_data\ACN\4_2023-01-23.md'


2025-11-14 15:27:22,766 - INFO - Finished converting document 4_2023-01-24 in 0.05 sec.
2025-11-14 15:27:22,809 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:22,817 - INFO - Going to convert document batch...
2025-11-14 15:27:22,818 - INFO - Processing document 4_2023-01-30
2025-11-14 15:27:22,835 - INFO - Finished converting document 4_2023-01-30 in 0.03 sec.
2025-11-14 15:27:22,865 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:22,873 - INFO - Going to convert document batch...
2025-11-14 15:27:22,873 - INFO - Processing document 4_2023-02-02
2025-11-14 15:27:22,928 - INFO - Finished converting document 4_2023-02-02 in 0.08 sec.
2025-11-14 15:27:22,964 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:22,971 - INFO - Going to convert document batch...
2025-11-14 15:27:22,972 - INFO - Processing document 4_2023-02-03


Converted 'data\edgar_documents\ACN\4_2023-01-24' --> 'data\processed_data\ACN\4_2023-01-24.md'
Converted 'data\edgar_documents\ACN\4_2023-01-30' --> 'data\processed_data\ACN\4_2023-01-30.md'
Converted 'data\edgar_documents\ACN\4_2023-02-02' --> 'data\processed_data\ACN\4_2023-02-02.md'


2025-11-14 15:27:22,992 - INFO - Finished converting document 4_2023-02-03 in 0.03 sec.
2025-11-14 15:27:23,024 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,033 - INFO - Going to convert document batch...
2025-11-14 15:27:23,034 - INFO - Processing document 4_2023-02-06
2025-11-14 15:27:23,055 - INFO - Finished converting document 4_2023-02-06 in 0.03 sec.
2025-11-14 15:27:23,089 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,097 - INFO - Going to convert document batch...
2025-11-14 15:27:23,098 - INFO - Processing document 4_2023-02-17
2025-11-14 15:27:23,118 - INFO - Finished converting document 4_2023-02-17 in 0.03 sec.
2025-11-14 15:27:23,152 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,159 - INFO - Going to convert document batch...
2025-11-14 15:27:23,159 - INFO - Processing document 4_2023-03-07
2025-11-14 15:27:23,178 - INFO - Finished converting document 4_2023-03-07 in 0.03 sec.


Converted 'data\edgar_documents\ACN\4_2023-02-03' --> 'data\processed_data\ACN\4_2023-02-03.md'
Converted 'data\edgar_documents\ACN\4_2023-02-06' --> 'data\processed_data\ACN\4_2023-02-06.md'
Converted 'data\edgar_documents\ACN\4_2023-02-17' --> 'data\processed_data\ACN\4_2023-02-17.md'


2025-11-14 15:27:23,214 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,223 - INFO - Going to convert document batch...
2025-11-14 15:27:23,224 - INFO - Processing document 4_2023-03-30
2025-11-14 15:27:23,246 - INFO - Finished converting document 4_2023-03-30 in 0.05 sec.
2025-11-14 15:27:23,287 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,295 - INFO - Going to convert document batch...
2025-11-14 15:27:23,296 - INFO - Processing document 4_2023-04-06
2025-11-14 15:27:23,319 - INFO - Finished converting document 4_2023-04-06 in 0.05 sec.
2025-11-14 15:27:23,357 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,368 - INFO - Going to convert document batch...
2025-11-14 15:27:23,370 - INFO - Processing document 4_2023-04-18
2025-11-14 15:27:23,396 - INFO - Finished converting document 4_2023-04-18 in 0.05 sec.


Converted 'data\edgar_documents\ACN\4_2023-03-07' --> 'data\processed_data\ACN\4_2023-03-07.md'
Converted 'data\edgar_documents\ACN\4_2023-03-30' --> 'data\processed_data\ACN\4_2023-03-30.md'
Converted 'data\edgar_documents\ACN\4_2023-04-06' --> 'data\processed_data\ACN\4_2023-04-06.md'


2025-11-14 15:27:23,439 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,448 - INFO - Going to convert document batch...
2025-11-14 15:27:23,450 - INFO - Processing document 4_2023-04-24
2025-11-14 15:27:23,473 - INFO - Finished converting document 4_2023-04-24 in 0.05 sec.
2025-11-14 15:27:23,512 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,521 - INFO - Going to convert document batch...
2025-11-14 15:27:23,522 - INFO - Processing document 4_2023-04-25
2025-11-14 15:27:23,543 - INFO - Finished converting document 4_2023-04-25 in 0.05 sec.
2025-11-14 15:27:23,586 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,593 - INFO - Going to convert document batch...
2025-11-14 15:27:23,594 - INFO - Processing document 4_2023-05-02


Converted 'data\edgar_documents\ACN\4_2023-04-18' --> 'data\processed_data\ACN\4_2023-04-18.md'
Converted 'data\edgar_documents\ACN\4_2023-04-24' --> 'data\processed_data\ACN\4_2023-04-24.md'
Converted 'data\edgar_documents\ACN\4_2023-04-25' --> 'data\processed_data\ACN\4_2023-04-25.md'


2025-11-14 15:27:23,612 - INFO - Finished converting document 4_2023-05-02 in 0.03 sec.
2025-11-14 15:27:23,652 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,660 - INFO - Going to convert document batch...
2025-11-14 15:27:23,661 - INFO - Processing document 4_2023-05-08
2025-11-14 15:27:23,683 - INFO - Finished converting document 4_2023-05-08 in 0.05 sec.
2025-11-14 15:27:23,736 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,746 - INFO - Going to convert document batch...
2025-11-14 15:27:23,747 - INFO - Processing document 4_2023-05-16
2025-11-14 15:27:23,765 - INFO - Finished converting document 4_2023-05-16 in 0.06 sec.
2025-11-14 15:27:23,805 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,814 - INFO - Going to convert document batch...
2025-11-14 15:27:23,815 - INFO - Processing document 4_2023-06-06
2025-11-14 15:27:23,836 - INFO - Finished converting document 4_2023-06-06 in 0.03 sec.


Converted 'data\edgar_documents\ACN\4_2023-05-02' --> 'data\processed_data\ACN\4_2023-05-02.md'
Converted 'data\edgar_documents\ACN\4_2023-05-08' --> 'data\processed_data\ACN\4_2023-05-08.md'
Converted 'data\edgar_documents\ACN\4_2023-05-16' --> 'data\processed_data\ACN\4_2023-05-16.md'


2025-11-14 15:27:23,874 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,882 - INFO - Going to convert document batch...
2025-11-14 15:27:23,883 - INFO - Processing document 4_2023-06-27
2025-11-14 15:27:23,904 - INFO - Finished converting document 4_2023-06-27 in 0.05 sec.
2025-11-14 15:27:23,942 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:23,950 - INFO - Going to convert document batch...
2025-11-14 15:27:23,951 - INFO - Processing document 4_2023-07-06
2025-11-14 15:27:23,971 - INFO - Finished converting document 4_2023-07-06 in 0.05 sec.
2025-11-14 15:27:24,014 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:24,023 - INFO - Going to convert document batch...
2025-11-14 15:27:24,024 - INFO - Processing document 4_2023-07-17
2025-11-14 15:27:24,050 - INFO - Finished converting document 4_2023-07-17 in 0.05 sec.


Converted 'data\edgar_documents\ACN\4_2023-06-06' --> 'data\processed_data\ACN\4_2023-06-06.md'
Converted 'data\edgar_documents\ACN\4_2023-06-27' --> 'data\processed_data\ACN\4_2023-06-27.md'
Converted 'data\edgar_documents\ACN\4_2023-07-06' --> 'data\processed_data\ACN\4_2023-07-06.md'


2025-11-14 15:27:24,089 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:24,100 - INFO - Going to convert document batch...
2025-11-14 15:27:24,100 - INFO - Processing document 4_2023-07-24
2025-11-14 15:27:24,126 - INFO - Finished converting document 4_2023-07-24 in 0.05 sec.
2025-11-14 15:27:24,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:24,174 - INFO - Going to convert document batch...
2025-11-14 15:27:24,175 - INFO - Processing document 4_2023-07-28
2025-11-14 15:27:24,201 - INFO - Finished converting document 4_2023-07-28 in 0.05 sec.
2025-11-14 15:27:24,239 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:24,250 - INFO - Going to convert document batch...
2025-11-14 15:27:24,251 - INFO - Processing document 4_2023-08-08


Converted 'data\edgar_documents\ACN\4_2023-07-17' --> 'data\processed_data\ACN\4_2023-07-17.md'
Converted 'data\edgar_documents\ACN\4_2023-07-24' --> 'data\processed_data\ACN\4_2023-07-24.md'
Converted 'data\edgar_documents\ACN\4_2023-07-28' --> 'data\processed_data\ACN\4_2023-07-28.md'


2025-11-14 15:27:24,624 - INFO - Finished converting document 4_2023-08-08 in 0.41 sec.
2025-11-14 15:27:24,686 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:24,696 - INFO - Going to convert document batch...
2025-11-14 15:27:24,697 - INFO - Processing document 4_2023-08-16
2025-11-14 15:27:24,715 - INFO - Finished converting document 4_2023-08-16 in 0.06 sec.
2025-11-14 15:27:24,748 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:24,756 - INFO - Going to convert document batch...
2025-11-14 15:27:24,756 - INFO - Processing document 4_2023-09-07
2025-11-14 15:27:24,775 - INFO - Finished converting document 4_2023-09-07 in 0.03 sec.
2025-11-14 15:27:24,813 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:24,822 - INFO - Going to convert document batch...
2025-11-14 15:27:24,822 - INFO - Processing document 4_2023-09-14


Converted 'data\edgar_documents\ACN\4_2023-08-08' --> 'data\processed_data\ACN\4_2023-08-08.md'
Converted 'data\edgar_documents\ACN\4_2023-08-16' --> 'data\processed_data\ACN\4_2023-08-16.md'
Converted 'data\edgar_documents\ACN\4_2023-09-07' --> 'data\processed_data\ACN\4_2023-09-07.md'


2025-11-14 15:27:24,845 - INFO - Finished converting document 4_2023-09-14 in 0.05 sec.
2025-11-14 15:27:24,883 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:24,898 - INFO - Going to convert document batch...
2025-11-14 15:27:24,899 - INFO - Processing document 4_2023-10-10
2025-11-14 15:27:24,918 - INFO - Finished converting document 4_2023-10-10 in 0.06 sec.
2025-11-14 15:27:24,951 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:24,963 - INFO - Going to convert document batch...
2025-11-14 15:27:24,964 - INFO - Processing document 4_2023-10-16
2025-11-14 15:27:24,991 - INFO - Finished converting document 4_2023-10-16 in 0.05 sec.
2025-11-14 15:27:25,034 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:25,042 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ACN\4_2023-09-14' --> 'data\processed_data\ACN\4_2023-09-14.md'
Converted 'data\edgar_documents\ACN\4_2023-10-10' --> 'data\processed_data\ACN\4_2023-10-10.md'
Converted 'data\edgar_documents\ACN\4_2023-10-16' --> 'data\processed_data\ACN\4_2023-10-16.md'


2025-11-14 15:27:25,043 - INFO - Processing document 4_2023-10-20
2025-11-14 15:27:25,065 - INFO - Finished converting document 4_2023-10-20 in 0.05 sec.
2025-11-14 15:27:25,109 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:25,122 - INFO - Going to convert document batch...
2025-11-14 15:27:25,122 - INFO - Processing document 4_2023-10-23
2025-11-14 15:27:25,151 - INFO - Finished converting document 4_2023-10-23 in 0.06 sec.
2025-11-14 15:27:25,190 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:25,200 - INFO - Going to convert document batch...
2025-11-14 15:27:25,200 - INFO - Processing document 4_2023-10-24
2025-11-14 15:27:25,225 - INFO - Finished converting document 4_2023-10-24 in 0.05 sec.
2025-11-14 15:27:25,279 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\4_2023-10-20' --> 'data\processed_data\ACN\4_2023-10-20.md'
Converted 'data\edgar_documents\ACN\4_2023-10-23' --> 'data\processed_data\ACN\4_2023-10-23.md'
Converted 'data\edgar_documents\ACN\4_2023-10-24' --> 'data\processed_data\ACN\4_2023-10-24.md'


2025-11-14 15:27:25,300 - INFO - Going to convert document batch...
2025-11-14 15:27:25,302 - INFO - Processing document 4_2023-10-25
2025-11-14 15:27:25,326 - INFO - Finished converting document 4_2023-10-25 in 0.08 sec.
2025-11-14 15:27:25,366 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:25,377 - INFO - Going to convert document batch...
2025-11-14 15:27:25,377 - INFO - Processing document 4_2023-10-31
2025-11-14 15:27:25,400 - INFO - Finished converting document 4_2023-10-31 in 0.05 sec.
2025-11-14 15:27:25,434 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:25,442 - INFO - Going to convert document batch...
2025-11-14 15:27:25,443 - INFO - Processing document 4_2023-11-02
2025-11-14 15:27:25,485 - INFO - Finished converting document 4_2023-11-02 in 0.06 sec.
2025-11-14 15:27:25,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:25,532 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ACN\4_2023-10-25' --> 'data\processed_data\ACN\4_2023-10-25.md'
Converted 'data\edgar_documents\ACN\4_2023-10-31' --> 'data\processed_data\ACN\4_2023-10-31.md'
Converted 'data\edgar_documents\ACN\4_2023-11-02' --> 'data\processed_data\ACN\4_2023-11-02.md'


2025-11-14 15:27:25,533 - INFO - Processing document 4_2023-11-06
2025-11-14 15:27:25,553 - INFO - Finished converting document 4_2023-11-06 in 0.03 sec.
2025-11-14 15:27:25,589 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:25,600 - INFO - Going to convert document batch...
2025-11-14 15:27:25,601 - INFO - Processing document 4_2023-11-13
2025-11-14 15:27:25,627 - INFO - Finished converting document 4_2023-11-13 in 0.05 sec.
2025-11-14 15:27:25,667 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:25,675 - INFO - Going to convert document batch...
2025-11-14 15:27:25,675 - INFO - Processing document 4_2023-11-16
2025-11-14 15:27:25,697 - INFO - Finished converting document 4_2023-11-16 in 0.03 sec.
2025-11-14 15:27:25,731 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:25,738 - INFO - Going to convert document batch...
2025-11-14 15:27:25,739 - INFO - Processing document 4_2023-12-06
2025-11-14 15:27:25,757 - IN

Converted 'data\edgar_documents\ACN\4_2023-11-06' --> 'data\processed_data\ACN\4_2023-11-06.md'
Converted 'data\edgar_documents\ACN\4_2023-11-13' --> 'data\processed_data\ACN\4_2023-11-13.md'
Converted 'data\edgar_documents\ACN\4_2023-11-16' --> 'data\processed_data\ACN\4_2023-11-16.md'


2025-11-14 15:27:25,802 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:25,814 - INFO - Going to convert document batch...
2025-11-14 15:27:25,816 - INFO - Processing document 4_2023-12-26
2025-11-14 15:27:25,842 - INFO - Finished converting document 4_2023-12-26 in 0.06 sec.
2025-11-14 15:27:25,879 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:25,887 - INFO - Going to convert document batch...
2025-11-14 15:27:25,888 - INFO - Processing document 4_2023-12-28
2025-11-14 15:27:25,908 - INFO - Finished converting document 4_2023-12-28 in 0.05 sec.
2025-11-14 15:27:25,945 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:25,955 - INFO - Going to convert document batch...
2025-11-14 15:27:25,955 - INFO - Processing document 4_2024-01-03


Converted 'data\edgar_documents\ACN\4_2023-12-06' --> 'data\processed_data\ACN\4_2023-12-06.md'
Converted 'data\edgar_documents\ACN\4_2023-12-26' --> 'data\processed_data\ACN\4_2023-12-26.md'
Converted 'data\edgar_documents\ACN\4_2023-12-28' --> 'data\processed_data\ACN\4_2023-12-28.md'


2025-11-14 15:27:25,975 - INFO - Finished converting document 4_2024-01-03 in 0.03 sec.
2025-11-14 15:27:26,009 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,020 - INFO - Going to convert document batch...
2025-11-14 15:27:26,021 - INFO - Processing document 4_2024-01-08
2025-11-14 15:27:26,041 - INFO - Finished converting document 4_2024-01-08 in 0.03 sec.
2025-11-14 15:27:26,074 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,084 - INFO - Going to convert document batch...
2025-11-14 15:27:26,086 - INFO - Processing document 4_2024-01-22
2025-11-14 15:27:26,115 - INFO - Finished converting document 4_2024-01-22 in 0.05 sec.
2025-11-14 15:27:26,151 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,160 - INFO - Going to convert document batch...
2025-11-14 15:27:26,161 - INFO - Processing document 4_2024-01-29
2025-11-14 15:27:26,185 - INFO - Finished converting document 4_2024-01-29 in 0.05 sec.


Converted 'data\edgar_documents\ACN\4_2024-01-03' --> 'data\processed_data\ACN\4_2024-01-03.md'
Converted 'data\edgar_documents\ACN\4_2024-01-08' --> 'data\processed_data\ACN\4_2024-01-08.md'
Converted 'data\edgar_documents\ACN\4_2024-01-22' --> 'data\processed_data\ACN\4_2024-01-22.md'


2025-11-14 15:27:26,220 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,235 - INFO - Going to convert document batch...
2025-11-14 15:27:26,236 - INFO - Processing document 4_2024-01-30
2025-11-14 15:27:26,257 - INFO - Finished converting document 4_2024-01-30 in 0.05 sec.
2025-11-14 15:27:26,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,309 - INFO - Going to convert document batch...
2025-11-14 15:27:26,310 - INFO - Processing document 4_2024-02-01
2025-11-14 15:27:26,330 - INFO - Finished converting document 4_2024-02-01 in 0.05 sec.
2025-11-14 15:27:26,364 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,373 - INFO - Going to convert document batch...
2025-11-14 15:27:26,374 - INFO - Processing document 4_2024-02-05


Converted 'data\edgar_documents\ACN\4_2024-01-29' --> 'data\processed_data\ACN\4_2024-01-29.md'
Converted 'data\edgar_documents\ACN\4_2024-01-30' --> 'data\processed_data\ACN\4_2024-01-30.md'
Converted 'data\edgar_documents\ACN\4_2024-02-01' --> 'data\processed_data\ACN\4_2024-02-01.md'


2025-11-14 15:27:26,395 - INFO - Finished converting document 4_2024-02-05 in 0.05 sec.
2025-11-14 15:27:26,433 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,441 - INFO - Going to convert document batch...
2025-11-14 15:27:26,442 - INFO - Processing document 4_2024-02-06
2025-11-14 15:27:26,464 - INFO - Finished converting document 4_2024-02-06 in 0.05 sec.
2025-11-14 15:27:26,515 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,524 - INFO - Going to convert document batch...
2025-11-14 15:27:26,525 - INFO - Processing document 4_2024-02-12
2025-11-14 15:27:26,544 - INFO - Finished converting document 4_2024-02-12 in 0.06 sec.
2025-11-14 15:27:26,594 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,608 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ACN\4_2024-02-05' --> 'data\processed_data\ACN\4_2024-02-05.md'
Converted 'data\edgar_documents\ACN\4_2024-02-06' --> 'data\processed_data\ACN\4_2024-02-06.md'
Converted 'data\edgar_documents\ACN\4_2024-02-12' --> 'data\processed_data\ACN\4_2024-02-12.md'


2025-11-14 15:27:26,608 - INFO - Processing document 4_2024-02-20
2025-11-14 15:27:26,630 - INFO - Finished converting document 4_2024-02-20 in 0.06 sec.
2025-11-14 15:27:26,663 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,672 - INFO - Going to convert document batch...
2025-11-14 15:27:26,673 - INFO - Processing document 4_2024-03-07
2025-11-14 15:27:26,692 - INFO - Finished converting document 4_2024-03-07 in 0.03 sec.
2025-11-14 15:27:26,742 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,754 - INFO - Going to convert document batch...
2025-11-14 15:27:26,755 - INFO - Processing document 4_2024-03-26
2025-11-14 15:27:26,783 - INFO - Finished converting document 4_2024-03-26 in 0.08 sec.
2025-11-14 15:27:26,838 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\4_2024-02-20' --> 'data\processed_data\ACN\4_2024-02-20.md'
Converted 'data\edgar_documents\ACN\4_2024-03-07' --> 'data\processed_data\ACN\4_2024-03-07.md'
Converted 'data\edgar_documents\ACN\4_2024-03-26' --> 'data\processed_data\ACN\4_2024-03-26.md'


2025-11-14 15:27:26,851 - INFO - Going to convert document batch...
2025-11-14 15:27:26,851 - INFO - Processing document 4_2024-04-08
2025-11-14 15:27:26,872 - INFO - Finished converting document 4_2024-04-08 in 0.06 sec.
2025-11-14 15:27:26,907 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,918 - INFO - Going to convert document batch...
2025-11-14 15:27:26,918 - INFO - Processing document 4_2024-04-16
2025-11-14 15:27:26,945 - INFO - Finished converting document 4_2024-04-16 in 0.05 sec.
2025-11-14 15:27:26,984 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:26,994 - INFO - Going to convert document batch...
2025-11-14 15:27:26,996 - INFO - Processing document 4_2024-04-22
2025-11-14 15:27:27,022 - INFO - Finished converting document 4_2024-04-22 in 0.05 sec.
2025-11-14 15:27:27,058 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,068 - INFO - Going to convert document batch...
2025-11-14 15:27:27,069 - 

Converted 'data\edgar_documents\ACN\4_2024-04-08' --> 'data\processed_data\ACN\4_2024-04-08.md'
Converted 'data\edgar_documents\ACN\4_2024-04-16' --> 'data\processed_data\ACN\4_2024-04-16.md'
Converted 'data\edgar_documents\ACN\4_2024-04-22' --> 'data\processed_data\ACN\4_2024-04-22.md'


2025-11-14 15:27:27,093 - INFO - Finished converting document 4_2024-04-26 in 0.05 sec.
2025-11-14 15:27:27,136 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,144 - INFO - Going to convert document batch...
2025-11-14 15:27:27,145 - INFO - Processing document 4_2024-05-03
2025-11-14 15:27:27,165 - INFO - Finished converting document 4_2024-05-03 in 0.03 sec.
2025-11-14 15:27:27,199 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,206 - INFO - Going to convert document batch...
2025-11-14 15:27:27,207 - INFO - Processing document 4_2024-05-06
2025-11-14 15:27:27,225 - INFO - Finished converting document 4_2024-05-06 in 0.03 sec.
2025-11-14 15:27:27,277 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,293 - INFO - Going to convert document batch...
2025-11-14 15:27:27,295 - INFO - Processing document 4_2024-05-14
2025-11-14 15:27:27,321 - INFO - Finished converting document 4_2024-05-14 in 0.06 sec.


Converted 'data\edgar_documents\ACN\4_2024-04-26' --> 'data\processed_data\ACN\4_2024-04-26.md'
Converted 'data\edgar_documents\ACN\4_2024-05-03' --> 'data\processed_data\ACN\4_2024-05-03.md'
Converted 'data\edgar_documents\ACN\4_2024-05-06' --> 'data\processed_data\ACN\4_2024-05-06.md'


2025-11-14 15:27:27,357 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,366 - INFO - Going to convert document batch...
2025-11-14 15:27:27,367 - INFO - Processing document 4_2024-05-17
2025-11-14 15:27:27,386 - INFO - Finished converting document 4_2024-05-17 in 0.05 sec.
2025-11-14 15:27:27,433 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,442 - INFO - Going to convert document batch...
2025-11-14 15:27:27,443 - INFO - Processing document 4_2024-06-06
2025-11-14 15:27:27,463 - INFO - Finished converting document 4_2024-06-06 in 0.06 sec.
2025-11-14 15:27:27,498 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,507 - INFO - Going to convert document batch...
2025-11-14 15:27:27,508 - INFO - Processing document 4_2024-07-08
2025-11-14 15:27:27,533 - INFO - Finished converting document 4_2024-07-08 in 0.05 sec.


Converted 'data\edgar_documents\ACN\4_2024-05-14' --> 'data\processed_data\ACN\4_2024-05-14.md'
Converted 'data\edgar_documents\ACN\4_2024-05-17' --> 'data\processed_data\ACN\4_2024-05-17.md'
Converted 'data\edgar_documents\ACN\4_2024-06-06' --> 'data\processed_data\ACN\4_2024-06-06.md'


2025-11-14 15:27:27,566 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,574 - INFO - Going to convert document batch...
2025-11-14 15:27:27,576 - INFO - Processing document 4_2024-07-15
2025-11-14 15:27:27,606 - INFO - Finished converting document 4_2024-07-15 in 0.06 sec.
2025-11-14 15:27:27,639 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,648 - INFO - Going to convert document batch...
2025-11-14 15:27:27,649 - INFO - Processing document 4_2024-07-23
2025-11-14 15:27:27,672 - INFO - Finished converting document 4_2024-07-23 in 0.05 sec.
2025-11-14 15:27:27,706 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,717 - INFO - Going to convert document batch...
2025-11-14 15:27:27,718 - INFO - Processing document 4_2024-07-24


Converted 'data\edgar_documents\ACN\4_2024-07-08' --> 'data\processed_data\ACN\4_2024-07-08.md'
Converted 'data\edgar_documents\ACN\4_2024-07-15' --> 'data\processed_data\ACN\4_2024-07-15.md'
Converted 'data\edgar_documents\ACN\4_2024-07-23' --> 'data\processed_data\ACN\4_2024-07-23.md'


2025-11-14 15:27:27,742 - INFO - Finished converting document 4_2024-07-24 in 0.05 sec.
2025-11-14 15:27:27,807 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,818 - INFO - Going to convert document batch...
2025-11-14 15:27:27,820 - INFO - Processing document 4_2024-08-06
2025-11-14 15:27:27,847 - INFO - Finished converting document 4_2024-08-06 in 0.06 sec.
2025-11-14 15:27:27,883 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,889 - INFO - Going to convert document batch...
2025-11-14 15:27:27,890 - INFO - Processing document 4_2024-08-16
2025-11-14 15:27:27,910 - INFO - Finished converting document 4_2024-08-16 in 0.03 sec.
2025-11-14 15:27:27,962 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:27,970 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ACN\4_2024-07-24' --> 'data\processed_data\ACN\4_2024-07-24.md'
Converted 'data\edgar_documents\ACN\4_2024-08-06' --> 'data\processed_data\ACN\4_2024-08-06.md'
Converted 'data\edgar_documents\ACN\4_2024-08-16' --> 'data\processed_data\ACN\4_2024-08-16.md'


2025-11-14 15:27:27,971 - INFO - Processing document 4_2024-09-06
2025-11-14 15:27:27,990 - INFO - Finished converting document 4_2024-09-06 in 0.05 sec.
2025-11-14 15:27:28,040 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:27:28,040 - ERROR - Input document 4_2024-10-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:27:28,042 - INFO - Going to convert document batch...
2025-11-14 15:27:28,102 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-1

Converted 'data\edgar_documents\ACN\4_2024-09-06' --> 'data\processed_data\ACN\4_2024-09-06.md'
Error processing data\edgar_documents\ACN\4_2024-10-01: File format not allowed: data\edgar_documents\ACN\4_2024-10-01
Error processing data\edgar_documents\ACN\4_2024-10-03: File format not allowed: data\edgar_documents\ACN\4_2024-10-03
Converted 'data\edgar_documents\ACN\4_2024-10-07' --> 'data\processed_data\ACN\4_2024-10-07.md'


2025-11-14 15:27:28,251 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:28,261 - INFO - Going to convert document batch...
2025-11-14 15:27:28,262 - INFO - Processing document 4_2024-10-18
2025-11-14 15:27:28,286 - INFO - Finished converting document 4_2024-10-18 in 0.05 sec.
2025-11-14 15:27:28,326 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:28,336 - INFO - Going to convert document batch...
2025-11-14 15:27:28,337 - INFO - Processing document 4_2024-10-22
2025-11-14 15:27:28,360 - INFO - Finished converting document 4_2024-10-22 in 0.05 sec.
2025-11-14 15:27:28,402 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:28,420 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ACN\4_2024-10-16' --> 'data\processed_data\ACN\4_2024-10-16.md'
Converted 'data\edgar_documents\ACN\4_2024-10-18' --> 'data\processed_data\ACN\4_2024-10-18.md'
Converted 'data\edgar_documents\ACN\4_2024-10-22' --> 'data\processed_data\ACN\4_2024-10-22.md'


2025-11-14 15:27:28,421 - INFO - Processing document 4_2024-10-23
2025-11-14 15:27:28,455 - INFO - Finished converting document 4_2024-10-23 in 0.08 sec.
2025-11-14 15:27:28,491 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:28,503 - INFO - Going to convert document batch...
2025-11-14 15:27:28,503 - INFO - Processing document 4_2024-10-24
2025-11-14 15:27:28,526 - INFO - Finished converting document 4_2024-10-24 in 0.05 sec.
2025-11-14 15:27:28,565 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:28,575 - INFO - Going to convert document batch...
2025-11-14 15:27:28,576 - INFO - Processing document 4_2024-10-29
2025-11-14 15:27:28,604 - INFO - Finished converting document 4_2024-10-29 in 0.06 sec.
2025-11-14 15:27:28,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:28,658 - INFO - Going to convert document batch...
2025-11-14 15:27:28,658 - INFO - Processing document 4_2024-11-05
2025-11-14 15:27:28,686 - IN

Converted 'data\edgar_documents\ACN\4_2024-10-23' --> 'data\processed_data\ACN\4_2024-10-23.md'
Converted 'data\edgar_documents\ACN\4_2024-10-24' --> 'data\processed_data\ACN\4_2024-10-24.md'
Converted 'data\edgar_documents\ACN\4_2024-10-29' --> 'data\processed_data\ACN\4_2024-10-29.md'


2025-11-14 15:27:28,724 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:28,733 - INFO - Going to convert document batch...
2025-11-14 15:27:28,734 - INFO - Processing document 4_2024-11-06
2025-11-14 15:27:28,753 - INFO - Finished converting document 4_2024-11-06 in 0.03 sec.
2025-11-14 15:27:28,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:28,797 - INFO - Going to convert document batch...
2025-11-14 15:27:28,798 - INFO - Processing document 4_2024-11-19
2025-11-14 15:27:28,819 - INFO - Finished converting document 4_2024-11-19 in 0.05 sec.
2025-11-14 15:27:28,852 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:28,860 - INFO - Going to convert document batch...
2025-11-14 15:27:28,862 - INFO - Processing document 4_2024-12-03
2025-11-14 15:27:28,882 - INFO - Finished converting document 4_2024-12-03 in 0.03 sec.
2025-11-14 15:27:28,931 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\4_2024-11-05' --> 'data\processed_data\ACN\4_2024-11-05.md'
Converted 'data\edgar_documents\ACN\4_2024-11-06' --> 'data\processed_data\ACN\4_2024-11-06.md'
Converted 'data\edgar_documents\ACN\4_2024-11-19' --> 'data\processed_data\ACN\4_2024-11-19.md'
Converted 'data\edgar_documents\ACN\4_2024-12-03' --> 'data\processed_data\ACN\4_2024-12-03.md'


2025-11-14 15:27:28,940 - INFO - Going to convert document batch...
2025-11-14 15:27:28,941 - INFO - Processing document 4_2024-12-06
2025-11-14 15:27:28,963 - INFO - Finished converting document 4_2024-12-06 in 0.06 sec.
2025-11-14 15:27:29,000 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\4_2024-12-06' --> 'data\processed_data\ACN\4_2024-12-06.md'


2025-11-14 15:27:29,251 - INFO - Going to convert document batch...
2025-11-14 15:27:29,251 - INFO - Processing document 4_2024-12-23
2025-11-14 15:27:29,273 - INFO - Finished converting document 4_2024-12-23 in 0.28 sec.
2025-11-14 15:27:29,318 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:29,326 - INFO - Going to convert document batch...
2025-11-14 15:27:29,328 - INFO - Processing document 4_2025-01-03
2025-11-14 15:27:29,348 - INFO - Finished converting document 4_2025-01-03 in 0.05 sec.
2025-11-14 15:27:29,381 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:29,389 - INFO - Going to convert document batch...
2025-11-14 15:27:29,390 - INFO - Processing document 4_2025-01-06
2025-11-14 15:27:29,413 - INFO - Finished converting document 4_2025-01-06 in 0.05 sec.
2025-11-14 15:27:29,466 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:29,475 - INFO - Going to convert document batch...
2025-11-14 15:27:29,476 - 

Converted 'data\edgar_documents\ACN\4_2024-12-23' --> 'data\processed_data\ACN\4_2024-12-23.md'
Converted 'data\edgar_documents\ACN\4_2025-01-03' --> 'data\processed_data\ACN\4_2025-01-03.md'
Converted 'data\edgar_documents\ACN\4_2025-01-06' --> 'data\processed_data\ACN\4_2025-01-06.md'


2025-11-14 15:27:29,501 - INFO - Finished converting document 4_2025-01-21 in 0.06 sec.
2025-11-14 15:27:29,542 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:29,555 - INFO - Going to convert document batch...
2025-11-14 15:27:29,555 - INFO - Processing document 4_2025-01-22
2025-11-14 15:27:29,585 - INFO - Finished converting document 4_2025-01-22 in 0.05 sec.
2025-11-14 15:27:29,624 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:29,635 - INFO - Going to convert document batch...
2025-11-14 15:27:29,636 - INFO - Processing document 4_2025-01-27
2025-11-14 15:27:29,662 - INFO - Finished converting document 4_2025-01-27 in 0.05 sec.
2025-11-14 15:27:29,702 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:29,709 - INFO - Going to convert document batch...
2025-11-14 15:27:29,711 - INFO - Processing document 4_2025-02-04


Converted 'data\edgar_documents\ACN\4_2025-01-21' --> 'data\processed_data\ACN\4_2025-01-21.md'
Converted 'data\edgar_documents\ACN\4_2025-01-22' --> 'data\processed_data\ACN\4_2025-01-22.md'
Converted 'data\edgar_documents\ACN\4_2025-01-27' --> 'data\processed_data\ACN\4_2025-01-27.md'


2025-11-14 15:27:29,731 - INFO - Finished converting document 4_2025-02-04 in 0.05 sec.
2025-11-14 15:27:29,768 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:29,781 - INFO - Going to convert document batch...
2025-11-14 15:27:29,782 - INFO - Processing document 4_2025-02-06
2025-11-14 15:27:29,816 - INFO - Finished converting document 4_2025-02-06 in 0.06 sec.
2025-11-14 15:27:29,856 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:29,864 - INFO - Going to convert document batch...
2025-11-14 15:27:29,865 - INFO - Processing document 4_2025-02-07
2025-11-14 15:27:29,885 - INFO - Finished converting document 4_2025-02-07 in 0.05 sec.
2025-11-14 15:27:29,920 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:29,928 - INFO - Going to convert document batch...
2025-11-14 15:27:29,928 - INFO - Processing document 4_2025-02-18


Converted 'data\edgar_documents\ACN\4_2025-02-04' --> 'data\processed_data\ACN\4_2025-02-04.md'
Converted 'data\edgar_documents\ACN\4_2025-02-06' --> 'data\processed_data\ACN\4_2025-02-06.md'
Converted 'data\edgar_documents\ACN\4_2025-02-07' --> 'data\processed_data\ACN\4_2025-02-07.md'


2025-11-14 15:27:29,951 - INFO - Finished converting document 4_2025-02-18 in 0.05 sec.
2025-11-14 15:27:29,999 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,018 - INFO - Going to convert document batch...
2025-11-14 15:27:30,019 - INFO - Processing document 4_2025-03-06
2025-11-14 15:27:30,045 - INFO - Finished converting document 4_2025-03-06 in 0.06 sec.
2025-11-14 15:27:30,096 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,105 - INFO - Going to convert document batch...
2025-11-14 15:27:30,106 - INFO - Processing document 4_2025-04-07
2025-11-14 15:27:30,124 - INFO - Finished converting document 4_2025-04-07 in 0.06 sec.
2025-11-14 15:27:30,157 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,169 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ACN\4_2025-02-18' --> 'data\processed_data\ACN\4_2025-02-18.md'
Converted 'data\edgar_documents\ACN\4_2025-03-06' --> 'data\processed_data\ACN\4_2025-03-06.md'
Converted 'data\edgar_documents\ACN\4_2025-04-07' --> 'data\processed_data\ACN\4_2025-04-07.md'


2025-11-14 15:27:30,170 - INFO - Processing document 4_2025-04-14
2025-11-14 15:27:30,207 - INFO - Finished converting document 4_2025-04-14 in 0.06 sec.
2025-11-14 15:27:30,248 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,254 - INFO - Going to convert document batch...
2025-11-14 15:27:30,255 - INFO - Processing document 4_2025-05-05
2025-11-14 15:27:30,273 - INFO - Finished converting document 4_2025-05-05 in 0.03 sec.
2025-11-14 15:27:30,313 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,321 - INFO - Going to convert document batch...
2025-11-14 15:27:30,322 - INFO - Processing document 4_2025-05-06
2025-11-14 15:27:30,339 - INFO - Finished converting document 4_2025-05-06 in 0.05 sec.
2025-11-14 15:27:30,375 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,384 - INFO - Going to convert document batch...
2025-11-14 15:27:30,384 - INFO - Processing document 4_2025-05-14
2025-11-14 15:27:30,404 - IN

Converted 'data\edgar_documents\ACN\4_2025-04-14' --> 'data\processed_data\ACN\4_2025-04-14.md'
Converted 'data\edgar_documents\ACN\4_2025-05-05' --> 'data\processed_data\ACN\4_2025-05-05.md'
Converted 'data\edgar_documents\ACN\4_2025-05-06' --> 'data\processed_data\ACN\4_2025-05-06.md'


2025-11-14 15:27:30,455 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,470 - INFO - Going to convert document batch...
2025-11-14 15:27:30,472 - INFO - Processing document 4_2025-05-16
2025-11-14 15:27:30,495 - INFO - Finished converting document 4_2025-05-16 in 0.08 sec.
2025-11-14 15:27:30,532 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,538 - INFO - Going to convert document batch...
2025-11-14 15:27:30,539 - INFO - Processing document 4_2025-06-09
2025-11-14 15:27:30,556 - INFO - Finished converting document 4_2025-06-09 in 0.03 sec.


Converted 'data\edgar_documents\ACN\4_2025-05-14' --> 'data\processed_data\ACN\4_2025-05-14.md'
Converted 'data\edgar_documents\ACN\4_2025-05-16' --> 'data\processed_data\ACN\4_2025-05-16.md'
Converted 'data\edgar_documents\ACN\4_2025-06-09' --> 'data\processed_data\ACN\4_2025-06-09.md'


2025-11-14 15:27:30,607 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,620 - INFO - Going to convert document batch...
2025-11-14 15:27:30,621 - INFO - Processing document 4_2025-07-07
2025-11-14 15:27:30,644 - INFO - Finished converting document 4_2025-07-07 in 0.06 sec.
2025-11-14 15:27:30,677 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,686 - INFO - Going to convert document batch...
2025-11-14 15:27:30,687 - INFO - Processing document 4_2025-07-14
2025-11-14 15:27:30,711 - INFO - Finished converting document 4_2025-07-14 in 0.05 sec.
2025-11-14 15:27:30,764 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,772 - INFO - Going to convert document batch...
2025-11-14 15:27:30,773 - INFO - Processing document 4_2025-08-06
2025-11-14 15:27:30,794 - INFO - Finished converting document 4_2025-08-06 in 0.06 sec.
2025-11-14 15:27:30,830 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\ACN\4_2025-07-07' --> 'data\processed_data\ACN\4_2025-07-07.md'
Converted 'data\edgar_documents\ACN\4_2025-07-14' --> 'data\processed_data\ACN\4_2025-07-14.md'
Converted 'data\edgar_documents\ACN\4_2025-08-06' --> 'data\processed_data\ACN\4_2025-08-06.md'


2025-11-14 15:27:30,857 - INFO - Finished converting document 4_2025-08-18 in 0.05 sec.
2025-11-14 15:27:30,909 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,919 - INFO - Going to convert document batch...
2025-11-14 15:27:30,920 - INFO - Processing document 4_2025-09-08
2025-11-14 15:27:30,939 - INFO - Finished converting document 4_2025-09-08 in 0.06 sec.
2025-11-14 15:27:30,985 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:30,994 - INFO - Going to convert document batch...
2025-11-14 15:27:30,995 - INFO - Processing document 4_2025-10-06
2025-11-14 15:27:31,016 - INFO - Finished converting document 4_2025-10-06 in 0.05 sec.
2025-11-14 15:27:31,056 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:31,072 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ACN\4_2025-08-18' --> 'data\processed_data\ACN\4_2025-08-18.md'
Converted 'data\edgar_documents\ACN\4_2025-09-08' --> 'data\processed_data\ACN\4_2025-09-08.md'
Converted 'data\edgar_documents\ACN\4_2025-10-06' --> 'data\processed_data\ACN\4_2025-10-06.md'


2025-11-14 15:27:31,073 - INFO - Processing document 4_2025-10-22
2025-11-14 15:27:31,112 - INFO - Finished converting document 4_2025-10-22 in 0.08 sec.
2025-11-14 15:27:31,150 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:31,161 - INFO - Going to convert document batch...
2025-11-14 15:27:31,163 - INFO - Processing document 4_2025-10-23
2025-11-14 15:27:31,186 - INFO - Finished converting document 4_2025-10-23 in 0.05 sec.
2025-11-14 15:27:31,227 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:31,238 - INFO - Going to convert document batch...
2025-11-14 15:27:31,239 - INFO - Processing document 4_2025-10-30
2025-11-14 15:27:31,265 - INFO - Finished converting document 4_2025-10-30 in 0.05 sec.
2025-11-14 15:27:31,323 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\4_2025-10-22' --> 'data\processed_data\ACN\4_2025-10-22.md'
Converted 'data\edgar_documents\ACN\4_2025-10-23' --> 'data\processed_data\ACN\4_2025-10-23.md'
Converted 'data\edgar_documents\ACN\4_2025-10-30' --> 'data\processed_data\ACN\4_2025-10-30.md'


2025-11-14 15:27:31,335 - INFO - Going to convert document batch...
2025-11-14 15:27:31,335 - INFO - Processing document 4_2025-11-04
2025-11-14 15:27:31,371 - INFO - Finished converting document 4_2025-11-04 in 0.08 sec.
2025-11-14 15:27:31,406 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:31,415 - INFO - Going to convert document batch...
2025-11-14 15:27:31,415 - INFO - Processing document 4_2025-11-06
2025-11-14 15:27:31,434 - INFO - Finished converting document 4_2025-11-06 in 0.05 sec.
2025-11-14 15:27:31,469 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:31,495 - INFO - Going to convert document batch...
2025-11-14 15:27:31,496 - INFO - Processing document 8-K_2023-02-01
2025-11-14 15:27:31,536 - INFO - Finished converting document 8-K_2023-02-01 in 0.08 sec.
2025-11-14 15:27:31,570 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:31,591 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ACN\4_2025-11-04' --> 'data\processed_data\ACN\4_2025-11-04.md'
Converted 'data\edgar_documents\ACN\4_2025-11-06' --> 'data\processed_data\ACN\4_2025-11-06.md'
Converted 'data\edgar_documents\ACN\8-K_2023-02-01' --> 'data\processed_data\ACN\8-K_2023-02-01.md'


2025-11-14 15:27:31,592 - INFO - Processing document 8-K_2023-03-23
2025-11-14 15:27:31,612 - INFO - Finished converting document 8-K_2023-03-23 in 0.06 sec.
2025-11-14 15:27:31,651 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:31,672 - INFO - Going to convert document batch...
2025-11-14 15:27:31,673 - INFO - Processing document 8-K_2023-04-14
2025-11-14 15:27:31,699 - INFO - Finished converting document 8-K_2023-04-14 in 0.08 sec.
2025-11-14 15:27:31,725 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:31,738 - INFO - Going to convert document batch...
2025-11-14 15:27:31,739 - INFO - Processing document 8-K_2023-06-22
2025-11-14 15:27:31,758 - INFO - Finished converting document 8-K_2023-06-22 in 0.05 sec.
2025-11-14 15:27:31,784 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:31,802 - INFO - Going to convert document batch...
2025-11-14 15:27:31,803 - INFO - Processing document 8-K_2023-07-27


Converted 'data\edgar_documents\ACN\8-K_2023-03-23' --> 'data\processed_data\ACN\8-K_2023-03-23.md'
Converted 'data\edgar_documents\ACN\8-K_2023-04-14' --> 'data\processed_data\ACN\8-K_2023-04-14.md'
Converted 'data\edgar_documents\ACN\8-K_2023-06-22' --> 'data\processed_data\ACN\8-K_2023-06-22.md'


2025-11-14 15:27:31,822 - INFO - Finished converting document 8-K_2023-07-27 in 0.05 sec.
2025-11-14 15:27:31,850 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:31,865 - INFO - Going to convert document batch...
2025-11-14 15:27:31,866 - INFO - Processing document 8-K_2023-09-28
2025-11-14 15:27:31,888 - INFO - Finished converting document 8-K_2023-09-28 in 0.06 sec.
2025-11-14 15:27:31,918 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:31,932 - INFO - Going to convert document batch...
2025-11-14 15:27:31,933 - INFO - Processing document 8-K_2023-12-06
2025-11-14 15:27:31,955 - INFO - Finished converting document 8-K_2023-12-06 in 0.05 sec.
2025-11-14 15:27:31,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,003 - INFO - Going to convert document batch...
2025-11-14 15:27:32,004 - INFO - Processing document 8-K_2023-12-19


Converted 'data\edgar_documents\ACN\8-K_2023-07-27' --> 'data\processed_data\ACN\8-K_2023-07-27.md'
Converted 'data\edgar_documents\ACN\8-K_2023-09-28' --> 'data\processed_data\ACN\8-K_2023-09-28.md'
Converted 'data\edgar_documents\ACN\8-K_2023-12-06' --> 'data\processed_data\ACN\8-K_2023-12-06.md'


2025-11-14 15:27:32,023 - INFO - Finished converting document 8-K_2023-12-19 in 0.05 sec.
2025-11-14 15:27:32,051 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,073 - INFO - Going to convert document batch...
2025-11-14 15:27:32,074 - INFO - Processing document 8-K_2024-01-31
2025-11-14 15:27:32,125 - INFO - Finished converting document 8-K_2024-01-31 in 0.09 sec.
2025-11-14 15:27:32,174 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,184 - INFO - Going to convert document batch...
2025-11-14 15:27:32,185 - INFO - Processing document 8-K_2024-03-21
2025-11-14 15:27:32,202 - INFO - Finished converting document 8-K_2024-03-21 in 0.05 sec.
2025-11-14 15:27:32,227 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\8-K_2023-12-19' --> 'data\processed_data\ACN\8-K_2023-12-19.md'
Converted 'data\edgar_documents\ACN\8-K_2024-01-31' --> 'data\processed_data\ACN\8-K_2024-01-31.md'
Converted 'data\edgar_documents\ACN\8-K_2024-03-21' --> 'data\processed_data\ACN\8-K_2024-03-21.md'


2025-11-14 15:27:32,236 - INFO - Going to convert document batch...
2025-11-14 15:27:32,237 - INFO - Processing document 8-K_2024-05-17
2025-11-14 15:27:32,255 - INFO - Finished converting document 8-K_2024-05-17 in 0.03 sec.
2025-11-14 15:27:32,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,288 - INFO - Going to convert document batch...
2025-11-14 15:27:32,289 - INFO - Processing document 8-K_2024-06-11
2025-11-14 15:27:32,309 - INFO - Finished converting document 8-K_2024-06-11 in 0.05 sec.
2025-11-14 15:27:32,333 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,340 - INFO - Going to convert document batch...
2025-11-14 15:27:32,340 - INFO - Processing document 8-K_2024-06-20
2025-11-14 15:27:32,358 - INFO - Finished converting document 8-K_2024-06-20 in 0.05 sec.
2025-11-14 15:27:32,382 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,390 - INFO - Going to convert document batch...
2025-11-14 15:

Converted 'data\edgar_documents\ACN\8-K_2024-05-17' --> 'data\processed_data\ACN\8-K_2024-05-17.md'
Converted 'data\edgar_documents\ACN\8-K_2024-06-11' --> 'data\processed_data\ACN\8-K_2024-06-11.md'
Converted 'data\edgar_documents\ACN\8-K_2024-06-20' --> 'data\processed_data\ACN\8-K_2024-06-20.md'
Converted 'data\edgar_documents\ACN\8-K_2024-07-19' --> 'data\processed_data\ACN\8-K_2024-07-19.md'


2025-11-14 15:27:32,459 - INFO - Finished converting document 8-K_2024-09-26 in 0.03 sec.
2025-11-14 15:27:32,486 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,551 - INFO - Going to convert document batch...
2025-11-14 15:27:32,552 - INFO - Processing document 8-K_2024-09-30
2025-11-14 15:27:32,617 - INFO - Finished converting document 8-K_2024-09-30 in 0.14 sec.
2025-11-14 15:27:32,640 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,653 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ACN\8-K_2024-09-26' --> 'data\processed_data\ACN\8-K_2024-09-26.md'
Converted 'data\edgar_documents\ACN\8-K_2024-09-30' --> 'data\processed_data\ACN\8-K_2024-09-30.md'


2025-11-14 15:27:32,654 - INFO - Processing document 8-K_2024-10-04
2025-11-14 15:27:32,679 - INFO - Finished converting document 8-K_2024-10-04 in 0.05 sec.
2025-11-14 15:27:32,706 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,715 - INFO - Going to convert document batch...
2025-11-14 15:27:32,716 - INFO - Processing document 8-K_2024-12-02
2025-11-14 15:27:32,731 - INFO - Finished converting document 8-K_2024-12-02 in 0.05 sec.
2025-11-14 15:27:32,754 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,762 - INFO - Going to convert document batch...
2025-11-14 15:27:32,763 - INFO - Processing document 8-K_2024-12-19
2025-11-14 15:27:32,782 - INFO - Finished converting document 8-K_2024-12-19 in 0.05 sec.
2025-11-14 15:27:32,808 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,830 - INFO - Going to convert document batch...
2025-11-14 15:27:32,830 - INFO - Processing document 8-K_2025-02-06
2025-11-14 15:

Converted 'data\edgar_documents\ACN\8-K_2024-10-04' --> 'data\processed_data\ACN\8-K_2024-10-04.md'
Converted 'data\edgar_documents\ACN\8-K_2024-12-02' --> 'data\processed_data\ACN\8-K_2024-12-02.md'
Converted 'data\edgar_documents\ACN\8-K_2024-12-19' --> 'data\processed_data\ACN\8-K_2024-12-19.md'


2025-11-14 15:27:32,902 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,912 - INFO - Going to convert document batch...
2025-11-14 15:27:32,913 - INFO - Processing document 8-K_2025-02-13
2025-11-14 15:27:32,930 - INFO - Finished converting document 8-K_2025-02-13 in 0.03 sec.
2025-11-14 15:27:32,952 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:32,961 - INFO - Going to convert document batch...
2025-11-14 15:27:32,962 - INFO - Processing document 8-K_2025-03-20
2025-11-14 15:27:32,978 - INFO - Finished converting document 8-K_2025-03-20 in 0.03 sec.
2025-11-14 15:27:33,000 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:33,009 - INFO - Going to convert document batch...
2025-11-14 15:27:33,010 - INFO - Processing document 8-K_2025-06-20
2025-11-14 15:27:33,030 - INFO - Finished converting document 8-K_2025-06-20 in 0.05 sec.
2025-11-14 15:27:33,053 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\ACN\8-K_2025-02-06' --> 'data\processed_data\ACN\8-K_2025-02-06.md'
Converted 'data\edgar_documents\ACN\8-K_2025-02-13' --> 'data\processed_data\ACN\8-K_2025-02-13.md'
Converted 'data\edgar_documents\ACN\8-K_2025-03-20' --> 'data\processed_data\ACN\8-K_2025-03-20.md'
Converted 'data\edgar_documents\ACN\8-K_2025-06-20' --> 'data\processed_data\ACN\8-K_2025-06-20.md'


2025-11-14 15:27:33,105 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:27:33,118 - INFO - Going to convert document batch...
2025-11-14 15:27:33,118 - INFO - Processing document 8-K_2025-09-25
2025-11-14 15:27:33,139 - INFO - Finished converting document 8-K_2025-09-25 in 0.05 sec.
2025-11-14 15:27:33,188 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\8-K_2025-07-17' --> 'data\processed_data\ACN\8-K_2025-07-17.md'
Converted 'data\edgar_documents\ACN\8-K_2025-09-25' --> 'data\processed_data\ACN\8-K_2025-09-25.md'


2025-11-14 15:27:33,884 - INFO - Going to convert document batch...
2025-11-14 15:27:33,884 - INFO - Processing document DEF-14A_2023-12-13
2025-11-14 15:27:36,725 - INFO - Finished converting document DEF-14A_2023-12-13 in 3.58 sec.
2025-11-14 15:27:37,672 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\DEF-14A_2023-12-13' --> 'data\processed_data\ACN\DEF-14A_2023-12-13.md'


2025-11-14 15:27:38,307 - INFO - Going to convert document batch...
2025-11-14 15:27:38,308 - INFO - Processing document DEF-14A_2024-12-16
2025-11-14 15:27:41,128 - INFO - Finished converting document DEF-14A_2024-12-16 in 3.48 sec.
2025-11-14 15:27:42,092 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ACN\DEF-14A_2024-12-16' --> 'data\processed_data\ACN\DEF-14A_2024-12-16.md'
Processed 151 new files. Errors: 2
Found 127 files to process in data\edgar_documents\ADBE


2025-11-14 15:27:42,910 - INFO - Going to convert document batch...
2025-11-14 15:27:42,911 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:27:42,911 - INFO - Processing document 10-K_2023-01-17
2025-11-14 15:27:44,086 - INFO - Finished converting document 10-K_2023-01-17 in 2.05 sec.
2025-11-14 15:27:44,644 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\10-K_2023-01-17' --> 'data\processed_data\ADBE\10-K_2023-01-17.md'


2025-11-14 15:27:45,446 - INFO - Going to convert document batch...
2025-11-14 15:27:45,447 - INFO - Processing document 10-K_2024-01-17
2025-11-14 15:27:46,594 - INFO - Finished converting document 10-K_2024-01-17 in 2.00 sec.
2025-11-14 15:27:47,128 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\10-K_2024-01-17' --> 'data\processed_data\ADBE\10-K_2024-01-17.md'


2025-11-14 15:27:47,973 - INFO - Going to convert document batch...
2025-11-14 15:27:47,974 - INFO - Processing document 10-K_2025-01-13
2025-11-14 15:27:49,075 - INFO - Finished converting document 10-K_2025-01-13 in 1.98 sec.
2025-11-14 15:27:49,609 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\10-K_2025-01-13' --> 'data\processed_data\ADBE\10-K_2025-01-13.md'


2025-11-14 15:27:49,974 - INFO - Going to convert document batch...
2025-11-14 15:27:49,975 - INFO - Processing document 10-Q_2023-03-29
2025-11-14 15:27:50,695 - INFO - Finished converting document 10-Q_2023-03-29 in 1.11 sec.
2025-11-14 15:27:51,116 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\10-Q_2023-03-29' --> 'data\processed_data\ADBE\10-Q_2023-03-29.md'


2025-11-14 15:27:51,960 - INFO - Going to convert document batch...
2025-11-14 15:27:51,961 - INFO - Processing document 10-Q_2023-06-28
2025-11-14 15:27:52,762 - INFO - Finished converting document 10-Q_2023-06-28 in 1.69 sec.
2025-11-14 15:27:53,213 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\10-Q_2023-06-28' --> 'data\processed_data\ADBE\10-Q_2023-06-28.md'


2025-11-14 15:27:53,741 - INFO - Going to convert document batch...
2025-11-14 15:27:53,742 - INFO - Processing document 10-Q_2023-09-27
2025-11-14 15:27:54,634 - INFO - Finished converting document 10-Q_2023-09-27 in 1.45 sec.
2025-11-14 15:27:55,505 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\10-Q_2023-09-27' --> 'data\processed_data\ADBE\10-Q_2023-09-27.md'


2025-11-14 15:27:55,960 - INFO - Going to convert document batch...
2025-11-14 15:27:55,960 - INFO - Processing document 10-Q_2024-03-27
2025-11-14 15:27:57,026 - INFO - Finished converting document 10-Q_2024-03-27 in 1.56 sec.
2025-11-14 15:27:57,418 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\10-Q_2024-03-27' --> 'data\processed_data\ADBE\10-Q_2024-03-27.md'


2025-11-14 15:27:58,099 - INFO - Going to convert document batch...
2025-11-14 15:27:58,100 - INFO - Processing document 10-Q_2024-06-26
2025-11-14 15:27:58,928 - INFO - Finished converting document 10-Q_2024-06-26 in 1.53 sec.
2025-11-14 15:27:59,362 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\10-Q_2024-06-26' --> 'data\processed_data\ADBE\10-Q_2024-06-26.md'


2025-11-14 15:27:59,769 - INFO - Going to convert document batch...
2025-11-14 15:27:59,770 - INFO - Processing document 10-Q_2024-09-25
2025-11-14 15:28:00,548 - INFO - Finished converting document 10-Q_2024-09-25 in 1.22 sec.
2025-11-14 15:28:00,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\10-Q_2024-09-25' --> 'data\processed_data\ADBE\10-Q_2024-09-25.md'


2025-11-14 15:28:01,679 - INFO - Going to convert document batch...
2025-11-14 15:28:01,680 - INFO - Processing document 10-Q_2025-03-26
2025-11-14 15:28:02,371 - INFO - Finished converting document 10-Q_2025-03-26 in 1.42 sec.
2025-11-14 15:28:02,743 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\10-Q_2025-03-26' --> 'data\processed_data\ADBE\10-Q_2025-03-26.md'


2025-11-14 15:28:03,105 - INFO - Going to convert document batch...
2025-11-14 15:28:03,106 - INFO - Processing document 10-Q_2025-06-25
2025-11-14 15:28:03,815 - INFO - Finished converting document 10-Q_2025-06-25 in 1.11 sec.
2025-11-14 15:28:04,203 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\10-Q_2025-06-25' --> 'data\processed_data\ADBE\10-Q_2025-06-25.md'


2025-11-14 15:28:04,872 - INFO - Going to convert document batch...
2025-11-14 15:28:04,872 - INFO - Processing document 10-Q_2025-09-24
2025-11-14 15:28:05,603 - INFO - Finished converting document 10-Q_2025-09-24 in 1.42 sec.
2025-11-14 15:28:05,998 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:06,008 - INFO - Going to convert document batch...
2025-11-14 15:28:06,008 - INFO - Processing document 4_2023-01-10
2025-11-14 15:28:06,029 - INFO - Finished converting document 4_2023-01-10 in 0.05 sec.
2025-11-14 15:28:06,078 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:28:06,079 - ERROR - Input document 4_2023-01-11 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, 

Converted 'data\edgar_documents\ADBE\10-Q_2025-09-24' --> 'data\processed_data\ADBE\10-Q_2025-09-24.md'
Converted 'data\edgar_documents\ADBE\4_2023-01-10' --> 'data\processed_data\ADBE\4_2023-01-10.md'
Error processing data\edgar_documents\ADBE\4_2023-01-11: File format not allowed: data\edgar_documents\ADBE\4_2023-01-11
Converted 'data\edgar_documents\ADBE\4_2023-01-12' --> 'data\processed_data\ADBE\4_2023-01-12.md'


2025-11-14 15:28:06,170 - INFO - Processing document 4_2023-01-23
2025-11-14 15:28:06,199 - INFO - Finished converting document 4_2023-01-23 in 0.06 sec.
2025-11-14 15:28:06,254 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:06,278 - INFO - Going to convert document batch...
2025-11-14 15:28:06,279 - INFO - Processing document 4_2023-01-26
2025-11-14 15:28:06,321 - INFO - Finished converting document 4_2023-01-26 in 0.09 sec.
2025-11-14 15:28:06,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:06,377 - INFO - Going to convert document batch...
2025-11-14 15:28:06,377 - INFO - Processing document 4_2023-02-03
2025-11-14 15:28:06,395 - INFO - Finished converting document 4_2023-02-03 in 0.03 sec.
2025-11-14 15:28:06,427 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\4_2023-01-23' --> 'data\processed_data\ADBE\4_2023-01-23.md'
Converted 'data\edgar_documents\ADBE\4_2023-01-26' --> 'data\processed_data\ADBE\4_2023-01-26.md'
Converted 'data\edgar_documents\ADBE\4_2023-02-03' --> 'data\processed_data\ADBE\4_2023-02-03.md'


2025-11-14 15:28:06,437 - INFO - Going to convert document batch...
2025-11-14 15:28:06,438 - INFO - Processing document 4_2023-02-16
2025-11-14 15:28:06,462 - INFO - Finished converting document 4_2023-02-16 in 0.05 sec.
2025-11-14 15:28:06,493 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:06,504 - INFO - Going to convert document batch...
2025-11-14 15:28:06,504 - INFO - Processing document 4_2023-03-01
2025-11-14 15:28:06,526 - INFO - Finished converting document 4_2023-03-01 in 0.05 sec.
2025-11-14 15:28:06,557 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:06,566 - INFO - Going to convert document batch...
2025-11-14 15:28:06,567 - INFO - Processing document 4_2023-03-16
2025-11-14 15:28:06,590 - INFO - Finished converting document 4_2023-03-16 in 0.05 sec.
2025-11-14 15:28:06,625 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:06,633 - INFO - Going to convert document batch...
2025-11-14 15:28:06,634 - 

Converted 'data\edgar_documents\ADBE\4_2023-02-16' --> 'data\processed_data\ADBE\4_2023-02-16.md'
Converted 'data\edgar_documents\ADBE\4_2023-03-01' --> 'data\processed_data\ADBE\4_2023-03-01.md'
Converted 'data\edgar_documents\ADBE\4_2023-03-16' --> 'data\processed_data\ADBE\4_2023-03-16.md'
Converted 'data\edgar_documents\ADBE\4_2023-03-21' --> 'data\processed_data\ADBE\4_2023-03-21.md'


2025-11-14 15:28:06,690 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:06,699 - INFO - Going to convert document batch...
2025-11-14 15:28:06,700 - INFO - Processing document 4_2023-04-18
2025-11-14 15:28:06,726 - INFO - Finished converting document 4_2023-04-18 in 0.05 sec.
2025-11-14 15:28:06,765 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:06,775 - INFO - Going to convert document batch...
2025-11-14 15:28:06,776 - INFO - Processing document 4_2023-04-24
2025-11-14 15:28:06,803 - INFO - Finished converting document 4_2023-04-24 in 0.05 sec.
2025-11-14 15:28:06,843 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:06,851 - INFO - Going to convert document batch...
2025-11-14 15:28:06,852 - INFO - Processing document 4_2023-04-26
2025-11-14 15:28:06,872 - INFO - Finished converting document 4_2023-04-26 in 0.05 sec.
2025-11-14 15:28:06,910 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\ADBE\4_2023-04-18' --> 'data\processed_data\ADBE\4_2023-04-18.md'
Converted 'data\edgar_documents\ADBE\4_2023-04-24' --> 'data\processed_data\ADBE\4_2023-04-24.md'
Converted 'data\edgar_documents\ADBE\4_2023-04-26' --> 'data\processed_data\ADBE\4_2023-04-26.md'


2025-11-14 15:28:06,971 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:06,986 - INFO - Going to convert document batch...
2025-11-14 15:28:06,988 - INFO - Processing document 4_2023-05-17
2025-11-14 15:28:07,009 - INFO - Finished converting document 4_2023-05-17 in 0.05 sec.
2025-11-14 15:28:07,051 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:07,072 - INFO - Going to convert document batch...
2025-11-14 15:28:07,073 - INFO - Processing document 4_2023-05-31
2025-11-14 15:28:07,108 - INFO - Finished converting document 4_2023-05-31 in 0.08 sec.


Converted 'data\edgar_documents\ADBE\4_2023-05-03' --> 'data\processed_data\ADBE\4_2023-05-03.md'
Converted 'data\edgar_documents\ADBE\4_2023-05-17' --> 'data\processed_data\ADBE\4_2023-05-17.md'


2025-11-14 15:28:07,156 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:07,171 - INFO - Going to convert document batch...
2025-11-14 15:28:07,171 - INFO - Processing document 4_2023-06-15
2025-11-14 15:28:07,197 - INFO - Finished converting document 4_2023-06-15 in 0.05 sec.
2025-11-14 15:28:07,254 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:07,265 - INFO - Going to convert document batch...
2025-11-14 15:28:07,266 - INFO - Processing document 4_2023-06-20
2025-11-14 15:28:07,292 - INFO - Finished converting document 4_2023-06-20 in 0.06 sec.
2025-11-14 15:28:07,333 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\4_2023-05-31' --> 'data\processed_data\ADBE\4_2023-05-31.md'
Converted 'data\edgar_documents\ADBE\4_2023-06-15' --> 'data\processed_data\ADBE\4_2023-06-15.md'
Converted 'data\edgar_documents\ADBE\4_2023-06-20' --> 'data\processed_data\ADBE\4_2023-06-20.md'


2025-11-14 15:28:07,344 - INFO - Going to convert document batch...
2025-11-14 15:28:07,345 - INFO - Processing document 4_2023-06-22
2025-11-14 15:28:07,373 - INFO - Finished converting document 4_2023-06-22 in 0.06 sec.
2025-11-14 15:28:07,415 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:07,423 - INFO - Going to convert document batch...
2025-11-14 15:28:07,424 - INFO - Processing document 4_2023-06-23
2025-11-14 15:28:07,444 - INFO - Finished converting document 4_2023-06-23 in 0.03 sec.
2025-11-14 15:28:07,482 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:07,492 - INFO - Going to convert document batch...
2025-11-14 15:28:07,493 - INFO - Processing document 4_2023-07-18
2025-11-14 15:28:07,519 - INFO - Finished converting document 4_2023-07-18 in 0.05 sec.
2025-11-14 15:28:07,553 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:07,563 - INFO - Going to convert document batch...
2025-11-14 15:28:07,564 - 

Converted 'data\edgar_documents\ADBE\4_2023-06-22' --> 'data\processed_data\ADBE\4_2023-06-22.md'
Converted 'data\edgar_documents\ADBE\4_2023-06-23' --> 'data\processed_data\ADBE\4_2023-06-23.md'
Converted 'data\edgar_documents\ADBE\4_2023-07-18' --> 'data\processed_data\ADBE\4_2023-07-18.md'
Converted 'data\edgar_documents\ADBE\4_2023-07-26' --> 'data\processed_data\ADBE\4_2023-07-26.md'


2025-11-14 15:28:07,627 - INFO - Going to convert document batch...
2025-11-14 15:28:07,628 - INFO - Processing document 4_2023-08-07
2025-11-14 15:28:07,647 - INFO - Finished converting document 4_2023-08-07 in 0.03 sec.
2025-11-14 15:28:07,695 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:07,712 - INFO - Going to convert document batch...
2025-11-14 15:28:07,713 - INFO - Processing document 4_2023-08-17
2025-11-14 15:28:07,734 - INFO - Finished converting document 4_2023-08-17 in 0.06 sec.
2025-11-14 15:28:07,766 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:07,777 - INFO - Going to convert document batch...
2025-11-14 15:28:07,777 - INFO - Processing document 4_2023-09-01
2025-11-14 15:28:07,799 - INFO - Finished converting document 4_2023-09-01 in 0.05 sec.
2025-11-14 15:28:07,831 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:07,840 - INFO - Going to convert document batch...
2025-11-14 15:28:07,840 - 

Converted 'data\edgar_documents\ADBE\4_2023-08-07' --> 'data\processed_data\ADBE\4_2023-08-07.md'
Converted 'data\edgar_documents\ADBE\4_2023-08-17' --> 'data\processed_data\ADBE\4_2023-08-17.md'
Converted 'data\edgar_documents\ADBE\4_2023-09-01' --> 'data\processed_data\ADBE\4_2023-09-01.md'


2025-11-14 15:28:07,902 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:07,913 - INFO - Going to convert document batch...
2025-11-14 15:28:07,914 - INFO - Processing document 4_2023-09-19
2025-11-14 15:28:07,941 - INFO - Finished converting document 4_2023-09-19 in 0.05 sec.
2025-11-14 15:28:07,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:07,985 - INFO - Going to convert document batch...
2025-11-14 15:28:07,986 - INFO - Processing document 4_2023-10-17
2025-11-14 15:28:08,006 - INFO - Finished converting document 4_2023-10-17 in 0.03 sec.
2025-11-14 15:28:08,038 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:08,048 - INFO - Going to convert document batch...
2025-11-14 15:28:08,049 - INFO - Processing document 4_2023-10-26
2025-11-14 15:28:08,075 - INFO - Finished converting document 4_2023-10-26 in 0.05 sec.


Converted 'data\edgar_documents\ADBE\4_2023-09-18' --> 'data\processed_data\ADBE\4_2023-09-18.md'
Converted 'data\edgar_documents\ADBE\4_2023-09-19' --> 'data\processed_data\ADBE\4_2023-09-19.md'
Converted 'data\edgar_documents\ADBE\4_2023-10-17' --> 'data\processed_data\ADBE\4_2023-10-17.md'


2025-11-14 15:28:08,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\4_2023-10-26' --> 'data\processed_data\ADBE\4_2023-10-26.md'


2025-11-14 15:28:08,474 - INFO - Going to convert document batch...
2025-11-14 15:28:08,475 - INFO - Processing document 4_2023-11-16
2025-11-14 15:28:08,503 - INFO - Finished converting document 4_2023-11-16 in 0.41 sec.
2025-11-14 15:28:08,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:08,565 - INFO - Going to convert document batch...
2025-11-14 15:28:08,566 - INFO - Processing document 4_2023-12-01
2025-11-14 15:28:08,586 - INFO - Finished converting document 4_2023-12-01 in 0.06 sec.
2025-11-14 15:28:08,619 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:08,628 - INFO - Going to convert document batch...
2025-11-14 15:28:08,629 - INFO - Processing document 4_2023-12-18
2025-11-14 15:28:08,651 - INFO - Finished converting document 4_2023-12-18 in 0.05 sec.
2025-11-14 15:28:08,701 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\4_2023-11-16' --> 'data\processed_data\ADBE\4_2023-11-16.md'
Converted 'data\edgar_documents\ADBE\4_2023-12-01' --> 'data\processed_data\ADBE\4_2023-12-01.md'
Converted 'data\edgar_documents\ADBE\4_2023-12-18' --> 'data\processed_data\ADBE\4_2023-12-18.md'


2025-11-14 15:28:08,717 - INFO - Going to convert document batch...
2025-11-14 15:28:08,718 - INFO - Processing document 4_2023-12-19
2025-11-14 15:28:08,746 - INFO - Finished converting document 4_2023-12-19 in 0.08 sec.
2025-11-14 15:28:08,799 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:08,814 - INFO - Going to convert document batch...
2025-11-14 15:28:08,815 - INFO - Processing document 4_2023-12-26
2025-11-14 15:28:08,833 - INFO - Finished converting document 4_2023-12-26 in 0.06 sec.
2025-11-14 15:28:08,864 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:08,871 - INFO - Going to convert document batch...
2025-11-14 15:28:08,872 - INFO - Processing document 4_2024-01-04
2025-11-14 15:28:08,890 - INFO - Finished converting document 4_2024-01-04 in 0.05 sec.
2025-11-14 15:28:08,921 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:08,927 - INFO - Going to convert document batch...
2025-11-14 15:28:08,928 - 

Converted 'data\edgar_documents\ADBE\4_2023-12-19' --> 'data\processed_data\ADBE\4_2023-12-19.md'
Converted 'data\edgar_documents\ADBE\4_2023-12-26' --> 'data\processed_data\ADBE\4_2023-12-26.md'
Converted 'data\edgar_documents\ADBE\4_2024-01-04' --> 'data\processed_data\ADBE\4_2024-01-04.md'
Converted 'data\edgar_documents\ADBE\4_2024-01-08' --> 'data\processed_data\ADBE\4_2024-01-08.md'


2025-11-14 15:28:08,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:09,008 - INFO - Going to convert document batch...
2025-11-14 15:28:09,010 - INFO - Processing document 4_2024-01-17
2025-11-14 15:28:09,034 - INFO - Finished converting document 4_2024-01-17 in 0.06 sec.
2025-11-14 15:28:09,068 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:09,084 - INFO - Going to convert document batch...
2025-11-14 15:28:09,085 - INFO - Processing document 4_2024-01-26
2025-11-14 15:28:09,126 - INFO - Finished converting document 4_2024-01-26 in 0.08 sec.
2025-11-14 15:28:09,182 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:09,200 - INFO - Going to convert document batch...
2025-11-14 15:28:09,201 - INFO - Processing document 4_2024-02-15
2025-11-14 15:28:09,226 - INFO - Finished converting document 4_2024-02-15 in 0.06 sec.


Converted 'data\edgar_documents\ADBE\4_2024-01-17' --> 'data\processed_data\ADBE\4_2024-01-17.md'
Converted 'data\edgar_documents\ADBE\4_2024-01-26' --> 'data\processed_data\ADBE\4_2024-01-26.md'


2025-11-14 15:28:09,258 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:09,268 - INFO - Going to convert document batch...
2025-11-14 15:28:09,268 - INFO - Processing document 4_2024-03-18
2025-11-14 15:28:09,290 - INFO - Finished converting document 4_2024-03-18 in 0.03 sec.
2025-11-14 15:28:09,321 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:09,332 - INFO - Going to convert document batch...
2025-11-14 15:28:09,333 - INFO - Processing document 4_2024-03-19
2025-11-14 15:28:09,360 - INFO - Finished converting document 4_2024-03-19 in 0.05 sec.
2025-11-14 15:28:09,409 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:09,416 - INFO - Going to convert document batch...
2025-11-14 15:28:09,417 - INFO - Processing document 4_2024-03-28
2025-11-14 15:28:09,435 - INFO - Finished converting document 4_2024-03-28 in 0.06 sec.


Converted 'data\edgar_documents\ADBE\4_2024-02-15' --> 'data\processed_data\ADBE\4_2024-02-15.md'
Converted 'data\edgar_documents\ADBE\4_2024-03-18' --> 'data\processed_data\ADBE\4_2024-03-18.md'
Converted 'data\edgar_documents\ADBE\4_2024-03-19' --> 'data\processed_data\ADBE\4_2024-03-19.md'


2025-11-14 15:28:09,474 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:28:09,474 - ERROR - Input document 4_2024-04-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:28:09,476 - INFO - Going to convert document batch...
2025-11-14 15:28:09,495 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:28:09,496 - ERROR - Input document 4_2024-04-02 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\ADBE\4_2024-03-28' --> 'data\processed_data\ADBE\4_2024-03-28.md'
Error processing data\edgar_documents\ADBE\4_2024-04-01: File format not allowed: data\edgar_documents\ADBE\4_2024-04-01
Error processing data\edgar_documents\ADBE\4_2024-04-02: File format not allowed: data\edgar_documents\ADBE\4_2024-04-02
Converted 'data\edgar_documents\ADBE\4_2024-04-17' --> 'data\processed_data\ADBE\4_2024-04-17.md'
Converted 'data\edgar_documents\ADBE\4_2024-04-19' --> 'data\processed_data\ADBE\4_2024-04-19.md'


2025-11-14 15:28:09,654 - INFO - Going to convert document batch...
2025-11-14 15:28:09,655 - INFO - Processing document 4_2024-04-23
2025-11-14 15:28:09,672 - INFO - Finished converting document 4_2024-04-23 in 0.05 sec.
2025-11-14 15:28:09,730 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:09,745 - INFO - Going to convert document batch...
2025-11-14 15:28:09,747 - INFO - Processing document 4_2024-04-25
2025-11-14 15:28:09,772 - INFO - Finished converting document 4_2024-04-25 in 0.08 sec.
2025-11-14 15:28:09,827 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:09,837 - INFO - Going to convert document batch...
2025-11-14 15:28:09,838 - INFO - Processing document 4_2024-05-03
2025-11-14 15:28:09,859 - INFO - Finished converting document 4_2024-05-03 in 0.06 sec.


Converted 'data\edgar_documents\ADBE\4_2024-04-23' --> 'data\processed_data\ADBE\4_2024-04-23.md'
Converted 'data\edgar_documents\ADBE\4_2024-04-25' --> 'data\processed_data\ADBE\4_2024-04-25.md'
Converted 'data\edgar_documents\ADBE\4_2024-05-03' --> 'data\processed_data\ADBE\4_2024-05-03.md'


2025-11-14 15:28:09,908 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:09,917 - INFO - Going to convert document batch...
2025-11-14 15:28:09,917 - INFO - Processing document 4_2024-05-08
2025-11-14 15:28:09,935 - INFO - Finished converting document 4_2024-05-08 in 0.06 sec.
2025-11-14 15:28:09,965 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:09,973 - INFO - Going to convert document batch...
2025-11-14 15:28:09,974 - INFO - Processing document 4_2024-05-16
2025-11-14 15:28:09,996 - INFO - Finished converting document 4_2024-05-16 in 0.05 sec.
2025-11-14 15:28:10,026 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:10,036 - INFO - Going to convert document batch...
2025-11-14 15:28:10,037 - INFO - Processing document 4_2024-06-04
2025-11-14 15:28:10,055 - INFO - Finished converting document 4_2024-06-04 in 0.03 sec.
2025-11-14 15:28:10,107 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\ADBE\4_2024-05-08' --> 'data\processed_data\ADBE\4_2024-05-08.md'
Converted 'data\edgar_documents\ADBE\4_2024-05-16' --> 'data\processed_data\ADBE\4_2024-05-16.md'
Converted 'data\edgar_documents\ADBE\4_2024-06-04' --> 'data\processed_data\ADBE\4_2024-06-04.md'


2025-11-14 15:28:10,173 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:10,181 - INFO - Going to convert document batch...
2025-11-14 15:28:10,182 - INFO - Processing document 4_2024-06-20
2025-11-14 15:28:10,200 - INFO - Finished converting document 4_2024-06-20 in 0.05 sec.
2025-11-14 15:28:10,232 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:10,241 - INFO - Going to convert document batch...
2025-11-14 15:28:10,242 - INFO - Processing document 4_2024-06-28
2025-11-14 15:28:10,264 - INFO - Finished converting document 4_2024-06-28 in 0.05 sec.
2025-11-14 15:28:10,299 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:10,310 - INFO - Going to convert document batch...
2025-11-14 15:28:10,311 - INFO - Processing document 4_2024-07-17
2025-11-14 15:28:10,338 - INFO - Finished converting document 4_2024-07-17 in 0.05 sec.


Converted 'data\edgar_documents\ADBE\4_2024-06-18' --> 'data\processed_data\ADBE\4_2024-06-18.md'
Converted 'data\edgar_documents\ADBE\4_2024-06-20' --> 'data\processed_data\ADBE\4_2024-06-20.md'
Converted 'data\edgar_documents\ADBE\4_2024-06-28' --> 'data\processed_data\ADBE\4_2024-06-28.md'
Converted 'data\edgar_documents\ADBE\4_2024-07-17' --> 'data\processed_data\ADBE\4_2024-07-17.md'


2025-11-14 15:28:10,393 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:10,406 - INFO - Going to convert document batch...
2025-11-14 15:28:10,407 - INFO - Processing document 4_2024-07-26
2025-11-14 15:28:10,429 - INFO - Finished converting document 4_2024-07-26 in 0.06 sec.
2025-11-14 15:28:10,461 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:10,469 - INFO - Going to convert document batch...
2025-11-14 15:28:10,470 - INFO - Processing document 4_2024-08-12
2025-11-14 15:28:10,488 - INFO - Finished converting document 4_2024-08-12 in 0.03 sec.
2025-11-14 15:28:10,537 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:10,553 - INFO - Going to convert document batch...
2025-11-14 15:28:10,554 - INFO - Processing document 4_2024-08-19
2025-11-14 15:28:10,581 - INFO - Finished converting document 4_2024-08-19 in 0.08 sec.
2025-11-14 15:28:10,613 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\ADBE\4_2024-07-26' --> 'data\processed_data\ADBE\4_2024-07-26.md'
Converted 'data\edgar_documents\ADBE\4_2024-08-12' --> 'data\processed_data\ADBE\4_2024-08-12.md'
Converted 'data\edgar_documents\ADBE\4_2024-08-19' --> 'data\processed_data\ADBE\4_2024-08-19.md'


2025-11-14 15:28:10,678 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:10,687 - INFO - Going to convert document batch...
2025-11-14 15:28:10,688 - INFO - Processing document 4_2024-09-19
2025-11-14 15:28:10,709 - INFO - Finished converting document 4_2024-09-19 in 0.03 sec.
2025-11-14 15:28:10,752 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:10,773 - INFO - Going to convert document batch...
2025-11-14 15:28:10,774 - INFO - Processing document 4_2024-09-26
2025-11-14 15:28:10,801 - INFO - Finished converting document 4_2024-09-26 in 0.06 sec.
2025-11-14 15:28:10,839 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:10,850 - INFO - Going to convert document batch...
2025-11-14 15:28:10,851 - INFO - Processing document 4_2024-10-17


Converted 'data\edgar_documents\ADBE\4_2024-09-17' --> 'data\processed_data\ADBE\4_2024-09-17.md'
Converted 'data\edgar_documents\ADBE\4_2024-09-19' --> 'data\processed_data\ADBE\4_2024-09-19.md'
Converted 'data\edgar_documents\ADBE\4_2024-09-26' --> 'data\processed_data\ADBE\4_2024-09-26.md'


2025-11-14 15:28:10,877 - INFO - Finished converting document 4_2024-10-17 in 0.05 sec.
2025-11-14 15:28:10,913 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:10,925 - INFO - Going to convert document batch...
2025-11-14 15:28:10,926 - INFO - Processing document 4_2024-10-28
2025-11-14 15:28:10,952 - INFO - Finished converting document 4_2024-10-28 in 0.05 sec.
2025-11-14 15:28:11,001 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:11,014 - INFO - Going to convert document batch...
2025-11-14 15:28:11,015 - INFO - Processing document 4_2024-10-31
2025-11-14 15:28:11,035 - INFO - Finished converting document 4_2024-10-31 in 0.06 sec.
2025-11-14 15:28:11,080 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:11,095 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ADBE\4_2024-10-17' --> 'data\processed_data\ADBE\4_2024-10-17.md'
Converted 'data\edgar_documents\ADBE\4_2024-10-28' --> 'data\processed_data\ADBE\4_2024-10-28.md'
Converted 'data\edgar_documents\ADBE\4_2024-10-31' --> 'data\processed_data\ADBE\4_2024-10-31.md'


2025-11-14 15:28:11,095 - INFO - Processing document 4_2024-11-19
2025-11-14 15:28:11,117 - INFO - Finished converting document 4_2024-11-19 in 0.06 sec.
2025-11-14 15:28:11,147 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:11,155 - INFO - Going to convert document batch...
2025-11-14 15:28:11,156 - INFO - Processing document 4_2024-12-02
2025-11-14 15:28:11,174 - INFO - Finished converting document 4_2024-12-02 in 0.03 sec.
2025-11-14 15:28:11,232 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:11,251 - INFO - Going to convert document batch...
2025-11-14 15:28:11,252 - INFO - Processing document 4_2024-12-10
2025-11-14 15:28:11,273 - INFO - Finished converting document 4_2024-12-10 in 0.08 sec.
2025-11-14 15:28:11,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:11,316 - INFO - Going to convert document batch...
2025-11-14 15:28:11,317 - INFO - Processing document 4_2024-12-17


Converted 'data\edgar_documents\ADBE\4_2024-11-19' --> 'data\processed_data\ADBE\4_2024-11-19.md'
Converted 'data\edgar_documents\ADBE\4_2024-12-02' --> 'data\processed_data\ADBE\4_2024-12-02.md'
Converted 'data\edgar_documents\ADBE\4_2024-12-10' --> 'data\processed_data\ADBE\4_2024-12-10.md'


2025-11-14 15:28:11,350 - INFO - Finished converting document 4_2024-12-17 in 0.05 sec.
2025-11-14 15:28:11,387 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:11,397 - INFO - Going to convert document batch...
2025-11-14 15:28:11,398 - INFO - Processing document 4_2025-01-02
2025-11-14 15:28:11,415 - INFO - Finished converting document 4_2025-01-02 in 0.03 sec.
2025-11-14 15:28:11,452 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:28:11,453 - ERROR - Input document 4_2025-01-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'js

Converted 'data\edgar_documents\ADBE\4_2024-12-17' --> 'data\processed_data\ADBE\4_2024-12-17.md'
Converted 'data\edgar_documents\ADBE\4_2025-01-02' --> 'data\processed_data\ADBE\4_2025-01-02.md'
Error processing data\edgar_documents\ADBE\4_2025-01-14: File format not allowed: data\edgar_documents\ADBE\4_2025-01-14
Error processing data\edgar_documents\ADBE\4_2025-01-15: File format not allowed: data\edgar_documents\ADBE\4_2025-01-15
Converted 'data\edgar_documents\ADBE\4_2025-01-17' --> 'data\processed_data\ADBE\4_2025-01-17.md'


2025-11-14 15:28:11,593 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:11,620 - INFO - Going to convert document batch...
2025-11-14 15:28:11,621 - INFO - Processing document 4_2025-01-28
2025-11-14 15:28:11,659 - INFO - Finished converting document 4_2025-01-28 in 0.11 sec.
2025-11-14 15:28:11,700 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:11,708 - INFO - Going to convert document batch...
2025-11-14 15:28:11,709 - INFO - Processing document 4_2025-01-30
2025-11-14 15:28:11,726 - INFO - Finished converting document 4_2025-01-30 in 0.03 sec.
2025-11-14 15:28:11,775 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:11,794 - INFO - Going to convert document batch...
2025-11-14 15:28:11,795 - INFO - Processing document 4_2025-03-17
2025-11-14 15:28:11,823 - INFO - Finished converting document 4_2025-03-17 in 0.08 sec.
2025-11-14 15:28:11,873 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\4_2025-01-28' --> 'data\processed_data\ADBE\4_2025-01-28.md'
Converted 'data\edgar_documents\ADBE\4_2025-01-30' --> 'data\processed_data\ADBE\4_2025-01-30.md'
Converted 'data\edgar_documents\ADBE\4_2025-03-17' --> 'data\processed_data\ADBE\4_2025-03-17.md'


2025-11-14 15:28:11,886 - INFO - Going to convert document batch...
2025-11-14 15:28:11,886 - INFO - Processing document 4_2025-03-21
2025-11-14 15:28:11,906 - INFO - Finished converting document 4_2025-03-21 in 0.06 sec.
2025-11-14 15:28:11,938 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\4_2025-03-21' --> 'data\processed_data\ADBE\4_2025-03-21.md'


2025-11-14 15:28:12,171 - INFO - Going to convert document batch...
2025-11-14 15:28:12,172 - INFO - Processing document 4_2025-04-17
2025-11-14 15:28:12,203 - INFO - Finished converting document 4_2025-04-17 in 0.28 sec.
2025-11-14 15:28:12,247 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:12,256 - INFO - Going to convert document batch...
2025-11-14 15:28:12,257 - INFO - Processing document 4_2025-04-23
2025-11-14 15:28:12,278 - INFO - Finished converting document 4_2025-04-23 in 0.05 sec.
2025-11-14 15:28:12,308 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:12,318 - INFO - Going to convert document batch...
2025-11-14 15:28:12,318 - INFO - Processing document 4_2025-04-28
2025-11-14 15:28:12,337 - INFO - Finished converting document 4_2025-04-28 in 0.03 sec.
2025-11-14 15:28:12,384 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:12,394 - INFO - Going to convert document batch...
2025-11-14 15:28:12,395 - 

Converted 'data\edgar_documents\ADBE\4_2025-04-17' --> 'data\processed_data\ADBE\4_2025-04-17.md'
Converted 'data\edgar_documents\ADBE\4_2025-04-23' --> 'data\processed_data\ADBE\4_2025-04-23.md'
Converted 'data\edgar_documents\ADBE\4_2025-04-28' --> 'data\processed_data\ADBE\4_2025-04-28.md'


2025-11-14 15:28:12,445 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:12,454 - INFO - Going to convert document batch...
2025-11-14 15:28:12,455 - INFO - Processing document 4_2025-06-16
2025-11-14 15:28:12,475 - INFO - Finished converting document 4_2025-06-16 in 0.03 sec.
2025-11-14 15:28:12,508 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:12,520 - INFO - Going to convert document batch...
2025-11-14 15:28:12,521 - INFO - Processing document 4_2025-07-17
2025-11-14 15:28:12,551 - INFO - Finished converting document 4_2025-07-17 in 0.05 sec.
2025-11-14 15:28:12,588 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:12,598 - INFO - Going to convert document batch...
2025-11-14 15:28:12,599 - INFO - Processing document 4_2025-07-28
2025-11-14 15:28:12,622 - INFO - Finished converting document 4_2025-07-28 in 0.05 sec.


Converted 'data\edgar_documents\ADBE\4_2025-05-06' --> 'data\processed_data\ADBE\4_2025-05-06.md'
Converted 'data\edgar_documents\ADBE\4_2025-06-16' --> 'data\processed_data\ADBE\4_2025-06-16.md'
Converted 'data\edgar_documents\ADBE\4_2025-07-17' --> 'data\processed_data\ADBE\4_2025-07-17.md'


2025-11-14 15:28:12,658 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:12,669 - INFO - Going to convert document batch...
2025-11-14 15:28:12,670 - INFO - Processing document 4_2025-09-17
2025-11-14 15:28:12,700 - INFO - Finished converting document 4_2025-09-17 in 0.06 sec.
2025-11-14 15:28:12,754 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:12,768 - INFO - Going to convert document batch...
2025-11-14 15:28:12,769 - INFO - Processing document 4_2025-10-16
2025-11-14 15:28:12,798 - INFO - Finished converting document 4_2025-10-16 in 0.08 sec.


Converted 'data\edgar_documents\ADBE\4_2025-07-28' --> 'data\processed_data\ADBE\4_2025-07-28.md'
Converted 'data\edgar_documents\ADBE\4_2025-09-17' --> 'data\processed_data\ADBE\4_2025-09-17.md'
Converted 'data\edgar_documents\ADBE\4_2025-10-16' --> 'data\processed_data\ADBE\4_2025-10-16.md'


2025-11-14 15:28:12,851 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:12,863 - INFO - Going to convert document batch...
2025-11-14 15:28:12,864 - INFO - Processing document 4_2025-10-27
2025-11-14 15:28:12,885 - INFO - Finished converting document 4_2025-10-27 in 0.06 sec.
2025-11-14 15:28:12,923 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:12,931 - INFO - Going to convert document batch...
2025-11-14 15:28:12,931 - INFO - Processing document 4_2025-11-04
2025-11-14 15:28:12,948 - INFO - Finished converting document 4_2025-11-04 in 0.05 sec.
2025-11-14 15:28:12,979 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:12,988 - INFO - Going to convert document batch...
2025-11-14 15:28:12,989 - INFO - Processing document 8-K_2023-01-19
2025-11-14 15:28:13,005 - INFO - Finished converting document 8-K_2023-01-19 in 0.03 sec.
2025-11-14 15:28:13,046 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14

Converted 'data\edgar_documents\ADBE\4_2025-10-27' --> 'data\processed_data\ADBE\4_2025-10-27.md'
Converted 'data\edgar_documents\ADBE\4_2025-11-04' --> 'data\processed_data\ADBE\4_2025-11-04.md'
Converted 'data\edgar_documents\ADBE\8-K_2023-01-19' --> 'data\processed_data\ADBE\8-K_2023-01-19.md'


2025-11-14 15:28:13,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:13,181 - INFO - Going to convert document batch...
2025-11-14 15:28:13,182 - INFO - Processing document 8-K_2023-03-15
2025-11-14 15:28:13,200 - INFO - Finished converting document 8-K_2023-03-15 in 0.06 sec.
2025-11-14 15:28:13,247 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:13,279 - INFO - Going to convert document batch...
2025-11-14 15:28:13,279 - INFO - Processing document 8-K_2023-04-24
2025-11-14 15:28:13,322 - INFO - Finished converting document 8-K_2023-04-24 in 0.11 sec.
2025-11-14 15:28:13,356 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\8-K_2023-01-26' --> 'data\processed_data\ADBE\8-K_2023-01-26.md'
Converted 'data\edgar_documents\ADBE\8-K_2023-03-15' --> 'data\processed_data\ADBE\8-K_2023-03-15.md'
Converted 'data\edgar_documents\ADBE\8-K_2023-04-24' --> 'data\processed_data\ADBE\8-K_2023-04-24.md'


2025-11-14 15:28:13,369 - INFO - Going to convert document batch...
2025-11-14 15:28:13,370 - INFO - Processing document 8-K_2023-06-15
2025-11-14 15:28:13,387 - INFO - Finished converting document 8-K_2023-06-15 in 0.05 sec.
2025-11-14 15:28:13,406 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:13,420 - INFO - Going to convert document batch...
2025-11-14 15:28:13,421 - INFO - Processing document 8-K_2023-09-14
2025-11-14 15:28:13,440 - INFO - Finished converting document 8-K_2023-09-14 in 0.05 sec.
2025-11-14 15:28:13,477 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:13,491 - INFO - Going to convert document batch...
2025-11-14 15:28:13,492 - INFO - Processing document 8-K_2023-10-26
2025-11-14 15:28:13,514 - INFO - Finished converting document 8-K_2023-10-26 in 0.06 sec.
2025-11-14 15:28:13,538 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:13,551 - INFO - Going to convert document batch...
2025-11-14 15:

Converted 'data\edgar_documents\ADBE\8-K_2023-06-15' --> 'data\processed_data\ADBE\8-K_2023-06-15.md'
Converted 'data\edgar_documents\ADBE\8-K_2023-09-14' --> 'data\processed_data\ADBE\8-K_2023-09-14.md'
Converted 'data\edgar_documents\ADBE\8-K_2023-10-26' --> 'data\processed_data\ADBE\8-K_2023-10-26.md'
Converted 'data\edgar_documents\ADBE\8-K_2023-12-13' --> 'data\processed_data\ADBE\8-K_2023-12-13.md'


2025-11-14 15:28:13,603 - INFO - Going to convert document batch...
2025-11-14 15:28:13,603 - INFO - Processing document 8-K_2023-12-18
2025-11-14 15:28:13,624 - INFO - Finished converting document 8-K_2023-12-18 in 0.05 sec.
2025-11-14 15:28:13,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:13,699 - INFO - Going to convert document batch...
2025-11-14 15:28:13,700 - INFO - Processing document 8-K_2024-01-26
2025-11-14 15:28:13,739 - INFO - Finished converting document 8-K_2024-01-26 in 0.09 sec.
2025-11-14 15:28:13,773 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:13,782 - INFO - Going to convert document batch...
2025-11-14 15:28:13,783 - INFO - Processing document 8-K_2024-03-14
2025-11-14 15:28:13,801 - INFO - Finished converting document 8-K_2024-03-14 in 0.03 sec.
2025-11-14 15:28:13,821 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:13,833 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\ADBE\8-K_2023-12-18' --> 'data\processed_data\ADBE\8-K_2023-12-18.md'
Converted 'data\edgar_documents\ADBE\8-K_2024-01-26' --> 'data\processed_data\ADBE\8-K_2024-01-26.md'
Converted 'data\edgar_documents\ADBE\8-K_2024-03-14' --> 'data\processed_data\ADBE\8-K_2024-03-14.md'


2025-11-14 15:28:13,834 - INFO - Processing document 8-K_2024-04-04
2025-11-14 15:28:13,857 - INFO - Finished converting document 8-K_2024-04-04 in 0.05 sec.
2025-11-14 15:28:13,883 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:13,904 - INFO - Going to convert document batch...
2025-11-14 15:28:13,905 - INFO - Processing document 8-K_2024-04-19
2025-11-14 15:28:13,947 - INFO - Finished converting document 8-K_2024-04-19 in 0.06 sec.
2025-11-14 15:28:13,982 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:13,993 - INFO - Going to convert document batch...
2025-11-14 15:28:13,994 - INFO - Processing document 8-K_2024-06-13
2025-11-14 15:28:14,011 - INFO - Finished converting document 8-K_2024-06-13 in 0.05 sec.
2025-11-14 15:28:14,030 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:14,038 - INFO - Going to convert document batch...
2025-11-14 15:28:14,039 - INFO - Processing document 8-K_2024-07-18
2025-11-14 15:

Converted 'data\edgar_documents\ADBE\8-K_2024-04-04' --> 'data\processed_data\ADBE\8-K_2024-04-04.md'
Converted 'data\edgar_documents\ADBE\8-K_2024-04-19' --> 'data\processed_data\ADBE\8-K_2024-04-19.md'
Converted 'data\edgar_documents\ADBE\8-K_2024-06-13' --> 'data\processed_data\ADBE\8-K_2024-06-13.md'
Converted 'data\edgar_documents\ADBE\8-K_2024-07-18' --> 'data\processed_data\ADBE\8-K_2024-07-18.md'


2025-11-14 15:28:14,073 - INFO - Going to convert document batch...
2025-11-14 15:28:14,074 - INFO - Processing document 8-K_2024-08-08
2025-11-14 15:28:14,087 - INFO - Finished converting document 8-K_2024-08-08 in 0.02 sec.
2025-11-14 15:28:14,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:14,125 - INFO - Going to convert document batch...
2025-11-14 15:28:14,126 - INFO - Processing document 8-K_2024-09-12
2025-11-14 15:28:14,141 - INFO - Finished converting document 8-K_2024-09-12 in 0.05 sec.
2025-11-14 15:28:14,163 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:14,172 - INFO - Going to convert document batch...
2025-11-14 15:28:14,173 - INFO - Processing document 8-K_2024-12-11
2025-11-14 15:28:14,189 - INFO - Finished converting document 8-K_2024-12-11 in 0.05 sec.
2025-11-14 15:28:14,212 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:14,224 - INFO - Going to convert document batch...
2025-11-14 15:

Converted 'data\edgar_documents\ADBE\8-K_2024-08-08' --> 'data\processed_data\ADBE\8-K_2024-08-08.md'
Converted 'data\edgar_documents\ADBE\8-K_2024-09-12' --> 'data\processed_data\ADBE\8-K_2024-09-12.md'
Converted 'data\edgar_documents\ADBE\8-K_2024-12-11' --> 'data\processed_data\ADBE\8-K_2024-12-11.md'
Converted 'data\edgar_documents\ADBE\8-K_2025-01-17' --> 'data\processed_data\ADBE\8-K_2025-01-17.md'


2025-11-14 15:28:14,295 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:14,317 - INFO - Going to convert document batch...
2025-11-14 15:28:14,318 - INFO - Processing document 8-K_2025-01-30
2025-11-14 15:28:14,353 - INFO - Finished converting document 8-K_2025-01-30 in 0.08 sec.
2025-11-14 15:28:14,407 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:14,423 - INFO - Going to convert document batch...
2025-11-14 15:28:14,424 - INFO - Processing document 8-K_2025-03-12
2025-11-14 15:28:14,439 - INFO - Finished converting document 8-K_2025-03-12 in 0.06 sec.
2025-11-14 15:28:14,478 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:14,504 - INFO - Going to convert document batch...
2025-11-14 15:28:14,506 - INFO - Processing document 8-K_2025-04-24
2025-11-14 15:28:14,548 - INFO - Finished converting document 8-K_2025-04-24 in 0.09 sec.


Converted 'data\edgar_documents\ADBE\8-K_2025-01-30' --> 'data\processed_data\ADBE\8-K_2025-01-30.md'
Converted 'data\edgar_documents\ADBE\8-K_2025-03-12' --> 'data\processed_data\ADBE\8-K_2025-03-12.md'


2025-11-14 15:28:14,602 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:14,622 - INFO - Going to convert document batch...
2025-11-14 15:28:14,622 - INFO - Processing document 8-K_2025-06-12
2025-11-14 15:28:14,642 - INFO - Finished converting document 8-K_2025-06-12 in 0.08 sec.
2025-11-14 15:28:14,661 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:14,671 - INFO - Going to convert document batch...
2025-11-14 15:28:14,672 - INFO - Processing document 8-K_2025-09-11
2025-11-14 15:28:14,688 - INFO - Finished converting document 8-K_2025-09-11 in 0.05 sec.
2025-11-14 15:28:14,728 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:28:14,730 - ERROR - Input document DEF-14A_2023-03-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF

Converted 'data\edgar_documents\ADBE\8-K_2025-04-24' --> 'data\processed_data\ADBE\8-K_2025-04-24.md'
Converted 'data\edgar_documents\ADBE\8-K_2025-06-12' --> 'data\processed_data\ADBE\8-K_2025-06-12.md'
Converted 'data\edgar_documents\ADBE\8-K_2025-09-11' --> 'data\processed_data\ADBE\8-K_2025-09-11.md'
Error processing data\edgar_documents\ADBE\DEF-14A_2023-03-03: File format not allowed: data\edgar_documents\ADBE\DEF-14A_2023-03-03


2025-11-14 15:28:15,359 - INFO - Going to convert document batch...
2025-11-14 15:28:15,360 - INFO - Processing document DEF-14A_2024-03-01
2025-11-14 15:28:16,656 - INFO - Finished converting document DEF-14A_2024-03-01 in 1.92 sec.
2025-11-14 15:28:17,506 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\ADBE\DEF-14A_2024-03-01' --> 'data\processed_data\ADBE\DEF-14A_2024-03-01.md'


2025-11-14 15:28:18,158 - INFO - Going to convert document batch...
2025-11-14 15:28:18,158 - INFO - Processing document DEF-14A_2025-02-28
2025-11-14 15:28:19,622 - INFO - Finished converting document DEF-14A_2025-02-28 in 2.16 sec.


Converted 'data\edgar_documents\ADBE\DEF-14A_2025-02-28' --> 'data\processed_data\ADBE\DEF-14A_2025-02-28.md'
Processed 121 new files. Errors: 6
Found 164 files to process in data\edgar_documents\AIG


2025-11-14 15:28:20,911 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:25,018 - INFO - Going to convert document batch...
2025-11-14 15:28:25,019 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:28:25,020 - INFO - Processing document 10-K_2023-02-17
2025-11-14 15:28:43,429 - INFO - Finished converting document 10-K_2023-02-17 in 22.84 sec.


Converted 'data\edgar_documents\AIG\10-K_2023-02-17' --> 'data\processed_data\AIG\10-K_2023-02-17.md'


2025-11-14 15:28:47,103 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:28:52,206 - INFO - Going to convert document batch...
2025-11-14 15:28:52,207 - INFO - Processing document 10-K_2024-02-14
2025-11-14 15:29:15,849 - INFO - Finished converting document 10-K_2024-02-14 in 29.14 sec.


Converted 'data\edgar_documents\AIG\10-K_2024-02-14' --> 'data\processed_data\AIG\10-K_2024-02-14.md'


2025-11-14 15:29:20,075 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:29:24,547 - INFO - Going to convert document batch...
2025-11-14 15:29:24,548 - INFO - Processing document 10-K_2025-02-13
2025-11-14 15:29:38,823 - INFO - Finished converting document 10-K_2025-02-13 in 19.08 sec.


Converted 'data\edgar_documents\AIG\10-K_2025-02-13' --> 'data\processed_data\AIG\10-K_2025-02-13.md'


2025-11-14 15:29:42,184 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:29:45,910 - INFO - Going to convert document batch...
2025-11-14 15:29:45,911 - INFO - Processing document 10-Q_2023-05-05
2025-11-14 15:29:53,882 - INFO - Finished converting document 10-Q_2023-05-05 in 11.97 sec.


Converted 'data\edgar_documents\AIG\10-Q_2023-05-05' --> 'data\processed_data\AIG\10-Q_2023-05-05.md'


2025-11-14 15:29:57,947 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:30:09,326 - INFO - Going to convert document batch...
2025-11-14 15:30:09,327 - INFO - Processing document 10-Q_2023-08-02
2025-11-14 15:30:31,894 - INFO - Finished converting document 10-Q_2023-08-02 in 34.20 sec.


Converted 'data\edgar_documents\AIG\10-Q_2023-08-02' --> 'data\processed_data\AIG\10-Q_2023-08-02.md'


2025-11-14 15:30:36,202 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:30:39,624 - INFO - Going to convert document batch...
2025-11-14 15:30:39,625 - INFO - Processing document 10-Q_2023-11-02
2025-11-14 15:30:49,531 - INFO - Finished converting document 10-Q_2023-11-02 in 13.62 sec.
2025-11-14 15:30:52,449 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\10-Q_2023-11-02' --> 'data\processed_data\AIG\10-Q_2023-11-02.md'


2025-11-14 15:30:55,901 - INFO - Going to convert document batch...
2025-11-14 15:30:55,902 - INFO - Processing document 10-Q_2024-05-02
2025-11-14 15:31:01,337 - INFO - Finished converting document 10-Q_2024-05-02 in 9.05 sec.
2025-11-14 15:31:03,541 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\10-Q_2024-05-02' --> 'data\processed_data\AIG\10-Q_2024-05-02.md'


2025-11-14 15:31:06,700 - INFO - Going to convert document batch...
2025-11-14 15:31:06,700 - INFO - Processing document 10-Q_2024-08-01
2025-11-14 15:31:12,993 - INFO - Finished converting document 10-Q_2024-08-01 in 9.61 sec.
2025-11-14 15:31:15,200 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\10-Q_2024-08-01' --> 'data\processed_data\AIG\10-Q_2024-08-01.md'


2025-11-14 15:31:18,053 - INFO - Going to convert document batch...
2025-11-14 15:31:18,054 - INFO - Processing document 10-Q_2024-11-07
2025-11-14 15:31:23,308 - INFO - Finished converting document 10-Q_2024-11-07 in 8.27 sec.
2025-11-14 15:31:25,403 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\10-Q_2024-11-07' --> 'data\processed_data\AIG\10-Q_2024-11-07.md'


2025-11-14 15:31:27,665 - INFO - Going to convert document batch...
2025-11-14 15:31:27,666 - INFO - Processing document 10-Q_2025-05-02
2025-11-14 15:31:31,646 - INFO - Finished converting document 10-Q_2025-05-02 in 6.44 sec.
2025-11-14 15:31:33,264 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\10-Q_2025-05-02' --> 'data\processed_data\AIG\10-Q_2025-05-02.md'


2025-11-14 15:31:36,023 - INFO - Going to convert document batch...
2025-11-14 15:31:36,025 - INFO - Processing document 10-Q_2025-08-07
2025-11-14 15:31:41,229 - INFO - Finished converting document 10-Q_2025-08-07 in 8.12 sec.
2025-11-14 15:31:43,478 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:31:43,479 - ERROR - Input document 10-Q_2025-11-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:31:43,484 - INFO - Going to convert d

Converted 'data\edgar_documents\AIG\10-Q_2025-08-07' --> 'data\processed_data\AIG\10-Q_2025-08-07.md'
Error processing data\edgar_documents\AIG\10-Q_2025-11-05: File format not allowed: data\edgar_documents\AIG\10-Q_2025-11-05


2025-11-14 15:31:43,534 - INFO - Finished converting document 4_2023-01-03 in 0.05 sec.
2025-11-14 15:31:43,603 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:43,613 - INFO - Going to convert document batch...
2025-11-14 15:31:43,614 - INFO - Processing document 4_2023-01-05
2025-11-14 15:31:43,641 - INFO - Finished converting document 4_2023-01-05 in 0.06 sec.
2025-11-14 15:31:43,684 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:43,693 - INFO - Going to convert document batch...
2025-11-14 15:31:43,694 - INFO - Processing document 4_2023-01-18
2025-11-14 15:31:43,717 - INFO - Finished converting document 4_2023-01-18 in 0.05 sec.
2025-11-14 15:31:43,782 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\4_2023-01-03' --> 'data\processed_data\AIG\4_2023-01-03.md'
Converted 'data\edgar_documents\AIG\4_2023-01-05' --> 'data\processed_data\AIG\4_2023-01-05.md'
Converted 'data\edgar_documents\AIG\4_2023-01-18' --> 'data\processed_data\AIG\4_2023-01-18.md'


2025-11-14 15:31:43,797 - INFO - Going to convert document batch...
2025-11-14 15:31:43,797 - INFO - Processing document 4_2023-02-14
2025-11-14 15:31:43,830 - INFO - Finished converting document 4_2023-02-14 in 0.09 sec.
2025-11-14 15:31:43,872 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:43,884 - INFO - Going to convert document batch...
2025-11-14 15:31:43,886 - INFO - Processing document 4_2023-02-16
2025-11-14 15:31:43,911 - INFO - Finished converting document 4_2023-02-16 in 0.05 sec.
2025-11-14 15:31:43,953 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:43,967 - INFO - Going to convert document batch...
2025-11-14 15:31:43,967 - INFO - Processing document 4_2023-02-23
2025-11-14 15:31:43,990 - INFO - Finished converting document 4_2023-02-23 in 0.05 sec.
2025-11-14 15:31:44,024 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:44,032 - INFO - Going to convert document batch...
2025-11-14 15:31:44,033 - 

Converted 'data\edgar_documents\AIG\4_2023-02-14' --> 'data\processed_data\AIG\4_2023-02-14.md'
Converted 'data\edgar_documents\AIG\4_2023-02-16' --> 'data\processed_data\AIG\4_2023-02-16.md'
Converted 'data\edgar_documents\AIG\4_2023-02-23' --> 'data\processed_data\AIG\4_2023-02-23.md'


2025-11-14 15:31:44,054 - INFO - Finished converting document 4_2023-03-02 in 0.03 sec.
2025-11-14 15:31:44,098 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:44,109 - INFO - Going to convert document batch...
2025-11-14 15:31:44,110 - INFO - Processing document 4_2023-03-17
2025-11-14 15:31:44,133 - INFO - Finished converting document 4_2023-03-17 in 0.05 sec.
2025-11-14 15:31:44,209 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:31:44,209 - ERROR - Input document 4_2023-03-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'js

Converted 'data\edgar_documents\AIG\4_2023-03-02' --> 'data\processed_data\AIG\4_2023-03-02.md'
Converted 'data\edgar_documents\AIG\4_2023-03-17' --> 'data\processed_data\AIG\4_2023-03-17.md'
Error processing data\edgar_documents\AIG\4_2023-03-23: File format not allowed: data\edgar_documents\AIG\4_2023-03-23
Error processing data\edgar_documents\AIG\4_2023-03-24: File format not allowed: data\edgar_documents\AIG\4_2023-03-24


2025-11-14 15:31:44,267 - INFO - Processing document 4_2023-04-04
2025-11-14 15:31:44,295 - INFO - Finished converting document 4_2023-04-04 in 0.06 sec.
2025-11-14 15:31:44,354 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:44,364 - INFO - Going to convert document batch...
2025-11-14 15:31:44,365 - INFO - Processing document 4_2023-04-05
2025-11-14 15:31:44,390 - INFO - Finished converting document 4_2023-04-05 in 0.06 sec.
2025-11-14 15:31:44,442 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:44,451 - INFO - Going to convert document batch...
2025-11-14 15:31:44,452 - INFO - Processing document 4_2023-04-18
2025-11-14 15:31:44,474 - INFO - Finished converting document 4_2023-04-18 in 0.05 sec.


Converted 'data\edgar_documents\AIG\4_2023-04-04' --> 'data\processed_data\AIG\4_2023-04-04.md'
Converted 'data\edgar_documents\AIG\4_2023-04-05' --> 'data\processed_data\AIG\4_2023-04-05.md'
Converted 'data\edgar_documents\AIG\4_2023-04-18' --> 'data\processed_data\AIG\4_2023-04-18.md'


2025-11-14 15:31:44,549 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:44,560 - INFO - Going to convert document batch...
2025-11-14 15:31:44,561 - INFO - Processing document 4_2023-05-12
2025-11-14 15:31:44,587 - INFO - Finished converting document 4_2023-05-12 in 0.08 sec.
2025-11-14 15:31:44,644 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:44,653 - INFO - Going to convert document batch...
2025-11-14 15:31:44,654 - INFO - Processing document 4_2023-06-12
2025-11-14 15:31:44,674 - INFO - Finished converting document 4_2023-06-12 in 0.06 sec.
2025-11-14 15:31:44,724 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:44,739 - INFO - Going to convert document batch...
2025-11-14 15:31:44,740 - INFO - Processing document 4_2023-06-16
2025-11-14 15:31:44,775 - INFO - Finished converting document 4_2023-06-16 in 0.06 sec.


Converted 'data\edgar_documents\AIG\4_2023-05-12' --> 'data\processed_data\AIG\4_2023-05-12.md'
Converted 'data\edgar_documents\AIG\4_2023-06-12' --> 'data\processed_data\AIG\4_2023-06-12.md'


2025-11-14 15:31:44,835 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:44,845 - INFO - Going to convert document batch...
2025-11-14 15:31:44,846 - INFO - Processing document 4_2023-06-21
2025-11-14 15:31:44,869 - INFO - Finished converting document 4_2023-06-21 in 0.05 sec.
2025-11-14 15:31:44,936 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:44,945 - INFO - Going to convert document batch...
2025-11-14 15:31:44,945 - INFO - Processing document 4_2023-06-23
2025-11-14 15:31:44,965 - INFO - Finished converting document 4_2023-06-23 in 0.08 sec.
2025-11-14 15:31:45,017 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\4_2023-06-16' --> 'data\processed_data\AIG\4_2023-06-16.md'
Converted 'data\edgar_documents\AIG\4_2023-06-21' --> 'data\processed_data\AIG\4_2023-06-21.md'
Converted 'data\edgar_documents\AIG\4_2023-06-23' --> 'data\processed_data\AIG\4_2023-06-23.md'


2025-11-14 15:31:45,025 - INFO - Going to convert document batch...
2025-11-14 15:31:45,026 - INFO - Processing document 4_2023-07-05
2025-11-14 15:31:45,051 - INFO - Finished converting document 4_2023-07-05 in 0.06 sec.
2025-11-14 15:31:45,102 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:45,112 - INFO - Going to convert document batch...
2025-11-14 15:31:45,112 - INFO - Processing document 4_2023-07-06
2025-11-14 15:31:45,136 - INFO - Finished converting document 4_2023-07-06 in 0.06 sec.
2025-11-14 15:31:45,186 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:45,216 - INFO - Going to convert document batch...
2025-11-14 15:31:45,217 - INFO - Processing document 4_2023-07-26


Converted 'data\edgar_documents\AIG\4_2023-07-05' --> 'data\processed_data\AIG\4_2023-07-05.md'
Converted 'data\edgar_documents\AIG\4_2023-07-06' --> 'data\processed_data\AIG\4_2023-07-06.md'


2025-11-14 15:31:45,296 - INFO - Finished converting document 4_2023-07-26 in 0.12 sec.
2025-11-14 15:31:45,386 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:45,400 - INFO - Going to convert document batch...
2025-11-14 15:31:45,401 - INFO - Processing document 4_2023-08-07
2025-11-14 15:31:45,440 - INFO - Finished converting document 4_2023-08-07 in 0.08 sec.
2025-11-14 15:31:45,495 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:45,504 - INFO - Going to convert document batch...
2025-11-14 15:31:45,505 - INFO - Processing document 4_2023-08-11
2025-11-14 15:31:45,524 - INFO - Finished converting document 4_2023-08-11 in 0.05 sec.
2025-11-14 15:31:45,571 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\4_2023-07-26' --> 'data\processed_data\AIG\4_2023-07-26.md'
Converted 'data\edgar_documents\AIG\4_2023-08-07' --> 'data\processed_data\AIG\4_2023-08-07.md'
Converted 'data\edgar_documents\AIG\4_2023-08-11' --> 'data\processed_data\AIG\4_2023-08-11.md'


2025-11-14 15:31:45,580 - INFO - Going to convert document batch...
2025-11-14 15:31:45,581 - INFO - Processing document 4_2023-10-03
2025-11-14 15:31:45,605 - INFO - Finished converting document 4_2023-10-03 in 0.06 sec.
2025-11-14 15:31:45,655 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:45,670 - INFO - Going to convert document batch...
2025-11-14 15:31:45,670 - INFO - Processing document 4_2023-10-17
2025-11-14 15:31:45,706 - INFO - Finished converting document 4_2023-10-17 in 0.08 sec.
2025-11-14 15:31:45,763 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:45,776 - INFO - Going to convert document batch...
2025-11-14 15:31:45,776 - INFO - Processing document 4_2023-10-18
2025-11-14 15:31:45,807 - INFO - Finished converting document 4_2023-10-18 in 0.06 sec.


Converted 'data\edgar_documents\AIG\4_2023-10-03' --> 'data\processed_data\AIG\4_2023-10-03.md'
Converted 'data\edgar_documents\AIG\4_2023-10-17' --> 'data\processed_data\AIG\4_2023-10-17.md'


2025-11-14 15:31:45,847 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:45,859 - INFO - Going to convert document batch...
2025-11-14 15:31:45,860 - INFO - Processing document 4_2023-11-13
2025-11-14 15:31:45,883 - INFO - Finished converting document 4_2023-11-13 in 0.05 sec.
2025-11-14 15:31:45,922 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:45,933 - INFO - Going to convert document batch...
2025-11-14 15:31:45,934 - INFO - Processing document 4_2023-12-05
2025-11-14 15:31:45,961 - INFO - Finished converting document 4_2023-12-05 in 0.05 sec.
2025-11-14 15:31:46,005 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:46,018 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AIG\4_2023-10-18' --> 'data\processed_data\AIG\4_2023-10-18.md'
Converted 'data\edgar_documents\AIG\4_2023-11-13' --> 'data\processed_data\AIG\4_2023-11-13.md'
Converted 'data\edgar_documents\AIG\4_2023-12-05' --> 'data\processed_data\AIG\4_2023-12-05.md'


2025-11-14 15:31:46,019 - INFO - Processing document 4_2023-12-12
2025-11-14 15:31:46,048 - INFO - Finished converting document 4_2023-12-12 in 0.06 sec.
2025-11-14 15:31:46,091 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:46,101 - INFO - Going to convert document batch...
2025-11-14 15:31:46,101 - INFO - Processing document 4_2023-12-18
2025-11-14 15:31:46,131 - INFO - Finished converting document 4_2023-12-18 in 0.05 sec.
2025-11-14 15:31:46,169 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\4_2023-12-12' --> 'data\processed_data\AIG\4_2023-12-12.md'
Converted 'data\edgar_documents\AIG\4_2023-12-18' --> 'data\processed_data\AIG\4_2023-12-18.md'


2025-11-14 15:31:46,902 - INFO - Going to convert document batch...
2025-11-14 15:31:46,904 - INFO - Processing document 4_2023-12-19
2025-11-14 15:31:46,927 - INFO - Finished converting document 4_2023-12-19 in 0.77 sec.
2025-11-14 15:31:46,963 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:46,980 - INFO - Going to convert document batch...
2025-11-14 15:31:46,981 - INFO - Processing document 4_2023-12-21
2025-11-14 15:31:47,022 - INFO - Finished converting document 4_2023-12-21 in 0.06 sec.
2025-11-14 15:31:47,069 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:47,081 - INFO - Going to convert document batch...
2025-11-14 15:31:47,082 - INFO - Processing document 4_2024-01-02
2025-11-14 15:31:47,111 - INFO - Finished converting document 4_2024-01-02 in 0.05 sec.


Converted 'data\edgar_documents\AIG\4_2023-12-19' --> 'data\processed_data\AIG\4_2023-12-19.md'
Converted 'data\edgar_documents\AIG\4_2023-12-21' --> 'data\processed_data\AIG\4_2023-12-21.md'
Converted 'data\edgar_documents\AIG\4_2024-01-02' --> 'data\processed_data\AIG\4_2024-01-02.md'


2025-11-14 15:31:47,151 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:47,163 - INFO - Going to convert document batch...
2025-11-14 15:31:47,164 - INFO - Processing document 4_2024-01-03
2025-11-14 15:31:47,190 - INFO - Finished converting document 4_2024-01-03 in 0.05 sec.
2025-11-14 15:31:47,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:47,238 - INFO - Going to convert document batch...
2025-11-14 15:31:47,239 - INFO - Processing document 4_2024-01-04
2025-11-14 15:31:47,263 - INFO - Finished converting document 4_2024-01-04 in 0.05 sec.
2025-11-14 15:31:47,316 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:47,326 - INFO - Going to convert document batch...
2025-11-14 15:31:47,327 - INFO - Processing document 4_2024-01-17
2025-11-14 15:31:47,348 - INFO - Finished converting document 4_2024-01-17 in 0.06 sec.
2025-11-14 15:31:47,399 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\AIG\4_2024-01-03' --> 'data\processed_data\AIG\4_2024-01-03.md'
Converted 'data\edgar_documents\AIG\4_2024-01-04' --> 'data\processed_data\AIG\4_2024-01-04.md'
Converted 'data\edgar_documents\AIG\4_2024-01-17' --> 'data\processed_data\AIG\4_2024-01-17.md'


2025-11-14 15:31:47,419 - INFO - Processing document 4_2024-02-08
2025-11-14 15:31:47,469 - INFO - Finished converting document 4_2024-02-08 in 0.09 sec.
2025-11-14 15:31:47,523 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:47,534 - INFO - Going to convert document batch...
2025-11-14 15:31:47,535 - INFO - Processing document 4_2024-02-22
2025-11-14 15:31:47,562 - INFO - Finished converting document 4_2024-02-22 in 0.06 sec.
2025-11-14 15:31:47,597 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:47,607 - INFO - Going to convert document batch...
2025-11-14 15:31:47,607 - INFO - Processing document 4_2024-02-27
2025-11-14 15:31:47,626 - INFO - Finished converting document 4_2024-02-27 in 0.05 sec.
2025-11-14 15:31:47,659 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:47,666 - INFO - Going to convert document batch...
2025-11-14 15:31:47,667 - INFO - Processing document 4_2024-02-29
2025-11-14 15:31:47,686 - IN

Converted 'data\edgar_documents\AIG\4_2024-02-08' --> 'data\processed_data\AIG\4_2024-02-08.md'
Converted 'data\edgar_documents\AIG\4_2024-02-22' --> 'data\processed_data\AIG\4_2024-02-22.md'
Converted 'data\edgar_documents\AIG\4_2024-02-27' --> 'data\processed_data\AIG\4_2024-02-27.md'


2025-11-14 15:31:47,725 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:47,741 - INFO - Going to convert document batch...
2025-11-14 15:31:47,742 - INFO - Processing document 4_2024-03-05
2025-11-14 15:31:47,773 - INFO - Finished converting document 4_2024-03-05 in 0.06 sec.
2025-11-14 15:31:47,810 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:47,818 - INFO - Going to convert document batch...
2025-11-14 15:31:47,819 - INFO - Processing document 4_2024-03-18
2025-11-14 15:31:47,840 - INFO - Finished converting document 4_2024-03-18 in 0.05 sec.


Converted 'data\edgar_documents\AIG\4_2024-02-29' --> 'data\processed_data\AIG\4_2024-02-29.md'
Converted 'data\edgar_documents\AIG\4_2024-03-05' --> 'data\processed_data\AIG\4_2024-03-05.md'
Converted 'data\edgar_documents\AIG\4_2024-03-18' --> 'data\processed_data\AIG\4_2024-03-18.md'


2025-11-14 15:31:47,914 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:47,923 - INFO - Going to convert document batch...
2025-11-14 15:31:47,924 - INFO - Processing document 4_2024-03-29
2025-11-14 15:31:47,945 - INFO - Finished converting document 4_2024-03-29 in 0.08 sec.
2025-11-14 15:31:47,994 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:48,009 - INFO - Going to convert document batch...
2025-11-14 15:31:48,010 - INFO - Processing document 4_2024-04-03
2025-11-14 15:31:48,030 - INFO - Finished converting document 4_2024-04-03 in 0.06 sec.
2025-11-14 15:31:48,065 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:48,072 - INFO - Going to convert document batch...
2025-11-14 15:31:48,073 - INFO - Processing document 4_2024-05-17
2025-11-14 15:31:48,092 - INFO - Finished converting document 4_2024-05-17 in 0.05 sec.
2025-11-14 15:31:48,130 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\AIG\4_2024-03-29' --> 'data\processed_data\AIG\4_2024-03-29.md'
Converted 'data\edgar_documents\AIG\4_2024-04-03' --> 'data\processed_data\AIG\4_2024-04-03.md'
Converted 'data\edgar_documents\AIG\4_2024-05-17' --> 'data\processed_data\AIG\4_2024-05-17.md'


2025-11-14 15:31:48,215 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:48,226 - INFO - Going to convert document batch...
2025-11-14 15:31:48,227 - INFO - Processing document 4_2024-06-11
2025-11-14 15:31:48,255 - INFO - Finished converting document 4_2024-06-11 in 0.08 sec.
2025-11-14 15:31:48,288 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:48,299 - INFO - Going to convert document batch...
2025-11-14 15:31:48,300 - INFO - Processing document 4_2024-06-14
2025-11-14 15:31:48,322 - INFO - Finished converting document 4_2024-06-14 in 0.03 sec.
2025-11-14 15:31:48,355 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\4_2024-06-03' --> 'data\processed_data\AIG\4_2024-06-03.md'
Converted 'data\edgar_documents\AIG\4_2024-06-11' --> 'data\processed_data\AIG\4_2024-06-11.md'
Converted 'data\edgar_documents\AIG\4_2024-06-14' --> 'data\processed_data\AIG\4_2024-06-14.md'


2025-11-14 15:31:48,363 - INFO - Going to convert document batch...
2025-11-14 15:31:48,364 - INFO - Processing document 4_2024-06-18
2025-11-14 15:31:48,385 - INFO - Finished converting document 4_2024-06-18 in 0.03 sec.
2025-11-14 15:31:48,423 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:48,432 - INFO - Going to convert document batch...
2025-11-14 15:31:48,433 - INFO - Processing document 4_2024-06-21
2025-11-14 15:31:48,455 - INFO - Finished converting document 4_2024-06-21 in 0.05 sec.
2025-11-14 15:31:48,497 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:48,506 - INFO - Going to convert document batch...
2025-11-14 15:31:48,507 - INFO - Processing document 4_2024-07-01
2025-11-14 15:31:48,528 - INFO - Finished converting document 4_2024-07-01 in 0.06 sec.
2025-11-14 15:31:48,573 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:48,583 - INFO - Going to convert document batch...
2025-11-14 15:31:48,584 - 

Converted 'data\edgar_documents\AIG\4_2024-06-18' --> 'data\processed_data\AIG\4_2024-06-18.md'
Converted 'data\edgar_documents\AIG\4_2024-06-21' --> 'data\processed_data\AIG\4_2024-06-21.md'
Converted 'data\edgar_documents\AIG\4_2024-07-01' --> 'data\processed_data\AIG\4_2024-07-01.md'


2025-11-14 15:31:48,606 - INFO - Finished converting document 4_2024-07-02 in 0.06 sec.
2025-11-14 15:31:48,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:48,656 - INFO - Going to convert document batch...
2025-11-14 15:31:48,657 - INFO - Processing document 4_2024-07-30
2025-11-14 15:31:48,681 - INFO - Finished converting document 4_2024-07-30 in 0.05 sec.
2025-11-14 15:31:48,717 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:48,726 - INFO - Going to convert document batch...
2025-11-14 15:31:48,727 - INFO - Processing document 4_2024-08-07
2025-11-14 15:31:48,748 - INFO - Finished converting document 4_2024-08-07 in 0.05 sec.
2025-11-14 15:31:48,791 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:48,802 - INFO - Going to convert document batch...
2025-11-14 15:31:48,802 - INFO - Processing document 4_2024-08-19


Converted 'data\edgar_documents\AIG\4_2024-07-02' --> 'data\processed_data\AIG\4_2024-07-02.md'
Converted 'data\edgar_documents\AIG\4_2024-07-30' --> 'data\processed_data\AIG\4_2024-07-30.md'
Converted 'data\edgar_documents\AIG\4_2024-08-07' --> 'data\processed_data\AIG\4_2024-08-07.md'


2025-11-14 15:31:48,824 - INFO - Finished converting document 4_2024-08-19 in 0.06 sec.
2025-11-14 15:31:48,866 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:48,874 - INFO - Going to convert document batch...
2025-11-14 15:31:48,874 - INFO - Processing document 4_2024-09-18
2025-11-14 15:31:48,894 - INFO - Finished converting document 4_2024-09-18 in 0.03 sec.
2025-11-14 15:31:48,926 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:48,934 - INFO - Going to convert document batch...
2025-11-14 15:31:48,936 - INFO - Processing document 4_2024-10-02
2025-11-14 15:31:48,957 - INFO - Finished converting document 4_2024-10-02 in 0.05 sec.
2025-11-14 15:31:48,990 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:49,000 - INFO - Going to convert document batch...
2025-11-14 15:31:49,001 - INFO - Processing document 4_2024-10-18
2025-11-14 15:31:49,023 - INFO - Finished converting document 4_2024-10-18 in 0.03 sec.


Converted 'data\edgar_documents\AIG\4_2024-08-19' --> 'data\processed_data\AIG\4_2024-08-19.md'
Converted 'data\edgar_documents\AIG\4_2024-09-18' --> 'data\processed_data\AIG\4_2024-09-18.md'
Converted 'data\edgar_documents\AIG\4_2024-10-02' --> 'data\processed_data\AIG\4_2024-10-02.md'


2025-11-14 15:31:49,058 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:49,067 - INFO - Going to convert document batch...
2025-11-14 15:31:49,067 - INFO - Processing document 4_2024-11-07
2025-11-14 15:31:49,086 - INFO - Finished converting document 4_2024-11-07 in 0.03 sec.
2025-11-14 15:31:49,120 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:49,128 - INFO - Going to convert document batch...
2025-11-14 15:31:49,128 - INFO - Processing document 4_2024-11-12
2025-11-14 15:31:49,146 - INFO - Finished converting document 4_2024-11-12 in 0.03 sec.
2025-11-14 15:31:49,187 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:31:49,187 - ERROR - Input document 4_2024-11-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <Inp

Converted 'data\edgar_documents\AIG\4_2024-10-18' --> 'data\processed_data\AIG\4_2024-10-18.md'
Converted 'data\edgar_documents\AIG\4_2024-11-07' --> 'data\processed_data\AIG\4_2024-11-07.md'
Converted 'data\edgar_documents\AIG\4_2024-11-12' --> 'data\processed_data\AIG\4_2024-11-12.md'
Error processing data\edgar_documents\AIG\4_2024-11-14: File format not allowed: data\edgar_documents\AIG\4_2024-11-14
Error processing data\edgar_documents\AIG\4_2024-11-20: File format not allowed: data\edgar_documents\AIG\4_2024-11-20


2025-11-14 15:31:49,233 - INFO - Processing document 4_2024-11-26
2025-11-14 15:31:49,250 - INFO - Finished converting document 4_2024-11-26 in 0.03 sec.
2025-11-14 15:31:49,299 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:49,308 - INFO - Going to convert document batch...
2025-11-14 15:31:49,308 - INFO - Processing document 4_2024-12-03
2025-11-14 15:31:49,328 - INFO - Finished converting document 4_2024-12-03 in 0.06 sec.
2025-11-14 15:31:49,376 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:49,386 - INFO - Going to convert document batch...
2025-11-14 15:31:49,386 - INFO - Processing document 4_2024-12-10
2025-11-14 15:31:49,405 - INFO - Finished converting document 4_2024-12-10 in 0.06 sec.
2025-11-14 15:31:49,448 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\4_2024-11-26' --> 'data\processed_data\AIG\4_2024-11-26.md'
Converted 'data\edgar_documents\AIG\4_2024-12-03' --> 'data\processed_data\AIG\4_2024-12-03.md'
Converted 'data\edgar_documents\AIG\4_2024-12-10' --> 'data\processed_data\AIG\4_2024-12-10.md'


2025-11-14 15:31:49,456 - INFO - Going to convert document batch...
2025-11-14 15:31:49,457 - INFO - Processing document 4_2024-12-11
2025-11-14 15:31:49,478 - INFO - Finished converting document 4_2024-12-11 in 0.03 sec.
2025-11-14 15:31:49,522 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:49,532 - INFO - Going to convert document batch...
2025-11-14 15:31:49,533 - INFO - Processing document 4_2024-12-17
2025-11-14 15:31:49,563 - INFO - Finished converting document 4_2024-12-17 in 0.06 sec.
2025-11-14 15:31:49,602 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:49,610 - INFO - Going to convert document batch...
2025-11-14 15:31:49,610 - INFO - Processing document 4_2025-01-02
2025-11-14 15:31:49,630 - INFO - Finished converting document 4_2025-01-02 in 0.05 sec.
2025-11-14 15:31:49,673 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:49,680 - INFO - Going to convert document batch...
2025-11-14 15:31:49,681 - 

Converted 'data\edgar_documents\AIG\4_2024-12-11' --> 'data\processed_data\AIG\4_2024-12-11.md'
Converted 'data\edgar_documents\AIG\4_2024-12-17' --> 'data\processed_data\AIG\4_2024-12-17.md'
Converted 'data\edgar_documents\AIG\4_2025-01-02' --> 'data\processed_data\AIG\4_2025-01-02.md'


2025-11-14 15:31:49,703 - INFO - Finished converting document 4_2025-01-03 in 0.05 sec.
2025-11-14 15:31:49,748 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:49,756 - INFO - Going to convert document batch...
2025-11-14 15:31:49,756 - INFO - Processing document 4_2025-02-18
2025-11-14 15:31:49,773 - INFO - Finished converting document 4_2025-02-18 in 0.05 sec.
2025-11-14 15:31:49,822 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:49,830 - INFO - Going to convert document batch...
2025-11-14 15:31:49,830 - INFO - Processing document 4_2025-02-20
2025-11-14 15:31:49,851 - INFO - Finished converting document 4_2025-02-20 in 0.05 sec.
2025-11-14 15:31:49,895 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:49,906 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AIG\4_2025-01-03' --> 'data\processed_data\AIG\4_2025-01-03.md'
Converted 'data\edgar_documents\AIG\4_2025-02-18' --> 'data\processed_data\AIG\4_2025-02-18.md'
Converted 'data\edgar_documents\AIG\4_2025-02-20' --> 'data\processed_data\AIG\4_2025-02-20.md'


2025-11-14 15:31:49,906 - INFO - Processing document 4_2025-02-21
2025-11-14 15:31:49,926 - INFO - Finished converting document 4_2025-02-21 in 0.05 sec.
2025-11-14 15:31:49,972 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:49,982 - INFO - Going to convert document batch...
2025-11-14 15:31:49,982 - INFO - Processing document 4_2025-02-25
2025-11-14 15:31:50,008 - INFO - Finished converting document 4_2025-02-25 in 0.06 sec.
2025-11-14 15:31:50,057 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:50,066 - INFO - Going to convert document batch...
2025-11-14 15:31:50,067 - INFO - Processing document 4_2025-03-05
2025-11-14 15:31:50,091 - INFO - Finished converting document 4_2025-03-05 in 0.06 sec.
2025-11-14 15:31:50,140 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\4_2025-02-21' --> 'data\processed_data\AIG\4_2025-02-21.md'
Converted 'data\edgar_documents\AIG\4_2025-02-25' --> 'data\processed_data\AIG\4_2025-02-25.md'
Converted 'data\edgar_documents\AIG\4_2025-03-05' --> 'data\processed_data\AIG\4_2025-03-05.md'


2025-11-14 15:31:50,149 - INFO - Going to convert document batch...
2025-11-14 15:31:50,150 - INFO - Processing document 4_2025-04-02
2025-11-14 15:31:50,175 - INFO - Finished converting document 4_2025-04-02 in 0.06 sec.
2025-11-14 15:31:50,225 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:31:50,226 - ERROR - Input document 4_2025-05-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:31:50,227 - INFO - Going to convert document batch...
2025-11-14 15:31:50,240 - IN

Converted 'data\edgar_documents\AIG\4_2025-04-02' --> 'data\processed_data\AIG\4_2025-04-02.md'
Error processing data\edgar_documents\AIG\4_2025-05-05: File format not allowed: data\edgar_documents\AIG\4_2025-05-05
Converted 'data\edgar_documents\AIG\4_2025-05-06' --> 'data\processed_data\AIG\4_2025-05-06.md'
Converted 'data\edgar_documents\AIG\4_2025-05-14' --> 'data\processed_data\AIG\4_2025-05-14.md'


2025-11-14 15:31:50,389 - INFO - Processing document 4_2025-05-15
2025-11-14 15:31:50,408 - INFO - Finished converting document 4_2025-05-15 in 0.05 sec.
2025-11-14 15:31:50,451 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:50,463 - INFO - Going to convert document batch...
2025-11-14 15:31:50,464 - INFO - Processing document 4_2025-05-20
2025-11-14 15:31:50,489 - INFO - Finished converting document 4_2025-05-20 in 0.06 sec.
2025-11-14 15:31:50,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:50,550 - INFO - Going to convert document batch...
2025-11-14 15:31:50,551 - INFO - Processing document 4_2025-05-22
2025-11-14 15:31:50,577 - INFO - Finished converting document 4_2025-05-22 in 0.06 sec.


Converted 'data\edgar_documents\AIG\4_2025-05-15' --> 'data\processed_data\AIG\4_2025-05-15.md'
Converted 'data\edgar_documents\AIG\4_2025-05-20' --> 'data\processed_data\AIG\4_2025-05-20.md'
Converted 'data\edgar_documents\AIG\4_2025-05-22' --> 'data\processed_data\AIG\4_2025-05-22.md'


2025-11-14 15:31:50,628 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:50,639 - INFO - Going to convert document batch...
2025-11-14 15:31:50,641 - INFO - Processing document 4_2025-06-04
2025-11-14 15:31:50,659 - INFO - Finished converting document 4_2025-06-04 in 0.06 sec.
2025-11-14 15:31:50,694 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:50,702 - INFO - Going to convert document batch...
2025-11-14 15:31:50,703 - INFO - Processing document 4_2025-06-17
2025-11-14 15:31:50,725 - INFO - Finished converting document 4_2025-06-17 in 0.05 sec.
2025-11-14 15:31:50,768 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:50,778 - INFO - Going to convert document batch...
2025-11-14 15:31:50,779 - INFO - Processing document 4_2025-06-30
2025-11-14 15:31:50,798 - INFO - Finished converting document 4_2025-06-30 in 0.05 sec.
2025-11-14 15:31:50,847 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\AIG\4_2025-06-04' --> 'data\processed_data\AIG\4_2025-06-04.md'
Converted 'data\edgar_documents\AIG\4_2025-06-17' --> 'data\processed_data\AIG\4_2025-06-17.md'
Converted 'data\edgar_documents\AIG\4_2025-06-30' --> 'data\processed_data\AIG\4_2025-06-30.md'


2025-11-14 15:31:50,858 - INFO - Processing document 4_2025-07-03
2025-11-14 15:31:50,882 - INFO - Finished converting document 4_2025-07-03 in 0.05 sec.
2025-11-14 15:31:50,929 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:50,937 - INFO - Going to convert document batch...
2025-11-14 15:31:50,937 - INFO - Processing document 4_2025-08-07
2025-11-14 15:31:50,956 - INFO - Finished converting document 4_2025-08-07 in 0.05 sec.
2025-11-14 15:31:50,998 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:51,005 - INFO - Going to convert document batch...
2025-11-14 15:31:51,005 - INFO - Processing document 4_2025-08-08
2025-11-14 15:31:51,021 - INFO - Finished converting document 4_2025-08-08 in 0.05 sec.
2025-11-14 15:31:51,051 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:51,059 - INFO - Going to convert document batch...
2025-11-14 15:31:51,060 - INFO - Processing document 4_2025-08-19
2025-11-14 15:31:51,079 - IN

Converted 'data\edgar_documents\AIG\4_2025-07-03' --> 'data\processed_data\AIG\4_2025-07-03.md'
Converted 'data\edgar_documents\AIG\4_2025-08-07' --> 'data\processed_data\AIG\4_2025-08-07.md'
Converted 'data\edgar_documents\AIG\4_2025-08-08' --> 'data\processed_data\AIG\4_2025-08-08.md'


2025-11-14 15:31:51,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:51,130 - INFO - Going to convert document batch...
2025-11-14 15:31:51,131 - INFO - Processing document 4_2025-09-08
2025-11-14 15:31:51,148 - INFO - Finished converting document 4_2025-09-08 in 0.05 sec.
2025-11-14 15:31:51,209 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:51,224 - INFO - Going to convert document batch...
2025-11-14 15:31:51,224 - INFO - Processing document 4_2025-10-01
2025-11-14 15:31:51,248 - INFO - Finished converting document 4_2025-10-01 in 0.08 sec.
2025-11-14 15:31:51,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\4_2025-08-19' --> 'data\processed_data\AIG\4_2025-08-19.md'
Converted 'data\edgar_documents\AIG\4_2025-09-08' --> 'data\processed_data\AIG\4_2025-09-08.md'
Converted 'data\edgar_documents\AIG\4_2025-10-01' --> 'data\processed_data\AIG\4_2025-10-01.md'


2025-11-14 15:31:51,493 - INFO - Going to convert document batch...
2025-11-14 15:31:51,493 - INFO - Processing document 4_2025-10-03
2025-11-14 15:31:51,512 - INFO - Finished converting document 4_2025-10-03 in 0.25 sec.
2025-11-14 15:31:51,547 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:51,556 - INFO - Going to convert document batch...
2025-11-14 15:31:51,557 - INFO - Processing document 4_2025-10-17
2025-11-14 15:31:51,579 - INFO - Finished converting document 4_2025-10-17 in 0.05 sec.
2025-11-14 15:31:51,621 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:51,628 - INFO - Going to convert document batch...
2025-11-14 15:31:51,629 - INFO - Processing document 4_2025-10-22
2025-11-14 15:31:51,648 - INFO - Finished converting document 4_2025-10-22 in 0.05 sec.
2025-11-14 15:31:51,689 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:51,697 - INFO - Going to convert document batch...
2025-11-14 15:31:51,698 - 

Converted 'data\edgar_documents\AIG\4_2025-10-03' --> 'data\processed_data\AIG\4_2025-10-03.md'
Converted 'data\edgar_documents\AIG\4_2025-10-17' --> 'data\processed_data\AIG\4_2025-10-17.md'
Converted 'data\edgar_documents\AIG\4_2025-10-22' --> 'data\processed_data\AIG\4_2025-10-22.md'


2025-11-14 15:31:51,715 - INFO - Finished converting document 4_2025-11-05 in 0.05 sec.
2025-11-14 15:31:51,751 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:51,766 - INFO - Going to convert document batch...
2025-11-14 15:31:51,767 - INFO - Processing document 8-K_2023-01-10
2025-11-14 15:31:51,786 - INFO - Finished converting document 8-K_2023-01-10 in 0.05 sec.
2025-11-14 15:31:51,820 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:51,831 - INFO - Going to convert document batch...
2025-11-14 15:31:51,832 - INFO - Processing document 8-K_2023-01-23
2025-11-14 15:31:51,852 - INFO - Finished converting document 8-K_2023-01-23 in 0.05 sec.
2025-11-14 15:31:51,889 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:51,903 - INFO - Going to convert document batch...
2025-11-14 15:31:51,904 - INFO - Processing document 8-K_2023-01-30
2025-11-14 15:31:51,927 - INFO - Finished converting document 8-K_2023-01-30 in 0.06

Converted 'data\edgar_documents\AIG\4_2025-11-05' --> 'data\processed_data\AIG\4_2025-11-05.md'
Converted 'data\edgar_documents\AIG\8-K_2023-01-10' --> 'data\processed_data\AIG\8-K_2023-01-10.md'
Converted 'data\edgar_documents\AIG\8-K_2023-01-23' --> 'data\processed_data\AIG\8-K_2023-01-23.md'


2025-11-14 15:31:51,962 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:51,974 - INFO - Going to convert document batch...
2025-11-14 15:31:51,975 - INFO - Processing document 8-K_2023-02-15
2025-11-14 15:31:51,996 - INFO - Finished converting document 8-K_2023-02-15 in 0.06 sec.
2025-11-14 15:31:52,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:52,044 - INFO - Going to convert document batch...
2025-11-14 15:31:52,045 - INFO - Processing document 8-K_2023-02-27
2025-11-14 15:31:52,071 - INFO - Finished converting document 8-K_2023-02-27 in 0.05 sec.
2025-11-14 15:31:52,114 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:52,127 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AIG\8-K_2023-01-30' --> 'data\processed_data\AIG\8-K_2023-01-30.md'
Converted 'data\edgar_documents\AIG\8-K_2023-02-15' --> 'data\processed_data\AIG\8-K_2023-02-15.md'
Converted 'data\edgar_documents\AIG\8-K_2023-02-27' --> 'data\processed_data\AIG\8-K_2023-02-27.md'


2025-11-14 15:31:52,127 - INFO - Processing document 8-K_2023-03-13
2025-11-14 15:31:52,149 - INFO - Finished converting document 8-K_2023-03-13 in 0.06 sec.
2025-11-14 15:31:52,185 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:52,194 - INFO - Going to convert document batch...
2025-11-14 15:31:52,195 - INFO - Processing document 8-K_2023-03-23
2025-11-14 15:31:52,210 - INFO - Finished converting document 8-K_2023-03-23 in 0.05 sec.
2025-11-14 15:31:52,235 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:52,251 - INFO - Going to convert document batch...
2025-11-14 15:31:52,251 - INFO - Processing document 8-K_2023-03-27
2025-11-14 15:31:52,290 - INFO - Finished converting document 8-K_2023-03-27 in 0.06 sec.
2025-11-14 15:31:52,337 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\8-K_2023-03-13' --> 'data\processed_data\AIG\8-K_2023-03-13.md'
Converted 'data\edgar_documents\AIG\8-K_2023-03-23' --> 'data\processed_data\AIG\8-K_2023-03-23.md'
Converted 'data\edgar_documents\AIG\8-K_2023-03-27' --> 'data\processed_data\AIG\8-K_2023-03-27.md'


2025-11-14 15:31:52,351 - INFO - Going to convert document batch...
2025-11-14 15:31:52,353 - INFO - Processing document 8-K_2023-05-04
2025-11-14 15:31:52,377 - INFO - Finished converting document 8-K_2023-05-04 in 0.06 sec.
2025-11-14 15:31:52,417 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:52,433 - INFO - Going to convert document batch...
2025-11-14 15:31:52,434 - INFO - Processing document 8-K_2023-05-15
2025-11-14 15:31:52,461 - INFO - Finished converting document 8-K_2023-05-15 in 0.06 sec.
2025-11-14 15:31:52,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:52,513 - INFO - Going to convert document batch...
2025-11-14 15:31:52,514 - INFO - Processing document 8-K_2023-05-22
2025-11-14 15:31:52,539 - INFO - Finished converting document 8-K_2023-05-22 in 0.06 sec.
2025-11-14 15:31:52,579 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\8-K_2023-05-04' --> 'data\processed_data\AIG\8-K_2023-05-04.md'
Converted 'data\edgar_documents\AIG\8-K_2023-05-15' --> 'data\processed_data\AIG\8-K_2023-05-15.md'
Converted 'data\edgar_documents\AIG\8-K_2023-05-22' --> 'data\processed_data\AIG\8-K_2023-05-22.md'


2025-11-14 15:31:52,598 - INFO - Going to convert document batch...
2025-11-14 15:31:52,598 - INFO - Processing document 8-K_2023-06-23
2025-11-14 15:31:52,623 - INFO - Finished converting document 8-K_2023-06-23 in 0.08 sec.
2025-11-14 15:31:52,669 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:52,685 - INFO - Going to convert document batch...
2025-11-14 15:31:52,687 - INFO - Processing document 8-K_2023-08-01
2025-11-14 15:31:52,707 - INFO - Finished converting document 8-K_2023-08-01 in 0.06 sec.
2025-11-14 15:31:52,738 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:52,759 - INFO - Going to convert document batch...
2025-11-14 15:31:52,760 - INFO - Processing document 8-K_2023-08-17
2025-11-14 15:31:52,782 - INFO - Finished converting document 8-K_2023-08-17 in 0.06 sec.
2025-11-14 15:31:52,823 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\8-K_2023-06-23' --> 'data\processed_data\AIG\8-K_2023-06-23.md'
Converted 'data\edgar_documents\AIG\8-K_2023-08-01' --> 'data\processed_data\AIG\8-K_2023-08-01.md'
Converted 'data\edgar_documents\AIG\8-K_2023-08-17' --> 'data\processed_data\AIG\8-K_2023-08-17.md'


2025-11-14 15:31:52,840 - INFO - Going to convert document batch...
2025-11-14 15:31:52,841 - INFO - Processing document 8-K_2023-09-08
2025-11-14 15:31:52,868 - INFO - Finished converting document 8-K_2023-09-08 in 0.06 sec.
2025-11-14 15:31:52,896 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:52,909 - INFO - Going to convert document batch...
2025-11-14 15:31:52,910 - INFO - Processing document 8-K_2023-11-01
2025-11-14 15:31:52,932 - INFO - Finished converting document 8-K_2023-11-01 in 0.03 sec.
2025-11-14 15:31:52,974 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:52,999 - INFO - Going to convert document batch...
2025-11-14 15:31:52,999 - INFO - Processing document 8-K_2023-11-06
2025-11-14 15:31:53,020 - INFO - Finished converting document 8-K_2023-11-06 in 0.08 sec.
2025-11-14 15:31:53,057 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,081 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AIG\8-K_2023-09-08' --> 'data\processed_data\AIG\8-K_2023-09-08.md'
Converted 'data\edgar_documents\AIG\8-K_2023-11-01' --> 'data\processed_data\AIG\8-K_2023-11-01.md'
Converted 'data\edgar_documents\AIG\8-K_2023-11-06' --> 'data\processed_data\AIG\8-K_2023-11-06.md'


2025-11-14 15:31:53,082 - INFO - Processing document 8-K_2023-11-21
2025-11-14 15:31:53,109 - INFO - Finished converting document 8-K_2023-11-21 in 0.08 sec.
2025-11-14 15:31:53,135 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,150 - INFO - Going to convert document batch...
2025-11-14 15:31:53,151 - INFO - Processing document 8-K_2023-12-04
2025-11-14 15:31:53,173 - INFO - Finished converting document 8-K_2023-12-04 in 0.05 sec.
2025-11-14 15:31:53,204 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,214 - INFO - Going to convert document batch...
2025-11-14 15:31:53,215 - INFO - Processing document 8-K_2024-01-31
2025-11-14 15:31:53,244 - INFO - Finished converting document 8-K_2024-01-31 in 0.05 sec.
2025-11-14 15:31:53,285 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,294 - INFO - Going to convert document batch...
2025-11-14 15:31:53,294 - INFO - Processing document 8-K_2024-02-01


Converted 'data\edgar_documents\AIG\8-K_2023-11-21' --> 'data\processed_data\AIG\8-K_2023-11-21.md'
Converted 'data\edgar_documents\AIG\8-K_2023-12-04' --> 'data\processed_data\AIG\8-K_2023-12-04.md'
Converted 'data\edgar_documents\AIG\8-K_2024-01-31' --> 'data\processed_data\AIG\8-K_2024-01-31.md'


2025-11-14 15:31:53,309 - INFO - Finished converting document 8-K_2024-02-01 in 0.06 sec.
2025-11-14 15:31:53,338 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,352 - INFO - Going to convert document batch...
2025-11-14 15:31:53,353 - INFO - Processing document 8-K_2024-02-07
2025-11-14 15:31:53,376 - INFO - Finished converting document 8-K_2024-02-07 in 0.06 sec.
2025-11-14 15:31:53,409 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,422 - INFO - Going to convert document batch...
2025-11-14 15:31:53,423 - INFO - Processing document 8-K_2024-02-13
2025-11-14 15:31:53,445 - INFO - Finished converting document 8-K_2024-02-13 in 0.05 sec.
2025-11-14 15:31:53,487 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,496 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AIG\8-K_2024-02-01' --> 'data\processed_data\AIG\8-K_2024-02-01.md'
Converted 'data\edgar_documents\AIG\8-K_2024-02-07' --> 'data\processed_data\AIG\8-K_2024-02-07.md'
Converted 'data\edgar_documents\AIG\8-K_2024-02-13' --> 'data\processed_data\AIG\8-K_2024-02-13.md'


2025-11-14 15:31:53,496 - INFO - Processing document 8-K_2024-04-22
2025-11-14 15:31:53,512 - INFO - Finished converting document 8-K_2024-04-22 in 0.06 sec.
2025-11-14 15:31:53,531 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,542 - INFO - Going to convert document batch...
2025-11-14 15:31:53,543 - INFO - Processing document 8-K_2024-05-01
2025-11-14 15:31:53,565 - INFO - Finished converting document 8-K_2024-05-01 in 0.05 sec.
2025-11-14 15:31:53,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,611 - INFO - Going to convert document batch...
2025-11-14 15:31:53,612 - INFO - Processing document 8-K_2024-05-16
2025-11-14 15:31:53,636 - INFO - Finished converting document 8-K_2024-05-16 in 0.06 sec.
2025-11-14 15:31:53,675 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,694 - INFO - Going to convert document batch...
2025-11-14 15:31:53,695 - INFO - Processing document 8-K_2024-05-17


Converted 'data\edgar_documents\AIG\8-K_2024-04-22' --> 'data\processed_data\AIG\8-K_2024-04-22.md'
Converted 'data\edgar_documents\AIG\8-K_2024-05-01' --> 'data\processed_data\AIG\8-K_2024-05-01.md'
Converted 'data\edgar_documents\AIG\8-K_2024-05-16' --> 'data\processed_data\AIG\8-K_2024-05-16.md'


2025-11-14 15:31:53,736 - INFO - Finished converting document 8-K_2024-05-17 in 0.08 sec.
2025-11-14 15:31:53,792 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,815 - INFO - Going to convert document batch...
2025-11-14 15:31:53,816 - INFO - Processing document 8-K_2024-06-10
2025-11-14 15:31:53,839 - INFO - Finished converting document 8-K_2024-06-10 in 0.08 sec.
2025-11-14 15:31:53,880 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,894 - INFO - Going to convert document batch...
2025-11-14 15:31:53,894 - INFO - Processing document 8-K_2024-06-13
2025-11-14 15:31:53,919 - INFO - Finished converting document 8-K_2024-06-13 in 0.08 sec.
2025-11-14 15:31:53,942 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:53,954 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AIG\8-K_2024-05-17' --> 'data\processed_data\AIG\8-K_2024-05-17.md'
Converted 'data\edgar_documents\AIG\8-K_2024-06-10' --> 'data\processed_data\AIG\8-K_2024-06-10.md'
Converted 'data\edgar_documents\AIG\8-K_2024-06-13' --> 'data\processed_data\AIG\8-K_2024-06-13.md'


2025-11-14 15:31:53,955 - INFO - Processing document 8-K_2024-06-25
2025-11-14 15:31:53,975 - INFO - Finished converting document 8-K_2024-06-25 in 0.05 sec.
2025-11-14 15:31:54,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,031 - INFO - Going to convert document batch...
2025-11-14 15:31:54,031 - INFO - Processing document 8-K_2024-07-31
2025-11-14 15:31:54,053 - INFO - Finished converting document 8-K_2024-07-31 in 0.06 sec.
2025-11-14 15:31:54,093 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,104 - INFO - Going to convert document batch...
2025-11-14 15:31:54,105 - INFO - Processing document 8-K_2024-09-03
2025-11-14 15:31:54,125 - INFO - Finished converting document 8-K_2024-09-03 in 0.06 sec.
2025-11-14 15:31:54,171 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\8-K_2024-06-25' --> 'data\processed_data\AIG\8-K_2024-06-25.md'
Converted 'data\edgar_documents\AIG\8-K_2024-07-31' --> 'data\processed_data\AIG\8-K_2024-07-31.md'
Converted 'data\edgar_documents\AIG\8-K_2024-09-03' --> 'data\processed_data\AIG\8-K_2024-09-03.md'


2025-11-14 15:31:54,182 - INFO - Going to convert document batch...
2025-11-14 15:31:54,183 - INFO - Processing document 8-K_2024-09-18
2025-11-14 15:31:54,205 - INFO - Finished converting document 8-K_2024-09-18 in 0.06 sec.
2025-11-14 15:31:54,244 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,256 - INFO - Going to convert document batch...
2025-11-14 15:31:54,257 - INFO - Processing document 8-K_2024-09-27
2025-11-14 15:31:54,275 - INFO - Finished converting document 8-K_2024-09-27 in 0.05 sec.
2025-11-14 15:31:54,310 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,324 - INFO - Going to convert document batch...
2025-11-14 15:31:54,325 - INFO - Processing document 8-K_2024-10-11
2025-11-14 15:31:54,339 - INFO - Finished converting document 8-K_2024-10-11 in 0.06 sec.
2025-11-14 15:31:54,382 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,401 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AIG\8-K_2024-09-18' --> 'data\processed_data\AIG\8-K_2024-09-18.md'
Converted 'data\edgar_documents\AIG\8-K_2024-09-27' --> 'data\processed_data\AIG\8-K_2024-09-27.md'
Converted 'data\edgar_documents\AIG\8-K_2024-10-11' --> 'data\processed_data\AIG\8-K_2024-10-11.md'


2025-11-14 15:31:54,401 - INFO - Processing document 8-K_2024-10-21
2025-11-14 15:31:54,423 - INFO - Finished converting document 8-K_2024-10-21 in 0.08 sec.
2025-11-14 15:31:54,458 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,471 - INFO - Going to convert document batch...
2025-11-14 15:31:54,472 - INFO - Processing document 8-K_2024-11-04
2025-11-14 15:31:54,491 - INFO - Finished converting document 8-K_2024-11-04 in 0.05 sec.
2025-11-14 15:31:54,517 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,529 - INFO - Going to convert document batch...
2025-11-14 15:31:54,529 - INFO - Processing document 8-K_2024-11-08
2025-11-14 15:31:54,549 - INFO - Finished converting document 8-K_2024-11-08 in 0.05 sec.
2025-11-14 15:31:54,581 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,600 - INFO - Going to convert document batch...
2025-11-14 15:31:54,602 - INFO - Processing document 8-K_2024-11-27


Converted 'data\edgar_documents\AIG\8-K_2024-10-21' --> 'data\processed_data\AIG\8-K_2024-10-21.md'
Converted 'data\edgar_documents\AIG\8-K_2024-11-04' --> 'data\processed_data\AIG\8-K_2024-11-04.md'
Converted 'data\edgar_documents\AIG\8-K_2024-11-08' --> 'data\processed_data\AIG\8-K_2024-11-08.md'


2025-11-14 15:31:54,668 - INFO - Finished converting document 8-K_2024-11-27 in 0.11 sec.
2025-11-14 15:31:54,712 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,721 - INFO - Going to convert document batch...
2025-11-14 15:31:54,722 - INFO - Processing document 8-K_2024-12-06
2025-11-14 15:31:54,741 - INFO - Finished converting document 8-K_2024-12-06 in 0.05 sec.
2025-11-14 15:31:54,781 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,794 - INFO - Going to convert document batch...
2025-11-14 15:31:54,795 - INFO - Processing document 8-K_2024-12-13
2025-11-14 15:31:54,815 - INFO - Finished converting document 8-K_2024-12-13 in 0.06 sec.
2025-11-14 15:31:54,851 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,861 - INFO - Going to convert document batch...
2025-11-14 15:31:54,861 - INFO - Processing document 8-K_2025-02-11
2025-11-14 15:31:54,882 - INFO - Finished converting document 8-K_2025-02-11 in 0.

Converted 'data\edgar_documents\AIG\8-K_2024-11-27' --> 'data\processed_data\AIG\8-K_2024-11-27.md'
Converted 'data\edgar_documents\AIG\8-K_2024-12-06' --> 'data\processed_data\AIG\8-K_2024-12-06.md'
Converted 'data\edgar_documents\AIG\8-K_2024-12-13' --> 'data\processed_data\AIG\8-K_2024-12-13.md'


2025-11-14 15:31:54,915 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,927 - INFO - Going to convert document batch...
2025-11-14 15:31:54,927 - INFO - Processing document 8-K_2025-02-20
2025-11-14 15:31:54,948 - INFO - Finished converting document 8-K_2025-02-20 in 0.05 sec.
2025-11-14 15:31:54,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:54,986 - INFO - Going to convert document batch...
2025-11-14 15:31:54,987 - INFO - Processing document 8-K_2025-03-31
2025-11-14 15:31:55,007 - INFO - Finished converting document 8-K_2025-03-31 in 0.05 sec.
2025-11-14 15:31:55,066 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:55,081 - INFO - Going to convert document batch...
2025-11-14 15:31:55,081 - INFO - Processing document 8-K_2025-05-01
2025-11-14 15:31:55,099 - INFO - Finished converting document 8-K_2025-05-01 in 0.08 sec.


Converted 'data\edgar_documents\AIG\8-K_2025-02-11' --> 'data\processed_data\AIG\8-K_2025-02-11.md'
Converted 'data\edgar_documents\AIG\8-K_2025-02-20' --> 'data\processed_data\AIG\8-K_2025-02-20.md'
Converted 'data\edgar_documents\AIG\8-K_2025-03-31' --> 'data\processed_data\AIG\8-K_2025-03-31.md'


2025-11-14 15:31:55,141 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:55,180 - INFO - Going to convert document batch...
2025-11-14 15:31:55,181 - INFO - Processing document 8-K_2025-05-07
2025-11-14 15:31:55,213 - INFO - Finished converting document 8-K_2025-05-07 in 0.11 sec.
2025-11-14 15:31:55,257 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:55,268 - INFO - Going to convert document batch...
2025-11-14 15:31:55,269 - INFO - Processing document 8-K_2025-05-15


Converted 'data\edgar_documents\AIG\8-K_2025-05-01' --> 'data\processed_data\AIG\8-K_2025-05-01.md'
Converted 'data\edgar_documents\AIG\8-K_2025-05-07' --> 'data\processed_data\AIG\8-K_2025-05-07.md'


2025-11-14 15:31:55,522 - INFO - Finished converting document 8-K_2025-05-15 in 0.28 sec.
2025-11-14 15:31:55,554 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:55,568 - INFO - Going to convert document batch...
2025-11-14 15:31:55,569 - INFO - Processing document 8-K_2025-05-16
2025-11-14 15:31:55,597 - INFO - Finished converting document 8-K_2025-05-16 in 0.06 sec.
2025-11-14 15:31:55,630 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:55,640 - INFO - Going to convert document batch...
2025-11-14 15:31:55,641 - INFO - Processing document 8-K_2025-06-02
2025-11-14 15:31:55,660 - INFO - Finished converting document 8-K_2025-06-02 in 0.05 sec.
2025-11-14 15:31:55,692 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:55,703 - INFO - Going to convert document batch...
2025-11-14 15:31:55,703 - INFO - Processing document 8-K_2025-06-09
2025-11-14 15:31:55,725 - INFO - Finished converting document 8-K_2025-06-09 in 0.

Converted 'data\edgar_documents\AIG\8-K_2025-05-15' --> 'data\processed_data\AIG\8-K_2025-05-15.md'
Converted 'data\edgar_documents\AIG\8-K_2025-05-16' --> 'data\processed_data\AIG\8-K_2025-05-16.md'
Converted 'data\edgar_documents\AIG\8-K_2025-06-02' --> 'data\processed_data\AIG\8-K_2025-06-02.md'


2025-11-14 15:31:55,766 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:55,777 - INFO - Going to convert document batch...
2025-11-14 15:31:55,778 - INFO - Processing document 8-K_2025-07-21
2025-11-14 15:31:55,798 - INFO - Finished converting document 8-K_2025-07-21 in 0.06 sec.
2025-11-14 15:31:55,820 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:55,828 - INFO - Going to convert document batch...
2025-11-14 15:31:55,829 - INFO - Processing document 8-K_2025-08-06
2025-11-14 15:31:55,846 - INFO - Finished converting document 8-K_2025-08-06 in 0.03 sec.
2025-11-14 15:31:55,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:55,899 - INFO - Going to convert document batch...
2025-11-14 15:31:55,901 - INFO - Processing document 8-K_2025-08-18
2025-11-14 15:31:55,925 - INFO - Finished converting document 8-K_2025-08-18 in 0.06 sec.


Converted 'data\edgar_documents\AIG\8-K_2025-06-09' --> 'data\processed_data\AIG\8-K_2025-06-09.md'
Converted 'data\edgar_documents\AIG\8-K_2025-07-21' --> 'data\processed_data\AIG\8-K_2025-07-21.md'
Converted 'data\edgar_documents\AIG\8-K_2025-08-06' --> 'data\processed_data\AIG\8-K_2025-08-06.md'


2025-11-14 15:31:55,949 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:55,957 - INFO - Going to convert document batch...
2025-11-14 15:31:55,957 - INFO - Processing document 8-K_2025-10-03
2025-11-14 15:31:55,971 - INFO - Finished converting document 8-K_2025-10-03 in 0.03 sec.
2025-11-14 15:31:55,990 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:31:55,999 - INFO - Going to convert document batch...
2025-11-14 15:31:56,000 - INFO - Processing document 8-K_2025-11-04
2025-11-14 15:31:56,017 - INFO - Finished converting document 8-K_2025-11-04 in 0.05 sec.
2025-11-14 15:31:56,062 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\8-K_2025-08-18' --> 'data\processed_data\AIG\8-K_2025-08-18.md'
Converted 'data\edgar_documents\AIG\8-K_2025-10-03' --> 'data\processed_data\AIG\8-K_2025-10-03.md'
Converted 'data\edgar_documents\AIG\8-K_2025-11-04' --> 'data\processed_data\AIG\8-K_2025-11-04.md'


2025-11-14 15:31:56,474 - INFO - Going to convert document batch...
2025-11-14 15:31:56,475 - INFO - Processing document DEF-14A_2023-03-29
2025-11-14 15:31:58,133 - INFO - Finished converting document DEF-14A_2023-03-29 in 2.09 sec.
2025-11-14 15:31:59,007 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\DEF-14A_2023-03-29' --> 'data\processed_data\AIG\DEF-14A_2023-03-29.md'


2025-11-14 15:31:59,533 - INFO - Going to convert document batch...
2025-11-14 15:31:59,535 - INFO - Processing document DEF-14A_2024-04-02
2025-11-14 15:32:01,596 - INFO - Finished converting document DEF-14A_2024-04-02 in 2.64 sec.
2025-11-14 15:32:02,396 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\DEF-14A_2024-04-02' --> 'data\processed_data\AIG\DEF-14A_2024-04-02.md'


2025-11-14 15:32:03,108 - INFO - Going to convert document batch...
2025-11-14 15:32:03,109 - INFO - Processing document DEF-14A_2025-04-02
2025-11-14 15:32:04,846 - INFO - Finished converting document DEF-14A_2025-04-02 in 2.50 sec.
2025-11-14 15:32:05,581 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AIG\DEF-14A_2025-04-02' --> 'data\processed_data\AIG\DEF-14A_2025-04-02.md'
Processed 158 new files. Errors: 6
Found 147 files to process in data\edgar_documents\AMD


2025-11-14 15:32:06,318 - INFO - Going to convert document batch...
2025-11-14 15:32:06,319 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:32:06,319 - INFO - Processing document 10-K_2023-02-27
2025-11-14 15:32:07,495 - INFO - Finished converting document 10-K_2023-02-27 in 1.98 sec.
2025-11-14 15:32:08,074 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\10-K_2023-02-27' --> 'data\processed_data\AMD\10-K_2023-02-27.md'


2025-11-14 15:32:08,494 - INFO - Going to convert document batch...
2025-11-14 15:32:08,494 - INFO - Processing document 10-K_2024-01-31
2025-11-14 15:32:09,664 - INFO - Finished converting document 10-K_2024-01-31 in 1.66 sec.
2025-11-14 15:32:10,154 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\10-K_2024-01-31' --> 'data\processed_data\AMD\10-K_2024-01-31.md'


2025-11-14 15:32:10,560 - INFO - Going to convert document batch...
2025-11-14 15:32:10,561 - INFO - Processing document 10-K_2025-02-05
2025-11-14 15:32:11,470 - INFO - Finished converting document 10-K_2025-02-05 in 1.36 sec.
2025-11-14 15:32:12,029 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\10-K_2025-02-05' --> 'data\processed_data\AMD\10-K_2025-02-05.md'


2025-11-14 15:32:12,602 - INFO - Going to convert document batch...
2025-11-14 15:32:12,603 - INFO - Processing document 10-Q_2023-05-03
2025-11-14 15:32:13,184 - INFO - Finished converting document 10-Q_2023-05-03 in 1.19 sec.
2025-11-14 15:32:13,497 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\10-Q_2023-05-03' --> 'data\processed_data\AMD\10-Q_2023-05-03.md'


2025-11-14 15:32:13,784 - INFO - Going to convert document batch...
2025-11-14 15:32:13,785 - INFO - Processing document 10-Q_2023-08-02
2025-11-14 15:32:14,295 - INFO - Finished converting document 10-Q_2023-08-02 in 0.84 sec.
2025-11-14 15:32:14,572 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\10-Q_2023-08-02' --> 'data\processed_data\AMD\10-Q_2023-08-02.md'


2025-11-14 15:32:14,839 - INFO - Going to convert document batch...
2025-11-14 15:32:14,840 - INFO - Processing document 10-Q_2023-11-01
2025-11-14 15:32:15,481 - INFO - Finished converting document 10-Q_2023-11-01 in 0.95 sec.
2025-11-14 15:32:15,760 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\10-Q_2023-11-01' --> 'data\processed_data\AMD\10-Q_2023-11-01.md'


2025-11-14 15:32:16,291 - INFO - Going to convert document batch...
2025-11-14 15:32:16,292 - INFO - Processing document 10-Q_2024-05-01
2025-11-14 15:32:16,751 - INFO - Finished converting document 10-Q_2024-05-01 in 1.02 sec.
2025-11-14 15:32:16,998 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\10-Q_2024-05-01' --> 'data\processed_data\AMD\10-Q_2024-05-01.md'


2025-11-14 15:32:17,253 - INFO - Going to convert document batch...
2025-11-14 15:32:17,254 - INFO - Processing document 10-Q_2024-07-31
2025-11-14 15:32:17,783 - INFO - Finished converting document 10-Q_2024-07-31 in 0.81 sec.
2025-11-14 15:32:18,088 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\10-Q_2024-07-31' --> 'data\processed_data\AMD\10-Q_2024-07-31.md'


2025-11-14 15:32:18,425 - INFO - Going to convert document batch...
2025-11-14 15:32:18,426 - INFO - Processing document 10-Q_2024-10-30
2025-11-14 15:32:19,188 - INFO - Finished converting document 10-Q_2024-10-30 in 1.14 sec.
2025-11-14 15:32:19,463 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\10-Q_2024-10-30' --> 'data\processed_data\AMD\10-Q_2024-10-30.md'


2025-11-14 15:32:19,692 - INFO - Going to convert document batch...
2025-11-14 15:32:19,694 - INFO - Processing document 10-Q_2025-05-07
2025-11-14 15:32:20,135 - INFO - Finished converting document 10-Q_2025-05-07 in 0.69 sec.
2025-11-14 15:32:20,402 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\10-Q_2025-05-07' --> 'data\processed_data\AMD\10-Q_2025-05-07.md'


2025-11-14 15:32:20,689 - INFO - Going to convert document batch...
2025-11-14 15:32:20,689 - INFO - Processing document 10-Q_2025-08-06
2025-11-14 15:32:21,233 - INFO - Finished converting document 10-Q_2025-08-06 in 0.86 sec.
2025-11-14 15:32:21,554 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\10-Q_2025-08-06' --> 'data\processed_data\AMD\10-Q_2025-08-06.md'


2025-11-14 15:32:22,154 - INFO - Going to convert document batch...
2025-11-14 15:32:22,155 - INFO - Processing document 10-Q_2025-11-05
2025-11-14 15:32:22,702 - INFO - Finished converting document 10-Q_2025-11-05 in 1.19 sec.
2025-11-14 15:32:22,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:22,986 - INFO - Going to convert document batch...
2025-11-14 15:32:22,987 - INFO - Processing document 4_2023-01-18
2025-11-14 15:32:23,008 - INFO - Finished converting document 4_2023-01-18 in 0.05 sec.
2025-11-14 15:32:23,057 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:23,068 - INFO - Going to convert document batch...
2025-11-14 15:32:23,069 - INFO - Processing document 4_2023-02-08
2025-11-14 15:32:23,092 - INFO - Finished converting document 4_2023-02-08 in 0.06 sec.
2025-11-14 15:32:23,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\10-Q_2025-11-05' --> 'data\processed_data\AMD\10-Q_2025-11-05.md'
Converted 'data\edgar_documents\AMD\4_2023-01-18' --> 'data\processed_data\AMD\4_2023-01-18.md'
Converted 'data\edgar_documents\AMD\4_2023-02-08' --> 'data\processed_data\AMD\4_2023-02-08.md'


2025-11-14 15:32:23,152 - INFO - Going to convert document batch...
2025-11-14 15:32:23,153 - INFO - Processing document 4_2023-02-13
2025-11-14 15:32:23,171 - INFO - Finished converting document 4_2023-02-13 in 0.06 sec.
2025-11-14 15:32:23,214 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:23,228 - INFO - Going to convert document batch...
2025-11-14 15:32:23,229 - INFO - Processing document 4_2023-02-16
2025-11-14 15:32:23,252 - INFO - Finished converting document 4_2023-02-16 in 0.06 sec.
2025-11-14 15:32:23,290 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:23,301 - INFO - Going to convert document batch...
2025-11-14 15:32:23,302 - INFO - Processing document 4_2023-02-17
2025-11-14 15:32:23,322 - INFO - Finished converting document 4_2023-02-17 in 0.05 sec.
2025-11-14 15:32:23,372 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2023-02-13' --> 'data\processed_data\AMD\4_2023-02-13.md'
Converted 'data\edgar_documents\AMD\4_2023-02-16' --> 'data\processed_data\AMD\4_2023-02-16.md'
Converted 'data\edgar_documents\AMD\4_2023-02-17' --> 'data\processed_data\AMD\4_2023-02-17.md'


2025-11-14 15:32:23,382 - INFO - Going to convert document batch...
2025-11-14 15:32:23,383 - INFO - Processing document 4_2023-03-08
2025-11-14 15:32:23,419 - INFO - Finished converting document 4_2023-03-08 in 0.08 sec.
2025-11-14 15:32:23,506 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:23,541 - INFO - Going to convert document batch...
2025-11-14 15:32:23,542 - INFO - Processing document 4_2023-03-09
2025-11-14 15:32:23,635 - INFO - Finished converting document 4_2023-03-09 in 0.16 sec.


Converted 'data\edgar_documents\AMD\4_2023-03-08' --> 'data\processed_data\AMD\4_2023-03-08.md'


2025-11-14 15:32:23,757 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:23,781 - INFO - Going to convert document batch...
2025-11-14 15:32:23,782 - INFO - Processing document 4_2023-03-17
2025-11-14 15:32:23,858 - INFO - Finished converting document 4_2023-03-17 in 0.14 sec.


Converted 'data\edgar_documents\AMD\4_2023-03-09' --> 'data\processed_data\AMD\4_2023-03-09.md'


2025-11-14 15:32:23,935 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:23,958 - INFO - Going to convert document batch...
2025-11-14 15:32:23,959 - INFO - Processing document 4_2023-03-20
2025-11-14 15:32:24,024 - INFO - Finished converting document 4_2023-03-20 in 0.11 sec.


Converted 'data\edgar_documents\AMD\4_2023-03-17' --> 'data\processed_data\AMD\4_2023-03-17.md'
Converted 'data\edgar_documents\AMD\4_2023-03-20' --> 'data\processed_data\AMD\4_2023-03-20.md'


2025-11-14 15:32:24,118 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:24,146 - INFO - Going to convert document batch...
2025-11-14 15:32:24,147 - INFO - Processing document 4_2023-04-10
2025-11-14 15:32:24,201 - INFO - Finished converting document 4_2023-04-10 in 0.11 sec.
2025-11-14 15:32:24,271 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:24,293 - INFO - Going to convert document batch...
2025-11-14 15:32:24,294 - INFO - Processing document 4_2023-04-14
2025-11-14 15:32:24,339 - INFO - Finished converting document 4_2023-04-14 in 0.08 sec.
2025-11-14 15:32:24,418 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:24,439 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMD\4_2023-04-10' --> 'data\processed_data\AMD\4_2023-04-10.md'
Converted 'data\edgar_documents\AMD\4_2023-04-14' --> 'data\processed_data\AMD\4_2023-04-14.md'


2025-11-14 15:32:24,440 - INFO - Processing document 4_2023-04-18
2025-11-14 15:32:24,489 - INFO - Finished converting document 4_2023-04-18 in 0.09 sec.
2025-11-14 15:32:24,553 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:24,574 - INFO - Going to convert document batch...
2025-11-14 15:32:24,576 - INFO - Processing document 4_2023-05-09
2025-11-14 15:32:24,644 - INFO - Finished converting document 4_2023-05-09 in 0.11 sec.
2025-11-14 15:32:24,728 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2023-04-18' --> 'data\processed_data\AMD\4_2023-04-18.md'
Converted 'data\edgar_documents\AMD\4_2023-05-09' --> 'data\processed_data\AMD\4_2023-05-09.md'


2025-11-14 15:32:24,745 - INFO - Going to convert document batch...
2025-11-14 15:32:24,747 - INFO - Processing document 4_2023-05-17
2025-11-14 15:32:24,792 - INFO - Finished converting document 4_2023-05-17 in 0.09 sec.
2025-11-14 15:32:24,865 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:24,882 - INFO - Going to convert document batch...
2025-11-14 15:32:24,883 - INFO - Processing document 4_2023-05-22
2025-11-14 15:32:24,927 - INFO - Finished converting document 4_2023-05-22 in 0.08 sec.
2025-11-14 15:32:24,988 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:25,012 - INFO - Going to convert document batch...
2025-11-14 15:32:25,013 - INFO - Processing document 4_2023-05-25


Converted 'data\edgar_documents\AMD\4_2023-05-17' --> 'data\processed_data\AMD\4_2023-05-17.md'
Converted 'data\edgar_documents\AMD\4_2023-05-22' --> 'data\processed_data\AMD\4_2023-05-22.md'


2025-11-14 15:32:25,068 - INFO - Finished converting document 4_2023-05-25 in 0.09 sec.
2025-11-14 15:32:25,145 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:25,161 - INFO - Going to convert document batch...
2025-11-14 15:32:25,162 - INFO - Processing document 4_2023-05-30
2025-11-14 15:32:25,198 - INFO - Finished converting document 4_2023-05-30 in 0.08 sec.
2025-11-14 15:32:25,266 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:25,286 - INFO - Going to convert document batch...
2025-11-14 15:32:25,288 - INFO - Processing document 4_2023-06-07


Converted 'data\edgar_documents\AMD\4_2023-05-25' --> 'data\processed_data\AMD\4_2023-05-25.md'
Converted 'data\edgar_documents\AMD\4_2023-05-30' --> 'data\processed_data\AMD\4_2023-05-30.md'


2025-11-14 15:32:25,350 - INFO - Finished converting document 4_2023-06-07 in 0.09 sec.
2025-11-14 15:32:25,448 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:25,497 - INFO - Going to convert document batch...
2025-11-14 15:32:25,498 - INFO - Processing document 4_2023-06-08
2025-11-14 15:32:25,610 - INFO - Finished converting document 4_2023-06-08 in 0.19 sec.


Converted 'data\edgar_documents\AMD\4_2023-06-07' --> 'data\processed_data\AMD\4_2023-06-07.md'


2025-11-14 15:32:25,709 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:25,732 - INFO - Going to convert document batch...
2025-11-14 15:32:25,733 - INFO - Processing document 4_2023-06-12
2025-11-14 15:32:25,777 - INFO - Finished converting document 4_2023-06-12 in 0.09 sec.
2025-11-14 15:32:25,863 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2023-06-08' --> 'data\processed_data\AMD\4_2023-06-08.md'
Converted 'data\edgar_documents\AMD\4_2023-06-12' --> 'data\processed_data\AMD\4_2023-06-12.md'


2025-11-14 15:32:25,886 - INFO - Going to convert document batch...
2025-11-14 15:32:25,888 - INFO - Processing document 4_2023-06-13
2025-11-14 15:32:25,984 - INFO - Finished converting document 4_2023-06-13 in 0.16 sec.
2025-11-14 15:32:26,102 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:26,158 - INFO - Going to convert document batch...
2025-11-14 15:32:26,160 - INFO - Processing document 4_2023-07-10
2025-11-14 15:32:26,242 - INFO - Finished converting document 4_2023-07-10 in 0.16 sec.


Converted 'data\edgar_documents\AMD\4_2023-06-13' --> 'data\processed_data\AMD\4_2023-06-13.md'


2025-11-14 15:32:26,358 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:26,411 - INFO - Going to convert document batch...
2025-11-14 15:32:26,413 - INFO - Processing document 4_2023-07-14
2025-11-14 15:32:26,493 - INFO - Finished converting document 4_2023-07-14 in 0.14 sec.


Converted 'data\edgar_documents\AMD\4_2023-07-10' --> 'data\processed_data\AMD\4_2023-07-10.md'


2025-11-14 15:32:26,633 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:26,661 - INFO - Going to convert document batch...
2025-11-14 15:32:26,662 - INFO - Processing document 4_2023-08-10
2025-11-14 15:32:26,731 - INFO - Finished converting document 4_2023-08-10 in 0.14 sec.


Converted 'data\edgar_documents\AMD\4_2023-07-14' --> 'data\processed_data\AMD\4_2023-07-14.md'


2025-11-14 15:32:26,810 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:26,857 - INFO - Going to convert document batch...
2025-11-14 15:32:26,858 - INFO - Processing document 4_2023-08-11
2025-11-14 15:32:26,930 - INFO - Finished converting document 4_2023-08-11 in 0.12 sec.


Converted 'data\edgar_documents\AMD\4_2023-08-10' --> 'data\processed_data\AMD\4_2023-08-10.md'


2025-11-14 15:32:27,007 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:27,048 - INFO - Going to convert document batch...
2025-11-14 15:32:27,049 - INFO - Processing document 4_2023-08-17
2025-11-14 15:32:27,117 - INFO - Finished converting document 4_2023-08-17 in 0.11 sec.
2025-11-14 15:32:27,192 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2023-08-11' --> 'data\processed_data\AMD\4_2023-08-11.md'
Converted 'data\edgar_documents\AMD\4_2023-08-17' --> 'data\processed_data\AMD\4_2023-08-17.md'


2025-11-14 15:32:27,214 - INFO - Going to convert document batch...
2025-11-14 15:32:27,216 - INFO - Processing document 4_2023-08-18
2025-11-14 15:32:27,260 - INFO - Finished converting document 4_2023-08-18 in 0.09 sec.
2025-11-14 15:32:27,306 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:27,327 - INFO - Going to convert document batch...
2025-11-14 15:32:27,328 - INFO - Processing document 4_2023-08-29
2025-11-14 15:32:27,371 - INFO - Finished converting document 4_2023-08-29 in 0.08 sec.
2025-11-14 15:32:27,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:27,446 - INFO - Going to convert document batch...
2025-11-14 15:32:27,447 - INFO - Processing document 4_2023-08-30
2025-11-14 15:32:27,507 - INFO - Finished converting document 4_2023-08-30 in 0.09 sec.


Converted 'data\edgar_documents\AMD\4_2023-08-18' --> 'data\processed_data\AMD\4_2023-08-18.md'
Converted 'data\edgar_documents\AMD\4_2023-08-29' --> 'data\processed_data\AMD\4_2023-08-29.md'


2025-11-14 15:32:27,600 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:27,630 - INFO - Going to convert document batch...
2025-11-14 15:32:27,631 - INFO - Processing document 4_2023-09-01
2025-11-14 15:32:27,670 - INFO - Finished converting document 4_2023-09-01 in 0.11 sec.
2025-11-14 15:32:27,734 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2023-08-30' --> 'data\processed_data\AMD\4_2023-08-30.md'
Converted 'data\edgar_documents\AMD\4_2023-09-01' --> 'data\processed_data\AMD\4_2023-09-01.md'


2025-11-14 15:32:27,784 - INFO - Going to convert document batch...
2025-11-14 15:32:27,786 - INFO - Processing document 4_2023-09-14
2025-11-14 15:32:27,872 - INFO - Finished converting document 4_2023-09-14 in 0.17 sec.
2025-11-14 15:32:27,927 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:27,950 - INFO - Going to convert document batch...
2025-11-14 15:32:27,951 - INFO - Processing document 4_2023-11-07
2025-11-14 15:32:27,992 - INFO - Finished converting document 4_2023-11-07 in 0.08 sec.
2025-11-14 15:32:28,074 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:28,111 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMD\4_2023-09-14' --> 'data\processed_data\AMD\4_2023-09-14.md'
Converted 'data\edgar_documents\AMD\4_2023-11-07' --> 'data\processed_data\AMD\4_2023-11-07.md'


2025-11-14 15:32:28,112 - INFO - Processing document 4_2023-11-09
2025-11-14 15:32:28,183 - INFO - Finished converting document 4_2023-11-09 in 0.14 sec.
2025-11-14 15:32:28,249 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:28,275 - INFO - Going to convert document batch...
2025-11-14 15:32:28,276 - INFO - Processing document 4_2023-11-29
2025-11-14 15:32:28,349 - INFO - Finished converting document 4_2023-11-29 in 0.11 sec.


Converted 'data\edgar_documents\AMD\4_2023-11-09' --> 'data\processed_data\AMD\4_2023-11-09.md'


2025-11-14 15:32:28,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:28,479 - INFO - Going to convert document batch...
2025-11-14 15:32:28,482 - INFO - Processing document 4_2023-12-07
2025-11-14 15:32:28,546 - INFO - Finished converting document 4_2023-12-07 in 0.12 sec.


Converted 'data\edgar_documents\AMD\4_2023-11-29' --> 'data\processed_data\AMD\4_2023-11-29.md'
Converted 'data\edgar_documents\AMD\4_2023-12-07' --> 'data\processed_data\AMD\4_2023-12-07.md'


2025-11-14 15:32:28,652 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:28,669 - INFO - Going to convert document batch...
2025-11-14 15:32:28,670 - INFO - Processing document 4_2023-12-11
2025-11-14 15:32:28,708 - INFO - Finished converting document 4_2023-12-11 in 0.08 sec.
2025-11-14 15:32:28,773 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:28,792 - INFO - Going to convert document batch...
2025-11-14 15:32:28,793 - INFO - Processing document 4_2024-01-17


Converted 'data\edgar_documents\AMD\4_2023-12-11' --> 'data\processed_data\AMD\4_2023-12-11.md'


2025-11-14 15:32:29,552 - INFO - Finished converting document 4_2024-01-17 in 0.80 sec.
2025-11-14 15:32:29,642 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:29,664 - INFO - Going to convert document batch...
2025-11-14 15:32:29,667 - INFO - Processing document 4_2024-02-06
2025-11-14 15:32:29,710 - INFO - Finished converting document 4_2024-02-06 in 0.08 sec.
2025-11-14 15:32:29,774 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2024-01-17' --> 'data\processed_data\AMD\4_2024-01-17.md'
Converted 'data\edgar_documents\AMD\4_2024-02-06' --> 'data\processed_data\AMD\4_2024-02-06.md'


2025-11-14 15:32:29,809 - INFO - Going to convert document batch...
2025-11-14 15:32:29,810 - INFO - Processing document 4_2024-02-07
2025-11-14 15:32:29,876 - INFO - Finished converting document 4_2024-02-07 in 0.12 sec.
2025-11-14 15:32:29,985 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:30,020 - INFO - Going to convert document batch...
2025-11-14 15:32:30,021 - INFO - Processing document 4_2024-02-16
2025-11-14 15:32:30,110 - INFO - Finished converting document 4_2024-02-16 in 0.16 sec.


Converted 'data\edgar_documents\AMD\4_2024-02-07' --> 'data\processed_data\AMD\4_2024-02-07.md'
Converted 'data\edgar_documents\AMD\4_2024-02-16' --> 'data\processed_data\AMD\4_2024-02-16.md'


2025-11-14 15:32:30,170 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:30,195 - INFO - Going to convert document batch...
2025-11-14 15:32:30,197 - INFO - Processing document 4_2024-02-20
2025-11-14 15:32:30,232 - INFO - Finished converting document 4_2024-02-20 in 0.09 sec.
2025-11-14 15:32:30,289 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:30,310 - INFO - Going to convert document batch...
2025-11-14 15:32:30,312 - INFO - Processing document 4_2024-02-23
2025-11-14 15:32:30,386 - INFO - Finished converting document 4_2024-02-23 in 0.11 sec.


Converted 'data\edgar_documents\AMD\4_2024-02-20' --> 'data\processed_data\AMD\4_2024-02-20.md'


2025-11-14 15:32:30,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:30,562 - INFO - Going to convert document batch...
2025-11-14 15:32:30,563 - INFO - Processing document 4_2024-03-04
2025-11-14 15:32:30,615 - INFO - Finished converting document 4_2024-03-04 in 0.09 sec.
2025-11-14 15:32:30,699 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2024-02-23' --> 'data\processed_data\AMD\4_2024-02-23.md'
Converted 'data\edgar_documents\AMD\4_2024-03-04' --> 'data\processed_data\AMD\4_2024-03-04.md'


2025-11-14 15:32:30,724 - INFO - Going to convert document batch...
2025-11-14 15:32:30,727 - INFO - Processing document 4_2024-03-06
2025-11-14 15:32:30,789 - INFO - Finished converting document 4_2024-03-06 in 0.11 sec.
2025-11-14 15:32:30,858 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:30,892 - INFO - Going to convert document batch...
2025-11-14 15:32:30,893 - INFO - Processing document 4_2024-03-07
2025-11-14 15:32:30,972 - INFO - Finished converting document 4_2024-03-07 in 0.12 sec.


Converted 'data\edgar_documents\AMD\4_2024-03-06' --> 'data\processed_data\AMD\4_2024-03-06.md'


2025-11-14 15:32:31,073 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:31,118 - INFO - Going to convert document batch...
2025-11-14 15:32:31,120 - INFO - Processing document 4_2024-03-11
2025-11-14 15:32:31,191 - INFO - Finished converting document 4_2024-03-11 in 0.14 sec.


Converted 'data\edgar_documents\AMD\4_2024-03-07' --> 'data\processed_data\AMD\4_2024-03-07.md'


2025-11-14 15:32:31,251 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:31,281 - INFO - Going to convert document batch...
2025-11-14 15:32:31,282 - INFO - Processing document 4_2024-03-15
2025-11-14 15:32:31,352 - INFO - Finished converting document 4_2024-03-15 in 0.11 sec.


Converted 'data\edgar_documents\AMD\4_2024-03-11' --> 'data\processed_data\AMD\4_2024-03-11.md'


2025-11-14 15:32:31,444 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:31,466 - INFO - Going to convert document batch...
2025-11-14 15:32:31,468 - INFO - Processing document 4_2024-03-19
2025-11-14 15:32:31,532 - INFO - Finished converting document 4_2024-03-19 in 0.11 sec.
2025-11-14 15:32:31,608 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2024-03-15' --> 'data\processed_data\AMD\4_2024-03-15.md'
Converted 'data\edgar_documents\AMD\4_2024-03-19' --> 'data\processed_data\AMD\4_2024-03-19.md'


2025-11-14 15:32:31,635 - INFO - Going to convert document batch...
2025-11-14 15:32:31,636 - INFO - Processing document 4_2024-04-17
2025-11-14 15:32:31,713 - INFO - Finished converting document 4_2024-04-17 in 0.14 sec.
2025-11-14 15:32:31,799 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:31,820 - INFO - Going to convert document batch...
2025-11-14 15:32:31,821 - INFO - Processing document 4_2024-05-10
2025-11-14 15:32:31,877 - INFO - Finished converting document 4_2024-05-10 in 0.09 sec.
2025-11-14 15:32:31,939 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:31,965 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMD\4_2024-04-17' --> 'data\processed_data\AMD\4_2024-04-17.md'
Converted 'data\edgar_documents\AMD\4_2024-05-10' --> 'data\processed_data\AMD\4_2024-05-10.md'


2025-11-14 15:32:31,967 - INFO - Processing document 4_2024-05-17
2025-11-14 15:32:32,017 - INFO - Finished converting document 4_2024-05-17 in 0.09 sec.
2025-11-14 15:32:32,092 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:32,127 - INFO - Going to convert document batch...
2025-11-14 15:32:32,128 - INFO - Processing document 4_2024-05-21
2025-11-14 15:32:32,182 - INFO - Finished converting document 4_2024-05-21 in 0.12 sec.
2025-11-14 15:32:32,244 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2024-05-17' --> 'data\processed_data\AMD\4_2024-05-17.md'
Converted 'data\edgar_documents\AMD\4_2024-05-21' --> 'data\processed_data\AMD\4_2024-05-21.md'


2025-11-14 15:32:32,265 - INFO - Going to convert document batch...
2025-11-14 15:32:32,266 - INFO - Processing document 4_2024-06-06
2025-11-14 15:32:32,311 - INFO - Finished converting document 4_2024-06-06 in 0.09 sec.
2025-11-14 15:32:32,362 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:32,394 - INFO - Going to convert document batch...
2025-11-14 15:32:32,395 - INFO - Processing document 4_2024-06-07
2025-11-14 15:32:32,462 - INFO - Finished converting document 4_2024-06-07 in 0.11 sec.
2025-11-14 15:32:32,526 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2024-06-06' --> 'data\processed_data\AMD\4_2024-06-06.md'
Converted 'data\edgar_documents\AMD\4_2024-06-07' --> 'data\processed_data\AMD\4_2024-06-07.md'


2025-11-14 15:32:32,552 - INFO - Going to convert document batch...
2025-11-14 15:32:32,553 - INFO - Processing document 4_2024-06-10
2025-11-14 15:32:32,603 - INFO - Finished converting document 4_2024-06-10 in 0.08 sec.
2025-11-14 15:32:32,683 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:32,706 - INFO - Going to convert document batch...
2025-11-14 15:32:32,708 - INFO - Processing document 4_2024-06-11
2025-11-14 15:32:32,771 - INFO - Finished converting document 4_2024-06-11 in 0.11 sec.
2025-11-14 15:32:32,857 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2024-06-10' --> 'data\processed_data\AMD\4_2024-06-10.md'
Converted 'data\edgar_documents\AMD\4_2024-06-11' --> 'data\processed_data\AMD\4_2024-06-11.md'


2025-11-14 15:32:32,882 - INFO - Going to convert document batch...
2025-11-14 15:32:32,884 - INFO - Processing document 4_2024-06-12
2025-11-14 15:32:32,935 - INFO - Finished converting document 4_2024-06-12 in 0.11 sec.
2025-11-14 15:32:32,994 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:33,020 - INFO - Going to convert document batch...
2025-11-14 15:32:33,021 - INFO - Processing document 4_2024-06-13
2025-11-14 15:32:33,083 - INFO - Finished converting document 4_2024-06-13 in 0.09 sec.
2025-11-14 15:32:33,164 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:33,195 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMD\4_2024-06-12' --> 'data\processed_data\AMD\4_2024-06-12.md'
Converted 'data\edgar_documents\AMD\4_2024-06-13' --> 'data\processed_data\AMD\4_2024-06-13.md'


2025-11-14 15:32:33,197 - INFO - Processing document 4_2024-06-18
2025-11-14 15:32:33,283 - INFO - Finished converting document 4_2024-06-18 in 0.12 sec.
2025-11-14 15:32:33,361 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:33,389 - INFO - Going to convert document batch...
2025-11-14 15:32:33,390 - INFO - Processing document 4_2024-07-16
2025-11-14 15:32:33,452 - INFO - Finished converting document 4_2024-07-16 in 0.11 sec.
2025-11-14 15:32:33,547 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2024-06-18' --> 'data\processed_data\AMD\4_2024-06-18.md'
Converted 'data\edgar_documents\AMD\4_2024-07-16' --> 'data\processed_data\AMD\4_2024-07-16.md'


2025-11-14 15:32:33,584 - INFO - Going to convert document batch...
2025-11-14 15:32:33,587 - INFO - Processing document 4_2024-07-17
2025-11-14 15:32:33,696 - INFO - Finished converting document 4_2024-07-17 in 0.17 sec.
2025-11-14 15:32:33,760 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:33,774 - INFO - Going to convert document batch...
2025-11-14 15:32:33,775 - INFO - Processing document 4_2024-08-07
2025-11-14 15:32:33,810 - INFO - Finished converting document 4_2024-08-07 in 0.08 sec.
2025-11-14 15:32:33,890 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2024-07-17' --> 'data\processed_data\AMD\4_2024-07-17.md'
Converted 'data\edgar_documents\AMD\4_2024-08-07' --> 'data\processed_data\AMD\4_2024-08-07.md'


2025-11-14 15:32:33,926 - INFO - Going to convert document batch...
2025-11-14 15:32:33,929 - INFO - Processing document 4_2024-08-13
2025-11-14 15:32:34,028 - INFO - Finished converting document 4_2024-08-13 in 0.16 sec.
2025-11-14 15:32:34,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:34,182 - INFO - Going to convert document batch...
2025-11-14 15:32:34,184 - INFO - Processing document 4_2024-08-19
2025-11-14 15:32:34,246 - INFO - Finished converting document 4_2024-08-19 in 0.16 sec.


Converted 'data\edgar_documents\AMD\4_2024-08-13' --> 'data\processed_data\AMD\4_2024-08-13.md'


2025-11-14 15:32:34,316 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:34,345 - INFO - Going to convert document batch...
2025-11-14 15:32:34,347 - INFO - Processing document 4_2024-08-22
2025-11-14 15:32:34,423 - INFO - Finished converting document 4_2024-08-22 in 0.12 sec.


Converted 'data\edgar_documents\AMD\4_2024-08-19' --> 'data\processed_data\AMD\4_2024-08-19.md'


2025-11-14 15:32:34,495 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:34,530 - INFO - Going to convert document batch...
2025-11-14 15:32:34,531 - INFO - Processing document 4_2024-09-13
2025-11-14 15:32:34,602 - INFO - Finished converting document 4_2024-09-13 in 0.11 sec.


Converted 'data\edgar_documents\AMD\4_2024-08-22' --> 'data\processed_data\AMD\4_2024-08-22.md'


2025-11-14 15:32:34,714 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:34,746 - INFO - Going to convert document batch...
2025-11-14 15:32:34,747 - INFO - Processing document 4_2024-09-17
2025-11-14 15:32:34,817 - INFO - Finished converting document 4_2024-09-17 in 0.12 sec.


Converted 'data\edgar_documents\AMD\4_2024-09-13' --> 'data\processed_data\AMD\4_2024-09-13.md'
Converted 'data\edgar_documents\AMD\4_2024-09-17' --> 'data\processed_data\AMD\4_2024-09-17.md'


2025-11-14 15:32:34,895 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:34,921 - INFO - Going to convert document batch...
2025-11-14 15:32:34,923 - INFO - Processing document 4_2024-11-05
2025-11-14 15:32:34,989 - INFO - Finished converting document 4_2024-11-05 in 0.12 sec.
2025-11-14 15:32:35,058 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:35,088 - INFO - Going to convert document batch...
2025-11-14 15:32:35,090 - INFO - Processing document 4_2024-11-07
2025-11-14 15:32:35,150 - INFO - Finished converting document 4_2024-11-07 in 0.09 sec.
2025-11-14 15:32:35,216 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:35,243 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMD\4_2024-11-05' --> 'data\processed_data\AMD\4_2024-11-05.md'
Converted 'data\edgar_documents\AMD\4_2024-11-07' --> 'data\processed_data\AMD\4_2024-11-07.md'


2025-11-14 15:32:35,245 - INFO - Processing document 4_2024-11-08
2025-11-14 15:32:35,308 - INFO - Finished converting document 4_2024-11-08 in 0.12 sec.
2025-11-14 15:32:35,387 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:35,410 - INFO - Going to convert document batch...
2025-11-14 15:32:35,412 - INFO - Processing document 4_2024-12-06
2025-11-14 15:32:35,478 - INFO - Finished converting document 4_2024-12-06 in 0.09 sec.
2025-11-14 15:32:35,559 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2024-11-08' --> 'data\processed_data\AMD\4_2024-11-08.md'
Converted 'data\edgar_documents\AMD\4_2024-12-06' --> 'data\processed_data\AMD\4_2024-12-06.md'


2025-11-14 15:32:35,593 - INFO - Going to convert document batch...
2025-11-14 15:32:35,598 - INFO - Processing document 4_2024-12-17
2025-11-14 15:32:35,706 - INFO - Finished converting document 4_2024-12-17 in 0.16 sec.
2025-11-14 15:32:35,778 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:35,804 - INFO - Going to convert document batch...
2025-11-14 15:32:35,805 - INFO - Processing document 4_2025-01-17
2025-11-14 15:32:35,874 - INFO - Finished converting document 4_2025-01-17 in 0.11 sec.
2025-11-14 15:32:35,971 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2024-12-17' --> 'data\processed_data\AMD\4_2024-12-17.md'
Converted 'data\edgar_documents\AMD\4_2025-01-17' --> 'data\processed_data\AMD\4_2025-01-17.md'


2025-11-14 15:32:35,998 - INFO - Going to convert document batch...
2025-11-14 15:32:35,999 - INFO - Processing document 4_2025-02-12
2025-11-14 15:32:36,066 - INFO - Finished converting document 4_2025-02-12 in 0.12 sec.
2025-11-14 15:32:36,153 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:36,176 - INFO - Going to convert document batch...
2025-11-14 15:32:36,178 - INFO - Processing document 4_2025-02-19
2025-11-14 15:32:36,237 - INFO - Finished converting document 4_2025-02-19 in 0.09 sec.
2025-11-14 15:32:36,295 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:36,326 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMD\4_2025-02-12' --> 'data\processed_data\AMD\4_2025-02-12.md'
Converted 'data\edgar_documents\AMD\4_2025-02-19' --> 'data\processed_data\AMD\4_2025-02-19.md'


2025-11-14 15:32:36,328 - INFO - Processing document 4_2025-03-03
2025-11-14 15:32:36,393 - INFO - Finished converting document 4_2025-03-03 in 0.11 sec.
2025-11-14 15:32:36,488 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:32:36,489 - ERROR - Input document 4_2025-03-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:32:36,494 - INFO - Going to convert document batch...
2025-11-14 15:32:36,528 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-1

Converted 'data\edgar_documents\AMD\4_2025-03-03' --> 'data\processed_data\AMD\4_2025-03-03.md'
Error processing data\edgar_documents\AMD\4_2025-03-10: File format not allowed: data\edgar_documents\AMD\4_2025-03-10
Error processing data\edgar_documents\AMD\4_2025-03-12: File format not allowed: data\edgar_documents\AMD\4_2025-03-12


2025-11-14 15:32:36,737 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:36,772 - INFO - Going to convert document batch...
2025-11-14 15:32:36,773 - INFO - Processing document 4_2025-03-18
2025-11-14 15:32:36,838 - INFO - Finished converting document 4_2025-03-18 in 0.11 sec.


Converted 'data\edgar_documents\AMD\4_2025-03-14' --> 'data\processed_data\AMD\4_2025-03-14.md'


2025-11-14 15:32:36,944 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:36,971 - INFO - Going to convert document batch...
2025-11-14 15:32:36,973 - INFO - Processing document 4_2025-04-17
2025-11-14 15:32:37,050 - INFO - Finished converting document 4_2025-04-17 in 0.14 sec.


Converted 'data\edgar_documents\AMD\4_2025-03-18' --> 'data\processed_data\AMD\4_2025-03-18.md'


2025-11-14 15:32:37,133 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:37,164 - INFO - Going to convert document batch...
2025-11-14 15:32:37,165 - INFO - Processing document 4_2025-05-12
2025-11-14 15:32:37,249 - INFO - Finished converting document 4_2025-05-12 in 0.14 sec.


Converted 'data\edgar_documents\AMD\4_2025-04-17' --> 'data\processed_data\AMD\4_2025-04-17.md'
Converted 'data\edgar_documents\AMD\4_2025-05-12' --> 'data\processed_data\AMD\4_2025-05-12.md'


2025-11-14 15:32:37,345 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:37,378 - INFO - Going to convert document batch...
2025-11-14 15:32:37,380 - INFO - Processing document 4_2025-05-16
2025-11-14 15:32:37,451 - INFO - Finished converting document 4_2025-05-16 in 0.14 sec.
2025-11-14 15:32:37,531 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:37,563 - INFO - Going to convert document batch...
2025-11-14 15:32:37,565 - INFO - Processing document 4_2025-05-19
2025-11-14 15:32:37,635 - INFO - Finished converting document 4_2025-05-19 in 0.11 sec.
2025-11-14 15:32:37,708 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2025-05-16' --> 'data\processed_data\AMD\4_2025-05-16.md'
Converted 'data\edgar_documents\AMD\4_2025-05-19' --> 'data\processed_data\AMD\4_2025-05-19.md'


2025-11-14 15:32:37,731 - INFO - Going to convert document batch...
2025-11-14 15:32:37,732 - INFO - Processing document 4_2025-05-22
2025-11-14 15:32:37,786 - INFO - Finished converting document 4_2025-05-22 in 0.09 sec.
2025-11-14 15:32:37,854 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:37,880 - INFO - Going to convert document batch...
2025-11-14 15:32:37,882 - INFO - Processing document 4_2025-06-13
2025-11-14 15:32:37,952 - INFO - Finished converting document 4_2025-06-13 in 0.11 sec.


Converted 'data\edgar_documents\AMD\4_2025-05-22' --> 'data\processed_data\AMD\4_2025-05-22.md'
Converted 'data\edgar_documents\AMD\4_2025-06-13' --> 'data\processed_data\AMD\4_2025-06-13.md'


2025-11-14 15:32:38,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:38,125 - INFO - Going to convert document batch...
2025-11-14 15:32:38,128 - INFO - Processing document 4_2025-06-17
2025-11-14 15:32:38,202 - INFO - Finished converting document 4_2025-06-17 in 0.19 sec.
2025-11-14 15:32:38,269 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2025-06-17' --> 'data\processed_data\AMD\4_2025-06-17.md'


2025-11-14 15:32:38,756 - INFO - Going to convert document batch...
2025-11-14 15:32:38,757 - INFO - Processing document 4_2025-07-17
2025-11-14 15:32:38,837 - INFO - Finished converting document 4_2025-07-17 in 0.58 sec.
2025-11-14 15:32:38,925 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:38,958 - INFO - Going to convert document batch...
2025-11-14 15:32:38,960 - INFO - Processing document 4_2025-08-12
2025-11-14 15:32:39,039 - INFO - Finished converting document 4_2025-08-12 in 0.12 sec.


Converted 'data\edgar_documents\AMD\4_2025-07-17' --> 'data\processed_data\AMD\4_2025-07-17.md'
Converted 'data\edgar_documents\AMD\4_2025-08-12' --> 'data\processed_data\AMD\4_2025-08-12.md'


2025-11-14 15:32:39,149 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:39,182 - INFO - Going to convert document batch...
2025-11-14 15:32:39,184 - INFO - Processing document 4_2025-08-15
2025-11-14 15:32:39,263 - INFO - Finished converting document 4_2025-08-15 in 0.16 sec.
2025-11-14 15:32:39,349 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:39,376 - INFO - Going to convert document batch...
2025-11-14 15:32:39,377 - INFO - Processing document 4_2025-08-19
2025-11-14 15:32:39,438 - INFO - Finished converting document 4_2025-08-19 in 0.11 sec.
2025-11-14 15:32:39,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2025-08-15' --> 'data\processed_data\AMD\4_2025-08-15.md'
Converted 'data\edgar_documents\AMD\4_2025-08-19' --> 'data\processed_data\AMD\4_2025-08-19.md'


2025-11-14 15:32:39,562 - INFO - Going to convert document batch...
2025-11-14 15:32:39,564 - INFO - Processing document 4_2025-08-25
2025-11-14 15:32:39,644 - INFO - Finished converting document 4_2025-08-25 in 0.14 sec.
2025-11-14 15:32:39,719 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:39,729 - INFO - Going to convert document batch...
2025-11-14 15:32:39,730 - INFO - Processing document 4_2025-09-04
2025-11-14 15:32:39,771 - INFO - Finished converting document 4_2025-09-04 in 0.06 sec.
2025-11-14 15:32:39,836 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:39,878 - INFO - Going to convert document batch...
2025-11-14 15:32:39,880 - INFO - Processing document 4_2025-09-12


Converted 'data\edgar_documents\AMD\4_2025-08-25' --> 'data\processed_data\AMD\4_2025-08-25.md'
Converted 'data\edgar_documents\AMD\4_2025-09-04' --> 'data\processed_data\AMD\4_2025-09-04.md'


2025-11-14 15:32:39,960 - INFO - Finished converting document 4_2025-09-12 in 0.14 sec.
2025-11-14 15:32:40,041 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:40,076 - INFO - Going to convert document batch...
2025-11-14 15:32:40,079 - INFO - Processing document 4_2025-09-17
2025-11-14 15:32:40,175 - INFO - Finished converting document 4_2025-09-17 in 0.16 sec.


Converted 'data\edgar_documents\AMD\4_2025-09-12' --> 'data\processed_data\AMD\4_2025-09-12.md'


2025-11-14 15:32:40,266 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:40,293 - INFO - Going to convert document batch...
2025-11-14 15:32:40,294 - INFO - Processing document 4_2025-09-26
2025-11-14 15:32:40,348 - INFO - Finished converting document 4_2025-09-26 in 0.11 sec.
2025-11-14 15:32:40,428 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2025-09-17' --> 'data\processed_data\AMD\4_2025-09-17.md'
Converted 'data\edgar_documents\AMD\4_2025-09-26' --> 'data\processed_data\AMD\4_2025-09-26.md'


2025-11-14 15:32:40,442 - INFO - Going to convert document batch...
2025-11-14 15:32:40,444 - INFO - Processing document 4_2025-10-08
2025-11-14 15:32:40,515 - INFO - Finished converting document 4_2025-10-08 in 0.11 sec.
2025-11-14 15:32:40,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:40,631 - INFO - Going to convert document batch...
2025-11-14 15:32:40,633 - INFO - Processing document 4_2025-10-17
2025-11-14 15:32:40,691 - INFO - Finished converting document 4_2025-10-17 in 0.11 sec.
2025-11-14 15:32:40,785 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\4_2025-10-08' --> 'data\processed_data\AMD\4_2025-10-08.md'
Converted 'data\edgar_documents\AMD\4_2025-10-17' --> 'data\processed_data\AMD\4_2025-10-17.md'


2025-11-14 15:32:40,828 - INFO - Going to convert document batch...
2025-11-14 15:32:40,831 - INFO - Processing document 8-K_2023-01-11
2025-11-14 15:32:40,906 - INFO - Finished converting document 8-K_2023-01-11 in 0.16 sec.
2025-11-14 15:32:40,981 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:41,027 - INFO - Going to convert document batch...
2025-11-14 15:32:41,030 - INFO - Processing document 8-K_2023-01-31
2025-11-14 15:32:41,086 - INFO - Finished converting document 8-K_2023-01-31 in 0.12 sec.


Converted 'data\edgar_documents\AMD\8-K_2023-01-11' --> 'data\processed_data\AMD\8-K_2023-01-11.md'
Converted 'data\edgar_documents\AMD\8-K_2023-01-31' --> 'data\processed_data\AMD\8-K_2023-01-31.md'


2025-11-14 15:32:41,172 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:41,220 - INFO - Going to convert document batch...
2025-11-14 15:32:41,222 - INFO - Processing document 8-K_2023-02-21
2025-11-14 15:32:41,272 - INFO - Finished converting document 8-K_2023-02-21 in 0.12 sec.
2025-11-14 15:32:41,320 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:41,348 - INFO - Going to convert document batch...
2025-11-14 15:32:41,349 - INFO - Processing document 8-K_2023-05-02
2025-11-14 15:32:41,377 - INFO - Finished converting document 8-K_2023-05-02 in 0.08 sec.
2025-11-14 15:32:41,421 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:41,453 - INFO - Going to convert document batch...
2025-11-14 15:32:41,455 - INFO - Processing document 8-K_2023-05-23


Converted 'data\edgar_documents\AMD\8-K_2023-02-21' --> 'data\processed_data\AMD\8-K_2023-02-21.md'
Converted 'data\edgar_documents\AMD\8-K_2023-05-02' --> 'data\processed_data\AMD\8-K_2023-05-02.md'


2025-11-14 15:32:41,536 - INFO - Finished converting document 8-K_2023-05-23 in 0.14 sec.
2025-11-14 15:32:41,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:41,650 - INFO - Going to convert document batch...
2025-11-14 15:32:41,651 - INFO - Processing document 8-K_2023-07-10
2025-11-14 15:32:41,699 - INFO - Finished converting document 8-K_2023-07-10 in 0.12 sec.


Converted 'data\edgar_documents\AMD\8-K_2023-05-23' --> 'data\processed_data\AMD\8-K_2023-05-23.md'
Converted 'data\edgar_documents\AMD\8-K_2023-07-10' --> 'data\processed_data\AMD\8-K_2023-07-10.md'


2025-11-14 15:32:41,778 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:41,826 - INFO - Going to convert document batch...
2025-11-14 15:32:41,828 - INFO - Processing document 8-K_2023-08-01
2025-11-14 15:32:41,879 - INFO - Finished converting document 8-K_2023-08-01 in 0.12 sec.
2025-11-14 15:32:41,934 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:41,976 - INFO - Going to convert document batch...
2025-11-14 15:32:41,980 - INFO - Processing document 8-K_2023-10-31
2025-11-14 15:32:42,034 - INFO - Finished converting document 8-K_2023-10-31 in 0.12 sec.
2025-11-14 15:32:42,091 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\8-K_2023-08-01' --> 'data\processed_data\AMD\8-K_2023-08-01.md'
Converted 'data\edgar_documents\AMD\8-K_2023-10-31' --> 'data\processed_data\AMD\8-K_2023-10-31.md'


2025-11-14 15:32:42,124 - INFO - Going to convert document batch...
2025-11-14 15:32:42,130 - INFO - Processing document 8-K_2024-01-30
2025-11-14 15:32:42,207 - INFO - Finished converting document 8-K_2024-01-30 in 0.14 sec.
2025-11-14 15:32:42,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:42,294 - INFO - Going to convert document batch...
2025-11-14 15:32:42,296 - INFO - Processing document 8-K_2024-02-20
2025-11-14 15:32:42,379 - INFO - Finished converting document 8-K_2024-02-20 in 0.14 sec.
2025-11-14 15:32:42,440 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\8-K_2024-01-30' --> 'data\processed_data\AMD\8-K_2024-01-30.md'
Converted 'data\edgar_documents\AMD\8-K_2024-02-20' --> 'data\processed_data\AMD\8-K_2024-02-20.md'


2025-11-14 15:32:42,484 - INFO - Going to convert document batch...
2025-11-14 15:32:42,490 - INFO - Processing document 8-K_2024-04-30
2025-11-14 15:32:42,546 - INFO - Finished converting document 8-K_2024-04-30 in 0.14 sec.
2025-11-14 15:32:42,591 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:42,659 - INFO - Going to convert document batch...
2025-11-14 15:32:42,661 - INFO - Processing document 8-K_2024-05-13
2025-11-14 15:32:42,737 - INFO - Finished converting document 8-K_2024-05-13 in 0.16 sec.


Converted 'data\edgar_documents\AMD\8-K_2024-04-30' --> 'data\processed_data\AMD\8-K_2024-04-30.md'
Converted 'data\edgar_documents\AMD\8-K_2024-05-13' --> 'data\processed_data\AMD\8-K_2024-05-13.md'


2025-11-14 15:32:42,814 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:42,866 - INFO - Going to convert document batch...
2025-11-14 15:32:42,867 - INFO - Processing document 8-K_2024-07-02
2025-11-14 15:32:42,929 - INFO - Finished converting document 8-K_2024-07-02 in 0.14 sec.
2025-11-14 15:32:42,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:43,010 - INFO - Going to convert document batch...
2025-11-14 15:32:43,012 - INFO - Processing document 8-K_2024-07-22
2025-11-14 15:32:43,059 - INFO - Finished converting document 8-K_2024-07-22 in 0.11 sec.


Converted 'data\edgar_documents\AMD\8-K_2024-07-02' --> 'data\processed_data\AMD\8-K_2024-07-02.md'
Converted 'data\edgar_documents\AMD\8-K_2024-07-22' --> 'data\processed_data\AMD\8-K_2024-07-22.md'


2025-11-14 15:32:43,135 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:43,172 - INFO - Going to convert document batch...
2025-11-14 15:32:43,175 - INFO - Processing document 8-K_2024-07-30
2025-11-14 15:32:43,234 - INFO - Finished converting document 8-K_2024-07-30 in 0.14 sec.
2025-11-14 15:32:43,288 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:43,330 - INFO - Going to convert document batch...
2025-11-14 15:32:43,332 - INFO - Processing document 8-K_2024-08-19
2025-11-14 15:32:43,396 - INFO - Finished converting document 8-K_2024-08-19 in 0.12 sec.
2025-11-14 15:32:43,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\8-K_2024-07-30' --> 'data\processed_data\AMD\8-K_2024-07-30.md'
Converted 'data\edgar_documents\AMD\8-K_2024-08-19' --> 'data\processed_data\AMD\8-K_2024-08-19.md'


2025-11-14 15:32:43,474 - INFO - Going to convert document batch...
2025-11-14 15:32:43,475 - INFO - Processing document 8-K_2024-10-29
2025-11-14 15:32:43,547 - INFO - Finished converting document 8-K_2024-10-29 in 0.11 sec.
2025-11-14 15:32:43,589 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:43,630 - INFO - Going to convert document batch...
2025-11-14 15:32:43,633 - INFO - Processing document 8-K_2024-11-18
2025-11-14 15:32:43,685 - INFO - Finished converting document 8-K_2024-11-18 in 0.11 sec.


Converted 'data\edgar_documents\AMD\8-K_2024-10-29' --> 'data\processed_data\AMD\8-K_2024-10-29.md'
Converted 'data\edgar_documents\AMD\8-K_2024-11-18' --> 'data\processed_data\AMD\8-K_2024-11-18.md'


2025-11-14 15:32:43,770 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:43,808 - INFO - Going to convert document batch...
2025-11-14 15:32:43,810 - INFO - Processing document 8-K_2025-02-04
2025-11-14 15:32:43,866 - INFO - Finished converting document 8-K_2025-02-04 in 0.12 sec.
2025-11-14 15:32:43,931 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:43,971 - INFO - Going to convert document batch...
2025-11-14 15:32:43,973 - INFO - Processing document 8-K_2025-02-24
2025-11-14 15:32:44,031 - INFO - Finished converting document 8-K_2025-02-24 in 0.14 sec.


Converted 'data\edgar_documents\AMD\8-K_2025-02-04' --> 'data\processed_data\AMD\8-K_2025-02-04.md'
Converted 'data\edgar_documents\AMD\8-K_2025-02-24' --> 'data\processed_data\AMD\8-K_2025-02-24.md'


2025-11-14 15:32:44,085 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:44,129 - INFO - Going to convert document batch...
2025-11-14 15:32:44,130 - INFO - Processing document 8-K_2025-03-12
2025-11-14 15:32:44,177 - INFO - Finished converting document 8-K_2025-03-12 in 0.12 sec.
2025-11-14 15:32:44,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:44,263 - INFO - Going to convert document batch...
2025-11-14 15:32:44,265 - INFO - Processing document 8-K_2025-03-24
2025-11-14 15:32:44,322 - INFO - Finished converting document 8-K_2025-03-24 in 0.11 sec.
2025-11-14 15:32:44,380 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\8-K_2025-03-12' --> 'data\processed_data\AMD\8-K_2025-03-12.md'
Converted 'data\edgar_documents\AMD\8-K_2025-03-24' --> 'data\processed_data\AMD\8-K_2025-03-24.md'


2025-11-14 15:32:44,412 - INFO - Going to convert document batch...
2025-11-14 15:32:44,416 - INFO - Processing document 8-K_2025-03-31
2025-11-14 15:32:44,503 - INFO - Finished converting document 8-K_2025-03-31 in 0.14 sec.
2025-11-14 15:32:44,594 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:44,640 - INFO - Going to convert document batch...
2025-11-14 15:32:44,643 - INFO - Processing document 8-K_2025-04-16
2025-11-14 15:32:44,686 - INFO - Finished converting document 8-K_2025-04-16 in 0.12 sec.
2025-11-14 15:32:44,748 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\8-K_2025-03-31' --> 'data\processed_data\AMD\8-K_2025-03-31.md'
Converted 'data\edgar_documents\AMD\8-K_2025-04-16' --> 'data\processed_data\AMD\8-K_2025-04-16.md'


2025-11-14 15:32:44,781 - INFO - Going to convert document batch...
2025-11-14 15:32:44,782 - INFO - Processing document 8-K_2025-05-06
2025-11-14 15:32:44,854 - INFO - Finished converting document 8-K_2025-05-06 in 0.14 sec.
2025-11-14 15:32:44,917 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:44,965 - INFO - Going to convert document batch...
2025-11-14 15:32:44,968 - INFO - Processing document 8-K_2025-05-16
2025-11-14 15:32:45,080 - INFO - Finished converting document 8-K_2025-05-16 in 0.19 sec.


Converted 'data\edgar_documents\AMD\8-K_2025-05-06' --> 'data\processed_data\AMD\8-K_2025-05-06.md'


2025-11-14 15:32:45,160 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:45,185 - INFO - Going to convert document batch...
2025-11-14 15:32:45,187 - INFO - Processing document 8-K_2025-05-19
2025-11-14 15:32:45,227 - INFO - Finished converting document 8-K_2025-05-19 in 0.08 sec.
2025-11-14 15:32:45,292 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:45,330 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMD\8-K_2025-05-16' --> 'data\processed_data\AMD\8-K_2025-05-16.md'
Converted 'data\edgar_documents\AMD\8-K_2025-05-19' --> 'data\processed_data\AMD\8-K_2025-05-19.md'


2025-11-14 15:32:45,332 - INFO - Processing document 8-K_2025-06-03
2025-11-14 15:32:45,369 - INFO - Finished converting document 8-K_2025-06-03 in 0.09 sec.
2025-11-14 15:32:45,398 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:45,412 - INFO - Going to convert document batch...
2025-11-14 15:32:45,412 - INFO - Processing document 8-K_2025-07-02
2025-11-14 15:32:45,482 - INFO - Finished converting document 8-K_2025-07-02 in 0.11 sec.
2025-11-14 15:32:45,559 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\8-K_2025-06-03' --> 'data\processed_data\AMD\8-K_2025-06-03.md'
Converted 'data\edgar_documents\AMD\8-K_2025-07-02' --> 'data\processed_data\AMD\8-K_2025-07-02.md'


2025-11-14 15:32:45,599 - INFO - Going to convert document batch...
2025-11-14 15:32:45,602 - INFO - Processing document 8-K_2025-08-05
2025-11-14 15:32:45,690 - INFO - Finished converting document 8-K_2025-08-05 in 0.16 sec.
2025-11-14 15:32:45,740 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:45,756 - INFO - Going to convert document batch...
2025-11-14 15:32:45,758 - INFO - Processing document 8-K_2025-08-25
2025-11-14 15:32:45,784 - INFO - Finished converting document 8-K_2025-08-25 in 0.08 sec.
2025-11-14 15:32:45,836 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:45,869 - INFO - Going to convert document batch...
2025-11-14 15:32:45,870 - INFO - Processing document 8-K_2025-10-06
2025-11-14 15:32:45,911 - INFO - Finished converting document 8-K_2025-10-06 in 0.11 sec.


Converted 'data\edgar_documents\AMD\8-K_2025-08-05' --> 'data\processed_data\AMD\8-K_2025-08-05.md'
Converted 'data\edgar_documents\AMD\8-K_2025-08-25' --> 'data\processed_data\AMD\8-K_2025-08-25.md'


2025-11-14 15:32:45,983 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:46,009 - INFO - Going to convert document batch...
2025-11-14 15:32:46,011 - INFO - Processing document 8-K_2025-10-27
2025-11-14 15:32:46,086 - INFO - Finished converting document 8-K_2025-10-27 in 0.12 sec.
2025-11-14 15:32:46,146 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\8-K_2025-10-06' --> 'data\processed_data\AMD\8-K_2025-10-06.md'
Converted 'data\edgar_documents\AMD\8-K_2025-10-27' --> 'data\processed_data\AMD\8-K_2025-10-27.md'


2025-11-14 15:32:46,160 - INFO - Going to convert document batch...
2025-11-14 15:32:46,162 - INFO - Processing document 8-K_2025-11-04
2025-11-14 15:32:46,227 - INFO - Finished converting document 8-K_2025-11-04 in 0.09 sec.
2025-11-14 15:32:46,374 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:32:46,375 - ERROR - Input document DEF-14A_2023-03-31 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:32:46,382 - INFO - Going to convert 

Converted 'data\edgar_documents\AMD\8-K_2025-11-04' --> 'data\processed_data\AMD\8-K_2025-11-04.md'
Error processing data\edgar_documents\AMD\DEF-14A_2023-03-31: File format not allowed: data\edgar_documents\AMD\DEF-14A_2023-03-31


2025-11-14 15:32:46,453 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:32:49,093 - INFO - Going to convert document batch...
2025-11-14 15:32:49,095 - INFO - Processing document DEF-14A_2024-03-25
2025-11-14 15:32:52,718 - INFO - Finished converting document DEF-14A_2024-03-25 in 6.34 sec.
2025-11-14 15:32:54,695 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMD\DEF-14A_2024-03-25' --> 'data\processed_data\AMD\DEF-14A_2024-03-25.md'


2025-11-14 15:32:56,681 - INFO - Going to convert document batch...
2025-11-14 15:32:56,683 - INFO - Processing document DEF-14A_2025-03-28
2025-11-14 15:33:00,552 - INFO - Finished converting document DEF-14A_2025-03-28 in 5.91 sec.


Converted 'data\edgar_documents\AMD\DEF-14A_2025-03-28' --> 'data\processed_data\AMD\DEF-14A_2025-03-28.md'
Processed 144 new files. Errors: 3
Found 92 files to process in data\edgar_documents\AMGN


2025-11-14 15:33:02,328 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:33:04,657 - INFO - Going to convert document batch...
2025-11-14 15:33:04,658 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:33:04,661 - INFO - Processing document 10-K_2023-02-09
2025-11-14 15:33:10,874 - INFO - Finished converting document 10-K_2023-02-09 in 8.72 sec.
2025-11-14 15:33:12,356 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\10-K_2023-02-09' --> 'data\processed_data\AMGN\10-K_2023-02-09.md'


2025-11-14 15:33:14,290 - INFO - Going to convert document batch...
2025-11-14 15:33:14,291 - INFO - Processing document 10-K_2024-02-14
2025-11-14 15:33:19,188 - INFO - Finished converting document 10-K_2024-02-14 in 6.91 sec.
2025-11-14 15:33:21,251 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:33:21,252 - ERROR - Input document 10-K_2025-02-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:33:21,256 - INFO - Going to convert d

Converted 'data\edgar_documents\AMGN\10-K_2024-02-14' --> 'data\processed_data\AMGN\10-K_2024-02-14.md'
Error processing data\edgar_documents\AMGN\10-K_2025-02-14: File format not allowed: data\edgar_documents\AMGN\10-K_2025-02-14


2025-11-14 15:33:22,319 - INFO - Going to convert document batch...
2025-11-14 15:33:22,321 - INFO - Processing document 10-Q_2023-04-28
2025-11-14 15:33:24,730 - INFO - Finished converting document 10-Q_2023-04-28 in 3.48 sec.
2025-11-14 15:33:25,934 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\10-Q_2023-04-28' --> 'data\processed_data\AMGN\10-Q_2023-04-28.md'


2025-11-14 15:33:28,443 - INFO - Going to convert document batch...
2025-11-14 15:33:28,445 - INFO - Processing document 10-Q_2023-08-04
2025-11-14 15:33:31,476 - INFO - Finished converting document 10-Q_2023-08-04 in 5.58 sec.
2025-11-14 15:33:32,726 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\10-Q_2023-08-04' --> 'data\processed_data\AMGN\10-Q_2023-08-04.md'


2025-11-14 15:33:33,516 - INFO - Going to convert document batch...
2025-11-14 15:33:33,517 - INFO - Processing document 10-Q_2023-10-31
2025-11-14 15:33:35,118 - INFO - Finished converting document 10-Q_2023-10-31 in 2.42 sec.
2025-11-14 15:33:36,378 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\10-Q_2023-10-31' --> 'data\processed_data\AMGN\10-Q_2023-10-31.md'


2025-11-14 15:33:37,536 - INFO - Going to convert document batch...
2025-11-14 15:33:37,537 - INFO - Processing document 10-Q_2024-05-03
2025-11-14 15:33:40,362 - INFO - Finished converting document 10-Q_2024-05-03 in 4.01 sec.
2025-11-14 15:33:41,701 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\10-Q_2024-05-03' --> 'data\processed_data\AMGN\10-Q_2024-05-03.md'


2025-11-14 15:33:43,684 - INFO - Going to convert document batch...
2025-11-14 15:33:43,686 - INFO - Processing document 10-Q_2024-08-07
2025-11-14 15:33:47,023 - INFO - Finished converting document 10-Q_2024-08-07 in 5.38 sec.
2025-11-14 15:33:48,483 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\10-Q_2024-08-07' --> 'data\processed_data\AMGN\10-Q_2024-08-07.md'


2025-11-14 15:33:50,929 - INFO - Going to convert document batch...
2025-11-14 15:33:50,931 - INFO - Processing document 10-Q_2024-10-31
2025-11-14 15:33:53,728 - INFO - Finished converting document 10-Q_2024-10-31 in 5.31 sec.
2025-11-14 15:33:55,230 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\10-Q_2024-10-31' --> 'data\processed_data\AMGN\10-Q_2024-10-31.md'


2025-11-14 15:33:57,224 - INFO - Going to convert document batch...
2025-11-14 15:33:57,226 - INFO - Processing document 10-Q_2025-05-02
2025-11-14 15:33:59,879 - INFO - Finished converting document 10-Q_2025-05-02 in 4.70 sec.
2025-11-14 15:34:01,325 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\10-Q_2025-05-02' --> 'data\processed_data\AMGN\10-Q_2025-05-02.md'


2025-11-14 15:34:03,034 - INFO - Going to convert document batch...
2025-11-14 15:34:03,035 - INFO - Processing document 10-Q_2025-08-06
2025-11-14 15:34:06,037 - INFO - Finished converting document 10-Q_2025-08-06 in 4.77 sec.
2025-11-14 15:34:08,850 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\10-Q_2025-08-06' --> 'data\processed_data\AMGN\10-Q_2025-08-06.md'


2025-11-14 15:34:10,487 - INFO - Going to convert document batch...
2025-11-14 15:34:10,489 - INFO - Processing document 10-Q_2025-11-05
2025-11-14 15:34:13,921 - INFO - Finished converting document 10-Q_2025-11-05 in 5.16 sec.
2025-11-14 15:34:15,572 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:34:15,573 - ERROR - Input document 4_2023-02-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:34:15,574 - INFO - Going to convert document batch...
2025-11-14 15:34:15,59

Converted 'data\edgar_documents\AMGN\10-Q_2025-11-05' --> 'data\processed_data\AMGN\10-Q_2025-11-05.md'
Error processing data\edgar_documents\AMGN\4_2023-02-14: File format not allowed: data\edgar_documents\AMGN\4_2023-02-14
Error processing data\edgar_documents\AMGN\4_2023-02-17: File format not allowed: data\edgar_documents\AMGN\4_2023-02-17
Converted 'data\edgar_documents\AMGN\4_2023-03-08' --> 'data\processed_data\AMGN\4_2023-03-08.md'


2025-11-14 15:34:15,770 - INFO - Going to convert document batch...
2025-11-14 15:34:15,772 - INFO - Processing document 4_2023-03-20
2025-11-14 15:34:15,867 - INFO - Finished converting document 4_2023-03-20 in 0.12 sec.
2025-11-14 15:34:15,956 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:15,985 - INFO - Going to convert document batch...
2025-11-14 15:34:15,987 - INFO - Processing document 4_2023-05-02
2025-11-14 15:34:16,048 - INFO - Finished converting document 4_2023-05-02 in 0.11 sec.


Converted 'data\edgar_documents\AMGN\4_2023-03-20' --> 'data\processed_data\AMGN\4_2023-03-20.md'
Converted 'data\edgar_documents\AMGN\4_2023-05-02' --> 'data\processed_data\AMGN\4_2023-05-02.md'


2025-11-14 15:34:16,145 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:16,174 - INFO - Going to convert document batch...
2025-11-14 15:34:16,176 - INFO - Processing document 4_2023-05-03
2025-11-14 15:34:16,214 - INFO - Finished converting document 4_2023-05-03 in 0.11 sec.
2025-11-14 15:34:16,272 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:16,306 - INFO - Going to convert document batch...
2025-11-14 15:34:16,313 - INFO - Processing document 4_2023-05-04
2025-11-14 15:34:16,397 - INFO - Finished converting document 4_2023-05-04 in 0.14 sec.


Converted 'data\edgar_documents\AMGN\4_2023-05-03' --> 'data\processed_data\AMGN\4_2023-05-03.md'


2025-11-14 15:34:16,465 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\4_2023-05-04' --> 'data\processed_data\AMGN\4_2023-05-04.md'


2025-11-14 15:34:17,285 - INFO - Going to convert document batch...
2025-11-14 15:34:17,287 - INFO - Processing document 4_2023-05-09
2025-11-14 15:34:17,332 - INFO - Finished converting document 4_2023-05-09 in 0.89 sec.
2025-11-14 15:34:17,394 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:17,410 - INFO - Going to convert document batch...
2025-11-14 15:34:17,410 - INFO - Processing document 4_2023-05-23
2025-11-14 15:34:17,441 - INFO - Finished converting document 4_2023-05-23 in 0.06 sec.
2025-11-14 15:34:17,515 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:17,545 - INFO - Going to convert document batch...
2025-11-14 15:34:17,547 - INFO - Processing document 4_2023-07-31


Converted 'data\edgar_documents\AMGN\4_2023-05-09' --> 'data\processed_data\AMGN\4_2023-05-09.md'
Converted 'data\edgar_documents\AMGN\4_2023-05-23' --> 'data\processed_data\AMGN\4_2023-05-23.md'


2025-11-14 15:34:17,604 - INFO - Finished converting document 4_2023-07-31 in 0.12 sec.
2025-11-14 15:34:17,684 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:17,713 - INFO - Going to convert document batch...
2025-11-14 15:34:17,714 - INFO - Processing document 4_2023-08-10
2025-11-14 15:34:17,749 - INFO - Finished converting document 4_2023-08-10 in 0.08 sec.
2025-11-14 15:34:17,809 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:17,823 - INFO - Going to convert document batch...
2025-11-14 15:34:17,824 - INFO - Processing document 4_2023-08-11


Converted 'data\edgar_documents\AMGN\4_2023-07-31' --> 'data\processed_data\AMGN\4_2023-07-31.md'
Converted 'data\edgar_documents\AMGN\4_2023-08-10' --> 'data\processed_data\AMGN\4_2023-08-10.md'


2025-11-14 15:34:17,862 - INFO - Finished converting document 4_2023-08-11 in 0.08 sec.
2025-11-14 15:34:17,915 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:17,931 - INFO - Going to convert document batch...
2025-11-14 15:34:17,931 - INFO - Processing document 4_2023-09-19
2025-11-14 15:34:18,003 - INFO - Finished converting document 4_2023-09-19 in 0.11 sec.
2025-11-14 15:34:18,061 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\4_2023-08-11' --> 'data\processed_data\AMGN\4_2023-08-11.md'
Converted 'data\edgar_documents\AMGN\4_2023-09-19' --> 'data\processed_data\AMGN\4_2023-09-19.md'


2025-11-14 15:34:18,085 - INFO - Going to convert document batch...
2025-11-14 15:34:18,087 - INFO - Processing document 4_2023-11-03
2025-11-14 15:34:18,168 - INFO - Finished converting document 4_2023-11-03 in 0.12 sec.
2025-11-14 15:34:18,213 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:18,227 - INFO - Going to convert document batch...
2025-11-14 15:34:18,228 - INFO - Processing document 4_2023-11-07
2025-11-14 15:34:18,281 - INFO - Finished converting document 4_2023-11-07 in 0.08 sec.
2025-11-14 15:34:18,379 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\4_2023-11-03' --> 'data\processed_data\AMGN\4_2023-11-03.md'
Converted 'data\edgar_documents\AMGN\4_2023-11-07' --> 'data\processed_data\AMGN\4_2023-11-07.md'


2025-11-14 15:34:18,395 - INFO - Going to convert document batch...
2025-11-14 15:34:18,396 - INFO - Processing document 4_2023-11-13
2025-11-14 15:34:18,432 - INFO - Finished converting document 4_2023-11-13 in 0.09 sec.
2025-11-14 15:34:18,489 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:18,514 - INFO - Going to convert document batch...
2025-11-14 15:34:18,516 - INFO - Processing document 4_2023-11-29
2025-11-14 15:34:18,581 - INFO - Finished converting document 4_2023-11-29 in 0.11 sec.


Converted 'data\edgar_documents\AMGN\4_2023-11-13' --> 'data\processed_data\AMGN\4_2023-11-13.md'


2025-11-14 15:34:18,693 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:18,709 - INFO - Going to convert document batch...
2025-11-14 15:34:18,710 - INFO - Processing document 4_2023-12-04
2025-11-14 15:34:18,746 - INFO - Finished converting document 4_2023-12-04 in 0.08 sec.
2025-11-14 15:34:18,794 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:18,811 - INFO - Going to convert document batch...
2025-11-14 15:34:18,815 - INFO - Processing document 4_2024-02-12


Converted 'data\edgar_documents\AMGN\4_2023-11-29' --> 'data\processed_data\AMGN\4_2023-11-29.md'
Converted 'data\edgar_documents\AMGN\4_2023-12-04' --> 'data\processed_data\AMGN\4_2023-12-04.md'


2025-11-14 15:34:18,856 - INFO - Finished converting document 4_2024-02-12 in 0.08 sec.
2025-11-14 15:34:18,947 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:18,975 - INFO - Going to convert document batch...
2025-11-14 15:34:18,977 - INFO - Processing document 4_2024-03-08
2025-11-14 15:34:19,030 - INFO - Finished converting document 4_2024-03-08 in 0.11 sec.
2025-11-14 15:34:19,104 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\4_2024-02-12' --> 'data\processed_data\AMGN\4_2024-02-12.md'
Converted 'data\edgar_documents\AMGN\4_2024-03-08' --> 'data\processed_data\AMGN\4_2024-03-08.md'


2025-11-14 15:34:19,123 - INFO - Going to convert document batch...
2025-11-14 15:34:19,125 - INFO - Processing document 4_2024-03-20
2025-11-14 15:34:19,161 - INFO - Finished converting document 4_2024-03-20 in 0.08 sec.
2025-11-14 15:34:19,220 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:19,241 - INFO - Going to convert document batch...
2025-11-14 15:34:19,242 - INFO - Processing document 4_2024-05-01
2025-11-14 15:34:19,280 - INFO - Finished converting document 4_2024-05-01 in 0.08 sec.
2025-11-14 15:34:19,365 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\4_2024-03-20' --> 'data\processed_data\AMGN\4_2024-03-20.md'
Converted 'data\edgar_documents\AMGN\4_2024-05-01' --> 'data\processed_data\AMGN\4_2024-05-01.md'


2025-11-14 15:34:19,392 - INFO - Going to convert document batch...
2025-11-14 15:34:19,395 - INFO - Processing document 4_2024-05-02
2025-11-14 15:34:19,461 - INFO - Finished converting document 4_2024-05-02 in 0.12 sec.
2025-11-14 15:34:19,557 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:19,589 - INFO - Going to convert document batch...
2025-11-14 15:34:19,590 - INFO - Processing document 4_2024-05-03
2025-11-14 15:34:19,626 - INFO - Finished converting document 4_2024-05-03 in 0.09 sec.
2025-11-14 15:34:19,691 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:19,705 - INFO - Going to convert document batch...
2025-11-14 15:34:19,706 - INFO - Processing document 4_2024-05-06
2025-11-14 15:34:19,736 - INFO - Finished converting document 4_2024-05-06 in 0.08 sec.


Converted 'data\edgar_documents\AMGN\4_2024-05-02' --> 'data\processed_data\AMGN\4_2024-05-02.md'
Converted 'data\edgar_documents\AMGN\4_2024-05-03' --> 'data\processed_data\AMGN\4_2024-05-03.md'


2025-11-14 15:34:19,780 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:19,789 - INFO - Going to convert document batch...
2025-11-14 15:34:19,790 - INFO - Processing document 4_2024-05-07
2025-11-14 15:34:19,819 - INFO - Finished converting document 4_2024-05-07 in 0.05 sec.
2025-11-14 15:34:19,897 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:19,924 - INFO - Going to convert document batch...
2025-11-14 15:34:19,926 - INFO - Processing document 4_2024-05-08


Converted 'data\edgar_documents\AMGN\4_2024-05-06' --> 'data\processed_data\AMGN\4_2024-05-06.md'
Converted 'data\edgar_documents\AMGN\4_2024-05-07' --> 'data\processed_data\AMGN\4_2024-05-07.md'


2025-11-14 15:34:20,006 - INFO - Finished converting document 4_2024-05-08 in 0.14 sec.
2025-11-14 15:34:20,082 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:20,112 - INFO - Going to convert document batch...
2025-11-14 15:34:20,115 - INFO - Processing document 4_2024-05-09
2025-11-14 15:34:20,165 - INFO - Finished converting document 4_2024-05-09 in 0.09 sec.
2025-11-14 15:34:20,234 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\4_2024-05-08' --> 'data\processed_data\AMGN\4_2024-05-08.md'
Converted 'data\edgar_documents\AMGN\4_2024-05-09' --> 'data\processed_data\AMGN\4_2024-05-09.md'


2025-11-14 15:34:20,250 - INFO - Going to convert document batch...
2025-11-14 15:34:20,251 - INFO - Processing document 4_2024-06-04
2025-11-14 15:34:20,287 - INFO - Finished converting document 4_2024-06-04 in 0.08 sec.
2025-11-14 15:34:20,340 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:20,371 - INFO - Going to convert document batch...
2025-11-14 15:34:20,373 - INFO - Processing document 4_2024-07-31
2025-11-14 15:34:20,453 - INFO - Finished converting document 4_2024-07-31 in 0.14 sec.


Converted 'data\edgar_documents\AMGN\4_2024-06-04' --> 'data\processed_data\AMGN\4_2024-06-04.md'
Converted 'data\edgar_documents\AMGN\4_2024-07-31' --> 'data\processed_data\AMGN\4_2024-07-31.md'


2025-11-14 15:34:20,518 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:20,537 - INFO - Going to convert document batch...
2025-11-14 15:34:20,540 - INFO - Processing document 4_2024-08-13
2025-11-14 15:34:20,604 - INFO - Finished converting document 4_2024-08-13 in 0.12 sec.
2025-11-14 15:34:20,682 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:20,708 - INFO - Going to convert document batch...
2025-11-14 15:34:20,711 - INFO - Processing document 4_2024-11-06
2025-11-14 15:34:20,756 - INFO - Finished converting document 4_2024-11-06 in 0.09 sec.
2025-11-14 15:34:20,836 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\4_2024-08-13' --> 'data\processed_data\AMGN\4_2024-08-13.md'
Converted 'data\edgar_documents\AMGN\4_2024-11-06' --> 'data\processed_data\AMGN\4_2024-11-06.md'


2025-11-14 15:34:20,882 - INFO - Going to convert document batch...
2025-11-14 15:34:20,884 - INFO - Processing document 4_2024-12-03
2025-11-14 15:34:20,935 - INFO - Finished converting document 4_2024-12-03 in 0.14 sec.
2025-11-14 15:34:20,983 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:20,991 - INFO - Going to convert document batch...
2025-11-14 15:34:20,993 - INFO - Processing document 4_2024-12-06
2025-11-14 15:34:21,023 - INFO - Finished converting document 4_2024-12-06 in 0.05 sec.
2025-11-14 15:34:21,120 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:21,139 - INFO - Going to convert document batch...
2025-11-14 15:34:21,140 - INFO - Processing document 4_2025-02-06


Converted 'data\edgar_documents\AMGN\4_2024-12-03' --> 'data\processed_data\AMGN\4_2024-12-03.md'
Converted 'data\edgar_documents\AMGN\4_2024-12-06' --> 'data\processed_data\AMGN\4_2024-12-06.md'


2025-11-14 15:34:21,195 - INFO - Finished converting document 4_2025-02-06 in 0.09 sec.
2025-11-14 15:34:21,273 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:21,290 - INFO - Going to convert document batch...
2025-11-14 15:34:21,291 - INFO - Processing document 4_2025-02-10
2025-11-14 15:34:21,332 - INFO - Finished converting document 4_2025-02-10 in 0.08 sec.
2025-11-14 15:34:21,417 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:21,442 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMGN\4_2025-02-06' --> 'data\processed_data\AMGN\4_2025-02-06.md'
Converted 'data\edgar_documents\AMGN\4_2025-02-10' --> 'data\processed_data\AMGN\4_2025-02-10.md'


2025-11-14 15:34:21,444 - INFO - Processing document 4_2025-02-13
2025-11-14 15:34:21,516 - INFO - Finished converting document 4_2025-02-13 in 0.12 sec.
2025-11-14 15:34:21,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:21,632 - INFO - Going to convert document batch...
2025-11-14 15:34:21,634 - INFO - Processing document 4_2025-02-20
2025-11-14 15:34:21,701 - INFO - Finished converting document 4_2025-02-20 in 0.14 sec.


Converted 'data\edgar_documents\AMGN\4_2025-02-13' --> 'data\processed_data\AMGN\4_2025-02-13.md'
Converted 'data\edgar_documents\AMGN\4_2025-02-20' --> 'data\processed_data\AMGN\4_2025-02-20.md'


2025-11-14 15:34:21,778 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:21,831 - INFO - Going to convert document batch...
2025-11-14 15:34:21,834 - INFO - Processing document 4_2025-02-21
2025-11-14 15:34:21,906 - INFO - Finished converting document 4_2025-02-21 in 0.16 sec.
2025-11-14 15:34:21,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:22,005 - INFO - Going to convert document batch...
2025-11-14 15:34:22,005 - INFO - Processing document 4_2025-03-05
2025-11-14 15:34:22,065 - INFO - Finished converting document 4_2025-03-05 in 0.11 sec.


Converted 'data\edgar_documents\AMGN\4_2025-02-21' --> 'data\processed_data\AMGN\4_2025-02-21.md'
Converted 'data\edgar_documents\AMGN\4_2025-03-05' --> 'data\processed_data\AMGN\4_2025-03-05.md'


2025-11-14 15:34:22,155 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:22,186 - INFO - Going to convert document batch...
2025-11-14 15:34:22,188 - INFO - Processing document 4_2025-03-19
2025-11-14 15:34:22,257 - INFO - Finished converting document 4_2025-03-19 in 0.12 sec.
2025-11-14 15:34:22,325 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:22,347 - INFO - Going to convert document batch...
2025-11-14 15:34:22,349 - INFO - Processing document 4_2025-05-02
2025-11-14 15:34:22,395 - INFO - Finished converting document 4_2025-05-02 in 0.08 sec.
2025-11-14 15:34:22,484 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:22,507 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMGN\4_2025-03-19' --> 'data\processed_data\AMGN\4_2025-03-19.md'
Converted 'data\edgar_documents\AMGN\4_2025-05-02' --> 'data\processed_data\AMGN\4_2025-05-02.md'


2025-11-14 15:34:22,508 - INFO - Processing document 4_2025-05-06
2025-11-14 15:34:22,572 - INFO - Finished converting document 4_2025-05-06 in 0.11 sec.
2025-11-14 15:34:22,632 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:22,652 - INFO - Going to convert document batch...
2025-11-14 15:34:22,654 - INFO - Processing document 4_2025-05-08
2025-11-14 15:34:22,700 - INFO - Finished converting document 4_2025-05-08 in 0.08 sec.
2025-11-14 15:34:22,762 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:22,772 - INFO - Going to convert document batch...
2025-11-14 15:34:22,774 - INFO - Processing document 4_2025-05-28


Converted 'data\edgar_documents\AMGN\4_2025-05-06' --> 'data\processed_data\AMGN\4_2025-05-06.md'
Converted 'data\edgar_documents\AMGN\4_2025-05-08' --> 'data\processed_data\AMGN\4_2025-05-08.md'


2025-11-14 15:34:22,824 - INFO - Finished converting document 4_2025-05-28 in 0.09 sec.
2025-11-14 15:34:22,879 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:22,897 - INFO - Going to convert document batch...
2025-11-14 15:34:22,899 - INFO - Processing document 4_2025-06-06
2025-11-14 15:34:22,964 - INFO - Finished converting document 4_2025-06-06 in 0.11 sec.
2025-11-14 15:34:23,044 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\4_2025-05-28' --> 'data\processed_data\AMGN\4_2025-05-28.md'
Converted 'data\edgar_documents\AMGN\4_2025-06-06' --> 'data\processed_data\AMGN\4_2025-06-06.md'


2025-11-14 15:34:23,065 - INFO - Going to convert document batch...
2025-11-14 15:34:23,067 - INFO - Processing document 4_2025-08-12
2025-11-14 15:34:23,124 - INFO - Finished converting document 4_2025-08-12 in 0.11 sec.
2025-11-14 15:34:23,204 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:23,223 - INFO - Going to convert document batch...
2025-11-14 15:34:23,224 - INFO - Processing document 4_2025-08-22
2025-11-14 15:34:23,261 - INFO - Finished converting document 4_2025-08-22 in 0.08 sec.
2025-11-14 15:34:23,322 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:23,353 - INFO - Going to convert document batch...
2025-11-14 15:34:23,355 - INFO - Processing document 4_2025-11-07


Converted 'data\edgar_documents\AMGN\4_2025-08-12' --> 'data\processed_data\AMGN\4_2025-08-12.md'
Converted 'data\edgar_documents\AMGN\4_2025-08-22' --> 'data\processed_data\AMGN\4_2025-08-22.md'


2025-11-14 15:34:23,409 - INFO - Finished converting document 4_2025-11-07 in 0.11 sec.
2025-11-14 15:34:23,487 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:23,523 - INFO - Going to convert document batch...
2025-11-14 15:34:23,524 - INFO - Processing document 8-K_2023-01-31
2025-11-14 15:34:23,582 - INFO - Finished converting document 8-K_2023-01-31 in 0.11 sec.
2025-11-14 15:34:23,643 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\4_2025-11-07' --> 'data\processed_data\AMGN\4_2025-11-07.md'
Converted 'data\edgar_documents\AMGN\8-K_2023-01-31' --> 'data\processed_data\AMGN\8-K_2023-01-31.md'


2025-11-14 15:34:23,688 - INFO - Going to convert document batch...
2025-11-14 15:34:23,690 - INFO - Processing document 8-K_2023-02-16
2025-11-14 15:34:23,735 - INFO - Finished converting document 8-K_2023-02-16 in 0.14 sec.
2025-11-14 15:34:23,776 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:23,805 - INFO - Going to convert document batch...
2025-11-14 15:34:23,807 - INFO - Processing document 8-K_2023-03-02
2025-11-14 15:34:23,864 - INFO - Finished converting document 8-K_2023-03-02 in 0.09 sec.
2025-11-14 15:34:23,929 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:23,950 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMGN\8-K_2023-02-16' --> 'data\processed_data\AMGN\8-K_2023-02-16.md'
Converted 'data\edgar_documents\AMGN\8-K_2023-03-02' --> 'data\processed_data\AMGN\8-K_2023-03-02.md'


2025-11-14 15:34:23,950 - INFO - Processing document 8-K_2023-03-09
2025-11-14 15:34:24,002 - INFO - Finished converting document 8-K_2023-03-09 in 0.11 sec.
2025-11-14 15:34:24,041 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:24,074 - INFO - Going to convert document batch...
2025-11-14 15:34:24,075 - INFO - Processing document 8-K_2023-04-27
2025-11-14 15:34:24,119 - INFO - Finished converting document 8-K_2023-04-27 in 0.09 sec.
2025-11-14 15:34:24,172 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:24,209 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMGN\8-K_2023-03-09' --> 'data\processed_data\AMGN\8-K_2023-03-09.md'
Converted 'data\edgar_documents\AMGN\8-K_2023-04-27' --> 'data\processed_data\AMGN\8-K_2023-04-27.md'


2025-11-14 15:34:24,212 - INFO - Processing document 8-K_2023-05-16
2025-11-14 15:34:24,264 - INFO - Finished converting document 8-K_2023-05-16 in 0.12 sec.
2025-11-14 15:34:24,330 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:24,362 - INFO - Going to convert document batch...
2025-11-14 15:34:24,364 - INFO - Processing document 8-K_2023-05-18
2025-11-14 15:34:24,412 - INFO - Finished converting document 8-K_2023-05-18 in 0.11 sec.
2025-11-14 15:34:24,468 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\8-K_2023-05-16' --> 'data\processed_data\AMGN\8-K_2023-05-16.md'
Converted 'data\edgar_documents\AMGN\8-K_2023-05-18' --> 'data\processed_data\AMGN\8-K_2023-05-18.md'


2025-11-14 15:34:24,526 - INFO - Going to convert document batch...
2025-11-14 15:34:24,528 - INFO - Processing document 8-K_2023-05-22
2025-11-14 15:34:24,631 - INFO - Finished converting document 8-K_2023-05-22 in 0.19 sec.
2025-11-14 15:34:24,691 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:24,716 - INFO - Going to convert document batch...
2025-11-14 15:34:24,720 - INFO - Processing document 8-K_2023-06-05
2025-11-14 15:34:24,769 - INFO - Finished converting document 8-K_2023-06-05 in 0.09 sec.
2025-11-14 15:34:24,825 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:24,871 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMGN\8-K_2023-05-22' --> 'data\processed_data\AMGN\8-K_2023-05-22.md'
Converted 'data\edgar_documents\AMGN\8-K_2023-06-05' --> 'data\processed_data\AMGN\8-K_2023-06-05.md'


2025-11-14 15:34:24,873 - INFO - Processing document 8-K_2023-08-03
2025-11-14 15:34:24,952 - INFO - Finished converting document 8-K_2023-08-03 in 0.16 sec.
2025-11-14 15:34:25,000 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:25,039 - INFO - Going to convert document batch...
2025-11-14 15:34:25,041 - INFO - Processing document 8-K_2023-08-04
2025-11-14 15:34:25,093 - INFO - Finished converting document 8-K_2023-08-04 in 0.11 sec.
2025-11-14 15:34:25,159 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\8-K_2023-08-03' --> 'data\processed_data\AMGN\8-K_2023-08-03.md'
Converted 'data\edgar_documents\AMGN\8-K_2023-08-04' --> 'data\processed_data\AMGN\8-K_2023-08-04.md'


2025-11-14 15:34:25,189 - INFO - Going to convert document batch...
2025-11-14 15:34:25,193 - INFO - Processing document 8-K_2023-09-01
2025-11-14 15:34:25,227 - INFO - Finished converting document 8-K_2023-09-01 in 0.09 sec.
2025-11-14 15:34:25,260 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:25,280 - INFO - Going to convert document batch...
2025-11-14 15:34:25,281 - INFO - Processing document 8-K_2023-09-05
2025-11-14 15:34:25,317 - INFO - Finished converting document 8-K_2023-09-05 in 0.08 sec.
2025-11-14 15:34:25,358 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:25,380 - INFO - Going to convert document batch...
2025-11-14 15:34:25,381 - INFO - Processing document 8-K_2023-09-12
2025-11-14 15:34:25,413 - INFO - Finished converting document 8-K_2023-09-12 in 0.08 sec.


Converted 'data\edgar_documents\AMGN\8-K_2023-09-01' --> 'data\processed_data\AMGN\8-K_2023-09-01.md'
Converted 'data\edgar_documents\AMGN\8-K_2023-09-05' --> 'data\processed_data\AMGN\8-K_2023-09-05.md'


2025-11-14 15:34:25,449 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:25,467 - INFO - Going to convert document batch...
2025-11-14 15:34:25,470 - INFO - Processing document 8-K_2023-10-05
2025-11-14 15:34:25,510 - INFO - Finished converting document 8-K_2023-10-05 in 0.08 sec.
2025-11-14 15:34:25,546 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:25,580 - INFO - Going to convert document batch...
2025-11-14 15:34:25,581 - INFO - Processing document 8-K_2023-10-06
2025-11-14 15:34:25,625 - INFO - Finished converting document 8-K_2023-10-06 in 0.09 sec.


Converted 'data\edgar_documents\AMGN\8-K_2023-09-12' --> 'data\processed_data\AMGN\8-K_2023-09-12.md'
Converted 'data\edgar_documents\AMGN\8-K_2023-10-05' --> 'data\processed_data\AMGN\8-K_2023-10-05.md'


2025-11-14 15:34:25,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:25,698 - INFO - Going to convert document batch...
2025-11-14 15:34:25,699 - INFO - Processing document 8-K_2023-10-31
2025-11-14 15:34:25,736 - INFO - Finished converting document 8-K_2023-10-31 in 0.08 sec.
2025-11-14 15:34:25,791 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:25,824 - INFO - Going to convert document batch...
2025-11-14 15:34:25,824 - INFO - Processing document 8-K_2023-12-14


Converted 'data\edgar_documents\AMGN\8-K_2023-10-06' --> 'data\processed_data\AMGN\8-K_2023-10-06.md'
Converted 'data\edgar_documents\AMGN\8-K_2023-10-31' --> 'data\processed_data\AMGN\8-K_2023-10-31.md'


2025-11-14 15:34:25,882 - INFO - Finished converting document 8-K_2023-12-14 in 0.12 sec.
2025-11-14 15:34:25,948 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:34:25,951 - ERROR - Input document 8-K_2024-02-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:34:25,953 - INFO - Going to convert document batch...
2025-11-14 15:34:25,972 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:26,015 - INFO - Going to convert document batch...
2025-11-14

Converted 'data\edgar_documents\AMGN\8-K_2023-12-14' --> 'data\processed_data\AMGN\8-K_2023-12-14.md'
Error processing data\edgar_documents\AMGN\8-K_2024-02-06: File format not allowed: data\edgar_documents\AMGN\8-K_2024-02-06


2025-11-14 15:34:26,125 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\8-K_2024-05-02' --> 'data\processed_data\AMGN\8-K_2024-05-02.md'


2025-11-14 15:34:26,793 - INFO - Going to convert document batch...
2025-11-14 15:34:26,796 - INFO - Processing document 8-K_2024-06-03
2025-11-14 15:34:26,887 - INFO - Finished converting document 8-K_2024-06-03 in 0.78 sec.
2025-11-14 15:34:26,959 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:26,995 - INFO - Going to convert document batch...
2025-11-14 15:34:26,997 - INFO - Processing document 8-K_2024-08-06
2025-11-14 15:34:27,062 - INFO - Finished converting document 8-K_2024-08-06 in 0.12 sec.


Converted 'data\edgar_documents\AMGN\8-K_2024-06-03' --> 'data\processed_data\AMGN\8-K_2024-06-03.md'
Converted 'data\edgar_documents\AMGN\8-K_2024-08-06' --> 'data\processed_data\AMGN\8-K_2024-08-06.md'


2025-11-14 15:34:27,128 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:27,159 - INFO - Going to convert document batch...
2025-11-14 15:34:27,161 - INFO - Processing document 8-K_2024-10-30
2025-11-14 15:34:27,233 - INFO - Finished converting document 8-K_2024-10-30 in 0.14 sec.
2025-11-14 15:34:27,283 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:27,300 - INFO - Going to convert document batch...
2025-11-14 15:34:27,301 - INFO - Processing document 8-K_2025-02-04
2025-11-14 15:34:27,363 - INFO - Finished converting document 8-K_2025-02-04 in 0.09 sec.
2025-11-14 15:34:27,439 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:27,473 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMGN\8-K_2024-10-30' --> 'data\processed_data\AMGN\8-K_2024-10-30.md'
Converted 'data\edgar_documents\AMGN\8-K_2025-02-04' --> 'data\processed_data\AMGN\8-K_2025-02-04.md'


2025-11-14 15:34:27,475 - INFO - Processing document 8-K_2025-05-01
2025-11-14 15:34:27,551 - INFO - Finished converting document 8-K_2025-05-01 in 0.14 sec.
2025-11-14 15:34:27,620 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:27,659 - INFO - Going to convert document batch...
2025-11-14 15:34:27,661 - INFO - Processing document 8-K_2025-05-27
2025-11-14 15:34:27,726 - INFO - Finished converting document 8-K_2025-05-27 in 0.14 sec.


Converted 'data\edgar_documents\AMGN\8-K_2025-05-01' --> 'data\processed_data\AMGN\8-K_2025-05-01.md'
Converted 'data\edgar_documents\AMGN\8-K_2025-05-27' --> 'data\processed_data\AMGN\8-K_2025-05-27.md'


2025-11-14 15:34:27,779 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:27,820 - INFO - Going to convert document batch...
2025-11-14 15:34:27,822 - INFO - Processing document 8-K_2025-08-05
2025-11-14 15:34:27,893 - INFO - Finished converting document 8-K_2025-08-05 in 0.14 sec.
2025-11-14 15:34:27,972 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:34:28,012 - INFO - Going to convert document batch...
2025-11-14 15:34:28,014 - INFO - Processing document 8-K_2025-11-04
2025-11-14 15:34:28,074 - INFO - Finished converting document 8-K_2025-11-04 in 0.14 sec.


Converted 'data\edgar_documents\AMGN\8-K_2025-08-05' --> 'data\processed_data\AMGN\8-K_2025-08-05.md'
Converted 'data\edgar_documents\AMGN\8-K_2025-11-04' --> 'data\processed_data\AMGN\8-K_2025-11-04.md'


2025-11-14 15:34:28,222 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:34:28,224 - ERROR - Input document DEF-14A_2023-04-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:34:28,229 - INFO - Going to convert document batch...
2025-11-14 15:34:28,319 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Error processing data\edgar_documents\AMGN\DEF-14A_2023-04-06: File format not allowed: data\edgar_documents\AMGN\DEF-14A_2023-04-06


2025-11-14 15:34:32,285 - INFO - Going to convert document batch...
2025-11-14 15:34:32,286 - INFO - Processing document DEF-14A_2024-04-17
2025-11-14 15:34:53,622 - INFO - Finished converting document DEF-14A_2024-04-17 in 25.39 sec.
2025-11-14 15:34:57,019 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\DEF-14A_2024-04-17' --> 'data\processed_data\AMGN\DEF-14A_2024-04-17.md'


2025-11-14 15:35:00,992 - INFO - Going to convert document batch...
2025-11-14 15:35:00,993 - INFO - Processing document DEF-14A_2025-04-09
2025-11-14 15:35:08,486 - INFO - Finished converting document DEF-14A_2025-04-09 in 11.62 sec.
2025-11-14 15:35:10,107 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMGN\DEF-14A_2025-04-09' --> 'data\processed_data\AMGN\DEF-14A_2025-04-09.md'
Processed 87 new files. Errors: 5
Found 146 files to process in data\edgar_documents\AMT


2025-11-14 15:35:13,585 - INFO - Going to convert document batch...
2025-11-14 15:35:13,587 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:35:13,589 - INFO - Processing document 10-K_2023-02-23
2025-11-14 15:35:19,428 - INFO - Finished converting document 10-K_2023-02-23 in 9.47 sec.
2025-11-14 15:35:22,453 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\10-K_2023-02-23' --> 'data\processed_data\AMT\10-K_2023-02-23.md'


2025-11-14 15:35:24,761 - INFO - Going to convert document batch...
2025-11-14 15:35:24,762 - INFO - Processing document 10-K_2024-02-27
2025-11-14 15:35:30,733 - INFO - Finished converting document 10-K_2024-02-27 in 8.45 sec.
2025-11-14 15:35:33,067 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\10-K_2024-02-27' --> 'data\processed_data\AMT\10-K_2024-02-27.md'


2025-11-14 15:35:37,183 - INFO - Going to convert document batch...
2025-11-14 15:35:37,185 - INFO - Processing document 10-K_2025-02-25
2025-11-14 15:35:44,650 - INFO - Finished converting document 10-K_2025-02-25 in 11.69 sec.
2025-11-14 15:35:47,180 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\10-K_2025-02-25' --> 'data\processed_data\AMT\10-K_2025-02-25.md'


2025-11-14 15:35:48,702 - INFO - Going to convert document batch...
2025-11-14 15:35:48,703 - INFO - Processing document 10-Q_2023-04-26
2025-11-14 15:35:50,954 - INFO - Finished converting document 10-Q_2023-04-26 in 3.81 sec.
2025-11-14 15:35:53,414 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\10-Q_2023-04-26' --> 'data\processed_data\AMT\10-Q_2023-04-26.md'


2025-11-14 15:35:55,303 - INFO - Going to convert document batch...
2025-11-14 15:35:55,305 - INFO - Processing document 10-Q_2023-07-27
2025-11-14 15:35:59,173 - INFO - Finished converting document 10-Q_2023-07-27 in 5.81 sec.
2025-11-14 15:36:00,728 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\10-Q_2023-07-27' --> 'data\processed_data\AMT\10-Q_2023-07-27.md'


2025-11-14 15:36:02,747 - INFO - Going to convert document batch...
2025-11-14 15:36:02,748 - INFO - Processing document 10-Q_2023-10-26
2025-11-14 15:36:06,894 - INFO - Finished converting document 10-Q_2023-10-26 in 6.25 sec.
2025-11-14 15:36:08,169 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\10-Q_2023-10-26' --> 'data\processed_data\AMT\10-Q_2023-10-26.md'


2025-11-14 15:36:09,483 - INFO - Going to convert document batch...
2025-11-14 15:36:09,485 - INFO - Processing document 10-Q_2024-04-30
2025-11-14 15:36:11,888 - INFO - Finished converting document 10-Q_2024-04-30 in 3.78 sec.
2025-11-14 15:36:13,205 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\10-Q_2024-04-30' --> 'data\processed_data\AMT\10-Q_2024-04-30.md'


2025-11-14 15:36:15,892 - INFO - Going to convert document batch...
2025-11-14 15:36:15,894 - INFO - Processing document 10-Q_2024-07-30
2025-11-14 15:36:18,786 - INFO - Finished converting document 10-Q_2024-07-30 in 5.62 sec.
2025-11-14 15:36:20,163 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\10-Q_2024-07-30' --> 'data\processed_data\AMT\10-Q_2024-07-30.md'


2025-11-14 15:36:22,810 - INFO - Going to convert document batch...
2025-11-14 15:36:22,811 - INFO - Processing document 10-Q_2024-10-29
2025-11-14 15:36:26,070 - INFO - Finished converting document 10-Q_2024-10-29 in 5.98 sec.
2025-11-14 15:36:27,545 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\10-Q_2024-10-29' --> 'data\processed_data\AMT\10-Q_2024-10-29.md'


2025-11-14 15:36:29,378 - INFO - Going to convert document batch...
2025-11-14 15:36:29,379 - INFO - Processing document 10-Q_2025-04-29
2025-11-14 15:36:31,678 - INFO - Finished converting document 10-Q_2025-04-29 in 4.20 sec.
2025-11-14 15:36:32,233 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\10-Q_2025-04-29' --> 'data\processed_data\AMT\10-Q_2025-04-29.md'


2025-11-14 15:36:33,185 - INFO - Going to convert document batch...
2025-11-14 15:36:33,186 - INFO - Processing document 10-Q_2025-07-29
2025-11-14 15:36:34,404 - INFO - Finished converting document 10-Q_2025-07-29 in 2.22 sec.
2025-11-14 15:36:34,999 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\10-Q_2025-07-29' --> 'data\processed_data\AMT\10-Q_2025-07-29.md'


2025-11-14 15:36:35,570 - INFO - Going to convert document batch...
2025-11-14 15:36:35,571 - INFO - Processing document 10-Q_2025-10-28
2025-11-14 15:36:37,060 - INFO - Finished converting document 10-Q_2025-10-28 in 2.11 sec.
2025-11-14 15:36:37,607 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:37,614 - INFO - Going to convert document batch...
2025-11-14 15:36:37,615 - INFO - Processing document 4_2023-01-04
2025-11-14 15:36:37,632 - INFO - Finished converting document 4_2023-01-04 in 0.03 sec.
2025-11-14 15:36:37,665 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:37,679 - INFO - Going to convert document batch...
2025-11-14 15:36:37,680 - INFO - Processing document 4_2023-01-05
2025-11-14 15:36:37,699 - INFO - Finished converting document 4_2023-01-05 in 0.05 sec.
2025-11-14 15:36:37,728 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:37,736 - INFO - Going to convert document batch...
2025-11-14 15:36:37,

Converted 'data\edgar_documents\AMT\10-Q_2025-10-28' --> 'data\processed_data\AMT\10-Q_2025-10-28.md'
Converted 'data\edgar_documents\AMT\4_2023-01-04' --> 'data\processed_data\AMT\4_2023-01-04.md'
Converted 'data\edgar_documents\AMT\4_2023-01-05' --> 'data\processed_data\AMT\4_2023-01-05.md'
Converted 'data\edgar_documents\AMT\4_2023-01-11' --> 'data\processed_data\AMT\4_2023-01-11.md'


2025-11-14 15:36:37,792 - INFO - Going to convert document batch...
2025-11-14 15:36:37,793 - INFO - Processing document 4_2023-01-18
2025-11-14 15:36:37,815 - INFO - Finished converting document 4_2023-01-18 in 0.05 sec.
2025-11-14 15:36:37,845 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:37,853 - INFO - Going to convert document batch...
2025-11-14 15:36:37,853 - INFO - Processing document 4_2023-01-19
2025-11-14 15:36:37,868 - INFO - Finished converting document 4_2023-01-19 in 0.03 sec.
2025-11-14 15:36:37,896 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:37,904 - INFO - Going to convert document batch...
2025-11-14 15:36:37,905 - INFO - Processing document 4_2023-02-06
2025-11-14 15:36:37,924 - INFO - Finished converting document 4_2023-02-06 in 0.03 sec.
2025-11-14 15:36:37,963 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:37,975 - INFO - Going to convert document batch...
2025-11-14 15:36:37,975 - 

Converted 'data\edgar_documents\AMT\4_2023-01-18' --> 'data\processed_data\AMT\4_2023-01-18.md'
Converted 'data\edgar_documents\AMT\4_2023-01-19' --> 'data\processed_data\AMT\4_2023-01-19.md'
Converted 'data\edgar_documents\AMT\4_2023-02-06' --> 'data\processed_data\AMT\4_2023-02-06.md'
Converted 'data\edgar_documents\AMT\4_2023-02-08' --> 'data\processed_data\AMT\4_2023-02-08.md'


2025-11-14 15:36:38,035 - INFO - Going to convert document batch...
2025-11-14 15:36:38,036 - INFO - Processing document 4_2023-02-28
2025-11-14 15:36:38,052 - INFO - Finished converting document 4_2023-02-28 in 0.03 sec.
2025-11-14 15:36:38,080 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:38,091 - INFO - Going to convert document batch...
2025-11-14 15:36:38,091 - INFO - Processing document 4_2023-03-01
2025-11-14 15:36:38,115 - INFO - Finished converting document 4_2023-03-01 in 0.05 sec.
2025-11-14 15:36:38,147 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:38,154 - INFO - Going to convert document batch...
2025-11-14 15:36:38,156 - INFO - Processing document 4_2023-03-14
2025-11-14 15:36:38,172 - INFO - Finished converting document 4_2023-03-14 in 0.03 sec.
2025-11-14 15:36:38,201 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:38,210 - INFO - Going to convert document batch...
2025-11-14 15:36:38,210 - 

Converted 'data\edgar_documents\AMT\4_2023-02-28' --> 'data\processed_data\AMT\4_2023-02-28.md'
Converted 'data\edgar_documents\AMT\4_2023-03-01' --> 'data\processed_data\AMT\4_2023-03-01.md'
Converted 'data\edgar_documents\AMT\4_2023-03-14' --> 'data\processed_data\AMT\4_2023-03-14.md'
Converted 'data\edgar_documents\AMT\4_2023-05-03' --> 'data\processed_data\AMT\4_2023-05-03.md'


2025-11-14 15:36:38,322 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:36:38,323 - ERROR - Input document 4_2023-05-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:36:38,325 - INFO - Going to convert document batch...
2025-11-14 15:36:38,352 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:36:38,352 - ERROR - Input document 4_2023-05-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\AMT\4_2023-05-09: File format not allowed: data\edgar_documents\AMT\4_2023-05-09
Error processing data\edgar_documents\AMT\4_2023-05-10: File format not allowed: data\edgar_documents\AMT\4_2023-05-10
Error processing data\edgar_documents\AMT\4_2023-05-22: File format not allowed: data\edgar_documents\AMT\4_2023-05-22
Error processing data\edgar_documents\AMT\4_2023-05-23: File format not allowed: data\edgar_documents\AMT\4_2023-05-23
Converted 'data\edgar_documents\AMT\4_2023-05-24' --> 'data\processed_data\AMT\4_2023-05-24.md'


2025-11-14 15:36:38,522 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:38,532 - INFO - Going to convert document batch...
2025-11-14 15:36:38,532 - INFO - Processing document 4_2023-06-05
2025-11-14 15:36:38,549 - INFO - Finished converting document 4_2023-06-05 in 0.05 sec.
2025-11-14 15:36:38,581 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:38,588 - INFO - Going to convert document batch...
2025-11-14 15:36:38,589 - INFO - Processing document 4_2023-07-03
2025-11-14 15:36:38,606 - INFO - Finished converting document 4_2023-07-03 in 0.05 sec.
2025-11-14 15:36:38,638 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:38,646 - INFO - Going to convert document batch...
2025-11-14 15:36:38,646 - INFO - Processing document 4_2023-08-03
2025-11-14 15:36:38,663 - INFO - Finished converting document 4_2023-08-03 in 0.03 sec.
2025-11-14 15:36:38,709 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\AMT\4_2023-06-05' --> 'data\processed_data\AMT\4_2023-06-05.md'
Converted 'data\edgar_documents\AMT\4_2023-07-03' --> 'data\processed_data\AMT\4_2023-07-03.md'
Converted 'data\edgar_documents\AMT\4_2023-08-03' --> 'data\processed_data\AMT\4_2023-08-03.md'


2025-11-14 15:36:38,781 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:38,788 - INFO - Going to convert document batch...
2025-11-14 15:36:38,789 - INFO - Processing document 4_2023-08-14
2025-11-14 15:36:38,806 - INFO - Finished converting document 4_2023-08-14 in 0.03 sec.
2025-11-14 15:36:38,834 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:38,843 - INFO - Going to convert document batch...
2025-11-14 15:36:38,843 - INFO - Processing document 4_2023-08-17
2025-11-14 15:36:38,861 - INFO - Finished converting document 4_2023-08-17 in 0.03 sec.
2025-11-14 15:36:38,891 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:38,902 - INFO - Going to convert document batch...
2025-11-14 15:36:38,902 - INFO - Processing document 4_2023-08-21
2025-11-14 15:36:38,924 - INFO - Finished converting document 4_2023-08-21 in 0.05 sec.
2025-11-14 15:36:38,967 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\AMT\4_2023-08-07' --> 'data\processed_data\AMT\4_2023-08-07.md'
Converted 'data\edgar_documents\AMT\4_2023-08-14' --> 'data\processed_data\AMT\4_2023-08-14.md'
Converted 'data\edgar_documents\AMT\4_2023-08-17' --> 'data\processed_data\AMT\4_2023-08-17.md'
Converted 'data\edgar_documents\AMT\4_2023-08-21' --> 'data\processed_data\AMT\4_2023-08-21.md'


2025-11-14 15:36:38,968 - ERROR - Input document 4_2023-09-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:36:38,969 - INFO - Going to convert document batch...
2025-11-14 15:36:38,993 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:36:38,994 - ERROR - Input document 4_2023-09-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\AMT\4_2023-09-12: File format not allowed: data\edgar_documents\AMT\4_2023-09-12
Error processing data\edgar_documents\AMT\4_2023-09-13: File format not allowed: data\edgar_documents\AMT\4_2023-09-13
Converted 'data\edgar_documents\AMT\4_2023-10-04' --> 'data\processed_data\AMT\4_2023-10-04.md'
Converted 'data\edgar_documents\AMT\4_2023-10-18' --> 'data\processed_data\AMT\4_2023-10-18.md'
Error processing data\edgar_documents\AMT\4_2023-10-27: File format not allowed: data\edgar_documents\AMT\4_2023-10-27


2025-11-14 15:36:39,168 - INFO - Finished converting document 4_2023-11-13 in 0.05 sec.
2025-11-14 15:36:39,199 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:39,208 - INFO - Going to convert document batch...
2025-11-14 15:36:39,209 - INFO - Processing document 4_2024-02-28
2025-11-14 15:36:39,228 - INFO - Finished converting document 4_2024-02-28 in 0.03 sec.
2025-11-14 15:36:39,258 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:39,266 - INFO - Going to convert document batch...
2025-11-14 15:36:39,267 - INFO - Processing document 4_2024-03-01
2025-11-14 15:36:39,286 - INFO - Finished converting document 4_2024-03-01 in 0.03 sec.
2025-11-14 15:36:39,329 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:36:39,330 - ERROR - Input document 4_2024-03-04 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFo

Converted 'data\edgar_documents\AMT\4_2023-11-13' --> 'data\processed_data\AMT\4_2023-11-13.md'
Converted 'data\edgar_documents\AMT\4_2024-02-28' --> 'data\processed_data\AMT\4_2024-02-28.md'
Converted 'data\edgar_documents\AMT\4_2024-03-01' --> 'data\processed_data\AMT\4_2024-03-01.md'
Error processing data\edgar_documents\AMT\4_2024-03-04: File format not allowed: data\edgar_documents\AMT\4_2024-03-04


2025-11-14 15:36:39,403 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:39,414 - INFO - Going to convert document batch...
2025-11-14 15:36:39,415 - INFO - Processing document 4_2024-03-06
2025-11-14 15:36:39,439 - INFO - Finished converting document 4_2024-03-06 in 0.05 sec.
2025-11-14 15:36:39,472 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:39,481 - INFO - Going to convert document batch...
2025-11-14 15:36:39,482 - INFO - Processing document 4_2024-03-08
2025-11-14 15:36:39,505 - INFO - Finished converting document 4_2024-03-08 in 0.05 sec.
2025-11-14 15:36:39,537 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:39,545 - INFO - Going to convert document batch...
2025-11-14 15:36:39,545 - INFO - Processing document 4_2024-03-12
2025-11-14 15:36:39,562 - INFO - Finished converting document 4_2024-03-12 in 0.03 sec.


Converted 'data\edgar_documents\AMT\4_2024-03-05' --> 'data\processed_data\AMT\4_2024-03-05.md'
Converted 'data\edgar_documents\AMT\4_2024-03-06' --> 'data\processed_data\AMT\4_2024-03-06.md'
Converted 'data\edgar_documents\AMT\4_2024-03-08' --> 'data\processed_data\AMT\4_2024-03-08.md'
Converted 'data\edgar_documents\AMT\4_2024-03-12' --> 'data\processed_data\AMT\4_2024-03-12.md'


2025-11-14 15:36:39,604 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:39,619 - INFO - Going to convert document batch...
2025-11-14 15:36:39,619 - INFO - Processing document 4_2024-03-19
2025-11-14 15:36:39,640 - INFO - Finished converting document 4_2024-03-19 in 0.06 sec.
2025-11-14 15:36:39,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:39,679 - INFO - Going to convert document batch...
2025-11-14 15:36:39,680 - INFO - Processing document 4_2024-05-03
2025-11-14 15:36:39,696 - INFO - Finished converting document 4_2024-05-03 in 0.03 sec.
2025-11-14 15:36:39,727 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:39,734 - INFO - Going to convert document batch...
2025-11-14 15:36:39,735 - INFO - Processing document 4_2024-05-07
2025-11-14 15:36:39,751 - INFO - Finished converting document 4_2024-05-07 in 0.03 sec.
2025-11-14 15:36:39,793 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\AMT\4_2024-03-19' --> 'data\processed_data\AMT\4_2024-03-19.md'
Converted 'data\edgar_documents\AMT\4_2024-05-03' --> 'data\processed_data\AMT\4_2024-05-03.md'
Converted 'data\edgar_documents\AMT\4_2024-05-07' --> 'data\processed_data\AMT\4_2024-05-07.md'
Converted 'data\edgar_documents\AMT\4_2024-05-22' --> 'data\processed_data\AMT\4_2024-05-22.md'


2025-11-14 15:36:39,862 - ERROR - Input document 4_2024-05-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:36:39,863 - INFO - Going to convert document batch...
2025-11-14 15:36:39,874 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:39,883 - INFO - Going to convert document batch...
2025-11-14 15:36:39,884 - INFO - Processing document 4_2024-06-04
2025-11-14 15:36:39,901 - INFO - Finished converting document 4_2024-06-04 in 0.05 sec.
2025-11-14 15:36:39,934 - INFO - detec

Error processing data\edgar_documents\AMT\4_2024-05-23: File format not allowed: data\edgar_documents\AMT\4_2024-05-23
Converted 'data\edgar_documents\AMT\4_2024-06-04' --> 'data\processed_data\AMT\4_2024-06-04.md'
Converted 'data\edgar_documents\AMT\4_2024-06-06' --> 'data\processed_data\AMT\4_2024-06-06.md'
Converted 'data\edgar_documents\AMT\4_2024-08-06' --> 'data\processed_data\AMT\4_2024-08-06.md'


2025-11-14 15:36:40,072 - INFO - Going to convert document batch...
2025-11-14 15:36:40,073 - INFO - Processing document 4_2024-08-28
2025-11-14 15:36:40,094 - INFO - Finished converting document 4_2024-08-28 in 0.05 sec.
2025-11-14 15:36:40,150 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:40,174 - INFO - Going to convert document batch...
2025-11-14 15:36:40,175 - INFO - Processing document 4_2024-09-05
2025-11-14 15:36:40,216 - INFO - Finished converting document 4_2024-09-05 in 0.09 sec.
2025-11-14 15:36:40,264 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:40,273 - INFO - Going to convert document batch...
2025-11-14 15:36:40,274 - INFO - Processing document 4_2024-09-12
2025-11-14 15:36:40,295 - INFO - Finished converting document 4_2024-09-12 in 0.06 sec.


Converted 'data\edgar_documents\AMT\4_2024-08-28' --> 'data\processed_data\AMT\4_2024-08-28.md'
Converted 'data\edgar_documents\AMT\4_2024-09-05' --> 'data\processed_data\AMT\4_2024-09-05.md'


2025-11-14 15:36:40,328 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:40,335 - INFO - Going to convert document batch...
2025-11-14 15:36:40,336 - INFO - Processing document 4_2024-09-17
2025-11-14 15:36:40,353 - INFO - Finished converting document 4_2024-09-17 in 0.03 sec.
2025-11-14 15:36:40,383 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:40,392 - INFO - Going to convert document batch...
2025-11-14 15:36:40,393 - INFO - Processing document 4_2024-10-03
2025-11-14 15:36:40,410 - INFO - Finished converting document 4_2024-10-03 in 0.03 sec.
2025-11-14 15:36:40,451 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:36:40,452 - ERROR - Input document 4_2024-11-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <Inp

Converted 'data\edgar_documents\AMT\4_2024-09-12' --> 'data\processed_data\AMT\4_2024-09-12.md'
Converted 'data\edgar_documents\AMT\4_2024-09-17' --> 'data\processed_data\AMT\4_2024-09-17.md'
Converted 'data\edgar_documents\AMT\4_2024-10-03' --> 'data\processed_data\AMT\4_2024-10-03.md'
Error processing data\edgar_documents\AMT\4_2024-11-18: File format not allowed: data\edgar_documents\AMT\4_2024-11-18
Error processing data\edgar_documents\AMT\4_2024-11-19: File format not allowed: data\edgar_documents\AMT\4_2024-11-19


2025-11-14 15:36:40,503 - INFO - Going to convert document batch...
2025-11-14 15:36:40,504 - INFO - Processing document 4_2025-01-07
2025-11-14 15:36:40,524 - INFO - Finished converting document 4_2025-01-07 in 0.03 sec.
2025-11-14 15:36:40,555 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:40,565 - INFO - Going to convert document batch...
2025-11-14 15:36:40,566 - INFO - Processing document 4_2025-01-17
2025-11-14 15:36:40,591 - INFO - Finished converting document 4_2025-01-17 in 0.05 sec.
2025-11-14 15:36:40,628 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:40,638 - INFO - Going to convert document batch...
2025-11-14 15:36:40,639 - INFO - Processing document 4_2025-02-18
2025-11-14 15:36:40,661 - INFO - Finished converting document 4_2025-02-18 in 0.05 sec.
2025-11-14 15:36:40,694 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:40,701 - INFO - Going to convert document batch...
2025-11-14 15:36:40,702 - 

Converted 'data\edgar_documents\AMT\4_2025-01-07' --> 'data\processed_data\AMT\4_2025-01-07.md'
Converted 'data\edgar_documents\AMT\4_2025-01-17' --> 'data\processed_data\AMT\4_2025-01-17.md'
Converted 'data\edgar_documents\AMT\4_2025-02-18' --> 'data\processed_data\AMT\4_2025-02-18.md'


2025-11-14 15:36:40,751 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:40,758 - INFO - Going to convert document batch...
2025-11-14 15:36:40,759 - INFO - Processing document 4_2025-03-03
2025-11-14 15:36:40,776 - INFO - Finished converting document 4_2025-03-03 in 0.05 sec.
2025-11-14 15:36:40,821 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:36:40,822 - ERROR - Input document 4_2025-03-11 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:36

Converted 'data\edgar_documents\AMT\4_2025-02-28' --> 'data\processed_data\AMT\4_2025-02-28.md'
Converted 'data\edgar_documents\AMT\4_2025-03-03' --> 'data\processed_data\AMT\4_2025-03-03.md'
Error processing data\edgar_documents\AMT\4_2025-03-11: File format not allowed: data\edgar_documents\AMT\4_2025-03-11
Converted 'data\edgar_documents\AMT\4_2025-03-12' --> 'data\processed_data\AMT\4_2025-03-12.md'


2025-11-14 15:36:40,927 - INFO - Finished converting document 4_2025-03-19 in 0.03 sec.
2025-11-14 15:36:40,957 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:40,978 - INFO - Going to convert document batch...
2025-11-14 15:36:40,980 - INFO - Processing document 4_2025-04-02
2025-11-14 15:36:41,008 - INFO - Finished converting document 4_2025-04-02 in 0.06 sec.
2025-11-14 15:36:41,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:41,056 - INFO - Going to convert document batch...
2025-11-14 15:36:41,057 - INFO - Processing document 4_2025-05-16
2025-11-14 15:36:41,075 - INFO - Finished converting document 4_2025-05-16 in 0.05 sec.


Converted 'data\edgar_documents\AMT\4_2025-03-19' --> 'data\processed_data\AMT\4_2025-03-19.md'
Converted 'data\edgar_documents\AMT\4_2025-04-02' --> 'data\processed_data\AMT\4_2025-04-02.md'
Converted 'data\edgar_documents\AMT\4_2025-05-16' --> 'data\processed_data\AMT\4_2025-05-16.md'


2025-11-14 15:36:41,132 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:36:41,132 - ERROR - Input document 4_2025-05-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:36:41,134 - INFO - Going to convert document batch...
2025-11-14 15:36:41,160 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:36:41,161 - ERROR - Input document 4_2025-05-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\AMT\4_2025-05-21: File format not allowed: data\edgar_documents\AMT\4_2025-05-21
Error processing data\edgar_documents\AMT\4_2025-05-22: File format not allowed: data\edgar_documents\AMT\4_2025-05-22
Converted 'data\edgar_documents\AMT\4_2025-06-03' --> 'data\processed_data\AMT\4_2025-06-03.md'
Converted 'data\edgar_documents\AMT\4_2025-08-01' --> 'data\processed_data\AMT\4_2025-08-01.md'
Error processing data\edgar_documents\AMT\4_2025-09-11: File format not allowed: data\edgar_documents\AMT\4_2025-09-11


2025-11-14 15:36:41,334 - ERROR - Input document 4_2025-09-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:36:41,336 - INFO - Going to convert document batch...
2025-11-14 15:36:41,349 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:41,357 - INFO - Going to convert document batch...
2025-11-14 15:36:41,358 - INFO - Processing document 4_2025-09-23
2025-11-14 15:36:41,377 - INFO - Finished converting document 4_2025-09-23 in 0.05 sec.
2025-11-14 15:36:41,408 - INFO - detec

Error processing data\edgar_documents\AMT\4_2025-09-12: File format not allowed: data\edgar_documents\AMT\4_2025-09-12
Converted 'data\edgar_documents\AMT\4_2025-09-23' --> 'data\processed_data\AMT\4_2025-09-23.md'
Converted 'data\edgar_documents\AMT\4_2025-10-03' --> 'data\processed_data\AMT\4_2025-10-03.md'


2025-11-14 15:36:41,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:41,551 - INFO - Going to convert document batch...
2025-11-14 15:36:41,552 - INFO - Processing document 8-K_2023-02-23
2025-11-14 15:36:41,572 - INFO - Finished converting document 8-K_2023-02-23 in 0.05 sec.
2025-11-14 15:36:41,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:41,612 - INFO - Going to convert document batch...
2025-11-14 15:36:41,613 - INFO - Processing document 8-K_2023-03-01
2025-11-14 15:36:41,634 - INFO - Finished converting document 8-K_2023-03-01 in 0.05 sec.
2025-11-14 15:36:41,660 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:41,676 - INFO - Going to convert document batch...
2025-11-14 15:36:41,677 - INFO - Processing document 8-K_2023-03-02
2025-11-14 15:36:41,699 - INFO - Finished converting document 8-K_2023-03-02 in 0.06 sec.


Converted 'data\edgar_documents\AMT\4_2025-11-04' --> 'data\processed_data\AMT\4_2025-11-04.md'
Converted 'data\edgar_documents\AMT\8-K_2023-02-23' --> 'data\processed_data\AMT\8-K_2023-02-23.md'
Converted 'data\edgar_documents\AMT\8-K_2023-03-01' --> 'data\processed_data\AMT\8-K_2023-03-01.md'


2025-11-14 15:36:41,728 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:41,744 - INFO - Going to convert document batch...
2025-11-14 15:36:41,745 - INFO - Processing document 8-K_2023-03-03
2025-11-14 15:36:41,769 - INFO - Finished converting document 8-K_2023-03-03 in 0.05 sec.
2025-11-14 15:36:41,795 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:41,811 - INFO - Going to convert document batch...
2025-11-14 15:36:41,812 - INFO - Processing document 8-K_2023-03-08
2025-11-14 15:36:41,832 - INFO - Finished converting document 8-K_2023-03-08 in 0.05 sec.
2025-11-14 15:36:41,857 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:41,873 - INFO - Going to convert document batch...
2025-11-14 15:36:41,874 - INFO - Processing document 8-K_2023-03-09
2025-11-14 15:36:41,896 - INFO - Finished converting document 8-K_2023-03-09 in 0.05 sec.


Converted 'data\edgar_documents\AMT\8-K_2023-03-02' --> 'data\processed_data\AMT\8-K_2023-03-02.md'
Converted 'data\edgar_documents\AMT\8-K_2023-03-03' --> 'data\processed_data\AMT\8-K_2023-03-03.md'
Converted 'data\edgar_documents\AMT\8-K_2023-03-08' --> 'data\processed_data\AMT\8-K_2023-03-08.md'


2025-11-14 15:36:41,920 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:41,938 - INFO - Going to convert document batch...
2025-11-14 15:36:41,939 - INFO - Processing document 8-K_2023-03-13
2025-11-14 15:36:41,960 - INFO - Finished converting document 8-K_2023-03-13 in 0.05 sec.
2025-11-14 15:36:41,984 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:41,998 - INFO - Going to convert document batch...
2025-11-14 15:36:41,999 - INFO - Processing document 8-K_2023-03-31
2025-11-14 15:36:42,017 - INFO - Finished converting document 8-K_2023-03-31 in 0.05 sec.
2025-11-14 15:36:42,041 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:42,056 - INFO - Going to convert document batch...
2025-11-14 15:36:42,057 - INFO - Processing document 8-K_2023-04-26
2025-11-14 15:36:42,078 - INFO - Finished converting document 8-K_2023-04-26 in 0.05 sec.


Converted 'data\edgar_documents\AMT\8-K_2023-03-09' --> 'data\processed_data\AMT\8-K_2023-03-09.md'
Converted 'data\edgar_documents\AMT\8-K_2023-03-13' --> 'data\processed_data\AMT\8-K_2023-03-13.md'
Converted 'data\edgar_documents\AMT\8-K_2023-03-31' --> 'data\processed_data\AMT\8-K_2023-03-31.md'
Converted 'data\edgar_documents\AMT\8-K_2023-04-26' --> 'data\processed_data\AMT\8-K_2023-04-26.md'


2025-11-14 15:36:42,120 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:42,143 - INFO - Going to convert document batch...
2025-11-14 15:36:42,144 - INFO - Processing document 8-K_2023-05-09
2025-11-14 15:36:42,164 - INFO - Finished converting document 8-K_2023-05-09 in 0.06 sec.
2025-11-14 15:36:42,189 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:42,203 - INFO - Going to convert document batch...
2025-11-14 15:36:42,205 - INFO - Processing document 8-K_2023-05-16
2025-11-14 15:36:42,226 - INFO - Finished converting document 8-K_2023-05-16 in 0.05 sec.
2025-11-14 15:36:42,250 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:42,266 - INFO - Going to convert document batch...
2025-11-14 15:36:42,267 - INFO - Processing document 8-K_2023-05-22
2025-11-14 15:36:42,288 - INFO - Finished converting document 8-K_2023-05-22 in 0.05 sec.
2025-11-14 15:36:42,312 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\AMT\8-K_2023-05-09' --> 'data\processed_data\AMT\8-K_2023-05-09.md'
Converted 'data\edgar_documents\AMT\8-K_2023-05-16' --> 'data\processed_data\AMT\8-K_2023-05-16.md'
Converted 'data\edgar_documents\AMT\8-K_2023-05-22' --> 'data\processed_data\AMT\8-K_2023-05-22.md'


2025-11-14 15:36:42,958 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:42,980 - INFO - Going to convert document batch...
2025-11-14 15:36:42,981 - INFO - Processing document 8-K_2023-06-29
2025-11-14 15:36:43,003 - INFO - Finished converting document 8-K_2023-06-29 in 0.17 sec.


Converted 'data\edgar_documents\AMT\8-K_2023-05-25' --> 'data\processed_data\AMT\8-K_2023-05-25.md'


2025-11-14 15:36:43,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,044 - INFO - Going to convert document batch...
2025-11-14 15:36:43,045 - INFO - Processing document 8-K_2023-07-20
2025-11-14 15:36:43,067 - INFO - Finished converting document 8-K_2023-07-20 in 0.05 sec.
2025-11-14 15:36:43,164 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,180 - INFO - Going to convert document batch...
2025-11-14 15:36:43,181 - INFO - Processing document 8-K_2023-07-27
2025-11-14 15:36:43,201 - INFO - Finished converting document 8-K_2023-07-27 in 0.12 sec.


Converted 'data\edgar_documents\AMT\8-K_2023-06-29' --> 'data\processed_data\AMT\8-K_2023-06-29.md'
Converted 'data\edgar_documents\AMT\8-K_2023-07-20' --> 'data\processed_data\AMT\8-K_2023-07-20.md'


2025-11-14 15:36:43,226 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,243 - INFO - Going to convert document batch...
2025-11-14 15:36:43,243 - INFO - Processing document 8-K_2023-09-12
2025-11-14 15:36:43,266 - INFO - Finished converting document 8-K_2023-09-12 in 0.05 sec.
2025-11-14 15:36:43,291 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,306 - INFO - Going to convert document batch...
2025-11-14 15:36:43,306 - INFO - Processing document 8-K_2023-09-15
2025-11-14 15:36:43,330 - INFO - Finished converting document 8-K_2023-09-15 in 0.05 sec.
2025-11-14 15:36:43,355 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,370 - INFO - Going to convert document batch...
2025-11-14 15:36:43,371 - INFO - Processing document 8-K_2023-09-20
2025-11-14 15:36:43,392 - INFO - Finished converting document 8-K_2023-09-20 in 0.05 sec.


Converted 'data\edgar_documents\AMT\8-K_2023-07-27' --> 'data\processed_data\AMT\8-K_2023-07-27.md'
Converted 'data\edgar_documents\AMT\8-K_2023-09-12' --> 'data\processed_data\AMT\8-K_2023-09-12.md'
Converted 'data\edgar_documents\AMT\8-K_2023-09-15' --> 'data\processed_data\AMT\8-K_2023-09-15.md'
Converted 'data\edgar_documents\AMT\8-K_2023-09-20' --> 'data\processed_data\AMT\8-K_2023-09-20.md'


2025-11-14 15:36:43,437 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,454 - INFO - Going to convert document batch...
2025-11-14 15:36:43,455 - INFO - Processing document 8-K_2023-10-26
2025-11-14 15:36:43,487 - INFO - Finished converting document 8-K_2023-10-26 in 0.08 sec.
2025-11-14 15:36:43,523 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,539 - INFO - Going to convert document batch...
2025-11-14 15:36:43,540 - INFO - Processing document 8-K_2023-12-14
2025-11-14 15:36:43,564 - INFO - Finished converting document 8-K_2023-12-14 in 0.06 sec.
2025-11-14 15:36:43,590 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,606 - INFO - Going to convert document batch...
2025-11-14 15:36:43,607 - INFO - Processing document 8-K_2024-01-05
2025-11-14 15:36:43,630 - INFO - Finished converting document 8-K_2024-01-05 in 0.05 sec.
2025-11-14 15:36:43,659 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\AMT\8-K_2023-10-26' --> 'data\processed_data\AMT\8-K_2023-10-26.md'
Converted 'data\edgar_documents\AMT\8-K_2023-12-14' --> 'data\processed_data\AMT\8-K_2023-12-14.md'
Converted 'data\edgar_documents\AMT\8-K_2024-01-05' --> 'data\processed_data\AMT\8-K_2024-01-05.md'


2025-11-14 15:36:43,720 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,733 - INFO - Going to convert document batch...
2025-11-14 15:36:43,734 - INFO - Processing document 8-K_2024-02-27
2025-11-14 15:36:43,757 - INFO - Finished converting document 8-K_2024-02-27 in 0.05 sec.
2025-11-14 15:36:43,780 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,794 - INFO - Going to convert document batch...
2025-11-14 15:36:43,795 - INFO - Processing document 8-K_2024-03-01
2025-11-14 15:36:43,819 - INFO - Finished converting document 8-K_2024-03-01 in 0.05 sec.
2025-11-14 15:36:43,845 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,858 - INFO - Going to convert document batch...
2025-11-14 15:36:43,859 - INFO - Processing document 8-K_2024-03-04
2025-11-14 15:36:43,882 - INFO - Finished converting document 8-K_2024-03-04 in 0.05 sec.


Converted 'data\edgar_documents\AMT\8-K_2024-02-07' --> 'data\processed_data\AMT\8-K_2024-02-07.md'
Converted 'data\edgar_documents\AMT\8-K_2024-02-27' --> 'data\processed_data\AMT\8-K_2024-02-27.md'
Converted 'data\edgar_documents\AMT\8-K_2024-03-01' --> 'data\processed_data\AMT\8-K_2024-03-01.md'


2025-11-14 15:36:43,907 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,923 - INFO - Going to convert document batch...
2025-11-14 15:36:43,923 - INFO - Processing document 8-K_2024-03-07
2025-11-14 15:36:43,949 - INFO - Finished converting document 8-K_2024-03-07 in 0.06 sec.
2025-11-14 15:36:43,974 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:43,988 - INFO - Going to convert document batch...
2025-11-14 15:36:43,989 - INFO - Processing document 8-K_2024-03-14
2025-11-14 15:36:44,014 - INFO - Finished converting document 8-K_2024-03-14 in 0.06 sec.
2025-11-14 15:36:44,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,055 - INFO - Going to convert document batch...
2025-11-14 15:36:44,056 - INFO - Processing document 8-K_2024-04-30
2025-11-14 15:36:44,079 - INFO - Finished converting document 8-K_2024-04-30 in 0.05 sec.


Converted 'data\edgar_documents\AMT\8-K_2024-03-04' --> 'data\processed_data\AMT\8-K_2024-03-04.md'
Converted 'data\edgar_documents\AMT\8-K_2024-03-07' --> 'data\processed_data\AMT\8-K_2024-03-07.md'
Converted 'data\edgar_documents\AMT\8-K_2024-03-14' --> 'data\processed_data\AMT\8-K_2024-03-14.md'


2025-11-14 15:36:44,102 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,115 - INFO - Going to convert document batch...
2025-11-14 15:36:44,116 - INFO - Processing document 8-K_2024-05-22
2025-11-14 15:36:44,140 - INFO - Finished converting document 8-K_2024-05-22 in 0.05 sec.
2025-11-14 15:36:44,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,184 - INFO - Going to convert document batch...
2025-11-14 15:36:44,185 - INFO - Processing document 8-K_2024-05-24
2025-11-14 15:36:44,220 - INFO - Finished converting document 8-K_2024-05-24 in 0.06 sec.
2025-11-14 15:36:44,252 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,268 - INFO - Going to convert document batch...
2025-11-14 15:36:44,268 - INFO - Processing document 8-K_2024-05-29
2025-11-14 15:36:44,291 - INFO - Finished converting document 8-K_2024-05-29 in 0.05 sec.


Converted 'data\edgar_documents\AMT\8-K_2024-04-30' --> 'data\processed_data\AMT\8-K_2024-04-30.md'
Converted 'data\edgar_documents\AMT\8-K_2024-05-22' --> 'data\processed_data\AMT\8-K_2024-05-22.md'
Converted 'data\edgar_documents\AMT\8-K_2024-05-24' --> 'data\processed_data\AMT\8-K_2024-05-24.md'


2025-11-14 15:36:44,317 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,331 - INFO - Going to convert document batch...
2025-11-14 15:36:44,332 - INFO - Processing document 8-K_2024-07-30
2025-11-14 15:36:44,358 - INFO - Finished converting document 8-K_2024-07-30 in 0.06 sec.
2025-11-14 15:36:44,383 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,397 - INFO - Going to convert document batch...
2025-11-14 15:36:44,397 - INFO - Processing document 8-K_2024-09-12
2025-11-14 15:36:44,418 - INFO - Finished converting document 8-K_2024-09-12 in 0.06 sec.
2025-11-14 15:36:44,444 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,459 - INFO - Going to convert document batch...
2025-11-14 15:36:44,460 - INFO - Processing document 8-K_2024-10-29
2025-11-14 15:36:44,482 - INFO - Finished converting document 8-K_2024-10-29 in 0.06 sec.


Converted 'data\edgar_documents\AMT\8-K_2024-05-29' --> 'data\processed_data\AMT\8-K_2024-05-29.md'
Converted 'data\edgar_documents\AMT\8-K_2024-07-30' --> 'data\processed_data\AMT\8-K_2024-07-30.md'
Converted 'data\edgar_documents\AMT\8-K_2024-09-12' --> 'data\processed_data\AMT\8-K_2024-09-12.md'


2025-11-14 15:36:44,510 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,522 - INFO - Going to convert document batch...
2025-11-14 15:36:44,523 - INFO - Processing document 8-K_2024-10-31
2025-11-14 15:36:44,543 - INFO - Finished converting document 8-K_2024-10-31 in 0.05 sec.
2025-11-14 15:36:44,566 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,580 - INFO - Going to convert document batch...
2025-11-14 15:36:44,580 - INFO - Processing document 8-K_2024-11-19
2025-11-14 15:36:44,604 - INFO - Finished converting document 8-K_2024-11-19 in 0.05 sec.
2025-11-14 15:36:44,629 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,646 - INFO - Going to convert document batch...
2025-11-14 15:36:44,647 - INFO - Processing document 8-K_2024-11-21
2025-11-14 15:36:44,673 - INFO - Finished converting document 8-K_2024-11-21 in 0.06 sec.


Converted 'data\edgar_documents\AMT\8-K_2024-10-29' --> 'data\processed_data\AMT\8-K_2024-10-29.md'
Converted 'data\edgar_documents\AMT\8-K_2024-10-31' --> 'data\processed_data\AMT\8-K_2024-10-31.md'
Converted 'data\edgar_documents\AMT\8-K_2024-11-19' --> 'data\processed_data\AMT\8-K_2024-11-19.md'


2025-11-14 15:36:44,697 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,712 - INFO - Going to convert document batch...
2025-11-14 15:36:44,712 - INFO - Processing document 8-K_2024-12-05
2025-11-14 15:36:44,740 - INFO - Finished converting document 8-K_2024-12-05 in 0.05 sec.
2025-11-14 15:36:44,763 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,801 - INFO - Going to convert document batch...
2025-11-14 15:36:44,804 - INFO - Processing document 8-K_2025-01-07
2025-11-14 15:36:44,855 - INFO - Finished converting document 8-K_2025-01-07 in 0.11 sec.
2025-11-14 15:36:44,882 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\8-K_2024-11-21' --> 'data\processed_data\AMT\8-K_2024-11-21.md'
Converted 'data\edgar_documents\AMT\8-K_2024-12-05' --> 'data\processed_data\AMT\8-K_2024-12-05.md'
Converted 'data\edgar_documents\AMT\8-K_2025-01-07' --> 'data\processed_data\AMT\8-K_2025-01-07.md'


2025-11-14 15:36:44,902 - INFO - Going to convert document batch...
2025-11-14 15:36:44,904 - INFO - Processing document 8-K_2025-01-28
2025-11-14 15:36:44,925 - INFO - Finished converting document 8-K_2025-01-28 in 0.06 sec.
2025-11-14 15:36:44,947 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:44,960 - INFO - Going to convert document batch...
2025-11-14 15:36:44,960 - INFO - Processing document 8-K_2025-02-05
2025-11-14 15:36:44,993 - INFO - Finished converting document 8-K_2025-02-05 in 0.05 sec.
2025-11-14 15:36:45,018 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:45,033 - INFO - Going to convert document batch...
2025-11-14 15:36:45,033 - INFO - Processing document 8-K_2025-02-25
2025-11-14 15:36:45,056 - INFO - Finished converting document 8-K_2025-02-25 in 0.05 sec.
2025-11-14 15:36:45,078 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:45,094 - INFO - Going to convert document batch...
2025-11-14 15:

Converted 'data\edgar_documents\AMT\8-K_2025-01-28' --> 'data\processed_data\AMT\8-K_2025-01-28.md'
Converted 'data\edgar_documents\AMT\8-K_2025-02-05' --> 'data\processed_data\AMT\8-K_2025-02-05.md'
Converted 'data\edgar_documents\AMT\8-K_2025-02-25' --> 'data\processed_data\AMT\8-K_2025-02-25.md'


2025-11-14 15:36:45,149 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:45,162 - INFO - Going to convert document batch...
2025-11-14 15:36:45,163 - INFO - Processing document 8-K_2025-03-06
2025-11-14 15:36:45,189 - INFO - Finished converting document 8-K_2025-03-06 in 0.06 sec.
2025-11-14 15:36:45,213 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:45,226 - INFO - Going to convert document batch...
2025-11-14 15:36:45,227 - INFO - Processing document 8-K_2025-03-11
2025-11-14 15:36:45,248 - INFO - Finished converting document 8-K_2025-03-11 in 0.05 sec.
2025-11-14 15:36:45,272 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:45,288 - INFO - Going to convert document batch...
2025-11-14 15:36:45,288 - INFO - Processing document 8-K_2025-03-14


Converted 'data\edgar_documents\AMT\8-K_2025-03-05' --> 'data\processed_data\AMT\8-K_2025-03-05.md'
Converted 'data\edgar_documents\AMT\8-K_2025-03-06' --> 'data\processed_data\AMT\8-K_2025-03-06.md'
Converted 'data\edgar_documents\AMT\8-K_2025-03-11' --> 'data\processed_data\AMT\8-K_2025-03-11.md'


2025-11-14 15:36:45,314 - INFO - Finished converting document 8-K_2025-03-14 in 0.06 sec.
2025-11-14 15:36:45,341 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:45,355 - INFO - Going to convert document batch...
2025-11-14 15:36:45,355 - INFO - Processing document 8-K_2025-03-20
2025-11-14 15:36:45,374 - INFO - Finished converting document 8-K_2025-03-20 in 0.05 sec.
2025-11-14 15:36:45,397 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:45,410 - INFO - Going to convert document batch...
2025-11-14 15:36:45,411 - INFO - Processing document 8-K_2025-04-29
2025-11-14 15:36:45,433 - INFO - Finished converting document 8-K_2025-04-29 in 0.05 sec.
2025-11-14 15:36:45,460 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:45,479 - INFO - Going to convert document batch...
2025-11-14 15:36:45,481 - INFO - Processing document 8-K_2025-05-15


Converted 'data\edgar_documents\AMT\8-K_2025-03-14' --> 'data\processed_data\AMT\8-K_2025-03-14.md'
Converted 'data\edgar_documents\AMT\8-K_2025-03-20' --> 'data\processed_data\AMT\8-K_2025-03-20.md'
Converted 'data\edgar_documents\AMT\8-K_2025-04-29' --> 'data\processed_data\AMT\8-K_2025-04-29.md'


2025-11-14 15:36:45,524 - INFO - Finished converting document 8-K_2025-05-15 in 0.08 sec.
2025-11-14 15:36:45,575 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:45,601 - INFO - Going to convert document batch...
2025-11-14 15:36:45,603 - INFO - Processing document 8-K_2025-05-21
2025-11-14 15:36:45,633 - INFO - Finished converting document 8-K_2025-05-21 in 0.08 sec.
2025-11-14 15:36:45,663 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:45,679 - INFO - Going to convert document batch...
2025-11-14 15:36:45,679 - INFO - Processing document 8-K_2025-05-30
2025-11-14 15:36:45,701 - INFO - Finished converting document 8-K_2025-05-30 in 0.06 sec.
2025-11-14 15:36:45,728 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:45,741 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMT\8-K_2025-05-15' --> 'data\processed_data\AMT\8-K_2025-05-15.md'
Converted 'data\edgar_documents\AMT\8-K_2025-05-21' --> 'data\processed_data\AMT\8-K_2025-05-21.md'
Converted 'data\edgar_documents\AMT\8-K_2025-05-30' --> 'data\processed_data\AMT\8-K_2025-05-30.md'


2025-11-14 15:36:45,742 - INFO - Processing document 8-K_2025-07-29
2025-11-14 15:36:45,764 - INFO - Finished converting document 8-K_2025-07-29 in 0.05 sec.
2025-11-14 15:36:45,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\8-K_2025-07-29' --> 'data\processed_data\AMT\8-K_2025-07-29.md'


2025-11-14 15:36:46,041 - INFO - Going to convert document batch...
2025-11-14 15:36:46,042 - INFO - Processing document 8-K_2025-08-25
2025-11-14 15:36:46,066 - INFO - Finished converting document 8-K_2025-08-25 in 0.28 sec.
2025-11-14 15:36:46,091 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:46,105 - INFO - Going to convert document batch...
2025-11-14 15:36:46,106 - INFO - Processing document 8-K_2025-09-05
2025-11-14 15:36:46,125 - INFO - Finished converting document 8-K_2025-09-05 in 0.05 sec.
2025-11-14 15:36:46,170 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:46,185 - INFO - Going to convert document batch...
2025-11-14 15:36:46,186 - INFO - Processing document 8-K_2025-09-11
2025-11-14 15:36:46,207 - INFO - Finished converting document 8-K_2025-09-11 in 0.06 sec.
2025-11-14 15:36:46,231 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:46,248 - INFO - Going to convert document batch...
2025-11-14 15:

Converted 'data\edgar_documents\AMT\8-K_2025-08-25' --> 'data\processed_data\AMT\8-K_2025-08-25.md'
Converted 'data\edgar_documents\AMT\8-K_2025-09-05' --> 'data\processed_data\AMT\8-K_2025-09-05.md'
Converted 'data\edgar_documents\AMT\8-K_2025-09-11' --> 'data\processed_data\AMT\8-K_2025-09-11.md'


2025-11-14 15:36:46,297 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:46,311 - INFO - Going to convert document batch...
2025-11-14 15:36:46,312 - INFO - Processing document 8-K_2025-09-18
2025-11-14 15:36:46,349 - INFO - Finished converting document 8-K_2025-09-18 in 0.06 sec.
2025-11-14 15:36:46,383 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:46,395 - INFO - Going to convert document batch...
2025-11-14 15:36:46,396 - INFO - Processing document 8-K_2025-09-24
2025-11-14 15:36:46,414 - INFO - Finished converting document 8-K_2025-09-24 in 0.05 sec.
2025-11-14 15:36:46,436 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:46,450 - INFO - Going to convert document batch...
2025-11-14 15:36:46,450 - INFO - Processing document 8-K_2025-10-28
2025-11-14 15:36:46,471 - INFO - Finished converting document 8-K_2025-10-28 in 0.05 sec.


Converted 'data\edgar_documents\AMT\8-K_2025-09-16' --> 'data\processed_data\AMT\8-K_2025-09-16.md'
Converted 'data\edgar_documents\AMT\8-K_2025-09-18' --> 'data\processed_data\AMT\8-K_2025-09-18.md'
Converted 'data\edgar_documents\AMT\8-K_2025-09-24' --> 'data\processed_data\AMT\8-K_2025-09-24.md'


2025-11-14 15:36:46,495 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:36:46,508 - INFO - Going to convert document batch...
2025-11-14 15:36:46,509 - INFO - Processing document 8-K_2025-11-07
2025-11-14 15:36:46,527 - INFO - Finished converting document 8-K_2025-11-07 in 0.05 sec.
2025-11-14 15:36:46,569 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\8-K_2025-10-28' --> 'data\processed_data\AMT\8-K_2025-10-28.md'
Converted 'data\edgar_documents\AMT\8-K_2025-11-07' --> 'data\processed_data\AMT\8-K_2025-11-07.md'


2025-11-14 15:36:46,982 - INFO - Going to convert document batch...
2025-11-14 15:36:46,983 - INFO - Processing document DEF-14A_2023-04-12
2025-11-14 15:36:48,897 - INFO - Finished converting document DEF-14A_2023-04-12 in 2.36 sec.
2025-11-14 15:36:49,729 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\DEF-14A_2023-04-12' --> 'data\processed_data\AMT\DEF-14A_2023-04-12.md'


2025-11-14 15:36:50,145 - INFO - Going to convert document batch...
2025-11-14 15:36:50,146 - INFO - Processing document DEF-14A_2024-04-10
2025-11-14 15:36:52,019 - INFO - Finished converting document DEF-14A_2024-04-10 in 2.33 sec.
2025-11-14 15:36:52,922 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\DEF-14A_2024-04-10' --> 'data\processed_data\AMT\DEF-14A_2024-04-10.md'


2025-11-14 15:36:53,655 - INFO - Going to convert document batch...
2025-11-14 15:36:53,656 - INFO - Processing document DEF-14A_2025-04-02
2025-11-14 15:36:56,890 - INFO - Finished converting document DEF-14A_2025-04-02 in 4.08 sec.
2025-11-14 15:36:58,504 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMT\DEF-14A_2025-04-02' --> 'data\processed_data\AMT\DEF-14A_2025-04-02.md'
Processed 130 new files. Errors: 16
Found 169 files to process in data\edgar_documents\AMZN


2025-11-14 15:36:59,170 - INFO - Going to convert document batch...
2025-11-14 15:36:59,170 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:36:59,170 - INFO - Processing document 10-K_2023-02-03
2025-11-14 15:37:00,025 - INFO - Finished converting document 10-K_2023-02-03 in 1.56 sec.
2025-11-14 15:37:00,412 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\10-K_2023-02-03' --> 'data\processed_data\AMZN\10-K_2023-02-03.md'


2025-11-14 15:37:01,007 - INFO - Going to convert document batch...
2025-11-14 15:37:01,007 - INFO - Processing document 10-K_2024-02-02
2025-11-14 15:37:01,888 - INFO - Finished converting document 10-K_2024-02-02 in 1.52 sec.
2025-11-14 15:37:02,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\10-K_2024-02-02' --> 'data\processed_data\AMZN\10-K_2024-02-02.md'


2025-11-14 15:37:02,670 - INFO - Going to convert document batch...
2025-11-14 15:37:02,670 - INFO - Processing document 10-K_2025-02-07
2025-11-14 15:37:03,548 - INFO - Finished converting document 10-K_2025-02-07 in 1.30 sec.
2025-11-14 15:37:03,930 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\10-K_2025-02-07' --> 'data\processed_data\AMZN\10-K_2025-02-07.md'


2025-11-14 15:37:04,506 - INFO - Going to convert document batch...
2025-11-14 15:37:04,507 - INFO - Processing document 10-Q_2023-04-28
2025-11-14 15:37:04,953 - INFO - Finished converting document 10-Q_2023-04-28 in 1.05 sec.
2025-11-14 15:37:05,217 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\10-Q_2023-04-28' --> 'data\processed_data\AMZN\10-Q_2023-04-28.md'


2025-11-14 15:37:05,491 - INFO - Going to convert document batch...
2025-11-14 15:37:05,492 - INFO - Processing document 10-Q_2023-08-04
2025-11-14 15:37:06,023 - INFO - Finished converting document 10-Q_2023-08-04 in 0.83 sec.
2025-11-14 15:37:06,321 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\10-Q_2023-08-04' --> 'data\processed_data\AMZN\10-Q_2023-08-04.md'


2025-11-14 15:37:06,605 - INFO - Going to convert document batch...
2025-11-14 15:37:06,606 - INFO - Processing document 10-Q_2023-10-27
2025-11-14 15:37:07,424 - INFO - Finished converting document 10-Q_2023-10-27 in 1.12 sec.
2025-11-14 15:37:07,731 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\10-Q_2023-10-27' --> 'data\processed_data\AMZN\10-Q_2023-10-27.md'


2025-11-14 15:37:07,999 - INFO - Going to convert document batch...
2025-11-14 15:37:07,999 - INFO - Processing document 10-Q_2024-05-01
2025-11-14 15:37:08,508 - INFO - Finished converting document 10-Q_2024-05-01 in 0.80 sec.
2025-11-14 15:37:08,799 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\10-Q_2024-05-01' --> 'data\processed_data\AMZN\10-Q_2024-05-01.md'


2025-11-14 15:37:09,080 - INFO - Going to convert document batch...
2025-11-14 15:37:09,081 - INFO - Processing document 10-Q_2024-08-02
2025-11-14 15:37:09,628 - INFO - Finished converting document 10-Q_2024-08-02 in 0.86 sec.
2025-11-14 15:37:09,953 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\10-Q_2024-08-02' --> 'data\processed_data\AMZN\10-Q_2024-08-02.md'


2025-11-14 15:37:10,587 - INFO - Going to convert document batch...
2025-11-14 15:37:10,588 - INFO - Processing document 10-Q_2024-11-01
2025-11-14 15:37:11,147 - INFO - Finished converting document 10-Q_2024-11-01 in 1.22 sec.
2025-11-14 15:37:11,452 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\10-Q_2024-11-01' --> 'data\processed_data\AMZN\10-Q_2024-11-01.md'


2025-11-14 15:37:11,692 - INFO - Going to convert document batch...
2025-11-14 15:37:11,692 - INFO - Processing document 10-Q_2025-05-02
2025-11-14 15:37:12,152 - INFO - Finished converting document 10-Q_2025-05-02 in 0.73 sec.
2025-11-14 15:37:12,427 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\10-Q_2025-05-02' --> 'data\processed_data\AMZN\10-Q_2025-05-02.md'


2025-11-14 15:37:12,999 - INFO - Going to convert document batch...
2025-11-14 15:37:12,999 - INFO - Processing document 10-Q_2025-08-01
2025-11-14 15:37:13,583 - INFO - Finished converting document 10-Q_2025-08-01 in 1.19 sec.
2025-11-14 15:37:13,929 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\10-Q_2025-08-01' --> 'data\processed_data\AMZN\10-Q_2025-08-01.md'


2025-11-14 15:37:14,220 - INFO - Going to convert document batch...
2025-11-14 15:37:14,221 - INFO - Processing document 10-Q_2025-10-31
2025-11-14 15:37:14,786 - INFO - Finished converting document 10-Q_2025-10-31 in 0.89 sec.
2025-11-14 15:37:15,075 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:15,088 - INFO - Going to convert document batch...
2025-11-14 15:37:15,089 - INFO - Processing document 4_2023-02-06
2025-11-14 15:37:15,124 - INFO - Finished converting document 4_2023-02-06 in 0.06 sec.
2025-11-14 15:37:15,222 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:15,232 - INFO - Going to convert document batch...
2025-11-14 15:37:15,233 - INFO - Processing document 4_2023-02-08
2025-11-14 15:37:15,251 - INFO - Finished converting document 4_2023-02-08 in 0.06 sec.


Converted 'data\edgar_documents\AMZN\10-Q_2025-10-31' --> 'data\processed_data\AMZN\10-Q_2025-10-31.md'
Converted 'data\edgar_documents\AMZN\4_2023-02-06' --> 'data\processed_data\AMZN\4_2023-02-06.md'


2025-11-14 15:37:15,283 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:15,292 - INFO - Going to convert document batch...
2025-11-14 15:37:15,293 - INFO - Processing document 4_2023-02-17
2025-11-14 15:37:15,317 - INFO - Finished converting document 4_2023-02-17 in 0.05 sec.
2025-11-14 15:37:15,376 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:15,390 - INFO - Going to convert document batch...
2025-11-14 15:37:15,391 - INFO - Processing document 4_2023-02-23
2025-11-14 15:37:15,416 - INFO - Finished converting document 4_2023-02-23 in 0.06 sec.
2025-11-14 15:37:15,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\4_2023-02-08' --> 'data\processed_data\AMZN\4_2023-02-08.md'
Converted 'data\edgar_documents\AMZN\4_2023-02-17' --> 'data\processed_data\AMZN\4_2023-02-17.md'
Converted 'data\edgar_documents\AMZN\4_2023-02-23' --> 'data\processed_data\AMZN\4_2023-02-23.md'


2025-11-14 15:37:15,465 - INFO - Going to convert document batch...
2025-11-14 15:37:15,466 - INFO - Processing document 4_2023-02-24
2025-11-14 15:37:15,486 - INFO - Finished converting document 4_2023-02-24 in 0.05 sec.
2025-11-14 15:37:15,517 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:15,525 - INFO - Going to convert document batch...
2025-11-14 15:37:15,526 - INFO - Processing document 4_2023-03-03
2025-11-14 15:37:15,546 - INFO - Finished converting document 4_2023-03-03 in 0.05 sec.
2025-11-14 15:37:15,578 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:15,585 - INFO - Going to convert document batch...
2025-11-14 15:37:15,586 - INFO - Processing document 4_2023-03-23
2025-11-14 15:37:15,607 - INFO - Finished converting document 4_2023-03-23 in 0.05 sec.
2025-11-14 15:37:15,644 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:15,654 - INFO - Going to convert document batch...
2025-11-14 15:37:15,655 - 

Converted 'data\edgar_documents\AMZN\4_2023-02-24' --> 'data\processed_data\AMZN\4_2023-02-24.md'
Converted 'data\edgar_documents\AMZN\4_2023-03-03' --> 'data\processed_data\AMZN\4_2023-03-03.md'
Converted 'data\edgar_documents\AMZN\4_2023-03-23' --> 'data\processed_data\AMZN\4_2023-03-23.md'
Converted 'data\edgar_documents\AMZN\4_2023-04-05' --> 'data\processed_data\AMZN\4_2023-04-05.md'


2025-11-14 15:37:15,716 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:15,726 - INFO - Going to convert document batch...
2025-11-14 15:37:15,727 - INFO - Processing document 4_2023-04-06
2025-11-14 15:37:15,753 - INFO - Finished converting document 4_2023-04-06 in 0.05 sec.
2025-11-14 15:37:15,795 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:15,806 - INFO - Going to convert document batch...
2025-11-14 15:37:15,807 - INFO - Processing document 4_2023-04-21
2025-11-14 15:37:15,835 - INFO - Finished converting document 4_2023-04-21 in 0.05 sec.
2025-11-14 15:37:15,880 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:15,888 - INFO - Going to convert document batch...
2025-11-14 15:37:15,889 - INFO - Processing document 4_2023-05-03
2025-11-14 15:37:15,909 - INFO - Finished converting document 4_2023-05-03 in 0.03 sec.
2025-11-14 15:37:15,947 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\AMZN\4_2023-04-06' --> 'data\processed_data\AMZN\4_2023-04-06.md'
Converted 'data\edgar_documents\AMZN\4_2023-04-21' --> 'data\processed_data\AMZN\4_2023-04-21.md'
Converted 'data\edgar_documents\AMZN\4_2023-05-03' --> 'data\processed_data\AMZN\4_2023-05-03.md'


2025-11-14 15:37:15,983 - INFO - Finished converting document 4_2023-05-08 in 0.05 sec.
2025-11-14 15:37:16,023 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:16,037 - INFO - Going to convert document batch...
2025-11-14 15:37:16,037 - INFO - Processing document 4_2023-05-17
2025-11-14 15:37:16,069 - INFO - Finished converting document 4_2023-05-17 in 0.05 sec.
2025-11-14 15:37:16,133 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:16,148 - INFO - Going to convert document batch...
2025-11-14 15:37:16,149 - INFO - Processing document 4_2023-05-18
2025-11-14 15:37:16,172 - INFO - Finished converting document 4_2023-05-18 in 0.06 sec.
2025-11-14 15:37:16,208 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\4_2023-05-08' --> 'data\processed_data\AMZN\4_2023-05-08.md'
Converted 'data\edgar_documents\AMZN\4_2023-05-17' --> 'data\processed_data\AMZN\4_2023-05-17.md'
Converted 'data\edgar_documents\AMZN\4_2023-05-18' --> 'data\processed_data\AMZN\4_2023-05-18.md'


2025-11-14 15:37:16,222 - INFO - Going to convert document batch...
2025-11-14 15:37:16,223 - INFO - Processing document 4_2023-05-23
2025-11-14 15:37:16,258 - INFO - Finished converting document 4_2023-05-23 in 0.05 sec.
2025-11-14 15:37:16,303 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\4_2023-05-23' --> 'data\processed_data\AMZN\4_2023-05-23.md'


2025-11-14 15:37:16,652 - INFO - Going to convert document batch...
2025-11-14 15:37:16,653 - INFO - Processing document 4_2023-05-26
2025-11-14 15:37:16,673 - INFO - Finished converting document 4_2023-05-26 in 0.38 sec.
2025-11-14 15:37:16,713 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:16,720 - INFO - Going to convert document batch...
2025-11-14 15:37:16,721 - INFO - Processing document 4_2023-06-05
2025-11-14 15:37:16,740 - INFO - Finished converting document 4_2023-06-05 in 0.03 sec.
2025-11-14 15:37:16,787 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:16,806 - INFO - Going to convert document batch...
2025-11-14 15:37:16,807 - INFO - Processing document 4_2023-06-08
2025-11-14 15:37:16,837 - INFO - Finished converting document 4_2023-06-08 in 0.06 sec.
2025-11-14 15:37:16,895 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\4_2023-05-26' --> 'data\processed_data\AMZN\4_2023-05-26.md'
Converted 'data\edgar_documents\AMZN\4_2023-06-05' --> 'data\processed_data\AMZN\4_2023-06-05.md'
Converted 'data\edgar_documents\AMZN\4_2023-06-08' --> 'data\processed_data\AMZN\4_2023-06-08.md'


2025-11-14 15:37:16,909 - INFO - Going to convert document batch...
2025-11-14 15:37:16,911 - INFO - Processing document 4_2023-06-23
2025-11-14 15:37:16,944 - INFO - Finished converting document 4_2023-06-23 in 0.08 sec.
2025-11-14 15:37:16,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:16,994 - INFO - Going to convert document batch...
2025-11-14 15:37:16,994 - INFO - Processing document 4_2023-07-06
2025-11-14 15:37:17,013 - INFO - Finished converting document 4_2023-07-06 in 0.05 sec.
2025-11-14 15:37:17,047 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:17,057 - INFO - Going to convert document batch...
2025-11-14 15:37:17,058 - INFO - Processing document 4_2023-07-10
2025-11-14 15:37:17,084 - INFO - Finished converting document 4_2023-07-10 in 0.05 sec.
2025-11-14 15:37:17,141 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:17,158 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMZN\4_2023-06-23' --> 'data\processed_data\AMZN\4_2023-06-23.md'
Converted 'data\edgar_documents\AMZN\4_2023-07-06' --> 'data\processed_data\AMZN\4_2023-07-06.md'
Converted 'data\edgar_documents\AMZN\4_2023-07-10' --> 'data\processed_data\AMZN\4_2023-07-10.md'


2025-11-14 15:37:17,161 - INFO - Processing document 4_2023-07-26
2025-11-14 15:37:17,182 - INFO - Finished converting document 4_2023-07-26 in 0.08 sec.
2025-11-14 15:37:17,216 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:17,223 - INFO - Going to convert document batch...
2025-11-14 15:37:17,224 - INFO - Processing document 4_2023-08-03
2025-11-14 15:37:17,242 - INFO - Finished converting document 4_2023-08-03 in 0.03 sec.
2025-11-14 15:37:17,287 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:17,303 - INFO - Going to convert document batch...
2025-11-14 15:37:17,305 - INFO - Processing document 4_2023-08-08
2025-11-14 15:37:17,353 - INFO - Finished converting document 4_2023-08-08 in 0.08 sec.
2025-11-14 15:37:17,384 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\4_2023-07-26' --> 'data\processed_data\AMZN\4_2023-07-26.md'
Converted 'data\edgar_documents\AMZN\4_2023-08-03' --> 'data\processed_data\AMZN\4_2023-08-03.md'
Converted 'data\edgar_documents\AMZN\4_2023-08-08' --> 'data\processed_data\AMZN\4_2023-08-08.md'


2025-11-14 15:37:17,393 - INFO - Going to convert document batch...
2025-11-14 15:37:17,393 - INFO - Processing document 4_2023-08-11
2025-11-14 15:37:17,411 - INFO - Finished converting document 4_2023-08-11 in 0.03 sec.
2025-11-14 15:37:17,445 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:17,457 - INFO - Going to convert document batch...
2025-11-14 15:37:17,457 - INFO - Processing document 4_2023-08-17
2025-11-14 15:37:17,486 - INFO - Finished converting document 4_2023-08-17 in 0.05 sec.
2025-11-14 15:37:17,523 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:17,537 - INFO - Going to convert document batch...
2025-11-14 15:37:17,539 - INFO - Processing document 4_2023-08-23
2025-11-14 15:37:17,572 - INFO - Finished converting document 4_2023-08-23 in 0.05 sec.
2025-11-14 15:37:17,613 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:17,623 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMZN\4_2023-08-11' --> 'data\processed_data\AMZN\4_2023-08-11.md'
Converted 'data\edgar_documents\AMZN\4_2023-08-17' --> 'data\processed_data\AMZN\4_2023-08-17.md'
Converted 'data\edgar_documents\AMZN\4_2023-08-23' --> 'data\processed_data\AMZN\4_2023-08-23.md'


2025-11-14 15:37:17,624 - INFO - Processing document 4_2023-09-06
2025-11-14 15:37:17,645 - INFO - Finished converting document 4_2023-09-06 in 0.05 sec.
2025-11-14 15:37:17,678 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:17,688 - INFO - Going to convert document batch...
2025-11-14 15:37:17,689 - INFO - Processing document 4_2023-09-07
2025-11-14 15:37:17,710 - INFO - Finished converting document 4_2023-09-07 in 0.05 sec.
2025-11-14 15:37:17,743 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:17,752 - INFO - Going to convert document batch...
2025-11-14 15:37:17,753 - INFO - Processing document 4_2023-09-13
2025-11-14 15:37:17,773 - INFO - Finished converting document 4_2023-09-13 in 0.03 sec.
2025-11-14 15:37:17,819 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:17,829 - INFO - Going to convert document batch...
2025-11-14 15:37:17,829 - INFO - Processing document 4_2023-09-18


Converted 'data\edgar_documents\AMZN\4_2023-09-06' --> 'data\processed_data\AMZN\4_2023-09-06.md'
Converted 'data\edgar_documents\AMZN\4_2023-09-07' --> 'data\processed_data\AMZN\4_2023-09-07.md'
Converted 'data\edgar_documents\AMZN\4_2023-09-13' --> 'data\processed_data\AMZN\4_2023-09-13.md'


2025-11-14 15:37:17,847 - INFO - Finished converting document 4_2023-09-18 in 0.05 sec.
2025-11-14 15:37:17,879 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:17,888 - INFO - Going to convert document batch...
2025-11-14 15:37:17,889 - INFO - Processing document 4_2023-09-22
2025-11-14 15:37:17,911 - INFO - Finished converting document 4_2023-09-22 in 0.05 sec.
2025-11-14 15:37:17,944 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:17,952 - INFO - Going to convert document batch...
2025-11-14 15:37:17,952 - INFO - Processing document 4_2023-10-04
2025-11-14 15:37:17,971 - INFO - Finished converting document 4_2023-10-04 in 0.03 sec.
2025-11-14 15:37:18,002 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,013 - INFO - Going to convert document batch...
2025-11-14 15:37:18,014 - INFO - Processing document 4_2023-10-10
2025-11-14 15:37:18,035 - INFO - Finished converting document 4_2023-10-10 in 0.05 sec.


Converted 'data\edgar_documents\AMZN\4_2023-09-18' --> 'data\processed_data\AMZN\4_2023-09-18.md'
Converted 'data\edgar_documents\AMZN\4_2023-09-22' --> 'data\processed_data\AMZN\4_2023-09-22.md'
Converted 'data\edgar_documents\AMZN\4_2023-10-04' --> 'data\processed_data\AMZN\4_2023-10-04.md'


2025-11-14 15:37:18,072 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,081 - INFO - Going to convert document batch...
2025-11-14 15:37:18,082 - INFO - Processing document 4_2023-10-23
2025-11-14 15:37:18,102 - INFO - Finished converting document 4_2023-10-23 in 0.03 sec.
2025-11-14 15:37:18,152 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,164 - INFO - Going to convert document batch...
2025-11-14 15:37:18,164 - INFO - Processing document 4_2023-11-01
2025-11-14 15:37:18,185 - INFO - Finished converting document 4_2023-11-01 in 0.06 sec.
2025-11-14 15:37:18,217 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,225 - INFO - Going to convert document batch...
2025-11-14 15:37:18,225 - INFO - Processing document 4_2023-11-03
2025-11-14 15:37:18,242 - INFO - Finished converting document 4_2023-11-03 in 0.03 sec.
2025-11-14 15:37:18,273 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\4_2023-10-10' --> 'data\processed_data\AMZN\4_2023-10-10.md'
Converted 'data\edgar_documents\AMZN\4_2023-10-23' --> 'data\processed_data\AMZN\4_2023-10-23.md'
Converted 'data\edgar_documents\AMZN\4_2023-11-01' --> 'data\processed_data\AMZN\4_2023-11-01.md'
Converted 'data\edgar_documents\AMZN\4_2023-11-03' --> 'data\processed_data\AMZN\4_2023-11-03.md'


2025-11-14 15:37:18,282 - INFO - Going to convert document batch...
2025-11-14 15:37:18,282 - INFO - Processing document 4_2023-11-06
2025-11-14 15:37:18,303 - INFO - Finished converting document 4_2023-11-06 in 0.03 sec.
2025-11-14 15:37:18,336 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,343 - INFO - Going to convert document batch...
2025-11-14 15:37:18,344 - INFO - Processing document 4_2023-11-15
2025-11-14 15:37:18,363 - INFO - Finished converting document 4_2023-11-15 in 0.03 sec.
2025-11-14 15:37:18,394 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,414 - INFO - Going to convert document batch...
2025-11-14 15:37:18,415 - INFO - Processing document 4_2023-11-17
2025-11-14 15:37:18,444 - INFO - Finished converting document 4_2023-11-17 in 0.06 sec.
2025-11-14 15:37:18,487 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,501 - INFO - Going to convert document batch...
2025-11-14 15:37:18,502 - 

Converted 'data\edgar_documents\AMZN\4_2023-11-06' --> 'data\processed_data\AMZN\4_2023-11-06.md'
Converted 'data\edgar_documents\AMZN\4_2023-11-15' --> 'data\processed_data\AMZN\4_2023-11-15.md'
Converted 'data\edgar_documents\AMZN\4_2023-11-17' --> 'data\processed_data\AMZN\4_2023-11-17.md'


2025-11-14 15:37:18,536 - INFO - Finished converting document 4_2023-11-24 in 0.06 sec.
2025-11-14 15:37:18,577 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,586 - INFO - Going to convert document batch...
2025-11-14 15:37:18,587 - INFO - Processing document 4_2023-11-27
2025-11-14 15:37:18,607 - INFO - Finished converting document 4_2023-11-27 in 0.05 sec.
2025-11-14 15:37:18,636 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,644 - INFO - Going to convert document batch...
2025-11-14 15:37:18,645 - INFO - Processing document 4_2023-12-05
2025-11-14 15:37:18,664 - INFO - Finished converting document 4_2023-12-05 in 0.03 sec.
2025-11-14 15:37:18,709 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,721 - INFO - Going to convert document batch...
2025-11-14 15:37:18,721 - INFO - Processing document 4_2023-12-08
2025-11-14 15:37:18,740 - INFO - Finished converting document 4_2023-12-08 in 0.05 sec.


Converted 'data\edgar_documents\AMZN\4_2023-11-24' --> 'data\processed_data\AMZN\4_2023-11-24.md'
Converted 'data\edgar_documents\AMZN\4_2023-11-27' --> 'data\processed_data\AMZN\4_2023-11-27.md'
Converted 'data\edgar_documents\AMZN\4_2023-12-05' --> 'data\processed_data\AMZN\4_2023-12-05.md'


2025-11-14 15:37:18,777 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,786 - INFO - Going to convert document batch...
2025-11-14 15:37:18,787 - INFO - Processing document 4_2023-12-26
2025-11-14 15:37:18,815 - INFO - Finished converting document 4_2023-12-26 in 0.05 sec.
2025-11-14 15:37:18,870 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,891 - INFO - Going to convert document batch...
2025-11-14 15:37:18,893 - INFO - Processing document 4_2024-01-08
2025-11-14 15:37:18,926 - INFO - Finished converting document 4_2024-01-08 in 0.08 sec.


Converted 'data\edgar_documents\AMZN\4_2023-12-08' --> 'data\processed_data\AMZN\4_2023-12-08.md'
Converted 'data\edgar_documents\AMZN\4_2023-12-26' --> 'data\processed_data\AMZN\4_2023-12-26.md'


2025-11-14 15:37:18,963 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:18,974 - INFO - Going to convert document batch...
2025-11-14 15:37:18,975 - INFO - Processing document 4_2024-01-22
2025-11-14 15:37:19,003 - INFO - Finished converting document 4_2024-01-22 in 0.05 sec.
2025-11-14 15:37:19,039 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:19,050 - INFO - Going to convert document batch...
2025-11-14 15:37:19,051 - INFO - Processing document 4_2024-02-05
2025-11-14 15:37:19,072 - INFO - Finished converting document 4_2024-02-05 in 0.03 sec.
2025-11-14 15:37:19,104 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:19,113 - INFO - Going to convert document batch...
2025-11-14 15:37:19,114 - INFO - Processing document 4_2024-02-09
2025-11-14 15:37:19,135 - INFO - Finished converting document 4_2024-02-09 in 0.05 sec.


Converted 'data\edgar_documents\AMZN\4_2024-01-08' --> 'data\processed_data\AMZN\4_2024-01-08.md'
Converted 'data\edgar_documents\AMZN\4_2024-01-22' --> 'data\processed_data\AMZN\4_2024-01-22.md'
Converted 'data\edgar_documents\AMZN\4_2024-02-05' --> 'data\processed_data\AMZN\4_2024-02-05.md'


2025-11-14 15:37:19,170 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:19,178 - INFO - Going to convert document batch...
2025-11-14 15:37:19,179 - INFO - Processing document 4_2024-02-13
2025-11-14 15:37:19,197 - INFO - Finished converting document 4_2024-02-13 in 0.03 sec.
2025-11-14 15:37:19,227 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:19,235 - INFO - Going to convert document batch...
2025-11-14 15:37:19,236 - INFO - Processing document 4_2024-02-14
2025-11-14 15:37:19,253 - INFO - Finished converting document 4_2024-02-14 in 0.03 sec.
2025-11-14 15:37:19,284 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:19,298 - INFO - Going to convert document batch...
2025-11-14 15:37:19,299 - INFO - Processing document 4_2024-02-15
2025-11-14 15:37:19,328 - INFO - Finished converting document 4_2024-02-15 in 0.06 sec.


Converted 'data\edgar_documents\AMZN\4_2024-02-09' --> 'data\processed_data\AMZN\4_2024-02-09.md'
Converted 'data\edgar_documents\AMZN\4_2024-02-13' --> 'data\processed_data\AMZN\4_2024-02-13.md'
Converted 'data\edgar_documents\AMZN\4_2024-02-14' --> 'data\processed_data\AMZN\4_2024-02-14.md'
Converted 'data\edgar_documents\AMZN\4_2024-02-15' --> 'data\processed_data\AMZN\4_2024-02-15.md'


2025-11-14 15:37:19,386 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:19,394 - INFO - Going to convert document batch...
2025-11-14 15:37:19,395 - INFO - Processing document 4_2024-02-20
2025-11-14 15:37:19,416 - INFO - Finished converting document 4_2024-02-20 in 0.05 sec.
2025-11-14 15:37:19,446 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:19,460 - INFO - Going to convert document batch...
2025-11-14 15:37:19,461 - INFO - Processing document 4_2024-02-23
2025-11-14 15:37:19,492 - INFO - Finished converting document 4_2024-02-23 in 0.05 sec.
2025-11-14 15:37:19,532 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:19,540 - INFO - Going to convert document batch...
2025-11-14 15:37:19,541 - INFO - Processing document 4_2024-03-04
2025-11-14 15:37:19,560 - INFO - Finished converting document 4_2024-03-04 in 0.05 sec.
2025-11-14 15:37:19,592 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\AMZN\4_2024-02-20' --> 'data\processed_data\AMZN\4_2024-02-20.md'
Converted 'data\edgar_documents\AMZN\4_2024-02-23' --> 'data\processed_data\AMZN\4_2024-02-23.md'
Converted 'data\edgar_documents\AMZN\4_2024-03-04' --> 'data\processed_data\AMZN\4_2024-03-04.md'


2025-11-14 15:37:19,621 - INFO - Finished converting document 4_2024-03-05 in 0.05 sec.
2025-11-14 15:37:19,652 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:19,660 - INFO - Going to convert document batch...
2025-11-14 15:37:19,661 - INFO - Processing document 4_2024-03-06
2025-11-14 15:37:19,679 - INFO - Finished converting document 4_2024-03-06 in 0.03 sec.
2025-11-14 15:37:19,709 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:19,717 - INFO - Going to convert document batch...
2025-11-14 15:37:19,718 - INFO - Processing document 4_2024-03-11
2025-11-14 15:37:19,738 - INFO - Finished converting document 4_2024-03-11 in 0.03 sec.
2025-11-14 15:37:19,771 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:19,782 - INFO - Going to convert document batch...
2025-11-14 15:37:19,783 - INFO - Processing document 4_2024-03-25
2025-11-14 15:37:19,803 - INFO - Finished converting document 4_2024-03-25 in 0.05 sec.
2025-1

Converted 'data\edgar_documents\AMZN\4_2024-03-05' --> 'data\processed_data\AMZN\4_2024-03-05.md'
Converted 'data\edgar_documents\AMZN\4_2024-03-06' --> 'data\processed_data\AMZN\4_2024-03-06.md'
Converted 'data\edgar_documents\AMZN\4_2024-03-11' --> 'data\processed_data\AMZN\4_2024-03-11.md'
Converted 'data\edgar_documents\AMZN\4_2024-03-25' --> 'data\processed_data\AMZN\4_2024-03-25.md'


2025-11-14 15:37:19,845 - INFO - Going to convert document batch...
2025-11-14 15:37:19,846 - INFO - Processing document 4_2024-04-03
2025-11-14 15:37:19,887 - INFO - Finished converting document 4_2024-04-03 in 0.06 sec.
2025-11-14 15:37:19,930 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:19,939 - INFO - Going to convert document batch...
2025-11-14 15:37:19,940 - INFO - Processing document 4_2024-04-08
2025-11-14 15:37:19,962 - INFO - Finished converting document 4_2024-04-08 in 0.03 sec.
2025-11-14 15:37:20,006 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:20,020 - INFO - Going to convert document batch...
2025-11-14 15:37:20,021 - INFO - Processing document 4_2024-04-12
2025-11-14 15:37:20,040 - INFO - Finished converting document 4_2024-04-12 in 0.05 sec.
2025-11-14 15:37:20,073 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:20,082 - INFO - Going to convert document batch...
2025-11-14 15:37:20,083 - 

Converted 'data\edgar_documents\AMZN\4_2024-04-03' --> 'data\processed_data\AMZN\4_2024-04-03.md'
Converted 'data\edgar_documents\AMZN\4_2024-04-08' --> 'data\processed_data\AMZN\4_2024-04-08.md'
Converted 'data\edgar_documents\AMZN\4_2024-04-12' --> 'data\processed_data\AMZN\4_2024-04-12.md'


2025-11-14 15:37:20,138 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:20,150 - INFO - Going to convert document batch...
2025-11-14 15:37:20,151 - INFO - Processing document 4_2024-05-03
2025-11-14 15:37:20,188 - INFO - Finished converting document 4_2024-05-03 in 0.06 sec.
2025-11-14 15:37:20,242 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:20,252 - INFO - Going to convert document batch...
2025-11-14 15:37:20,253 - INFO - Processing document 4_2024-05-08
2025-11-14 15:37:20,269 - INFO - Finished converting document 4_2024-05-08 in 0.05 sec.
2025-11-14 15:37:20,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:20,309 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMZN\4_2024-04-22' --> 'data\processed_data\AMZN\4_2024-04-22.md'
Converted 'data\edgar_documents\AMZN\4_2024-05-03' --> 'data\processed_data\AMZN\4_2024-05-03.md'
Converted 'data\edgar_documents\AMZN\4_2024-05-08' --> 'data\processed_data\AMZN\4_2024-05-08.md'


2025-11-14 15:37:20,310 - INFO - Processing document 4_2024-05-13
2025-11-14 15:37:20,327 - INFO - Finished converting document 4_2024-05-13 in 0.03 sec.
2025-11-14 15:37:20,358 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\4_2024-05-13' --> 'data\processed_data\AMZN\4_2024-05-13.md'


2025-11-14 15:37:20,611 - INFO - Going to convert document batch...
2025-11-14 15:37:20,612 - INFO - Processing document 4_2024-05-17
2025-11-14 15:37:20,645 - INFO - Finished converting document 4_2024-05-17 in 0.30 sec.
2025-11-14 15:37:20,687 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:20,698 - INFO - Going to convert document batch...
2025-11-14 15:37:20,699 - INFO - Processing document 4_2024-05-23
2025-11-14 15:37:20,727 - INFO - Finished converting document 4_2024-05-23 in 0.05 sec.
2025-11-14 15:37:20,767 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:20,778 - INFO - Going to convert document batch...
2025-11-14 15:37:20,779 - INFO - Processing document 4_2024-05-31
2025-11-14 15:37:20,797 - INFO - Finished converting document 4_2024-05-31 in 0.05 sec.
2025-11-14 15:37:20,828 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:20,837 - INFO - Going to convert document batch...
2025-11-14 15:37:20,838 - 

Converted 'data\edgar_documents\AMZN\4_2024-05-17' --> 'data\processed_data\AMZN\4_2024-05-17.md'
Converted 'data\edgar_documents\AMZN\4_2024-05-23' --> 'data\processed_data\AMZN\4_2024-05-23.md'
Converted 'data\edgar_documents\AMZN\4_2024-05-31' --> 'data\processed_data\AMZN\4_2024-05-31.md'


2025-11-14 15:37:20,888 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:20,897 - INFO - Going to convert document batch...
2025-11-14 15:37:20,899 - INFO - Processing document 4_2024-07-01
2025-11-14 15:37:20,922 - INFO - Finished converting document 4_2024-07-01 in 0.05 sec.
2025-11-14 15:37:20,969 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:20,987 - INFO - Going to convert document batch...
2025-11-14 15:37:20,988 - INFO - Processing document 4_2024-07-03
2025-11-14 15:37:21,012 - INFO - Finished converting document 4_2024-07-03 in 0.06 sec.
2025-11-14 15:37:21,049 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,057 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMZN\4_2024-06-05' --> 'data\processed_data\AMZN\4_2024-06-05.md'
Converted 'data\edgar_documents\AMZN\4_2024-07-01' --> 'data\processed_data\AMZN\4_2024-07-01.md'
Converted 'data\edgar_documents\AMZN\4_2024-07-03' --> 'data\processed_data\AMZN\4_2024-07-03.md'


2025-11-14 15:37:21,058 - INFO - Processing document 4_2024-07-05
2025-11-14 15:37:21,078 - INFO - Finished converting document 4_2024-07-05 in 0.05 sec.
2025-11-14 15:37:21,112 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,121 - INFO - Going to convert document batch...
2025-11-14 15:37:21,122 - INFO - Processing document 4_2024-07-09
2025-11-14 15:37:21,143 - INFO - Finished converting document 4_2024-07-09 in 0.05 sec.
2025-11-14 15:37:21,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,212 - INFO - Going to convert document batch...
2025-11-14 15:37:21,213 - INFO - Processing document 4_2024-07-11
2025-11-14 15:37:21,241 - INFO - Finished converting document 4_2024-07-11 in 0.08 sec.
2025-11-14 15:37:21,272 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,281 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMZN\4_2024-07-05' --> 'data\processed_data\AMZN\4_2024-07-05.md'
Converted 'data\edgar_documents\AMZN\4_2024-07-09' --> 'data\processed_data\AMZN\4_2024-07-09.md'
Converted 'data\edgar_documents\AMZN\4_2024-07-11' --> 'data\processed_data\AMZN\4_2024-07-11.md'


2025-11-14 15:37:21,282 - INFO - Processing document 4_2024-07-15
2025-11-14 15:37:21,306 - INFO - Finished converting document 4_2024-07-15 in 0.03 sec.
2025-11-14 15:37:21,341 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,349 - INFO - Going to convert document batch...
2025-11-14 15:37:21,350 - INFO - Processing document 4_2024-08-05
2025-11-14 15:37:21,368 - INFO - Finished converting document 4_2024-08-05 in 0.03 sec.
2025-11-14 15:37:21,416 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,429 - INFO - Going to convert document batch...
2025-11-14 15:37:21,429 - INFO - Processing document 4_2024-08-19
2025-11-14 15:37:21,453 - INFO - Finished converting document 4_2024-08-19 in 0.06 sec.
2025-11-14 15:37:21,490 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,502 - INFO - Going to convert document batch...
2025-11-14 15:37:21,503 - INFO - Processing document 4_2024-08-23
2025-11-14 15:37:21,534 - IN

Converted 'data\edgar_documents\AMZN\4_2024-07-15' --> 'data\processed_data\AMZN\4_2024-07-15.md'
Converted 'data\edgar_documents\AMZN\4_2024-08-05' --> 'data\processed_data\AMZN\4_2024-08-05.md'
Converted 'data\edgar_documents\AMZN\4_2024-08-19' --> 'data\processed_data\AMZN\4_2024-08-19.md'


2025-11-14 15:37:21,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,606 - INFO - Going to convert document batch...
2025-11-14 15:37:21,607 - INFO - Processing document 4_2024-08-30
2025-11-14 15:37:21,626 - INFO - Finished converting document 4_2024-08-30 in 0.06 sec.
2025-11-14 15:37:21,657 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,666 - INFO - Going to convert document batch...
2025-11-14 15:37:21,667 - INFO - Processing document 4_2024-09-05
2025-11-14 15:37:21,685 - INFO - Finished converting document 4_2024-09-05 in 0.05 sec.
2025-11-14 15:37:21,720 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,729 - INFO - Going to convert document batch...
2025-11-14 15:37:21,730 - INFO - Processing document 4_2024-09-11
2025-11-14 15:37:21,748 - INFO - Finished converting document 4_2024-09-11 in 0.05 sec.


Converted 'data\edgar_documents\AMZN\4_2024-08-23' --> 'data\processed_data\AMZN\4_2024-08-23.md'
Converted 'data\edgar_documents\AMZN\4_2024-08-30' --> 'data\processed_data\AMZN\4_2024-08-30.md'
Converted 'data\edgar_documents\AMZN\4_2024-09-05' --> 'data\processed_data\AMZN\4_2024-09-05.md'


2025-11-14 15:37:21,781 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,789 - INFO - Going to convert document batch...
2025-11-14 15:37:21,790 - INFO - Processing document 4_2024-09-26
2025-11-14 15:37:21,808 - INFO - Finished converting document 4_2024-09-26 in 0.05 sec.
2025-11-14 15:37:21,837 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,847 - INFO - Going to convert document batch...
2025-11-14 15:37:21,848 - INFO - Processing document 4_2024-10-03
2025-11-14 15:37:21,864 - INFO - Finished converting document 4_2024-10-03 in 0.03 sec.
2025-11-14 15:37:21,894 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:21,902 - INFO - Going to convert document batch...
2025-11-14 15:37:21,903 - INFO - Processing document 4_2024-11-05
2025-11-14 15:37:21,919 - INFO - Finished converting document 4_2024-11-05 in 0.05 sec.
2025-11-14 15:37:21,953 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\4_2024-09-11' --> 'data\processed_data\AMZN\4_2024-09-11.md'
Converted 'data\edgar_documents\AMZN\4_2024-09-26' --> 'data\processed_data\AMZN\4_2024-09-26.md'
Converted 'data\edgar_documents\AMZN\4_2024-10-03' --> 'data\processed_data\AMZN\4_2024-10-03.md'
Converted 'data\edgar_documents\AMZN\4_2024-11-05' --> 'data\processed_data\AMZN\4_2024-11-05.md'


2025-11-14 15:37:21,962 - INFO - Going to convert document batch...
2025-11-14 15:37:21,963 - INFO - Processing document 4_2024-11-06
2025-11-14 15:37:21,979 - INFO - Finished converting document 4_2024-11-06 in 0.05 sec.
2025-11-14 15:37:22,009 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,022 - INFO - Going to convert document batch...
2025-11-14 15:37:22,023 - INFO - Processing document 4_2024-11-08
2025-11-14 15:37:22,054 - INFO - Finished converting document 4_2024-11-08 in 0.05 sec.
2025-11-14 15:37:22,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,101 - INFO - Going to convert document batch...
2025-11-14 15:37:22,102 - INFO - Processing document 4_2024-11-12
2025-11-14 15:37:22,120 - INFO - Finished converting document 4_2024-11-12 in 0.05 sec.
2025-11-14 15:37:22,152 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,165 - INFO - Going to convert document batch...
2025-11-14 15:37:22,166 - 

Converted 'data\edgar_documents\AMZN\4_2024-11-06' --> 'data\processed_data\AMZN\4_2024-11-06.md'
Converted 'data\edgar_documents\AMZN\4_2024-11-08' --> 'data\processed_data\AMZN\4_2024-11-08.md'
Converted 'data\edgar_documents\AMZN\4_2024-11-12' --> 'data\processed_data\AMZN\4_2024-11-12.md'


2025-11-14 15:37:22,233 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,245 - INFO - Going to convert document batch...
2025-11-14 15:37:22,246 - INFO - Processing document 4_2024-11-19
2025-11-14 15:37:22,270 - INFO - Finished converting document 4_2024-11-19 in 0.05 sec.
2025-11-14 15:37:22,303 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,312 - INFO - Going to convert document batch...
2025-11-14 15:37:22,313 - INFO - Processing document 4_2024-11-20
2025-11-14 15:37:22,334 - INFO - Finished converting document 4_2024-11-20 in 0.03 sec.
2025-11-14 15:37:22,381 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,391 - INFO - Going to convert document batch...
2025-11-14 15:37:22,392 - INFO - Processing document 4_2024-11-21
2025-11-14 15:37:22,413 - INFO - Finished converting document 4_2024-11-21 in 0.05 sec.


Converted 'data\edgar_documents\AMZN\4_2024-11-14' --> 'data\processed_data\AMZN\4_2024-11-14.md'
Converted 'data\edgar_documents\AMZN\4_2024-11-19' --> 'data\processed_data\AMZN\4_2024-11-19.md'
Converted 'data\edgar_documents\AMZN\4_2024-11-20' --> 'data\processed_data\AMZN\4_2024-11-20.md'


2025-11-14 15:37:22,443 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,467 - INFO - Going to convert document batch...
2025-11-14 15:37:22,468 - INFO - Processing document 4_2024-11-25
2025-11-14 15:37:22,527 - INFO - Finished converting document 4_2024-11-25 in 0.09 sec.
2025-11-14 15:37:22,585 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,600 - INFO - Going to convert document batch...
2025-11-14 15:37:22,600 - INFO - Processing document 4_2024-12-04
2025-11-14 15:37:22,618 - INFO - Finished converting document 4_2024-12-04 in 0.05 sec.


Converted 'data\edgar_documents\AMZN\4_2024-11-21' --> 'data\processed_data\AMZN\4_2024-11-21.md'
Converted 'data\edgar_documents\AMZN\4_2024-11-25' --> 'data\processed_data\AMZN\4_2024-11-25.md'


2025-11-14 15:37:22,651 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,659 - INFO - Going to convert document batch...
2025-11-14 15:37:22,660 - INFO - Processing document 4_2024-12-06
2025-11-14 15:37:22,679 - INFO - Finished converting document 4_2024-12-06 in 0.03 sec.
2025-11-14 15:37:22,709 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,718 - INFO - Going to convert document batch...
2025-11-14 15:37:22,719 - INFO - Processing document 4_2024-12-11
2025-11-14 15:37:22,737 - INFO - Finished converting document 4_2024-12-11 in 0.03 sec.
2025-11-14 15:37:22,768 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,780 - INFO - Going to convert document batch...
2025-11-14 15:37:22,782 - INFO - Processing document 4_2025-02-14
2025-11-14 15:37:22,805 - INFO - Finished converting document 4_2025-02-14 in 0.05 sec.


Converted 'data\edgar_documents\AMZN\4_2024-12-04' --> 'data\processed_data\AMZN\4_2024-12-04.md'
Converted 'data\edgar_documents\AMZN\4_2024-12-06' --> 'data\processed_data\AMZN\4_2024-12-06.md'
Converted 'data\edgar_documents\AMZN\4_2024-12-11' --> 'data\processed_data\AMZN\4_2024-12-11.md'
Converted 'data\edgar_documents\AMZN\4_2025-02-14' --> 'data\processed_data\AMZN\4_2025-02-14.md'


2025-11-14 15:37:22,860 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,872 - INFO - Going to convert document batch...
2025-11-14 15:37:22,873 - INFO - Processing document 4_2025-02-19
2025-11-14 15:37:22,903 - INFO - Finished converting document 4_2025-02-19 in 0.08 sec.
2025-11-14 15:37:22,938 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:22,952 - INFO - Going to convert document batch...
2025-11-14 15:37:22,953 - INFO - Processing document 4_2025-02-25
2025-11-14 15:37:22,983 - INFO - Finished converting document 4_2025-02-25 in 0.06 sec.
2025-11-14 15:37:23,021 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:23,030 - INFO - Going to convert document batch...
2025-11-14 15:37:23,031 - INFO - Processing document 4_2025-03-05
2025-11-14 15:37:23,048 - INFO - Finished converting document 4_2025-03-05 in 0.03 sec.
2025-11-14 15:37:23,081 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\AMZN\4_2025-02-19' --> 'data\processed_data\AMZN\4_2025-02-19.md'
Converted 'data\edgar_documents\AMZN\4_2025-02-25' --> 'data\processed_data\AMZN\4_2025-02-25.md'
Converted 'data\edgar_documents\AMZN\4_2025-03-05' --> 'data\processed_data\AMZN\4_2025-03-05.md'


2025-11-14 15:37:23,139 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:23,148 - INFO - Going to convert document batch...
2025-11-14 15:37:23,149 - INFO - Processing document 4_2025-04-03
2025-11-14 15:37:23,173 - INFO - Finished converting document 4_2025-04-03 in 0.05 sec.
2025-11-14 15:37:23,205 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:23,215 - INFO - Going to convert document batch...
2025-11-14 15:37:23,215 - INFO - Processing document 4_2025-04-14
2025-11-14 15:37:23,242 - INFO - Finished converting document 4_2025-04-14 in 0.05 sec.
2025-11-14 15:37:23,292 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:23,305 - INFO - Going to convert document batch...
2025-11-14 15:37:23,306 - INFO - Processing document 4_2025-05-05
2025-11-14 15:37:23,328 - INFO - Finished converting document 4_2025-05-05 in 0.06 sec.


Converted 'data\edgar_documents\AMZN\4_2025-03-12' --> 'data\processed_data\AMZN\4_2025-03-12.md'
Converted 'data\edgar_documents\AMZN\4_2025-04-03' --> 'data\processed_data\AMZN\4_2025-04-03.md'
Converted 'data\edgar_documents\AMZN\4_2025-04-14' --> 'data\processed_data\AMZN\4_2025-04-14.md'


2025-11-14 15:37:23,358 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:23,366 - INFO - Going to convert document batch...
2025-11-14 15:37:23,367 - INFO - Processing document 4_2025-05-14
2025-11-14 15:37:23,384 - INFO - Finished converting document 4_2025-05-14 in 0.03 sec.
2025-11-14 15:37:23,445 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:23,456 - INFO - Going to convert document batch...
2025-11-14 15:37:23,458 - INFO - Processing document 4_2025-05-15
2025-11-14 15:37:23,480 - INFO - Finished converting document 4_2025-05-15 in 0.06 sec.
2025-11-14 15:37:23,514 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:23,525 - INFO - Going to convert document batch...
2025-11-14 15:37:23,526 - INFO - Processing document 4_2025-05-19


Converted 'data\edgar_documents\AMZN\4_2025-05-05' --> 'data\processed_data\AMZN\4_2025-05-05.md'
Converted 'data\edgar_documents\AMZN\4_2025-05-14' --> 'data\processed_data\AMZN\4_2025-05-14.md'
Converted 'data\edgar_documents\AMZN\4_2025-05-15' --> 'data\processed_data\AMZN\4_2025-05-15.md'


2025-11-14 15:37:23,551 - INFO - Finished converting document 4_2025-05-19 in 0.05 sec.
2025-11-14 15:37:23,587 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:23,595 - INFO - Going to convert document batch...
2025-11-14 15:37:23,596 - INFO - Processing document 4_2025-05-22
2025-11-14 15:37:23,615 - INFO - Finished converting document 4_2025-05-22 in 0.03 sec.
2025-11-14 15:37:23,668 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:23,694 - INFO - Going to convert document batch...
2025-11-14 15:37:23,695 - INFO - Processing document 4_2025-05-23
2025-11-14 15:37:23,722 - INFO - Finished converting document 4_2025-05-23 in 0.08 sec.
2025-11-14 15:37:23,761 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\4_2025-05-19' --> 'data\processed_data\AMZN\4_2025-05-19.md'
Converted 'data\edgar_documents\AMZN\4_2025-05-22' --> 'data\processed_data\AMZN\4_2025-05-22.md'
Converted 'data\edgar_documents\AMZN\4_2025-05-23' --> 'data\processed_data\AMZN\4_2025-05-23.md'


2025-11-14 15:37:23,769 - INFO - Going to convert document batch...
2025-11-14 15:37:23,770 - INFO - Processing document 4_2025-06-04
2025-11-14 15:37:23,791 - INFO - Finished converting document 4_2025-06-04 in 0.05 sec.
2025-11-14 15:37:23,821 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:23,829 - INFO - Going to convert document batch...
2025-11-14 15:37:23,830 - INFO - Processing document 4_2025-06-05
2025-11-14 15:37:23,846 - INFO - Finished converting document 4_2025-06-05 in 0.03 sec.
2025-11-14 15:37:23,894 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:23,909 - INFO - Going to convert document batch...
2025-11-14 15:37:23,910 - INFO - Processing document 4_2025-07-01
2025-11-14 15:37:23,931 - INFO - Finished converting document 4_2025-07-01 in 0.06 sec.
2025-11-14 15:37:23,970 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:23,979 - INFO - Going to convert document batch...
2025-11-14 15:37:23,980 - 

Converted 'data\edgar_documents\AMZN\4_2025-06-04' --> 'data\processed_data\AMZN\4_2025-06-04.md'
Converted 'data\edgar_documents\AMZN\4_2025-06-05' --> 'data\processed_data\AMZN\4_2025-06-05.md'
Converted 'data\edgar_documents\AMZN\4_2025-07-01' --> 'data\processed_data\AMZN\4_2025-07-01.md'


2025-11-14 15:37:24,036 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:24,045 - INFO - Going to convert document batch...
2025-11-14 15:37:24,046 - INFO - Processing document 4_2025-07-08
2025-11-14 15:37:24,064 - INFO - Finished converting document 4_2025-07-08 in 0.05 sec.
2025-11-14 15:37:24,101 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:24,110 - INFO - Going to convert document batch...
2025-11-14 15:37:24,111 - INFO - Processing document 4_2025-07-10
2025-11-14 15:37:24,129 - INFO - Finished converting document 4_2025-07-10 in 0.03 sec.
2025-11-14 15:37:24,187 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:24,202 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMZN\4_2025-07-03' --> 'data\processed_data\AMZN\4_2025-07-03.md'
Converted 'data\edgar_documents\AMZN\4_2025-07-08' --> 'data\processed_data\AMZN\4_2025-07-08.md'
Converted 'data\edgar_documents\AMZN\4_2025-07-10' --> 'data\processed_data\AMZN\4_2025-07-10.md'


2025-11-14 15:37:24,202 - INFO - Processing document 4_2025-07-15
2025-11-14 15:37:24,226 - INFO - Finished converting document 4_2025-07-15 in 0.08 sec.
2025-11-14 15:37:24,260 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:24,267 - INFO - Going to convert document batch...
2025-11-14 15:37:24,268 - INFO - Processing document 4_2025-07-17
2025-11-14 15:37:24,286 - INFO - Finished converting document 4_2025-07-17 in 0.03 sec.
2025-11-14 15:37:24,317 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AMZN\4_2025-07-15' --> 'data\processed_data\AMZN\4_2025-07-15.md'
Converted 'data\edgar_documents\AMZN\4_2025-07-17' --> 'data\processed_data\AMZN\4_2025-07-17.md'


2025-11-14 15:37:24,541 - INFO - Going to convert document batch...
2025-11-14 15:37:24,543 - INFO - Processing document 4_2025-07-23
2025-11-14 15:37:24,568 - INFO - Finished converting document 4_2025-07-23 in 0.27 sec.
2025-11-14 15:37:24,600 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:24,616 - INFO - Going to convert document batch...
2025-11-14 15:37:24,617 - INFO - Processing document 4_2025-07-25
2025-11-14 15:37:24,645 - INFO - Finished converting document 4_2025-07-25 in 0.05 sec.
2025-11-14 15:37:24,681 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:24,688 - INFO - Going to convert document batch...
2025-11-14 15:37:24,689 - INFO - Processing document 4_2025-08-05
2025-11-14 15:37:24,708 - INFO - Finished converting document 4_2025-08-05 in 0.03 sec.
2025-11-14 15:37:24,736 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:24,744 - INFO - Going to convert document batch...
2025-11-14 15:37:24,745 - 

Converted 'data\edgar_documents\AMZN\4_2025-07-23' --> 'data\processed_data\AMZN\4_2025-07-23.md'
Converted 'data\edgar_documents\AMZN\4_2025-07-25' --> 'data\processed_data\AMZN\4_2025-07-25.md'
Converted 'data\edgar_documents\AMZN\4_2025-08-05' --> 'data\processed_data\AMZN\4_2025-08-05.md'


2025-11-14 15:37:24,799 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:24,807 - INFO - Going to convert document batch...
2025-11-14 15:37:24,808 - INFO - Processing document 4_2025-08-18
2025-11-14 15:37:24,827 - INFO - Finished converting document 4_2025-08-18 in 0.05 sec.
2025-11-14 15:37:24,859 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:24,869 - INFO - Going to convert document batch...
2025-11-14 15:37:24,870 - INFO - Processing document 4_2025-08-19
2025-11-14 15:37:24,895 - INFO - Finished converting document 4_2025-08-19 in 0.05 sec.
2025-11-14 15:37:24,943 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:24,983 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMZN\4_2025-08-12' --> 'data\processed_data\AMZN\4_2025-08-12.md'
Converted 'data\edgar_documents\AMZN\4_2025-08-18' --> 'data\processed_data\AMZN\4_2025-08-18.md'
Converted 'data\edgar_documents\AMZN\4_2025-08-19' --> 'data\processed_data\AMZN\4_2025-08-19.md'


2025-11-14 15:37:24,985 - INFO - Processing document 4_2025-08-25
2025-11-14 15:37:25,022 - INFO - Finished converting document 4_2025-08-25 in 0.09 sec.
2025-11-14 15:37:25,060 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:25,067 - INFO - Going to convert document batch...
2025-11-14 15:37:25,069 - INFO - Processing document 4_2025-09-02
2025-11-14 15:37:25,088 - INFO - Finished converting document 4_2025-09-02 in 0.03 sec.
2025-11-14 15:37:25,136 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:25,148 - INFO - Going to convert document batch...
2025-11-14 15:37:25,149 - INFO - Processing document 4_2025-09-04
2025-11-14 15:37:25,169 - INFO - Finished converting document 4_2025-09-04 in 0.06 sec.
2025-11-14 15:37:25,201 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:25,209 - INFO - Going to convert document batch...
2025-11-14 15:37:25,210 - INFO - Processing document 4_2025-09-10
2025-11-14 15:37:25,228 - IN

Converted 'data\edgar_documents\AMZN\4_2025-08-25' --> 'data\processed_data\AMZN\4_2025-08-25.md'
Converted 'data\edgar_documents\AMZN\4_2025-09-02' --> 'data\processed_data\AMZN\4_2025-09-02.md'
Converted 'data\edgar_documents\AMZN\4_2025-09-04' --> 'data\processed_data\AMZN\4_2025-09-04.md'


2025-11-14 15:37:25,258 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:25,266 - INFO - Going to convert document batch...
2025-11-14 15:37:25,267 - INFO - Processing document 4_2025-10-03
2025-11-14 15:37:25,285 - INFO - Finished converting document 4_2025-10-03 in 0.03 sec.
2025-11-14 15:37:25,325 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:25,333 - INFO - Going to convert document batch...
2025-11-14 15:37:25,334 - INFO - Processing document 4_2025-11-04
2025-11-14 15:37:25,354 - INFO - Finished converting document 4_2025-11-04 in 0.03 sec.
2025-11-14 15:37:25,399 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:25,410 - INFO - Going to convert document batch...
2025-11-14 15:37:25,411 - INFO - Processing document 4_2025-11-10
2025-11-14 15:37:25,432 - INFO - Finished converting document 4_2025-11-10 in 0.06 sec.


Converted 'data\edgar_documents\AMZN\4_2025-09-10' --> 'data\processed_data\AMZN\4_2025-09-10.md'
Converted 'data\edgar_documents\AMZN\4_2025-10-03' --> 'data\processed_data\AMZN\4_2025-10-03.md'
Converted 'data\edgar_documents\AMZN\4_2025-11-04' --> 'data\processed_data\AMZN\4_2025-11-04.md'


2025-11-14 15:37:25,466 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:25,477 - INFO - Going to convert document batch...
2025-11-14 15:37:25,477 - INFO - Processing document 8-K_2023-01-03
2025-11-14 15:37:25,500 - INFO - Finished converting document 8-K_2023-01-03 in 0.05 sec.
2025-11-14 15:37:25,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:25,536 - INFO - Going to convert document batch...
2025-11-14 15:37:25,536 - INFO - Processing document 8-K_2023-01-06
2025-11-14 15:37:25,561 - INFO - Finished converting document 8-K_2023-01-06 in 0.05 sec.
2025-11-14 15:37:25,586 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:25,599 - INFO - Going to convert document batch...
2025-11-14 15:37:25,599 - INFO - Processing document 8-K_2023-02-02
2025-11-14 15:37:25,622 - INFO - Finished converting document 8-K_2023-02-02 in 0.05 sec.


Converted 'data\edgar_documents\AMZN\4_2025-11-10' --> 'data\processed_data\AMZN\4_2025-11-10.md'
Converted 'data\edgar_documents\AMZN\8-K_2023-01-03' --> 'data\processed_data\AMZN\8-K_2023-01-03.md'
Converted 'data\edgar_documents\AMZN\8-K_2023-01-06' --> 'data\processed_data\AMZN\8-K_2023-01-06.md'


2025-11-14 15:37:25,650 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:25,665 - INFO - Going to convert document batch...
2025-11-14 15:37:25,666 - INFO - Processing document 8-K_2023-04-13
2025-11-14 15:37:25,689 - INFO - Finished converting document 8-K_2023-04-13 in 0.05 sec.
2025-11-14 15:37:25,715 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:25,729 - INFO - Going to convert document batch...
2025-11-14 15:37:25,729 - INFO - Processing document 8-K_2023-04-27
2025-11-14 15:37:25,751 - INFO - Finished converting document 8-K_2023-04-27 in 0.05 sec.
2025-11-14 15:37:25,781 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:25,819 - INFO - Going to convert document batch...
2025-11-14 15:37:25,820 - INFO - Processing document 8-K_2023-05-26


Converted 'data\edgar_documents\AMZN\8-K_2023-02-02' --> 'data\processed_data\AMZN\8-K_2023-02-02.md'
Converted 'data\edgar_documents\AMZN\8-K_2023-04-13' --> 'data\processed_data\AMZN\8-K_2023-04-13.md'
Converted 'data\edgar_documents\AMZN\8-K_2023-04-27' --> 'data\processed_data\AMZN\8-K_2023-04-27.md'


2025-11-14 15:37:25,928 - INFO - Finished converting document 8-K_2023-05-26 in 0.16 sec.
2025-11-14 15:37:26,010 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,027 - INFO - Going to convert document batch...
2025-11-14 15:37:26,028 - INFO - Processing document 8-K_2023-08-03
2025-11-14 15:37:26,052 - INFO - Finished converting document 8-K_2023-08-03 in 0.08 sec.
2025-11-14 15:37:26,080 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,093 - INFO - Going to convert document batch...
2025-11-14 15:37:26,094 - INFO - Processing document 8-K_2023-09-13
2025-11-14 15:37:26,110 - INFO - Finished converting document 8-K_2023-09-13 in 0.05 sec.
2025-11-14 15:37:26,133 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,146 - INFO - Going to convert document batch...
2025-11-14 15:37:26,146 - INFO - Processing document 8-K_2023-10-26
2025-11-14 15:37:26,167 - INFO - Finished converting document 8-K_2023-10-26 in 0.

Converted 'data\edgar_documents\AMZN\8-K_2023-05-26' --> 'data\processed_data\AMZN\8-K_2023-05-26.md'
Converted 'data\edgar_documents\AMZN\8-K_2023-08-03' --> 'data\processed_data\AMZN\8-K_2023-08-03.md'
Converted 'data\edgar_documents\AMZN\8-K_2023-09-13' --> 'data\processed_data\AMZN\8-K_2023-09-13.md'


2025-11-14 15:37:26,203 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,217 - INFO - Going to convert document batch...
2025-11-14 15:37:26,217 - INFO - Processing document 8-K_2023-11-01
2025-11-14 15:37:26,251 - INFO - Finished converting document 8-K_2023-11-01 in 0.06 sec.
2025-11-14 15:37:26,305 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,318 - INFO - Going to convert document batch...
2025-11-14 15:37:26,319 - INFO - Processing document 8-K_2024-02-01


Converted 'data\edgar_documents\AMZN\8-K_2023-10-26' --> 'data\processed_data\AMZN\8-K_2023-10-26.md'
Converted 'data\edgar_documents\AMZN\8-K_2023-11-01' --> 'data\processed_data\AMZN\8-K_2023-11-01.md'


2025-11-14 15:37:26,373 - INFO - Finished converting document 8-K_2024-02-01 in 0.09 sec.
2025-11-14 15:37:26,409 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,421 - INFO - Going to convert document batch...
2025-11-14 15:37:26,422 - INFO - Processing document 8-K_2024-04-11
2025-11-14 15:37:26,446 - INFO - Finished converting document 8-K_2024-04-11 in 0.05 sec.
2025-11-14 15:37:26,473 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,483 - INFO - Going to convert document batch...
2025-11-14 15:37:26,484 - INFO - Processing document 8-K_2024-04-30
2025-11-14 15:37:26,504 - INFO - Finished converting document 8-K_2024-04-30 in 0.05 sec.
2025-11-14 15:37:26,559 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,570 - INFO - Going to convert document batch...
2025-11-14 15:37:26,571 - INFO - Processing document 8-K_2024-05-03
2025-11-14 15:37:26,594 - INFO - Finished converting document 8-K_2024-05-03 in 0.

Converted 'data\edgar_documents\AMZN\8-K_2024-02-01' --> 'data\processed_data\AMZN\8-K_2024-02-01.md'
Converted 'data\edgar_documents\AMZN\8-K_2024-04-11' --> 'data\processed_data\AMZN\8-K_2024-04-11.md'
Converted 'data\edgar_documents\AMZN\8-K_2024-04-30' --> 'data\processed_data\AMZN\8-K_2024-04-30.md'


2025-11-14 15:37:26,621 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,632 - INFO - Going to convert document batch...
2025-11-14 15:37:26,633 - INFO - Processing document 8-K_2024-05-14
2025-11-14 15:37:26,654 - INFO - Finished converting document 8-K_2024-05-14 in 0.05 sec.
2025-11-14 15:37:26,681 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,710 - INFO - Going to convert document batch...
2025-11-14 15:37:26,712 - INFO - Processing document 8-K_2024-05-24
2025-11-14 15:37:26,767 - INFO - Finished converting document 8-K_2024-05-24 in 0.09 sec.


Converted 'data\edgar_documents\AMZN\8-K_2024-05-03' --> 'data\processed_data\AMZN\8-K_2024-05-03.md'
Converted 'data\edgar_documents\AMZN\8-K_2024-05-14' --> 'data\processed_data\AMZN\8-K_2024-05-14.md'


2025-11-14 15:37:26,809 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,820 - INFO - Going to convert document batch...
2025-11-14 15:37:26,820 - INFO - Processing document 8-K_2024-08-01
2025-11-14 15:37:26,845 - INFO - Finished converting document 8-K_2024-08-01 in 0.05 sec.
2025-11-14 15:37:26,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,880 - INFO - Going to convert document batch...
2025-11-14 15:37:26,881 - INFO - Processing document 8-K_2024-10-31
2025-11-14 15:37:26,908 - INFO - Finished converting document 8-K_2024-10-31 in 0.05 sec.
2025-11-14 15:37:26,955 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:26,966 - INFO - Going to convert document batch...
2025-11-14 15:37:26,967 - INFO - Processing document 8-K_2025-02-06
2025-11-14 15:37:26,987 - INFO - Finished converting document 8-K_2025-02-06 in 0.06 sec.


Converted 'data\edgar_documents\AMZN\8-K_2024-05-24' --> 'data\processed_data\AMZN\8-K_2024-05-24.md'
Converted 'data\edgar_documents\AMZN\8-K_2024-08-01' --> 'data\processed_data\AMZN\8-K_2024-08-01.md'
Converted 'data\edgar_documents\AMZN\8-K_2024-10-31' --> 'data\processed_data\AMZN\8-K_2024-10-31.md'


2025-11-14 15:37:27,016 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:27,029 - INFO - Going to convert document batch...
2025-11-14 15:37:27,030 - INFO - Processing document 8-K_2025-04-10
2025-11-14 15:37:27,055 - INFO - Finished converting document 8-K_2025-04-10 in 0.05 sec.
2025-11-14 15:37:27,087 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:27,103 - INFO - Going to convert document batch...
2025-11-14 15:37:27,105 - INFO - Processing document 8-K_2025-05-01
2025-11-14 15:37:27,135 - INFO - Finished converting document 8-K_2025-05-01 in 0.06 sec.
2025-11-14 15:37:27,163 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:27,196 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AMZN\8-K_2025-02-06' --> 'data\processed_data\AMZN\8-K_2025-02-06.md'
Converted 'data\edgar_documents\AMZN\8-K_2025-04-10' --> 'data\processed_data\AMZN\8-K_2025-04-10.md'
Converted 'data\edgar_documents\AMZN\8-K_2025-05-01' --> 'data\processed_data\AMZN\8-K_2025-05-01.md'


2025-11-14 15:37:27,197 - INFO - Processing document 8-K_2025-05-22
2025-11-14 15:37:27,260 - INFO - Finished converting document 8-K_2025-05-22 in 0.12 sec.
2025-11-14 15:37:27,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:27,314 - INFO - Going to convert document batch...
2025-11-14 15:37:27,314 - INFO - Processing document 8-K_2025-07-31
2025-11-14 15:37:27,335 - INFO - Finished converting document 8-K_2025-07-31 in 0.05 sec.
2025-11-14 15:37:27,363 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:37:27,372 - INFO - Going to convert document batch...
2025-11-14 15:37:27,373 - INFO - Processing document 8-K_2025-10-30
2025-11-14 15:37:27,395 - INFO - Finished converting document 8-K_2025-10-30 in 0.05 sec.
2025-11-14 15:37:27,443 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:37:27,444 - ERROR - Input document DEF-14A_2023-04-13 with format None does not match any 

Converted 'data\edgar_documents\AMZN\8-K_2025-05-22' --> 'data\processed_data\AMZN\8-K_2025-05-22.md'
Converted 'data\edgar_documents\AMZN\8-K_2025-07-31' --> 'data\processed_data\AMZN\8-K_2025-07-31.md'
Converted 'data\edgar_documents\AMZN\8-K_2025-10-30' --> 'data\processed_data\AMZN\8-K_2025-10-30.md'
Error processing data\edgar_documents\AMZN\DEF-14A_2023-04-13: File format not allowed: data\edgar_documents\AMZN\DEF-14A_2023-04-13


2025-11-14 15:37:27,480 - ERROR - Input document DEF-14A_2024-04-11 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:37:27,481 - INFO - Going to convert document batch...
2025-11-14 15:37:27,512 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:37:27,512 - ERROR - Input document DEF-14A_2025-04-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: '

Error processing data\edgar_documents\AMZN\DEF-14A_2024-04-11: File format not allowed: data\edgar_documents\AMZN\DEF-14A_2024-04-11
Error processing data\edgar_documents\AMZN\DEF-14A_2025-04-10: File format not allowed: data\edgar_documents\AMZN\DEF-14A_2025-04-10
Processed 166 new files. Errors: 3
Found 156 files to process in data\edgar_documents\AVGO


2025-11-14 15:37:28,330 - INFO - Going to convert document batch...
2025-11-14 15:37:28,330 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:37:28,331 - INFO - Processing document 10-K_2023-12-14
2025-11-14 15:37:29,611 - INFO - Finished converting document 10-K_2023-12-14 in 2.09 sec.
2025-11-14 15:37:30,236 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\10-K_2023-12-14' --> 'data\processed_data\AVGO\10-K_2023-12-14.md'


2025-11-14 15:37:31,075 - INFO - Going to convert document batch...
2025-11-14 15:37:31,076 - INFO - Processing document 10-K_2024-12-20
2025-11-14 15:37:32,508 - INFO - Finished converting document 10-K_2024-12-20 in 2.31 sec.
2025-11-14 15:37:33,194 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\10-K_2024-12-20' --> 'data\processed_data\AVGO\10-K_2024-12-20.md'


2025-11-14 15:37:33,851 - INFO - Going to convert document batch...
2025-11-14 15:37:33,852 - INFO - Processing document 10-Q_2023-03-08
2025-11-14 15:37:34,572 - INFO - Finished converting document 10-Q_2023-03-08 in 1.41 sec.
2025-11-14 15:37:35,316 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\10-Q_2023-03-08' --> 'data\processed_data\AVGO\10-Q_2023-03-08.md'


2025-11-14 15:37:36,235 - INFO - Going to convert document batch...
2025-11-14 15:37:36,237 - INFO - Processing document 10-Q_2023-06-07
2025-11-14 15:37:38,225 - INFO - Finished converting document 10-Q_2023-06-07 in 2.94 sec.
2025-11-14 15:37:39,238 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\10-Q_2023-06-07' --> 'data\processed_data\AVGO\10-Q_2023-06-07.md'


2025-11-14 15:37:41,148 - INFO - Going to convert document batch...
2025-11-14 15:37:41,149 - INFO - Processing document 10-Q_2023-09-06
2025-11-14 15:37:43,051 - INFO - Finished converting document 10-Q_2023-09-06 in 3.84 sec.
2025-11-14 15:37:44,393 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\10-Q_2023-09-06' --> 'data\processed_data\AVGO\10-Q_2023-09-06.md'


2025-11-14 15:37:45,242 - INFO - Going to convert document batch...
2025-11-14 15:37:45,243 - INFO - Processing document 10-Q_2024-03-14
2025-11-14 15:37:47,461 - INFO - Finished converting document 10-Q_2024-03-14 in 3.09 sec.
2025-11-14 15:37:48,567 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\10-Q_2024-03-14' --> 'data\processed_data\AVGO\10-Q_2024-03-14.md'


2025-11-14 15:37:50,647 - INFO - Going to convert document batch...
2025-11-14 15:37:50,648 - INFO - Processing document 10-Q_2024-06-13
2025-11-14 15:37:53,258 - INFO - Finished converting document 10-Q_2024-06-13 in 4.73 sec.
2025-11-14 15:37:54,486 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\10-Q_2024-06-13' --> 'data\processed_data\AVGO\10-Q_2024-06-13.md'


2025-11-14 15:37:56,283 - INFO - Going to convert document batch...
2025-11-14 15:37:56,286 - INFO - Processing document 10-Q_2024-09-11
2025-11-14 15:37:58,768 - INFO - Finished converting document 10-Q_2024-09-11 in 4.31 sec.
2025-11-14 15:38:00,066 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\10-Q_2024-09-11' --> 'data\processed_data\AVGO\10-Q_2024-09-11.md'


2025-11-14 15:38:01,074 - INFO - Going to convert document batch...
2025-11-14 15:38:01,075 - INFO - Processing document 10-Q_2025-03-12
2025-11-14 15:38:02,646 - INFO - Finished converting document 10-Q_2025-03-12 in 2.66 sec.
2025-11-14 15:38:03,705 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\10-Q_2025-03-12' --> 'data\processed_data\AVGO\10-Q_2025-03-12.md'


2025-11-14 15:38:05,755 - INFO - Going to convert document batch...
2025-11-14 15:38:05,756 - INFO - Processing document 10-Q_2025-06-11
2025-11-14 15:38:07,675 - INFO - Finished converting document 10-Q_2025-06-11 in 4.05 sec.
2025-11-14 15:38:08,763 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\10-Q_2025-06-11' --> 'data\processed_data\AVGO\10-Q_2025-06-11.md'


2025-11-14 15:38:10,591 - INFO - Going to convert document batch...
2025-11-14 15:38:10,592 - INFO - Processing document 10-Q_2025-09-10
2025-11-14 15:38:13,028 - INFO - Finished converting document 10-Q_2025-09-10 in 4.33 sec.
2025-11-14 15:38:14,468 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:14,486 - INFO - Going to convert document batch...
2025-11-14 15:38:14,487 - INFO - Processing document 4_2023-01-06
2025-11-14 15:38:14,555 - INFO - Finished converting document 4_2023-01-06 in 0.09 sec.
2025-11-14 15:38:14,653 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\AVGO\10-Q_2025-09-10' --> 'data\processed_data\AVGO\10-Q_2025-09-10.md'
Converted 'data\edgar_documents\AVGO\4_2023-01-06' --> 'data\processed_data\AVGO\4_2023-01-06.md'


2025-11-14 15:38:14,654 - ERROR - Input document 4_2023-01-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:14,655 - INFO - Going to convert document batch...
2025-11-14 15:38:14,692 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:14,693 - ERROR - Input document 4_2023-01-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\AVGO\4_2023-01-09: File format not allowed: data\edgar_documents\AVGO\4_2023-01-09
Error processing data\edgar_documents\AVGO\4_2023-01-12: File format not allowed: data\edgar_documents\AVGO\4_2023-01-12
Error processing data\edgar_documents\AVGO\4_2023-01-23: File format not allowed: data\edgar_documents\AVGO\4_2023-01-23
Error processing data\edgar_documents\AVGO\4_2023-01-31: File format not allowed: data\edgar_documents\AVGO\4_2023-01-31
Error processing data\edgar_documents\AVGO\4_2023-02-09: File format not allowed: data\edgar_documents\AVGO\4_2023-02-09


2025-11-14 15:38:14,847 - ERROR - Input document 4_2023-02-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:14,849 - INFO - Going to convert document batch...
2025-11-14 15:38:14,874 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:14,876 - ERROR - Input document 4_2023-03-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\AVGO\4_2023-02-15: File format not allowed: data\edgar_documents\AVGO\4_2023-02-15
Error processing data\edgar_documents\AVGO\4_2023-03-09: File format not allowed: data\edgar_documents\AVGO\4_2023-03-09
Converted 'data\edgar_documents\AVGO\4_2023-03-10' --> 'data\processed_data\AVGO\4_2023-03-10.md'


2025-11-14 15:38:15,059 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:15,061 - ERROR - Input document 4_2023-03-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:15,063 - INFO - Going to convert document batch...
2025-11-14 15:38:15,087 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:15,116 - INFO - Going to convert document batch...
2025-11-14 15:38:15,118 - INFO - Processing document 4_2023-03-16
2025-11-14 15:38:15,187 - INFO - Fin

Error processing data\edgar_documents\AVGO\4_2023-03-15: File format not allowed: data\edgar_documents\AVGO\4_2023-03-15
Converted 'data\edgar_documents\AVGO\4_2023-03-16' --> 'data\processed_data\AVGO\4_2023-03-16.md'


2025-11-14 15:38:15,300 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:15,339 - INFO - Going to convert document batch...
2025-11-14 15:38:15,343 - INFO - Processing document 4_2023-03-17
2025-11-14 15:38:15,411 - INFO - Finished converting document 4_2023-03-17 in 0.14 sec.
2025-11-14 15:38:15,465 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:15,487 - INFO - Going to convert document batch...
2025-11-14 15:38:15,490 - INFO - Processing document 4_2023-03-20
2025-11-14 15:38:15,540 - INFO - Finished converting document 4_2023-03-20 in 0.08 sec.
2025-11-14 15:38:15,621 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\4_2023-03-17' --> 'data\processed_data\AVGO\4_2023-03-17.md'
Converted 'data\edgar_documents\AVGO\4_2023-03-20' --> 'data\processed_data\AVGO\4_2023-03-20.md'


2025-11-14 15:38:15,649 - INFO - Going to convert document batch...
2025-11-14 15:38:15,652 - INFO - Processing document 4_2023-03-29
2025-11-14 15:38:15,737 - INFO - Finished converting document 4_2023-03-29 in 0.14 sec.
2025-11-14 15:38:15,833 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:15,834 - ERROR - Input document 4_2023-03-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:15,836 - INFO - Going to convert document batch...
2025-11-14 15:38:15,851 - IN

Converted 'data\edgar_documents\AVGO\4_2023-03-29' --> 'data\processed_data\AVGO\4_2023-03-29.md'
Error processing data\edgar_documents\AVGO\4_2023-03-30: File format not allowed: data\edgar_documents\AVGO\4_2023-03-30
Converted 'data\edgar_documents\AVGO\4_2023-04-05' --> 'data\processed_data\AVGO\4_2023-04-05.md'


2025-11-14 15:38:16,025 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:16,027 - ERROR - Input document 4_2023-04-25 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:16,029 - INFO - Going to convert document batch...
2025-11-14 15:38:16,051 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:16,052 - ERROR - Input document 4_2023-05-04 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\AVGO\4_2023-04-25: File format not allowed: data\edgar_documents\AVGO\4_2023-04-25
Error processing data\edgar_documents\AVGO\4_2023-05-04: File format not allowed: data\edgar_documents\AVGO\4_2023-05-04
Error processing data\edgar_documents\AVGO\4_2023-06-07: File format not allowed: data\edgar_documents\AVGO\4_2023-06-07


2025-11-14 15:38:16,259 - INFO - Finished converting document 4_2023-06-12 in 0.14 sec.
2025-11-14 15:38:16,373 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:16,374 - ERROR - Input document 4_2023-06-26 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:16,376 - INFO - Going to convert document batch...
2025-11-14 15:38:16,393 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:16,395 - ERROR - Input document 4_2023-06-27 with forma

Converted 'data\edgar_documents\AVGO\4_2023-06-12' --> 'data\processed_data\AVGO\4_2023-06-12.md'
Error processing data\edgar_documents\AVGO\4_2023-06-26: File format not allowed: data\edgar_documents\AVGO\4_2023-06-26
Error processing data\edgar_documents\AVGO\4_2023-06-27: File format not allowed: data\edgar_documents\AVGO\4_2023-06-27


2025-11-14 15:38:16,607 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:16,609 - ERROR - Input document 4_2023-06-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:16,611 - INFO - Going to convert document batch...
2025-11-14 15:38:16,653 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:16,655 - ERROR - Input document 4_2023-07-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\AVGO\4_2023-06-29' --> 'data\processed_data\AVGO\4_2023-06-29.md'
Error processing data\edgar_documents\AVGO\4_2023-06-30: File format not allowed: data\edgar_documents\AVGO\4_2023-06-30
Error processing data\edgar_documents\AVGO\4_2023-07-12: File format not allowed: data\edgar_documents\AVGO\4_2023-07-12
Error processing data\edgar_documents\AVGO\4_2023-08-21: File format not allowed: data\edgar_documents\AVGO\4_2023-08-21
Error processing data\edgar_documents\AVGO\4_2023-08-28: File format not allowed: data\edgar_documents\AVGO\4_2023-08-28


2025-11-14 15:38:16,782 - INFO - Going to convert document batch...
2025-11-14 15:38:16,785 - INFO - Processing document 4_2023-09-08
2025-11-14 15:38:16,841 - INFO - Finished converting document 4_2023-09-08 in 0.11 sec.
2025-11-14 15:38:16,903 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:16,948 - INFO - Going to convert document batch...
2025-11-14 15:38:16,951 - INFO - Processing document 4_2023-09-14
2025-11-14 15:38:17,009 - INFO - Finished converting document 4_2023-09-14 in 0.11 sec.


Converted 'data\edgar_documents\AVGO\4_2023-09-08' --> 'data\processed_data\AVGO\4_2023-09-08.md'
Converted 'data\edgar_documents\AVGO\4_2023-09-14' --> 'data\processed_data\AVGO\4_2023-09-14.md'


2025-11-14 15:38:17,092 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:17,111 - INFO - Going to convert document batch...
2025-11-14 15:38:17,113 - INFO - Processing document 4_2023-09-19
2025-11-14 15:38:17,175 - INFO - Finished converting document 4_2023-09-19 in 0.11 sec.
2025-11-14 15:38:17,271 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:17,300 - INFO - Going to convert document batch...
2025-11-14 15:38:17,303 - INFO - Processing document 4_2023-09-26
2025-11-14 15:38:17,362 - INFO - Finished converting document 4_2023-09-26 in 0.11 sec.


Converted 'data\edgar_documents\AVGO\4_2023-09-19' --> 'data\processed_data\AVGO\4_2023-09-19.md'
Converted 'data\edgar_documents\AVGO\4_2023-09-26' --> 'data\processed_data\AVGO\4_2023-09-26.md'


2025-11-14 15:38:17,450 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:17,483 - INFO - Going to convert document batch...
2025-11-14 15:38:17,486 - INFO - Processing document 4_2023-10-06
2025-11-14 15:38:17,557 - INFO - Finished converting document 4_2023-10-06 in 0.14 sec.
2025-11-14 15:38:17,647 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:17,649 - ERROR - Input document 4_2023-10-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38

Converted 'data\edgar_documents\AVGO\4_2023-10-06' --> 'data\processed_data\AVGO\4_2023-10-06.md'
Error processing data\edgar_documents\AVGO\4_2023-10-18: File format not allowed: data\edgar_documents\AVGO\4_2023-10-18
Error processing data\edgar_documents\AVGO\4_2023-10-30: File format not allowed: data\edgar_documents\AVGO\4_2023-10-30


2025-11-14 15:38:17,885 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:17,923 - INFO - Going to convert document batch...
2025-11-14 15:38:17,925 - INFO - Processing document 4_2023-12-15
2025-11-14 15:38:18,007 - INFO - Finished converting document 4_2023-12-15 in 0.12 sec.


Converted 'data\edgar_documents\AVGO\4_2023-11-07' --> 'data\processed_data\AVGO\4_2023-11-07.md'
Converted 'data\edgar_documents\AVGO\4_2023-12-15' --> 'data\processed_data\AVGO\4_2023-12-15.md'


2025-11-14 15:38:18,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:18,144 - INFO - Going to convert document batch...
2025-11-14 15:38:18,147 - INFO - Processing document 4_2023-12-18
2025-11-14 15:38:18,209 - INFO - Finished converting document 4_2023-12-18 in 0.12 sec.
2025-11-14 15:38:18,294 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:18,322 - INFO - Going to convert document batch...
2025-11-14 15:38:18,325 - INFO - Processing document 4_2023-12-19
2025-11-14 15:38:18,380 - INFO - Finished converting document 4_2023-12-19 in 0.09 sec.
2025-11-14 15:38:18,433 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\4_2023-12-18' --> 'data\processed_data\AVGO\4_2023-12-18.md'
Converted 'data\edgar_documents\AVGO\4_2023-12-19' --> 'data\processed_data\AVGO\4_2023-12-19.md'


2025-11-14 15:38:18,519 - INFO - Going to convert document batch...
2025-11-14 15:38:18,522 - INFO - Processing document 4_2023-12-22
2025-11-14 15:38:18,664 - INFO - Finished converting document 4_2023-12-22 in 0.23 sec.
2025-11-14 15:38:18,735 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:18,750 - INFO - Going to convert document batch...
2025-11-14 15:38:18,751 - INFO - Processing document 4_2024-01-08
2025-11-14 15:38:18,797 - INFO - Finished converting document 4_2024-01-08 in 0.08 sec.
2025-11-14 15:38:18,868 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:18,883 - INFO - Going to convert document batch...
2025-11-14 15:38:18,883 - INFO - Processing document 4_2024-01-09


Converted 'data\edgar_documents\AVGO\4_2023-12-22' --> 'data\processed_data\AVGO\4_2023-12-22.md'
Converted 'data\edgar_documents\AVGO\4_2024-01-08' --> 'data\processed_data\AVGO\4_2024-01-08.md'


2025-11-14 15:38:18,937 - INFO - Finished converting document 4_2024-01-09 in 0.09 sec.
2025-11-14 15:38:18,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:19,008 - INFO - Going to convert document batch...
2025-11-14 15:38:19,009 - INFO - Processing document 4_2024-02-07
2025-11-14 15:38:19,055 - INFO - Finished converting document 4_2024-02-07 in 0.06 sec.
2025-11-14 15:38:19,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:19,152 - INFO - Going to convert document batch...
2025-11-14 15:38:19,155 - INFO - Processing document 4_2024-03-07


Converted 'data\edgar_documents\AVGO\4_2024-01-09' --> 'data\processed_data\AVGO\4_2024-01-09.md'
Converted 'data\edgar_documents\AVGO\4_2024-02-07' --> 'data\processed_data\AVGO\4_2024-02-07.md'


2025-11-14 15:38:19,223 - INFO - Finished converting document 4_2024-03-07 in 0.12 sec.
2025-11-14 15:38:19,312 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:19,347 - INFO - Going to convert document batch...
2025-11-14 15:38:19,351 - INFO - Processing document 4_2024-03-14
2025-11-14 15:38:19,403 - INFO - Finished converting document 4_2024-03-14 in 0.11 sec.
2025-11-14 15:38:19,487 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\4_2024-03-07' --> 'data\processed_data\AVGO\4_2024-03-07.md'
Converted 'data\edgar_documents\AVGO\4_2024-03-14' --> 'data\processed_data\AVGO\4_2024-03-14.md'


2025-11-14 15:38:19,528 - INFO - Going to convert document batch...
2025-11-14 15:38:19,530 - INFO - Processing document 4_2024-03-19
2025-11-14 15:38:19,590 - INFO - Finished converting document 4_2024-03-19 in 0.14 sec.
2025-11-14 15:38:19,672 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:19,712 - INFO - Going to convert document batch...
2025-11-14 15:38:19,714 - INFO - Processing document 4_2024-03-21
2025-11-14 15:38:19,775 - INFO - Finished converting document 4_2024-03-21 in 0.11 sec.


Converted 'data\edgar_documents\AVGO\4_2024-03-19' --> 'data\processed_data\AVGO\4_2024-03-19.md'
Converted 'data\edgar_documents\AVGO\4_2024-03-21' --> 'data\processed_data\AVGO\4_2024-03-21.md'


2025-11-14 15:38:19,867 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:19,894 - INFO - Going to convert document batch...
2025-11-14 15:38:19,896 - INFO - Processing document 4_2024-03-27
2025-11-14 15:38:19,937 - INFO - Finished converting document 4_2024-03-27 in 0.11 sec.
2025-11-14 15:38:19,985 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:20,001 - INFO - Going to convert document batch...
2025-11-14 15:38:20,002 - INFO - Processing document 4_2024-04-01
2025-11-14 15:38:20,049 - INFO - Finished converting document 4_2024-04-01 in 0.08 sec.


Converted 'data\edgar_documents\AVGO\4_2024-03-27' --> 'data\processed_data\AVGO\4_2024-03-27.md'
Converted 'data\edgar_documents\AVGO\4_2024-04-01' --> 'data\processed_data\AVGO\4_2024-04-01.md'


2025-11-14 15:38:20,153 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:20,171 - INFO - Going to convert document batch...
2025-11-14 15:38:20,172 - INFO - Processing document 4_2024-04-04
2025-11-14 15:38:20,217 - INFO - Finished converting document 4_2024-04-04 in 0.09 sec.
2025-11-14 15:38:20,283 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:20,308 - INFO - Going to convert document batch...
2025-11-14 15:38:20,310 - INFO - Processing document 4_2024-04-05
2025-11-14 15:38:20,360 - INFO - Finished converting document 4_2024-04-05 in 0.11 sec.


Converted 'data\edgar_documents\AVGO\4_2024-04-04' --> 'data\processed_data\AVGO\4_2024-04-04.md'
Converted 'data\edgar_documents\AVGO\4_2024-04-05' --> 'data\processed_data\AVGO\4_2024-04-05.md'


2025-11-14 15:38:20,442 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:20,466 - INFO - Going to convert document batch...
2025-11-14 15:38:20,468 - INFO - Processing document 4_2024-04-09
2025-11-14 15:38:20,538 - INFO - Finished converting document 4_2024-04-09 in 0.12 sec.
2025-11-14 15:38:20,623 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:20,653 - INFO - Going to convert document batch...
2025-11-14 15:38:20,656 - INFO - Processing document 4_2024-04-12
2025-11-14 15:38:20,731 - INFO - Finished converting document 4_2024-04-12 in 0.12 sec.


Converted 'data\edgar_documents\AVGO\4_2024-04-09' --> 'data\processed_data\AVGO\4_2024-04-09.md'
Converted 'data\edgar_documents\AVGO\4_2024-04-12' --> 'data\processed_data\AVGO\4_2024-04-12.md'


2025-11-14 15:38:20,791 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:20,815 - INFO - Going to convert document batch...
2025-11-14 15:38:20,816 - INFO - Processing document 4_2024-04-17
2025-11-14 15:38:20,880 - INFO - Finished converting document 4_2024-04-17 in 0.11 sec.
2025-11-14 15:38:20,964 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:20,994 - INFO - Going to convert document batch...
2025-11-14 15:38:20,996 - INFO - Processing document 4_2024-04-24
2025-11-14 15:38:21,052 - INFO - Finished converting document 4_2024-04-24 in 0.11 sec.
2025-11-14 15:38:21,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:21,126 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AVGO\4_2024-04-17' --> 'data\processed_data\AVGO\4_2024-04-17.md'
Converted 'data\edgar_documents\AVGO\4_2024-04-24' --> 'data\processed_data\AVGO\4_2024-04-24.md'


2025-11-14 15:38:21,128 - INFO - Processing document 4_2024-06-20
2025-11-14 15:38:21,200 - INFO - Finished converting document 4_2024-06-20 in 0.11 sec.
2025-11-14 15:38:21,289 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:21,324 - INFO - Going to convert document batch...
2025-11-14 15:38:21,327 - INFO - Processing document 4_2024-06-24
2025-11-14 15:38:21,373 - INFO - Finished converting document 4_2024-06-24 in 0.09 sec.
2025-11-14 15:38:21,438 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\4_2024-06-20' --> 'data\processed_data\AVGO\4_2024-06-20.md'
Converted 'data\edgar_documents\AVGO\4_2024-06-24' --> 'data\processed_data\AVGO\4_2024-06-24.md'


2025-11-14 15:38:21,461 - INFO - Going to convert document batch...
2025-11-14 15:38:21,462 - INFO - Processing document 4_2024-06-25
2025-11-14 15:38:21,494 - INFO - Finished converting document 4_2024-06-25 in 0.09 sec.
2025-11-14 15:38:21,555 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:21,589 - INFO - Going to convert document batch...
2025-11-14 15:38:21,591 - INFO - Processing document 4_2024-06-27
2025-11-14 15:38:21,657 - INFO - Finished converting document 4_2024-06-27 in 0.12 sec.


Converted 'data\edgar_documents\AVGO\4_2024-06-25' --> 'data\processed_data\AVGO\4_2024-06-25.md'


2025-11-14 15:38:21,765 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:21,766 - ERROR - Input document 4_2024-07-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:21,770 - INFO - Going to convert document batch...
2025-11-14 15:38:21,783 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:21,812 - INFO - Going to convert document batch...
2025-11-14 15:38:21,813 - INFO - Processing document 4_2024-07-09
2025-11-14 15:38:21,856 - INFO - Fin

Converted 'data\edgar_documents\AVGO\4_2024-06-27' --> 'data\processed_data\AVGO\4_2024-06-27.md'
Error processing data\edgar_documents\AVGO\4_2024-07-08: File format not allowed: data\edgar_documents\AVGO\4_2024-07-08
Converted 'data\edgar_documents\AVGO\4_2024-07-09' --> 'data\processed_data\AVGO\4_2024-07-09.md'


2025-11-14 15:38:21,979 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:21,982 - ERROR - Input document 4_2024-07-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:21,984 - INFO - Going to convert document batch...
2025-11-14 15:38:22,001 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:22,033 - INFO - Going to convert document batch...
2025-11-14 15:38:22,036 - INFO - Processing document 4_2024-07-15
2025-11-14 15:38:22,079 - INFO - Fin

Error processing data\edgar_documents\AVGO\4_2024-07-10: File format not allowed: data\edgar_documents\AVGO\4_2024-07-10
Converted 'data\edgar_documents\AVGO\4_2024-07-15' --> 'data\processed_data\AVGO\4_2024-07-15.md'


2025-11-14 15:38:22,183 - INFO - Processing document 4_2024-09-19
2025-11-14 15:38:22,253 - INFO - Finished converting document 4_2024-09-19 in 0.12 sec.
2025-11-14 15:38:22,318 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:22,344 - INFO - Going to convert document batch...
2025-11-14 15:38:22,346 - INFO - Processing document 4_2024-09-23
2025-11-14 15:38:22,393 - INFO - Finished converting document 4_2024-09-23 in 0.09 sec.
2025-11-14 15:38:22,486 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\4_2024-09-19' --> 'data\processed_data\AVGO\4_2024-09-19.md'
Converted 'data\edgar_documents\AVGO\4_2024-09-23' --> 'data\processed_data\AVGO\4_2024-09-23.md'


2025-11-14 15:38:22,513 - INFO - Going to convert document batch...
2025-11-14 15:38:22,514 - INFO - Processing document 4_2024-09-26
2025-11-14 15:38:22,575 - INFO - Finished converting document 4_2024-09-26 in 0.12 sec.
2025-11-14 15:38:22,656 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:22,681 - INFO - Going to convert document batch...
2025-11-14 15:38:22,683 - INFO - Processing document 4_2024-09-27
2025-11-14 15:38:22,742 - INFO - Finished converting document 4_2024-09-27 in 0.09 sec.
2025-11-14 15:38:22,821 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:22,823 - ERROR - Input document 4_2024-09-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\AVGO\4_2024-09-26' --> 'data\processed_data\AVGO\4_2024-09-26.md'
Converted 'data\edgar_documents\AVGO\4_2024-09-27' --> 'data\processed_data\AVGO\4_2024-09-27.md'


2025-11-14 15:38:22,826 - INFO - Going to convert document batch...
2025-11-14 15:38:22,852 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:22,885 - INFO - Going to convert document batch...
2025-11-14 15:38:22,889 - INFO - Processing document 4_2024-10-03
2025-11-14 15:38:22,964 - INFO - Finished converting document 4_2024-10-03 in 0.14 sec.


Error processing data\edgar_documents\AVGO\4_2024-09-30: File format not allowed: data\edgar_documents\AVGO\4_2024-09-30
Converted 'data\edgar_documents\AVGO\4_2024-10-03' --> 'data\processed_data\AVGO\4_2024-10-03.md'


2025-11-14 15:38:23,036 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:23,067 - INFO - Going to convert document batch...
2025-11-14 15:38:23,070 - INFO - Processing document 4_2024-10-07
2025-11-14 15:38:23,120 - INFO - Finished converting document 4_2024-10-07 in 0.12 sec.
2025-11-14 15:38:23,174 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:23,191 - INFO - Going to convert document batch...
2025-11-14 15:38:23,193 - INFO - Processing document 4_2024-10-09
2025-11-14 15:38:23,277 - INFO - Finished converting document 4_2024-10-09 in 0.12 sec.


Converted 'data\edgar_documents\AVGO\4_2024-10-07' --> 'data\processed_data\AVGO\4_2024-10-07.md'
Converted 'data\edgar_documents\AVGO\4_2024-10-09' --> 'data\processed_data\AVGO\4_2024-10-09.md'


2025-11-14 15:38:23,360 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:23,387 - INFO - Going to convert document batch...
2025-11-14 15:38:23,389 - INFO - Processing document 4_2024-10-11
2025-11-14 15:38:23,453 - INFO - Finished converting document 4_2024-10-11 in 0.12 sec.
2025-11-14 15:38:23,533 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:23,567 - INFO - Going to convert document batch...
2025-11-14 15:38:23,568 - INFO - Processing document 4_2024-10-16
2025-11-14 15:38:23,630 - INFO - Finished converting document 4_2024-10-16 in 0.11 sec.


Converted 'data\edgar_documents\AVGO\4_2024-10-11' --> 'data\processed_data\AVGO\4_2024-10-11.md'
Converted 'data\edgar_documents\AVGO\4_2024-10-16' --> 'data\processed_data\AVGO\4_2024-10-16.md'


2025-11-14 15:38:23,722 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:23,774 - INFO - Going to convert document batch...
2025-11-14 15:38:23,776 - INFO - Processing document 4_2024-11-08
2025-11-14 15:38:23,837 - INFO - Finished converting document 4_2024-11-08 in 0.14 sec.
2025-11-14 15:38:23,921 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:23,938 - INFO - Going to convert document batch...
2025-11-14 15:38:23,940 - INFO - Processing document 4_2024-12-18
2025-11-14 15:38:23,997 - INFO - Finished converting document 4_2024-12-18 in 0.11 sec.


Converted 'data\edgar_documents\AVGO\4_2024-11-08' --> 'data\processed_data\AVGO\4_2024-11-08.md'
Converted 'data\edgar_documents\AVGO\4_2024-12-18' --> 'data\processed_data\AVGO\4_2024-12-18.md'


2025-11-14 15:38:24,096 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:24,114 - INFO - Going to convert document batch...
2025-11-14 15:38:24,116 - INFO - Processing document 4_2024-12-19
2025-11-14 15:38:24,183 - INFO - Finished converting document 4_2024-12-19 in 0.12 sec.
2025-11-14 15:38:24,281 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:24,312 - INFO - Going to convert document batch...
2025-11-14 15:38:24,315 - INFO - Processing document 4_2024-12-26
2025-11-14 15:38:24,375 - INFO - Finished converting document 4_2024-12-26 in 0.12 sec.


Converted 'data\edgar_documents\AVGO\4_2024-12-19' --> 'data\processed_data\AVGO\4_2024-12-19.md'
Converted 'data\edgar_documents\AVGO\4_2024-12-26' --> 'data\processed_data\AVGO\4_2024-12-26.md'


2025-11-14 15:38:24,459 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:24,490 - INFO - Going to convert document batch...
2025-11-14 15:38:24,492 - INFO - Processing document 4_2024-12-27
2025-11-14 15:38:24,549 - INFO - Finished converting document 4_2024-12-27 in 0.12 sec.
2025-11-14 15:38:24,662 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\4_2024-12-27' --> 'data\processed_data\AVGO\4_2024-12-27.md'


2025-11-14 15:38:25,601 - INFO - Going to convert document batch...
2025-11-14 15:38:25,602 - INFO - Processing document 4_2025-01-06
2025-11-14 15:38:25,689 - INFO - Finished converting document 4_2025-01-06 in 1.05 sec.
2025-11-14 15:38:25,796 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:25,821 - INFO - Going to convert document batch...
2025-11-14 15:38:25,823 - INFO - Processing document 4_2025-01-08
2025-11-14 15:38:25,880 - INFO - Finished converting document 4_2025-01-08 in 0.11 sec.
2025-11-14 15:38:25,953 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\4_2025-01-06' --> 'data\processed_data\AVGO\4_2025-01-06.md'
Converted 'data\edgar_documents\AVGO\4_2025-01-08' --> 'data\processed_data\AVGO\4_2025-01-08.md'


2025-11-14 15:38:25,986 - INFO - Going to convert document batch...
2025-11-14 15:38:25,988 - INFO - Processing document 4_2025-01-10
2025-11-14 15:38:26,059 - INFO - Finished converting document 4_2025-01-10 in 0.12 sec.
2025-11-14 15:38:26,145 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:26,172 - INFO - Going to convert document batch...
2025-11-14 15:38:26,174 - INFO - Processing document 4_2025-03-06
2025-11-14 15:38:26,256 - INFO - Finished converting document 4_2025-03-06 in 0.14 sec.


Converted 'data\edgar_documents\AVGO\4_2025-01-10' --> 'data\processed_data\AVGO\4_2025-01-10.md'
Converted 'data\edgar_documents\AVGO\4_2025-03-06' --> 'data\processed_data\AVGO\4_2025-03-06.md'


2025-11-14 15:38:26,351 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:26,383 - INFO - Going to convert document batch...
2025-11-14 15:38:26,387 - INFO - Processing document 4_2025-03-18
2025-11-14 15:38:26,455 - INFO - Finished converting document 4_2025-03-18 in 0.14 sec.
2025-11-14 15:38:26,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:26,588 - INFO - Going to convert document batch...
2025-11-14 15:38:26,590 - INFO - Processing document 4_2025-03-19
2025-11-14 15:38:26,659 - INFO - Finished converting document 4_2025-03-19 in 0.14 sec.


Converted 'data\edgar_documents\AVGO\4_2025-03-18' --> 'data\processed_data\AVGO\4_2025-03-18.md'
Converted 'data\edgar_documents\AVGO\4_2025-03-19' --> 'data\processed_data\AVGO\4_2025-03-19.md'


2025-11-14 15:38:26,755 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:26,790 - INFO - Going to convert document batch...
2025-11-14 15:38:26,793 - INFO - Processing document 4_2025-03-26
2025-11-14 15:38:26,840 - INFO - Finished converting document 4_2025-03-26 in 0.14 sec.
2025-11-14 15:38:26,914 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:26,976 - INFO - Going to convert document batch...
2025-11-14 15:38:26,979 - INFO - Processing document 4_2025-03-28


Converted 'data\edgar_documents\AVGO\4_2025-03-26' --> 'data\processed_data\AVGO\4_2025-03-26.md'


2025-11-14 15:38:27,101 - INFO - Finished converting document 4_2025-03-28 in 0.20 sec.
2025-11-14 15:38:27,227 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:27,251 - INFO - Going to convert document batch...
2025-11-14 15:38:27,252 - INFO - Processing document 4_2025-04-15
2025-11-14 15:38:27,290 - INFO - Finished converting document 4_2025-04-15 in 0.08 sec.
2025-11-14 15:38:27,343 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:27,360 - INFO - Going to convert document batch...
2025-11-14 15:38:27,361 - INFO - Processing document 4_2025-04-16
2025-11-14 15:38:27,399 - INFO - Finished converting document 4_2025-04-16 in 0.06 sec.


Converted 'data\edgar_documents\AVGO\4_2025-03-28' --> 'data\processed_data\AVGO\4_2025-03-28.md'
Converted 'data\edgar_documents\AVGO\4_2025-04-15' --> 'data\processed_data\AVGO\4_2025-04-15.md'


2025-11-14 15:38:27,480 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:27,509 - INFO - Going to convert document batch...
2025-11-14 15:38:27,513 - INFO - Processing document 4_2025-04-23
2025-11-14 15:38:27,579 - INFO - Finished converting document 4_2025-04-23 in 0.11 sec.


Converted 'data\edgar_documents\AVGO\4_2025-04-16' --> 'data\processed_data\AVGO\4_2025-04-16.md'
Converted 'data\edgar_documents\AVGO\4_2025-04-23' --> 'data\processed_data\AVGO\4_2025-04-23.md'


2025-11-14 15:38:27,676 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:27,694 - INFO - Going to convert document batch...
2025-11-14 15:38:27,696 - INFO - Processing document 4_2025-05-16
2025-11-14 15:38:27,752 - INFO - Finished converting document 4_2025-05-16 in 0.11 sec.
2025-11-14 15:38:27,823 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:27,859 - INFO - Going to convert document batch...
2025-11-14 15:38:27,861 - INFO - Processing document 4_2025-06-13
2025-11-14 15:38:27,917 - INFO - Finished converting document 4_2025-06-13 in 0.11 sec.
2025-11-14 15:38:28,014 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\4_2025-05-16' --> 'data\processed_data\AVGO\4_2025-05-16.md'
Converted 'data\edgar_documents\AVGO\4_2025-06-13' --> 'data\processed_data\AVGO\4_2025-06-13.md'


2025-11-14 15:38:28,031 - INFO - Going to convert document batch...
2025-11-14 15:38:28,032 - INFO - Processing document 4_2025-06-16
2025-11-14 15:38:28,102 - INFO - Finished converting document 4_2025-06-16 in 0.11 sec.
2025-11-14 15:38:28,169 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:28,189 - INFO - Going to convert document batch...
2025-11-14 15:38:28,192 - INFO - Processing document 4_2025-06-18
2025-11-14 15:38:28,263 - INFO - Finished converting document 4_2025-06-18 in 0.11 sec.
2025-11-14 15:38:28,336 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\4_2025-06-16' --> 'data\processed_data\AVGO\4_2025-06-16.md'
Converted 'data\edgar_documents\AVGO\4_2025-06-18' --> 'data\processed_data\AVGO\4_2025-06-18.md'


2025-11-14 15:38:28,362 - INFO - Going to convert document batch...
2025-11-14 15:38:28,364 - INFO - Processing document 4_2025-06-23
2025-11-14 15:38:28,432 - INFO - Finished converting document 4_2025-06-23 in 0.12 sec.
2025-11-14 15:38:28,514 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:28,545 - INFO - Going to convert document batch...
2025-11-14 15:38:28,547 - INFO - Processing document 4_2025-06-25
2025-11-14 15:38:28,612 - INFO - Finished converting document 4_2025-06-25 in 0.11 sec.


Converted 'data\edgar_documents\AVGO\4_2025-06-23' --> 'data\processed_data\AVGO\4_2025-06-23.md'
Converted 'data\edgar_documents\AVGO\4_2025-06-25' --> 'data\processed_data\AVGO\4_2025-06-25.md'


2025-11-14 15:38:28,703 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:28,754 - INFO - Going to convert document batch...
2025-11-14 15:38:28,756 - INFO - Processing document 4_2025-06-26
2025-11-14 15:38:28,794 - INFO - Finished converting document 4_2025-06-26 in 0.12 sec.
2025-11-14 15:38:28,866 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:28,923 - INFO - Going to convert document batch...
2025-11-14 15:38:28,927 - INFO - Processing document 4_2025-06-27
2025-11-14 15:38:29,014 - INFO - Finished converting document 4_2025-06-27 in 0.17 sec.


Converted 'data\edgar_documents\AVGO\4_2025-06-26' --> 'data\processed_data\AVGO\4_2025-06-26.md'


2025-11-14 15:38:29,135 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:29,164 - INFO - Going to convert document batch...
2025-11-14 15:38:29,165 - INFO - Processing document 4_2025-06-30
2025-11-14 15:38:29,235 - INFO - Finished converting document 4_2025-06-30 in 0.12 sec.


Converted 'data\edgar_documents\AVGO\4_2025-06-27' --> 'data\processed_data\AVGO\4_2025-06-27.md'
Converted 'data\edgar_documents\AVGO\4_2025-06-30' --> 'data\processed_data\AVGO\4_2025-06-30.md'


2025-11-14 15:38:29,362 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:29,364 - ERROR - Input document 4_2025-07-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:29,367 - INFO - Going to convert document batch...
2025-11-14 15:38:29,416 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:29,417 - ERROR - Input document 4_2025-07-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\AVGO\4_2025-07-07: File format not allowed: data\edgar_documents\AVGO\4_2025-07-07
Error processing data\edgar_documents\AVGO\4_2025-07-09: File format not allowed: data\edgar_documents\AVGO\4_2025-07-09
Converted 'data\edgar_documents\AVGO\4_2025-07-11' --> 'data\processed_data\AVGO\4_2025-07-11.md'


2025-11-14 15:38:29,577 - INFO - Going to convert document batch...
2025-11-14 15:38:29,578 - INFO - Processing document 4_2025-07-16
2025-11-14 15:38:29,616 - INFO - Finished converting document 4_2025-07-16 in 0.08 sec.
2025-11-14 15:38:29,673 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:29,690 - INFO - Going to convert document batch...
2025-11-14 15:38:29,694 - INFO - Processing document 4_2025-08-15
2025-11-14 15:38:29,741 - INFO - Finished converting document 4_2025-08-15 in 0.08 sec.
2025-11-14 15:38:29,829 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\4_2025-07-16' --> 'data\processed_data\AVGO\4_2025-07-16.md'
Converted 'data\edgar_documents\AVGO\4_2025-08-15' --> 'data\processed_data\AVGO\4_2025-08-15.md'


2025-11-14 15:38:29,861 - INFO - Going to convert document batch...
2025-11-14 15:38:29,864 - INFO - Processing document 4_2025-09-10
2025-11-14 15:38:29,951 - INFO - Finished converting document 4_2025-09-10 in 0.16 sec.
2025-11-14 15:38:30,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:30,062 - INFO - Going to convert document batch...
2025-11-14 15:38:30,064 - INFO - Processing document 4_2025-09-12
2025-11-14 15:38:30,148 - INFO - Finished converting document 4_2025-09-12 in 0.12 sec.


Converted 'data\edgar_documents\AVGO\4_2025-09-10' --> 'data\processed_data\AVGO\4_2025-09-10.md'
Converted 'data\edgar_documents\AVGO\4_2025-09-12' --> 'data\processed_data\AVGO\4_2025-09-12.md'


2025-11-14 15:38:30,231 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:30,266 - INFO - Going to convert document batch...
2025-11-14 15:38:30,268 - INFO - Processing document 4_2025-09-15
2025-11-14 15:38:30,390 - INFO - Finished converting document 4_2025-09-15 in 0.17 sec.
2025-11-14 15:38:30,484 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:30,507 - INFO - Going to convert document batch...
2025-11-14 15:38:30,508 - INFO - Processing document 4_2025-09-17
2025-11-14 15:38:30,550 - INFO - Finished converting document 4_2025-09-17 in 0.08 sec.
2025-11-14 15:38:30,634 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\4_2025-09-15' --> 'data\processed_data\AVGO\4_2025-09-15.md'
Converted 'data\edgar_documents\AVGO\4_2025-09-17' --> 'data\processed_data\AVGO\4_2025-09-17.md'


2025-11-14 15:38:30,697 - INFO - Going to convert document batch...
2025-11-14 15:38:30,698 - INFO - Processing document 4_2025-09-18
2025-11-14 15:38:30,844 - INFO - Finished converting document 4_2025-09-18 in 0.25 sec.
2025-11-14 15:38:30,988 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:30,989 - ERROR - Input document 4_2025-09-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:30,991 - INFO - Going to convert document batch...
2025-11-14 15:38:31,016 - IN

Converted 'data\edgar_documents\AVGO\4_2025-09-18' --> 'data\processed_data\AVGO\4_2025-09-18.md'
Error processing data\edgar_documents\AVGO\4_2025-09-22: File format not allowed: data\edgar_documents\AVGO\4_2025-09-22
Error processing data\edgar_documents\AVGO\4_2025-09-24: File format not allowed: data\edgar_documents\AVGO\4_2025-09-24


2025-11-14 15:38:31,193 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:31,238 - INFO - Going to convert document batch...
2025-11-14 15:38:31,240 - INFO - Processing document 4_2025-09-26
2025-11-14 15:38:31,342 - INFO - Finished converting document 4_2025-09-26 in 0.17 sec.


Converted 'data\edgar_documents\AVGO\4_2025-09-25' --> 'data\processed_data\AVGO\4_2025-09-25.md'


2025-11-14 15:38:31,461 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:31,489 - INFO - Going to convert document batch...
2025-11-14 15:38:31,491 - INFO - Processing document 4_2025-10-16


Converted 'data\edgar_documents\AVGO\4_2025-09-26' --> 'data\processed_data\AVGO\4_2025-09-26.md'


2025-11-14 15:38:31,662 - INFO - Finished converting document 4_2025-10-16 in 0.22 sec.
2025-11-14 15:38:31,753 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:31,788 - INFO - Going to convert document batch...
2025-11-14 15:38:31,789 - INFO - Processing document 8-K_2023-03-02
2025-11-14 15:38:31,856 - INFO - Finished converting document 8-K_2023-03-02 in 0.12 sec.


Converted 'data\edgar_documents\AVGO\4_2025-10-16' --> 'data\processed_data\AVGO\4_2025-10-16.md'


2025-11-14 15:38:31,940 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:32,024 - INFO - Going to convert document batch...
2025-11-14 15:38:32,026 - INFO - Processing document 8-K_2023-04-06
2025-11-14 15:38:32,110 - INFO - Finished converting document 8-K_2023-04-06 in 0.19 sec.


Converted 'data\edgar_documents\AVGO\8-K_2023-03-02' --> 'data\processed_data\AVGO\8-K_2023-03-02.md'


2025-11-14 15:38:32,160 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:32,186 - INFO - Going to convert document batch...
2025-11-14 15:38:32,188 - INFO - Processing document 8-K_2023-05-23
2025-11-14 15:38:32,231 - INFO - Finished converting document 8-K_2023-05-23 in 0.09 sec.
2025-11-14 15:38:32,274 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:32,317 - INFO - Going to convert document batch...
2025-11-14 15:38:32,319 - INFO - Processing document 8-K_2023-06-01


Converted 'data\edgar_documents\AVGO\8-K_2023-04-06' --> 'data\processed_data\AVGO\8-K_2023-04-06.md'
Converted 'data\edgar_documents\AVGO\8-K_2023-05-23' --> 'data\processed_data\AVGO\8-K_2023-05-23.md'


2025-11-14 15:38:32,408 - INFO - Finished converting document 8-K_2023-06-01 in 0.14 sec.
2025-11-14 15:38:32,506 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:32,552 - INFO - Going to convert document batch...
2025-11-14 15:38:32,554 - INFO - Processing document 8-K_2023-08-16
2025-11-14 15:38:32,610 - INFO - Finished converting document 8-K_2023-08-16 in 0.14 sec.


Converted 'data\edgar_documents\AVGO\8-K_2023-06-01' --> 'data\processed_data\AVGO\8-K_2023-06-01.md'
Converted 'data\edgar_documents\AVGO\8-K_2023-08-16' --> 'data\processed_data\AVGO\8-K_2023-08-16.md'


2025-11-14 15:38:32,675 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:32,728 - INFO - Going to convert document batch...
2025-11-14 15:38:32,730 - INFO - Processing document 8-K_2023-08-31
2025-11-14 15:38:32,823 - INFO - Finished converting document 8-K_2023-08-31 in 0.19 sec.
2025-11-14 15:38:32,895 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:32,936 - INFO - Going to convert document batch...
2025-11-14 15:38:32,938 - INFO - Processing document 8-K_2023-10-18
2025-11-14 15:38:32,986 - INFO - Finished converting document 8-K_2023-10-18 in 0.11 sec.
2025-11-14 15:38:33,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\8-K_2023-08-31' --> 'data\processed_data\AVGO\8-K_2023-08-31.md'
Converted 'data\edgar_documents\AVGO\8-K_2023-10-18' --> 'data\processed_data\AVGO\8-K_2023-10-18.md'


2025-11-14 15:38:33,065 - INFO - Going to convert document batch...
2025-11-14 15:38:33,069 - INFO - Processing document 8-K_2023-10-30
2025-11-14 15:38:33,143 - INFO - Finished converting document 8-K_2023-10-30 in 0.12 sec.
2025-11-14 15:38:33,212 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:33,250 - INFO - Going to convert document batch...
2025-11-14 15:38:33,252 - INFO - Processing document 8-K_2023-11-22
2025-11-14 15:38:33,315 - INFO - Finished converting document 8-K_2023-11-22 in 0.14 sec.


Converted 'data\edgar_documents\AVGO\8-K_2023-10-30' --> 'data\processed_data\AVGO\8-K_2023-10-30.md'


2025-11-14 15:38:33,379 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:33,439 - INFO - Going to convert document batch...
2025-11-14 15:38:33,441 - INFO - Processing document 8-K_2023-12-07
2025-11-14 15:38:33,537 - INFO - Finished converting document 8-K_2023-12-07 in 0.17 sec.


Converted 'data\edgar_documents\AVGO\8-K_2023-11-22' --> 'data\processed_data\AVGO\8-K_2023-11-22.md'


2025-11-14 15:38:33,595 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:33,596 - ERROR - Input document 8-K_2024-02-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:33,598 - INFO - Going to convert document batch...
2025-11-14 15:38:33,616 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:33,618 - ERROR - Input document 8-K_2024-02-09 with format None does 

Converted 'data\edgar_documents\AVGO\8-K_2023-12-07' --> 'data\processed_data\AVGO\8-K_2023-12-07.md'
Error processing data\edgar_documents\AVGO\8-K_2024-02-08: File format not allowed: data\edgar_documents\AVGO\8-K_2024-02-08
Error processing data\edgar_documents\AVGO\8-K_2024-02-09: File format not allowed: data\edgar_documents\AVGO\8-K_2024-02-09


2025-11-14 15:38:33,815 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:33,890 - INFO - Going to convert document batch...
2025-11-14 15:38:33,892 - INFO - Processing document 8-K_2024-04-24


Converted 'data\edgar_documents\AVGO\8-K_2024-03-07' --> 'data\processed_data\AVGO\8-K_2024-03-07.md'


2025-11-14 15:38:34,010 - INFO - Finished converting document 8-K_2024-04-24 in 0.23 sec.
2025-11-14 15:38:34,086 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:34,120 - INFO - Going to convert document batch...
2025-11-14 15:38:34,122 - INFO - Processing document 8-K_2024-06-12
2025-11-14 15:38:34,195 - INFO - Finished converting document 8-K_2024-06-12 in 0.12 sec.


Converted 'data\edgar_documents\AVGO\8-K_2024-04-24' --> 'data\processed_data\AVGO\8-K_2024-04-24.md'
Converted 'data\edgar_documents\AVGO\8-K_2024-06-12' --> 'data\processed_data\AVGO\8-K_2024-06-12.md'


2025-11-14 15:38:34,280 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:34,281 - ERROR - Input document 8-K_2024-07-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:34,284 - INFO - Going to convert document batch...
2025-11-14 15:38:34,308 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:34,309 - ERROR - Input document 8-K_2024-07-12 with format None does 

Error processing data\edgar_documents\AVGO\8-K_2024-07-08: File format not allowed: data\edgar_documents\AVGO\8-K_2024-07-08
Error processing data\edgar_documents\AVGO\8-K_2024-07-12: File format not allowed: data\edgar_documents\AVGO\8-K_2024-07-12


2025-11-14 15:38:34,524 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:34,551 - INFO - Going to convert document batch...
2025-11-14 15:38:34,553 - INFO - Processing document 8-K_2024-10-02
2025-11-14 15:38:34,605 - INFO - Finished converting document 8-K_2024-10-02 in 0.11 sec.
2025-11-14 15:38:34,654 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:34,682 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AVGO\8-K_2024-09-05' --> 'data\processed_data\AVGO\8-K_2024-09-05.md'
Converted 'data\edgar_documents\AVGO\8-K_2024-10-02' --> 'data\processed_data\AVGO\8-K_2024-10-02.md'


2025-11-14 15:38:34,683 - INFO - Processing document 8-K_2024-12-12
2025-11-14 15:38:34,746 - INFO - Finished converting document 8-K_2024-12-12 in 0.12 sec.
2025-11-14 15:38:34,802 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:34,825 - INFO - Going to convert document batch...
2025-11-14 15:38:34,826 - INFO - Processing document 8-K_2025-01-10
2025-11-14 15:38:34,864 - INFO - Finished converting document 8-K_2025-01-10 in 0.08 sec.
2025-11-14 15:38:34,902 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:34,928 - INFO - Going to convert document batch...
2025-11-14 15:38:34,929 - INFO - Processing document 8-K_2025-01-13


Converted 'data\edgar_documents\AVGO\8-K_2024-12-12' --> 'data\processed_data\AVGO\8-K_2024-12-12.md'
Converted 'data\edgar_documents\AVGO\8-K_2025-01-10' --> 'data\processed_data\AVGO\8-K_2025-01-10.md'


2025-11-14 15:38:35,480 - INFO - Finished converting document 8-K_2025-01-13 in 0.59 sec.
2025-11-14 15:38:35,515 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:35,547 - INFO - Going to convert document batch...
2025-11-14 15:38:35,549 - INFO - Processing document 8-K_2025-03-06
2025-11-14 15:38:35,630 - INFO - Finished converting document 8-K_2025-03-06 in 0.12 sec.


Converted 'data\edgar_documents\AVGO\8-K_2025-01-13' --> 'data\processed_data\AVGO\8-K_2025-01-13.md'
Converted 'data\edgar_documents\AVGO\8-K_2025-03-06' --> 'data\processed_data\AVGO\8-K_2025-03-06.md'


2025-11-14 15:38:35,708 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:35,767 - INFO - Going to convert document batch...
2025-11-14 15:38:35,768 - INFO - Processing document 8-K_2025-04-22
2025-11-14 15:38:35,849 - INFO - Finished converting document 8-K_2025-04-22 in 0.17 sec.
2025-11-14 15:38:35,928 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:35,971 - INFO - Going to convert document batch...
2025-11-14 15:38:35,973 - INFO - Processing document 8-K_2025-06-05
2025-11-14 15:38:36,034 - INFO - Finished converting document 8-K_2025-06-05 in 0.12 sec.


Converted 'data\edgar_documents\AVGO\8-K_2025-04-22' --> 'data\processed_data\AVGO\8-K_2025-04-22.md'
Converted 'data\edgar_documents\AVGO\8-K_2025-06-05' --> 'data\processed_data\AVGO\8-K_2025-06-05.md'


2025-11-14 15:38:36,133 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:36,173 - INFO - Going to convert document batch...
2025-11-14 15:38:36,176 - INFO - Processing document 8-K_2025-07-11
2025-11-14 15:38:36,234 - INFO - Finished converting document 8-K_2025-07-11 in 0.14 sec.
2025-11-14 15:38:36,276 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:36,299 - INFO - Going to convert document batch...
2025-11-14 15:38:36,300 - INFO - Processing document 8-K_2025-09-04
2025-11-14 15:38:36,350 - INFO - Finished converting document 8-K_2025-09-04 in 0.08 sec.
2025-11-14 15:38:36,417 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:36,462 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AVGO\8-K_2025-07-11' --> 'data\processed_data\AVGO\8-K_2025-07-11.md'
Converted 'data\edgar_documents\AVGO\8-K_2025-09-04' --> 'data\processed_data\AVGO\8-K_2025-09-04.md'


2025-11-14 15:38:36,465 - INFO - Processing document 8-K_2025-09-09
2025-11-14 15:38:36,516 - INFO - Finished converting document 8-K_2025-09-09 in 0.14 sec.
2025-11-14 15:38:36,577 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:36,607 - INFO - Going to convert document batch...
2025-11-14 15:38:36,610 - INFO - Processing document 8-K_2025-09-10
2025-11-14 15:38:36,649 - INFO - Finished converting document 8-K_2025-09-10 in 0.09 sec.
2025-11-14 15:38:36,697 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:36,740 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AVGO\8-K_2025-09-09' --> 'data\processed_data\AVGO\8-K_2025-09-09.md'
Converted 'data\edgar_documents\AVGO\8-K_2025-09-10' --> 'data\processed_data\AVGO\8-K_2025-09-10.md'


2025-11-14 15:38:36,741 - INFO - Processing document 8-K_2025-09-29
2025-11-14 15:38:36,796 - INFO - Finished converting document 8-K_2025-09-29 in 0.14 sec.
2025-11-14 15:38:36,869 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:36,871 - ERROR - Input document DEF-14A_2023-02-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:36,874 - INFO - Going to convert document batch...
2025-11-14 15:38:36,966 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AVGO\8-K_2025-09-29' --> 'data\processed_data\AVGO\8-K_2025-09-29.md'
Error processing data\edgar_documents\AVGO\DEF-14A_2023-02-17: File format not allowed: data\edgar_documents\AVGO\DEF-14A_2023-02-17


2025-11-14 15:38:37,777 - INFO - Going to convert document batch...
2025-11-14 15:38:37,778 - INFO - Processing document DEF-14A_2024-02-26
2025-11-14 15:38:42,627 - INFO - Finished converting document DEF-14A_2024-02-26 in 5.75 sec.
2025-11-14 15:38:44,075 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:38:44,077 - ERROR - Input document DEF-14A_2025-03-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:38:44,082 - INFO - Going to 

Converted 'data\edgar_documents\AVGO\DEF-14A_2024-02-26' --> 'data\processed_data\AVGO\DEF-14A_2024-02-26.md'
Error processing data\edgar_documents\AVGO\DEF-14A_2025-03-03: File format not allowed: data\edgar_documents\AVGO\DEF-14A_2025-03-03
Processed 123 new files. Errors: 33
Found 169 files to process in data\edgar_documents\AXP


2025-11-14 15:38:44,240 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:38:47,369 - INFO - Going to convert document batch...
2025-11-14 15:38:47,371 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:38:47,372 - INFO - Processing document 10-K_2023-02-10
2025-11-14 15:38:55,893 - INFO - Finished converting document 10-K_2023-02-10 in 11.78 sec.
2025-11-14 15:38:58,712 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\10-K_2023-02-10' --> 'data\processed_data\AXP\10-K_2023-02-10.md'


2025-11-14 15:39:02,351 - INFO - Going to convert document batch...
2025-11-14 15:39:02,353 - INFO - Processing document 10-K_2024-02-09
2025-11-14 15:39:10,848 - INFO - Finished converting document 10-K_2024-02-09 in 12.24 sec.
2025-11-14 15:39:14,796 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\10-K_2024-02-09' --> 'data\processed_data\AXP\10-K_2024-02-09.md'


2025-11-14 15:39:18,675 - INFO - Going to convert document batch...
2025-11-14 15:39:18,677 - INFO - Processing document 10-K_2025-02-07
2025-11-14 15:39:25,623 - INFO - Finished converting document 10-K_2025-02-07 in 10.98 sec.
2025-11-14 15:39:28,565 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\10-K_2025-02-07' --> 'data\processed_data\AXP\10-K_2025-02-07.md'


2025-11-14 15:39:30,140 - INFO - Going to convert document batch...
2025-11-14 15:39:30,141 - INFO - Processing document 10-Q_2023-04-21
2025-11-14 15:39:33,239 - INFO - Finished converting document 10-Q_2023-04-21 in 4.75 sec.
2025-11-14 15:39:34,618 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\10-Q_2023-04-21' --> 'data\processed_data\AXP\10-Q_2023-04-21.md'


2025-11-14 15:39:37,886 - INFO - Going to convert document batch...
2025-11-14 15:39:37,888 - INFO - Processing document 10-Q_2023-07-25
2025-11-14 15:39:42,121 - INFO - Finished converting document 10-Q_2023-07-25 in 7.58 sec.
2025-11-14 15:39:44,034 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\10-Q_2023-07-25' --> 'data\processed_data\AXP\10-Q_2023-07-25.md'


2025-11-14 15:39:46,556 - INFO - Going to convert document batch...
2025-11-14 15:39:46,558 - INFO - Processing document 10-Q_2023-10-20
2025-11-14 15:39:50,003 - INFO - Finished converting document 10-Q_2023-10-20 in 6.03 sec.
2025-11-14 15:39:52,681 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\10-Q_2023-10-20' --> 'data\processed_data\AXP\10-Q_2023-10-20.md'


2025-11-14 15:39:54,173 - INFO - Going to convert document batch...
2025-11-14 15:39:54,174 - INFO - Processing document 10-Q_2024-04-19
2025-11-14 15:39:57,332 - INFO - Finished converting document 10-Q_2024-04-19 in 4.69 sec.
2025-11-14 15:39:58,837 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\10-Q_2024-04-19' --> 'data\processed_data\AXP\10-Q_2024-04-19.md'


2025-11-14 15:40:00,586 - INFO - Going to convert document batch...
2025-11-14 15:40:00,587 - INFO - Processing document 10-Q_2024-07-19
2025-11-14 15:40:02,024 - INFO - Finished converting document 10-Q_2024-07-19 in 3.28 sec.
2025-11-14 15:40:02,674 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\10-Q_2024-07-19' --> 'data\processed_data\AXP\10-Q_2024-07-19.md'


2025-11-14 15:40:03,648 - INFO - Going to convert document batch...
2025-11-14 15:40:03,649 - INFO - Processing document 10-Q_2024-10-18
2025-11-14 15:40:05,149 - INFO - Finished converting document 10-Q_2024-10-18 in 2.52 sec.
2025-11-14 15:40:05,857 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\10-Q_2024-10-18' --> 'data\processed_data\AXP\10-Q_2024-10-18.md'


2025-11-14 15:40:06,881 - INFO - Going to convert document batch...
2025-11-14 15:40:06,881 - INFO - Processing document 10-Q_2025-04-18
2025-11-14 15:40:08,114 - INFO - Finished converting document 10-Q_2025-04-18 in 2.30 sec.
2025-11-14 15:40:08,771 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\10-Q_2025-04-18' --> 'data\processed_data\AXP\10-Q_2025-04-18.md'


2025-11-14 15:40:09,964 - INFO - Going to convert document batch...
2025-11-14 15:40:09,965 - INFO - Processing document 10-Q_2025-07-18
2025-11-14 15:40:11,501 - INFO - Finished converting document 10-Q_2025-07-18 in 2.80 sec.
2025-11-14 15:40:12,265 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\10-Q_2025-07-18' --> 'data\processed_data\AXP\10-Q_2025-07-18.md'


2025-11-14 15:40:13,335 - INFO - Going to convert document batch...
2025-11-14 15:40:13,336 - INFO - Processing document 10-Q_2025-10-17
2025-11-14 15:40:16,724 - INFO - Finished converting document 10-Q_2025-10-17 in 4.52 sec.
2025-11-14 15:40:18,478 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:18,508 - INFO - Going to convert document batch...
2025-11-14 15:40:18,509 - INFO - Processing document 4_2023-01-04
2025-11-14 15:40:18,557 - INFO - Finished converting document 4_2023-01-04 in 0.12 sec.
2025-11-14 15:40:18,643 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\10-Q_2025-10-17' --> 'data\processed_data\AXP\10-Q_2025-10-17.md'
Converted 'data\edgar_documents\AXP\4_2023-01-04' --> 'data\processed_data\AXP\4_2023-01-04.md'


2025-11-14 15:40:18,664 - INFO - Going to convert document batch...
2025-11-14 15:40:18,666 - INFO - Processing document 4_2023-01-31
2025-11-14 15:40:18,731 - INFO - Finished converting document 4_2023-01-31 in 0.12 sec.
2025-11-14 15:40:18,822 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:18,848 - INFO - Going to convert document batch...
2025-11-14 15:40:18,849 - INFO - Processing document 4_2023-02-01
2025-11-14 15:40:18,956 - INFO - Finished converting document 4_2023-02-01 in 0.16 sec.


Converted 'data\edgar_documents\AXP\4_2023-01-31' --> 'data\processed_data\AXP\4_2023-01-31.md'


2025-11-14 15:40:19,042 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:19,043 - ERROR - Input document 4_2023-02-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:40:19,046 - INFO - Going to convert document batch...
2025-11-14 15:40:19,069 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:19,070 - ERROR - Input document 4_2023-02-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\AXP\4_2023-02-01' --> 'data\processed_data\AXP\4_2023-02-01.md'
Error processing data\edgar_documents\AXP\4_2023-02-13: File format not allowed: data\edgar_documents\AXP\4_2023-02-13
Error processing data\edgar_documents\AXP\4_2023-02-14: File format not allowed: data\edgar_documents\AXP\4_2023-02-14
Converted 'data\edgar_documents\AXP\4_2023-02-16' --> 'data\processed_data\AXP\4_2023-02-16.md'


2025-11-14 15:40:19,231 - INFO - Going to convert document batch...
2025-11-14 15:40:19,232 - INFO - Processing document 4_2023-02-21
2025-11-14 15:40:19,285 - INFO - Finished converting document 4_2023-02-21 in 0.09 sec.
2025-11-14 15:40:19,341 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:19,355 - INFO - Going to convert document batch...
2025-11-14 15:40:19,356 - INFO - Processing document 4_2023-03-06
2025-11-14 15:40:19,390 - INFO - Finished converting document 4_2023-03-06 in 0.06 sec.
2025-11-14 15:40:19,454 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:19,474 - INFO - Going to convert document batch...
2025-11-14 15:40:19,475 - INFO - Processing document 4_2023-03-10


Converted 'data\edgar_documents\AXP\4_2023-02-21' --> 'data\processed_data\AXP\4_2023-02-21.md'
Converted 'data\edgar_documents\AXP\4_2023-03-06' --> 'data\processed_data\AXP\4_2023-03-06.md'


2025-11-14 15:40:19,521 - INFO - Finished converting document 4_2023-03-10 in 0.09 sec.
2025-11-14 15:40:19,577 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:19,597 - INFO - Going to convert document batch...
2025-11-14 15:40:19,598 - INFO - Processing document 4_2023-04-04
2025-11-14 15:40:19,642 - INFO - Finished converting document 4_2023-04-04 in 0.08 sec.


Converted 'data\edgar_documents\AXP\4_2023-03-10' --> 'data\processed_data\AXP\4_2023-03-10.md'
Converted 'data\edgar_documents\AXP\4_2023-04-04' --> 'data\processed_data\AXP\4_2023-04-04.md'


2025-11-14 15:40:19,762 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:19,764 - ERROR - Input document 4_2023-04-26 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:40:19,766 - INFO - Going to convert document batch...
2025-11-14 15:40:19,807 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:19,808 - ERROR - Input document 4_2023-04-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\AXP\4_2023-04-26: File format not allowed: data\edgar_documents\AXP\4_2023-04-26
Error processing data\edgar_documents\AXP\4_2023-04-27: File format not allowed: data\edgar_documents\AXP\4_2023-04-27
Converted 'data\edgar_documents\AXP\4_2023-05-02' --> 'data\processed_data\AXP\4_2023-05-02.md'


2025-11-14 15:40:19,995 - INFO - Going to convert document batch...
2025-11-14 15:40:19,997 - INFO - Processing document 4_2023-05-04
2025-11-14 15:40:20,040 - INFO - Finished converting document 4_2023-05-04 in 0.08 sec.
2025-11-14 15:40:20,119 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:20,138 - INFO - Going to convert document batch...
2025-11-14 15:40:20,139 - INFO - Processing document 4_2023-05-22
2025-11-14 15:40:20,182 - INFO - Finished converting document 4_2023-05-22 in 0.09 sec.
2025-11-14 15:40:20,243 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:20,258 - INFO - Going to convert document batch...
2025-11-14 15:40:20,259 - INFO - Processing document 4_2023-07-05


Converted 'data\edgar_documents\AXP\4_2023-05-04' --> 'data\processed_data\AXP\4_2023-05-04.md'
Converted 'data\edgar_documents\AXP\4_2023-05-22' --> 'data\processed_data\AXP\4_2023-05-22.md'


2025-11-14 15:40:20,303 - INFO - Finished converting document 4_2023-07-05 in 0.06 sec.
2025-11-14 15:40:20,366 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:20,399 - INFO - Going to convert document batch...
2025-11-14 15:40:20,400 - INFO - Processing document 4_2023-07-11
2025-11-14 15:40:20,474 - INFO - Finished converting document 4_2023-07-11 in 0.11 sec.


Converted 'data\edgar_documents\AXP\4_2023-07-05' --> 'data\processed_data\AXP\4_2023-07-05.md'
Converted 'data\edgar_documents\AXP\4_2023-07-11' --> 'data\processed_data\AXP\4_2023-07-11.md'


2025-11-14 15:40:20,597 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:20,598 - ERROR - Input document 4_2023-07-25 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:40:20,600 - INFO - Going to convert document batch...
2025-11-14 15:40:20,627 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:20,628 - ERROR - Input document 4_2023-07-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\AXP\4_2023-07-25: File format not allowed: data\edgar_documents\AXP\4_2023-07-25
Error processing data\edgar_documents\AXP\4_2023-07-27: File format not allowed: data\edgar_documents\AXP\4_2023-07-27
Converted 'data\edgar_documents\AXP\4_2023-08-01' --> 'data\processed_data\AXP\4_2023-08-01.md'


2025-11-14 15:40:20,786 - INFO - Processing document 4_2023-10-03
2025-11-14 15:40:20,843 - INFO - Finished converting document 4_2023-10-03 in 0.09 sec.
2025-11-14 15:40:20,934 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:20,935 - ERROR - Input document 4_2023-10-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:40:20,937 - INFO - Going to convert document batch...
2025-11-14 15:40:20,959 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-1

Converted 'data\edgar_documents\AXP\4_2023-10-03' --> 'data\processed_data\AXP\4_2023-10-03.md'
Error processing data\edgar_documents\AXP\4_2023-10-24: File format not allowed: data\edgar_documents\AXP\4_2023-10-24
Error processing data\edgar_documents\AXP\4_2023-10-25: File format not allowed: data\edgar_documents\AXP\4_2023-10-25


2025-11-14 15:40:21,109 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:21,129 - INFO - Going to convert document batch...
2025-11-14 15:40:21,130 - INFO - Processing document 4_2023-11-30
2025-11-14 15:40:21,171 - INFO - Finished converting document 4_2023-11-30 in 0.08 sec.
2025-11-14 15:40:21,240 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:21,256 - INFO - Going to convert document batch...
2025-11-14 15:40:21,258 - INFO - Processing document 4_2024-01-03


Converted 'data\edgar_documents\AXP\4_2023-11-17' --> 'data\processed_data\AXP\4_2023-11-17.md'
Converted 'data\edgar_documents\AXP\4_2023-11-30' --> 'data\processed_data\AXP\4_2023-11-30.md'


2025-11-14 15:40:21,303 - INFO - Finished converting document 4_2024-01-03 in 0.08 sec.
2025-11-14 15:40:21,365 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:21,383 - INFO - Going to convert document batch...
2025-11-14 15:40:21,384 - INFO - Processing document 4_2024-01-30
2025-11-14 15:40:21,425 - INFO - Finished converting document 4_2024-01-30 in 0.08 sec.
2025-11-14 15:40:21,498 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:21,542 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AXP\4_2024-01-03' --> 'data\processed_data\AXP\4_2024-01-03.md'
Converted 'data\edgar_documents\AXP\4_2024-01-30' --> 'data\processed_data\AXP\4_2024-01-30.md'


2025-11-14 15:40:21,544 - INFO - Processing document 4_2024-01-31
2025-11-14 15:40:21,630 - INFO - Finished converting document 4_2024-01-31 in 0.16 sec.
2025-11-14 15:40:21,692 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:21,709 - INFO - Going to convert document batch...
2025-11-14 15:40:21,711 - INFO - Processing document 4_2024-02-05
2025-11-14 15:40:21,756 - INFO - Finished converting document 4_2024-02-05 in 0.06 sec.
2025-11-14 15:40:21,815 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:21,836 - INFO - Going to convert document batch...
2025-11-14 15:40:21,838 - INFO - Processing document 4_2024-02-12


Converted 'data\edgar_documents\AXP\4_2024-01-31' --> 'data\processed_data\AXP\4_2024-01-31.md'
Converted 'data\edgar_documents\AXP\4_2024-02-05' --> 'data\processed_data\AXP\4_2024-02-05.md'


2025-11-14 15:40:21,890 - INFO - Finished converting document 4_2024-02-12 in 0.09 sec.
2025-11-14 15:40:21,982 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:21,983 - ERROR - Input document 4_2024-02-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:40:21,988 - INFO - Going to convert document batch...
2025-11-14 15:40:22,017 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:22,043 - INFO - Going to convert document batch...
2025-11-14 15:

Converted 'data\edgar_documents\AXP\4_2024-02-12' --> 'data\processed_data\AXP\4_2024-02-12.md'
Error processing data\edgar_documents\AXP\4_2024-02-13: File format not allowed: data\edgar_documents\AXP\4_2024-02-13
Converted 'data\edgar_documents\AXP\4_2024-02-14' --> 'data\processed_data\AXP\4_2024-02-14.md'


2025-11-14 15:40:22,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:22,183 - INFO - Going to convert document batch...
2025-11-14 15:40:22,185 - INFO - Processing document 4_2024-02-22
2025-11-14 15:40:22,231 - INFO - Finished converting document 4_2024-02-22 in 0.09 sec.
2025-11-14 15:40:22,301 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:22,333 - INFO - Going to convert document batch...
2025-11-14 15:40:22,335 - INFO - Processing document 4_2024-03-04
2025-11-14 15:40:22,398 - INFO - Finished converting document 4_2024-03-04 in 0.11 sec.
2025-11-14 15:40:22,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:22,483 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AXP\4_2024-02-22' --> 'data\processed_data\AXP\4_2024-02-22.md'
Converted 'data\edgar_documents\AXP\4_2024-03-04' --> 'data\processed_data\AXP\4_2024-03-04.md'


2025-11-14 15:40:22,484 - INFO - Processing document 4_2024-03-11
2025-11-14 15:40:22,542 - INFO - Finished converting document 4_2024-03-11 in 0.11 sec.
2025-11-14 15:40:22,592 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:22,612 - INFO - Going to convert document batch...
2025-11-14 15:40:22,614 - INFO - Processing document 4_2024-04-02
2025-11-14 15:40:22,652 - INFO - Finished converting document 4_2024-04-02 in 0.08 sec.
2025-11-14 15:40:22,723 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:22,724 - ERROR - Input document 4_2024-04-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, 

Converted 'data\edgar_documents\AXP\4_2024-03-11' --> 'data\processed_data\AXP\4_2024-03-11.md'
Converted 'data\edgar_documents\AXP\4_2024-04-02' --> 'data\processed_data\AXP\4_2024-04-02.md'
Error processing data\edgar_documents\AXP\4_2024-04-23: File format not allowed: data\edgar_documents\AXP\4_2024-04-23


2025-11-14 15:40:22,769 - INFO - Going to convert document batch...
2025-11-14 15:40:22,771 - INFO - Processing document 4_2024-04-25
2025-11-14 15:40:22,818 - INFO - Finished converting document 4_2024-04-25 in 0.09 sec.
2025-11-14 15:40:22,874 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:22,893 - INFO - Going to convert document batch...
2025-11-14 15:40:22,894 - INFO - Processing document 4_2024-05-02
2025-11-14 15:40:22,952 - INFO - Finished converting document 4_2024-05-02 in 0.09 sec.
2025-11-14 15:40:23,030 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\4_2024-04-25' --> 'data\processed_data\AXP\4_2024-04-25.md'
Converted 'data\edgar_documents\AXP\4_2024-05-02' --> 'data\processed_data\AXP\4_2024-05-02.md'


2025-11-14 15:40:23,061 - INFO - Going to convert document batch...
2025-11-14 15:40:23,063 - INFO - Processing document 4_2024-05-06
2025-11-14 15:40:23,124 - INFO - Finished converting document 4_2024-05-06 in 0.11 sec.
2025-11-14 15:40:23,183 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:23,200 - INFO - Going to convert document batch...
2025-11-14 15:40:23,202 - INFO - Processing document 4_2024-05-07
2025-11-14 15:40:23,245 - INFO - Finished converting document 4_2024-05-07 in 0.08 sec.
2025-11-14 15:40:23,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:23,318 - INFO - Going to convert document batch...
2025-11-14 15:40:23,320 - INFO - Processing document 4_2024-05-08


Converted 'data\edgar_documents\AXP\4_2024-05-06' --> 'data\processed_data\AXP\4_2024-05-06.md'
Converted 'data\edgar_documents\AXP\4_2024-05-07' --> 'data\processed_data\AXP\4_2024-05-07.md'


2025-11-14 15:40:23,369 - INFO - Finished converting document 4_2024-05-08 in 0.08 sec.
2025-11-14 15:40:23,433 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:23,514 - INFO - Going to convert document batch...
2025-11-14 15:40:23,517 - INFO - Processing document 4_2024-05-13
2025-11-14 15:40:23,610 - INFO - Finished converting document 4_2024-05-13 in 0.19 sec.


Converted 'data\edgar_documents\AXP\4_2024-05-08' --> 'data\processed_data\AXP\4_2024-05-08.md'


2025-11-14 15:40:23,780 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:23,805 - INFO - Going to convert document batch...
2025-11-14 15:40:23,807 - INFO - Processing document 4_2024-05-21
2025-11-14 15:40:23,860 - INFO - Finished converting document 4_2024-05-21 in 0.20 sec.


Converted 'data\edgar_documents\AXP\4_2024-05-13' --> 'data\processed_data\AXP\4_2024-05-13.md'


2025-11-14 15:40:23,966 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:23,984 - INFO - Going to convert document batch...
2025-11-14 15:40:23,985 - INFO - Processing document 4_2024-05-23
2025-11-14 15:40:24,032 - INFO - Finished converting document 4_2024-05-23 in 0.12 sec.
2025-11-14 15:40:24,105 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\4_2024-05-21' --> 'data\processed_data\AXP\4_2024-05-21.md'
Converted 'data\edgar_documents\AXP\4_2024-05-23' --> 'data\processed_data\AXP\4_2024-05-23.md'


2025-11-14 15:40:24,122 - INFO - Going to convert document batch...
2025-11-14 15:40:24,123 - INFO - Processing document 4_2024-06-17
2025-11-14 15:40:24,161 - INFO - Finished converting document 4_2024-06-17 in 0.06 sec.
2025-11-14 15:40:24,214 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:24,231 - INFO - Going to convert document batch...
2025-11-14 15:40:24,232 - INFO - Processing document 4_2024-07-02
2025-11-14 15:40:24,272 - INFO - Finished converting document 4_2024-07-02 in 0.06 sec.
2025-11-14 15:40:24,376 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:24,379 - ERROR - Input document 4_2024-07-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\AXP\4_2024-06-17' --> 'data\processed_data\AXP\4_2024-06-17.md'
Converted 'data\edgar_documents\AXP\4_2024-07-02' --> 'data\processed_data\AXP\4_2024-07-02.md'


2025-11-14 15:40:24,402 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:24,430 - INFO - Going to convert document batch...
2025-11-14 15:40:24,433 - INFO - Processing document 4_2024-10-02
2025-11-14 15:40:24,487 - INFO - Finished converting document 4_2024-10-02 in 0.09 sec.


Error processing data\edgar_documents\AXP\4_2024-07-23: File format not allowed: data\edgar_documents\AXP\4_2024-07-23
Converted 'data\edgar_documents\AXP\4_2024-10-02' --> 'data\processed_data\AXP\4_2024-10-02.md'


2025-11-14 15:40:24,585 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:24,650 - INFO - Going to convert document batch...
2025-11-14 15:40:24,651 - INFO - Processing document 4_2024-10-24
2025-11-14 15:40:24,725 - INFO - Finished converting document 4_2024-10-24 in 0.17 sec.
2025-11-14 15:40:24,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:24,825 - INFO - Going to convert document batch...
2025-11-14 15:40:24,827 - INFO - Processing document 4_2024-10-31
2025-11-14 15:40:24,875 - INFO - Finished converting document 4_2024-10-31 in 0.11 sec.


Converted 'data\edgar_documents\AXP\4_2024-10-24' --> 'data\processed_data\AXP\4_2024-10-24.md'
Converted 'data\edgar_documents\AXP\4_2024-10-31' --> 'data\processed_data\AXP\4_2024-10-31.md'


2025-11-14 15:40:24,970 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:24,991 - INFO - Going to convert document batch...
2025-11-14 15:40:24,993 - INFO - Processing document 4_2024-11-08
2025-11-14 15:40:25,039 - INFO - Finished converting document 4_2024-11-08 in 0.09 sec.
2025-11-14 15:40:25,100 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:25,136 - INFO - Going to convert document batch...
2025-11-14 15:40:25,138 - INFO - Processing document 4_2024-11-12
2025-11-14 15:40:25,210 - INFO - Finished converting document 4_2024-11-12 in 0.12 sec.
2025-11-14 15:40:25,274 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\4_2024-11-08' --> 'data\processed_data\AXP\4_2024-11-08.md'
Converted 'data\edgar_documents\AXP\4_2024-11-12' --> 'data\processed_data\AXP\4_2024-11-12.md'


2025-11-14 15:40:25,295 - INFO - Going to convert document batch...
2025-11-14 15:40:25,298 - INFO - Processing document 4_2024-11-25
2025-11-14 15:40:25,337 - INFO - Finished converting document 4_2024-11-25 in 0.06 sec.
2025-11-14 15:40:25,392 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:25,413 - INFO - Going to convert document batch...
2025-11-14 15:40:25,414 - INFO - Processing document 4_2024-12-02
2025-11-14 15:40:25,458 - INFO - Finished converting document 4_2024-12-02 in 0.08 sec.
2025-11-14 15:40:25,560 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\4_2024-11-25' --> 'data\processed_data\AXP\4_2024-11-25.md'
Converted 'data\edgar_documents\AXP\4_2024-12-02' --> 'data\processed_data\AXP\4_2024-12-02.md'


2025-11-14 15:40:25,603 - INFO - Going to convert document batch...
2025-11-14 15:40:25,609 - INFO - Processing document 4_2025-01-03
2025-11-14 15:40:25,672 - INFO - Finished converting document 4_2025-01-03 in 0.14 sec.
2025-11-14 15:40:25,738 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:25,739 - ERROR - Input document 4_2025-01-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:40:25,740 - INFO - Going to convert document batch...
2025-11-14 15:40:25,763 - IN

Converted 'data\edgar_documents\AXP\4_2025-01-03' --> 'data\processed_data\AXP\4_2025-01-03.md'
Error processing data\edgar_documents\AXP\4_2025-01-29: File format not allowed: data\edgar_documents\AXP\4_2025-01-29


2025-11-14 15:40:25,961 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:25,999 - INFO - Going to convert document batch...
2025-11-14 15:40:26,002 - INFO - Processing document 4_2025-02-06
2025-11-14 15:40:26,056 - INFO - Finished converting document 4_2025-02-06 in 0.12 sec.


Converted 'data\edgar_documents\AXP\4_2025-01-30' --> 'data\processed_data\AXP\4_2025-01-30.md'


2025-11-14 15:40:26,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:26,186 - INFO - Going to convert document batch...
2025-11-14 15:40:26,187 - INFO - Processing document 4_2025-02-10
2025-11-14 15:40:26,235 - INFO - Finished converting document 4_2025-02-10 in 0.11 sec.
2025-11-14 15:40:26,312 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\4_2025-02-06' --> 'data\processed_data\AXP\4_2025-02-06.md'
Converted 'data\edgar_documents\AXP\4_2025-02-10' --> 'data\processed_data\AXP\4_2025-02-10.md'


2025-11-14 15:40:26,328 - INFO - Going to convert document batch...
2025-11-14 15:40:26,331 - INFO - Processing document 4_2025-02-13
2025-11-14 15:40:26,378 - INFO - Finished converting document 4_2025-02-13 in 0.09 sec.
2025-11-14 15:40:26,451 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:26,485 - INFO - Going to convert document batch...
2025-11-14 15:40:26,487 - INFO - Processing document 4_2025-02-28
2025-11-14 15:40:26,552 - INFO - Finished converting document 4_2025-02-28 in 0.12 sec.
2025-11-14 15:40:26,604 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\4_2025-02-13' --> 'data\processed_data\AXP\4_2025-02-13.md'
Converted 'data\edgar_documents\AXP\4_2025-02-28' --> 'data\processed_data\AXP\4_2025-02-28.md'


2025-11-14 15:40:26,632 - INFO - Going to convert document batch...
2025-11-14 15:40:26,633 - INFO - Processing document 4_2025-03-06
2025-11-14 15:40:26,693 - INFO - Finished converting document 4_2025-03-06 in 0.09 sec.
2025-11-14 15:40:26,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:26,813 - INFO - Going to convert document batch...
2025-11-14 15:40:26,814 - INFO - Processing document 4_2025-03-11
2025-11-14 15:40:26,882 - INFO - Finished converting document 4_2025-03-11 in 0.09 sec.
2025-11-14 15:40:26,967 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\4_2025-03-06' --> 'data\processed_data\AXP\4_2025-03-06.md'
Converted 'data\edgar_documents\AXP\4_2025-03-11' --> 'data\processed_data\AXP\4_2025-03-11.md'


2025-11-14 15:40:26,993 - INFO - Going to convert document batch...
2025-11-14 15:40:26,995 - INFO - Processing document 4_2025-04-02
2025-11-14 15:40:27,041 - INFO - Finished converting document 4_2025-04-02 in 0.09 sec.
2025-11-14 15:40:27,109 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:27,111 - ERROR - Input document 4_2025-04-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:40:27,112 - INFO - Going to convert document batch...
2025-11-14 15:40:27,128 - IN

Converted 'data\edgar_documents\AXP\4_2025-04-02' --> 'data\processed_data\AXP\4_2025-04-02.md'
Error processing data\edgar_documents\AXP\4_2025-04-22: File format not allowed: data\edgar_documents\AXP\4_2025-04-22
Converted 'data\edgar_documents\AXP\4_2025-04-30' --> 'data\processed_data\AXP\4_2025-04-30.md'


2025-11-14 15:40:27,265 - INFO - Going to convert document batch...
2025-11-14 15:40:27,268 - INFO - Processing document 4_2025-05-01
2025-11-14 15:40:27,315 - INFO - Finished converting document 4_2025-05-01 in 0.08 sec.
2025-11-14 15:40:27,385 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:27,409 - INFO - Going to convert document batch...
2025-11-14 15:40:27,410 - INFO - Processing document 4_2025-05-07
2025-11-14 15:40:27,457 - INFO - Finished converting document 4_2025-05-07 in 0.09 sec.
2025-11-14 15:40:27,554 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\AXP\4_2025-05-01' --> 'data\processed_data\AXP\4_2025-05-01.md'
Converted 'data\edgar_documents\AXP\4_2025-05-07' --> 'data\processed_data\AXP\4_2025-05-07.md'


2025-11-14 15:40:27,555 - ERROR - Input document 4_2025-05-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:40:27,558 - INFO - Going to convert document batch...
2025-11-14 15:40:27,590 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:27,591 - ERROR - Input document 4_2025-05-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\AXP\4_2025-05-13: File format not allowed: data\edgar_documents\AXP\4_2025-05-13
Error processing data\edgar_documents\AXP\4_2025-05-14: File format not allowed: data\edgar_documents\AXP\4_2025-05-14
Converted 'data\edgar_documents\AXP\4_2025-05-21' --> 'data\processed_data\AXP\4_2025-05-21.md'


2025-11-14 15:40:27,862 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:27,863 - ERROR - Input document 4_2025-07-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:40:27,866 - INFO - Going to convert document batch...
2025-11-14 15:40:27,893 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:27,923 - INFO - Going to convert document batch...
2025-11-14 15:40:27,924 - INFO - Processing document 4_2025-07-31
2025-11-14 15:40:27,985 - INFO - Fin

Converted 'data\edgar_documents\AXP\4_2025-07-02' --> 'data\processed_data\AXP\4_2025-07-02.md'
Error processing data\edgar_documents\AXP\4_2025-07-22: File format not allowed: data\edgar_documents\AXP\4_2025-07-22


2025-11-14 15:40:28,088 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:28,129 - INFO - Going to convert document batch...
2025-11-14 15:40:28,133 - INFO - Processing document 4_2025-08-07
2025-11-14 15:40:28,220 - INFO - Finished converting document 4_2025-08-07 in 0.16 sec.


Converted 'data\edgar_documents\AXP\4_2025-07-31' --> 'data\processed_data\AXP\4_2025-07-31.md'


2025-11-14 15:40:28,312 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:28,346 - INFO - Going to convert document batch...
2025-11-14 15:40:28,347 - INFO - Processing document 4_2025-09-04
2025-11-14 15:40:28,423 - INFO - Finished converting document 4_2025-09-04 in 0.12 sec.


Converted 'data\edgar_documents\AXP\4_2025-08-07' --> 'data\processed_data\AXP\4_2025-08-07.md'
Converted 'data\edgar_documents\AXP\4_2025-09-04' --> 'data\processed_data\AXP\4_2025-09-04.md'


2025-11-14 15:40:28,527 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:28,556 - INFO - Going to convert document batch...
2025-11-14 15:40:28,558 - INFO - Processing document 4_2025-09-05
2025-11-14 15:40:28,714 - INFO - Finished converting document 4_2025-09-05 in 0.22 sec.
2025-11-14 15:40:28,804 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:28,832 - INFO - Going to convert document batch...
2025-11-14 15:40:28,833 - INFO - Processing document 4_2025-09-08
2025-11-14 15:40:28,902 - INFO - Finished converting document 4_2025-09-08 in 0.12 sec.


Converted 'data\edgar_documents\AXP\4_2025-09-05' --> 'data\processed_data\AXP\4_2025-09-05.md'
Converted 'data\edgar_documents\AXP\4_2025-09-08' --> 'data\processed_data\AXP\4_2025-09-08.md'


2025-11-14 15:40:28,989 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:29,009 - INFO - Going to convert document batch...
2025-11-14 15:40:29,011 - INFO - Processing document 4_2025-10-02
2025-11-14 15:40:29,057 - INFO - Finished converting document 4_2025-10-02 in 0.11 sec.
2025-11-14 15:40:29,163 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:29,164 - ERROR - Input document 4_2025-10-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:40

Converted 'data\edgar_documents\AXP\4_2025-10-02' --> 'data\processed_data\AXP\4_2025-10-02.md'
Error processing data\edgar_documents\AXP\4_2025-10-21: File format not allowed: data\edgar_documents\AXP\4_2025-10-21


2025-11-14 15:40:29,319 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:29,337 - INFO - Going to convert document batch...
2025-11-14 15:40:29,339 - INFO - Processing document 4_2025-10-24
2025-11-14 15:40:29,393 - INFO - Finished converting document 4_2025-10-24 in 0.09 sec.
2025-11-14 15:40:29,484 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\4_2025-10-23' --> 'data\processed_data\AXP\4_2025-10-23.md'
Converted 'data\edgar_documents\AXP\4_2025-10-24' --> 'data\processed_data\AXP\4_2025-10-24.md'


2025-11-14 15:40:29,505 - INFO - Going to convert document batch...
2025-11-14 15:40:29,507 - INFO - Processing document 4_2025-11-04
2025-11-14 15:40:29,560 - INFO - Finished converting document 4_2025-11-04 in 0.11 sec.
2025-11-14 15:40:29,644 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:29,698 - INFO - Going to convert document batch...
2025-11-14 15:40:29,700 - INFO - Processing document 8-K_2023-01-17
2025-11-14 15:40:29,782 - INFO - Finished converting document 8-K_2023-01-17 in 0.17 sec.


Converted 'data\edgar_documents\AXP\4_2025-11-04' --> 'data\processed_data\AXP\4_2025-11-04.md'
Converted 'data\edgar_documents\AXP\8-K_2023-01-17' --> 'data\processed_data\AXP\8-K_2023-01-17.md'


2025-11-14 15:40:29,854 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:29,882 - INFO - Going to convert document batch...
2025-11-14 15:40:29,883 - INFO - Processing document 8-K_2023-01-27
2025-11-14 15:40:29,924 - INFO - Finished converting document 8-K_2023-01-27 in 0.11 sec.
2025-11-14 15:40:29,956 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:30,006 - INFO - Going to convert document batch...
2025-11-14 15:40:30,009 - INFO - Processing document 8-K_2023-02-15
2025-11-14 15:40:30,088 - INFO - Finished converting document 8-K_2023-02-15 in 0.16 sec.


Converted 'data\edgar_documents\AXP\8-K_2023-01-27' --> 'data\processed_data\AXP\8-K_2023-01-27.md'
Converted 'data\edgar_documents\AXP\8-K_2023-02-15' --> 'data\processed_data\AXP\8-K_2023-02-15.md'


2025-11-14 15:40:30,159 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:30,190 - INFO - Going to convert document batch...
2025-11-14 15:40:30,192 - INFO - Processing document 8-K_2023-02-16
2025-11-14 15:40:30,236 - INFO - Finished converting document 8-K_2023-02-16 in 0.11 sec.
2025-11-14 15:40:30,275 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:30,303 - INFO - Going to convert document batch...
2025-11-14 15:40:30,304 - INFO - Processing document 8-K_2023-03-08
2025-11-14 15:40:30,339 - INFO - Finished converting document 8-K_2023-03-08 in 0.09 sec.
2025-11-14 15:40:30,369 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:30,434 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AXP\8-K_2023-02-16' --> 'data\processed_data\AXP\8-K_2023-02-16.md'
Converted 'data\edgar_documents\AXP\8-K_2023-03-08' --> 'data\processed_data\AXP\8-K_2023-03-08.md'


2025-11-14 15:40:30,436 - INFO - Processing document 8-K_2023-03-15
2025-11-14 15:40:30,527 - INFO - Finished converting document 8-K_2023-03-15 in 0.17 sec.
2025-11-14 15:40:30,576 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:30,639 - INFO - Going to convert document batch...
2025-11-14 15:40:30,640 - INFO - Processing document 8-K_2023-04-17
2025-11-14 15:40:30,716 - INFO - Finished converting document 8-K_2023-04-17 in 0.16 sec.


Converted 'data\edgar_documents\AXP\8-K_2023-03-15' --> 'data\processed_data\AXP\8-K_2023-03-15.md'
Converted 'data\edgar_documents\AXP\8-K_2023-04-17' --> 'data\processed_data\AXP\8-K_2023-04-17.md'


2025-11-14 15:40:30,781 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:30,808 - INFO - Going to convert document batch...
2025-11-14 15:40:30,810 - INFO - Processing document 8-K_2023-04-20
2025-11-14 15:40:30,845 - INFO - Finished converting document 8-K_2023-04-20 in 0.09 sec.
2025-11-14 15:40:30,877 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:30,913 - INFO - Going to convert document batch...
2025-11-14 15:40:30,914 - INFO - Processing document 8-K_2023-05-01
2025-11-14 15:40:30,955 - INFO - Finished converting document 8-K_2023-05-01 in 0.09 sec.
2025-11-14 15:40:30,984 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:31,050 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\AXP\8-K_2023-04-20' --> 'data\processed_data\AXP\8-K_2023-04-20.md'
Converted 'data\edgar_documents\AXP\8-K_2023-05-01' --> 'data\processed_data\AXP\8-K_2023-05-01.md'


2025-11-14 15:40:31,051 - INFO - Processing document 8-K_2023-05-05
2025-11-14 15:40:31,166 - INFO - Finished converting document 8-K_2023-05-05 in 0.20 sec.
2025-11-14 15:40:31,241 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:31,292 - INFO - Going to convert document batch...
2025-11-14 15:40:31,293 - INFO - Processing document 8-K_2023-05-15
2025-11-14 15:40:31,367 - INFO - Finished converting document 8-K_2023-05-15 in 0.14 sec.


Converted 'data\edgar_documents\AXP\8-K_2023-05-05' --> 'data\processed_data\AXP\8-K_2023-05-05.md'


2025-11-14 15:40:31,422 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\8-K_2023-05-15' --> 'data\processed_data\AXP\8-K_2023-05-15.md'


2025-11-14 15:40:32,685 - INFO - Going to convert document batch...
2025-11-14 15:40:32,686 - INFO - Processing document 8-K_2023-06-15
2025-11-14 15:40:32,755 - INFO - Finished converting document 8-K_2023-06-15 in 1.34 sec.
2025-11-14 15:40:32,801 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:32,826 - INFO - Going to convert document batch...
2025-11-14 15:40:32,828 - INFO - Processing document 8-K_2023-06-27
2025-11-14 15:40:32,860 - INFO - Finished converting document 8-K_2023-06-27 in 0.08 sec.
2025-11-14 15:40:32,910 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\8-K_2023-06-15' --> 'data\processed_data\AXP\8-K_2023-06-15.md'
Converted 'data\edgar_documents\AXP\8-K_2023-06-27' --> 'data\processed_data\AXP\8-K_2023-06-27.md'


2025-11-14 15:40:32,982 - INFO - Going to convert document batch...
2025-11-14 15:40:32,983 - INFO - Processing document 8-K_2023-07-17
2025-11-14 15:40:33,067 - INFO - Finished converting document 8-K_2023-07-17 in 0.19 sec.
2025-11-14 15:40:33,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:33,147 - INFO - Going to convert document batch...
2025-11-14 15:40:33,148 - INFO - Processing document 8-K_2023-07-21
2025-11-14 15:40:33,177 - INFO - Finished converting document 8-K_2023-07-21 in 0.06 sec.
2025-11-14 15:40:33,219 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:33,258 - INFO - Going to convert document batch...
2025-11-14 15:40:33,260 - INFO - Processing document 8-K_2023-07-28
2025-11-14 15:40:33,320 - INFO - Finished converting document 8-K_2023-07-28 in 0.12 sec.


Converted 'data\edgar_documents\AXP\8-K_2023-07-17' --> 'data\processed_data\AXP\8-K_2023-07-17.md'
Converted 'data\edgar_documents\AXP\8-K_2023-07-21' --> 'data\processed_data\AXP\8-K_2023-07-21.md'


2025-11-14 15:40:33,387 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:33,443 - INFO - Going to convert document batch...
2025-11-14 15:40:33,445 - INFO - Processing document 8-K_2023-08-15
2025-11-14 15:40:33,530 - INFO - Finished converting document 8-K_2023-08-15 in 0.19 sec.


Converted 'data\edgar_documents\AXP\8-K_2023-07-28' --> 'data\processed_data\AXP\8-K_2023-07-28.md'


2025-11-14 15:40:33,585 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:33,633 - INFO - Going to convert document batch...
2025-11-14 15:40:33,633 - INFO - Processing document 8-K_2023-09-15
2025-11-14 15:40:33,699 - INFO - Finished converting document 8-K_2023-09-15 in 0.14 sec.
2025-11-14 15:40:33,749 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\8-K_2023-08-15' --> 'data\processed_data\AXP\8-K_2023-08-15.md'
Converted 'data\edgar_documents\AXP\8-K_2023-09-15' --> 'data\processed_data\AXP\8-K_2023-09-15.md'


2025-11-14 15:40:33,793 - INFO - Going to convert document batch...
2025-11-14 15:40:33,795 - INFO - Processing document 8-K_2023-10-16
2025-11-14 15:40:33,866 - INFO - Finished converting document 8-K_2023-10-16 in 0.14 sec.
2025-11-14 15:40:33,933 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:33,981 - INFO - Going to convert document batch...
2025-11-14 15:40:33,983 - INFO - Processing document 8-K_2023-10-20
2025-11-14 15:40:34,043 - INFO - Finished converting document 8-K_2023-10-20 in 0.14 sec.


Converted 'data\edgar_documents\AXP\8-K_2023-10-16' --> 'data\processed_data\AXP\8-K_2023-10-16.md'
Converted 'data\edgar_documents\AXP\8-K_2023-10-20' --> 'data\processed_data\AXP\8-K_2023-10-20.md'


2025-11-14 15:40:34,107 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:34,149 - INFO - Going to convert document batch...
2025-11-14 15:40:34,150 - INFO - Processing document 8-K_2023-10-30
2025-11-14 15:40:34,206 - INFO - Finished converting document 8-K_2023-10-30 in 0.14 sec.
2025-11-14 15:40:34,255 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:34,327 - INFO - Going to convert document batch...
2025-11-14 15:40:34,331 - INFO - Processing document 8-K_2023-11-15
2025-11-14 15:40:34,420 - INFO - Finished converting document 8-K_2023-11-15 in 0.19 sec.


Converted 'data\edgar_documents\AXP\8-K_2023-10-30' --> 'data\processed_data\AXP\8-K_2023-10-30.md'


2025-11-14 15:40:34,491 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:34,552 - INFO - Going to convert document batch...
2025-11-14 15:40:34,553 - INFO - Processing document 8-K_2023-12-15


Converted 'data\edgar_documents\AXP\8-K_2023-11-15' --> 'data\processed_data\AXP\8-K_2023-11-15.md'


2025-11-14 15:40:34,665 - INFO - Finished converting document 8-K_2023-12-15 in 0.19 sec.
2025-11-14 15:40:34,731 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:34,775 - INFO - Going to convert document batch...
2025-11-14 15:40:34,777 - INFO - Processing document 8-K_2024-01-16
2025-11-14 15:40:34,843 - INFO - Finished converting document 8-K_2024-01-16 in 0.12 sec.


Converted 'data\edgar_documents\AXP\8-K_2023-12-15' --> 'data\processed_data\AXP\8-K_2023-12-15.md'
Converted 'data\edgar_documents\AXP\8-K_2024-01-16' --> 'data\processed_data\AXP\8-K_2024-01-16.md'


2025-11-14 15:40:34,902 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:34,952 - INFO - Going to convert document batch...
2025-11-14 15:40:34,954 - INFO - Processing document 8-K_2024-01-26
2025-11-14 15:40:35,010 - INFO - Finished converting document 8-K_2024-01-26 in 0.16 sec.
2025-11-14 15:40:35,049 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:35,100 - INFO - Going to convert document batch...
2025-11-14 15:40:35,101 - INFO - Processing document 8-K_2024-02-15
2025-11-14 15:40:35,182 - INFO - Finished converting document 8-K_2024-02-15 in 0.16 sec.


Converted 'data\edgar_documents\AXP\8-K_2024-01-26' --> 'data\processed_data\AXP\8-K_2024-01-26.md'


2025-11-14 15:40:35,264 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:35,295 - INFO - Going to convert document batch...
2025-11-14 15:40:35,297 - INFO - Processing document 8-K_2024-02-16
2025-11-14 15:40:35,340 - INFO - Finished converting document 8-K_2024-02-16 in 0.11 sec.
2025-11-14 15:40:35,377 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:35,403 - INFO - Going to convert document batch...
2025-11-14 15:40:35,404 - INFO - Processing document 8-K_2024-03-07
2025-11-14 15:40:35,435 - INFO - Finished converting document 8-K_2024-03-07 in 0.08 sec.


Converted 'data\edgar_documents\AXP\8-K_2024-02-15' --> 'data\processed_data\AXP\8-K_2024-02-15.md'
Converted 'data\edgar_documents\AXP\8-K_2024-02-16' --> 'data\processed_data\AXP\8-K_2024-02-16.md'


2025-11-14 15:40:35,466 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:35,502 - INFO - Going to convert document batch...
2025-11-14 15:40:35,502 - INFO - Processing document 8-K_2024-03-15
2025-11-14 15:40:35,563 - INFO - Finished converting document 8-K_2024-03-15 in 0.11 sec.
2025-11-14 15:40:35,624 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\8-K_2024-03-07' --> 'data\processed_data\AXP\8-K_2024-03-07.md'
Converted 'data\edgar_documents\AXP\8-K_2024-03-15' --> 'data\processed_data\AXP\8-K_2024-03-15.md'


2025-11-14 15:40:35,699 - INFO - Going to convert document batch...
2025-11-14 15:40:35,701 - INFO - Processing document 8-K_2024-04-15
2025-11-14 15:40:35,852 - INFO - Finished converting document 8-K_2024-04-15 in 0.24 sec.
2025-11-14 15:40:35,943 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:35,962 - INFO - Going to convert document batch...
2025-11-14 15:40:35,964 - INFO - Processing document 8-K_2024-04-19
2025-11-14 15:40:36,049 - INFO - Finished converting document 8-K_2024-04-19 in 0.12 sec.


Converted 'data\edgar_documents\AXP\8-K_2024-04-15' --> 'data\processed_data\AXP\8-K_2024-04-15.md'
Converted 'data\edgar_documents\AXP\8-K_2024-04-19' --> 'data\processed_data\AXP\8-K_2024-04-19.md'


2025-11-14 15:40:36,139 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:36,174 - INFO - Going to convert document batch...
2025-11-14 15:40:36,176 - INFO - Processing document 8-K_2024-04-25
2025-11-14 15:40:36,244 - INFO - Finished converting document 8-K_2024-04-25 in 0.12 sec.
2025-11-14 15:40:36,271 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:36,349 - INFO - Going to convert document batch...
2025-11-14 15:40:36,349 - INFO - Processing document 8-K_2024-05-08


Converted 'data\edgar_documents\AXP\8-K_2024-04-25' --> 'data\processed_data\AXP\8-K_2024-04-25.md'


2025-11-14 15:40:36,574 - INFO - Finished converting document 8-K_2024-05-08 in 0.33 sec.
2025-11-14 15:40:36,689 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:36,739 - INFO - Going to convert document batch...
2025-11-14 15:40:36,741 - INFO - Processing document 8-K_2024-05-15
2025-11-14 15:40:36,817 - INFO - Finished converting document 8-K_2024-05-15 in 0.14 sec.


Converted 'data\edgar_documents\AXP\8-K_2024-05-08' --> 'data\processed_data\AXP\8-K_2024-05-08.md'
Converted 'data\edgar_documents\AXP\8-K_2024-05-15' --> 'data\processed_data\AXP\8-K_2024-05-15.md'


2025-11-14 15:40:36,877 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:36,937 - INFO - Going to convert document batch...
2025-11-14 15:40:36,939 - INFO - Processing document 8-K_2024-06-17
2025-11-14 15:40:37,021 - INFO - Finished converting document 8-K_2024-06-17 in 0.17 sec.
2025-11-14 15:40:37,093 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:37,179 - INFO - Going to convert document batch...
2025-11-14 15:40:37,181 - INFO - Processing document 8-K_2024-07-15


Converted 'data\edgar_documents\AXP\8-K_2024-06-17' --> 'data\processed_data\AXP\8-K_2024-06-17.md'


2025-11-14 15:40:37,299 - INFO - Finished converting document 8-K_2024-07-15 in 0.22 sec.
2025-11-14 15:40:37,374 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:37,413 - INFO - Going to convert document batch...
2025-11-14 15:40:37,414 - INFO - Processing document 8-K_2024-07-19
2025-11-14 15:40:37,460 - INFO - Finished converting document 8-K_2024-07-19 in 0.11 sec.
2025-11-14 15:40:37,506 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\8-K_2024-07-15' --> 'data\processed_data\AXP\8-K_2024-07-15.md'
Converted 'data\edgar_documents\AXP\8-K_2024-07-19' --> 'data\processed_data\AXP\8-K_2024-07-19.md'


2025-11-14 15:40:37,545 - INFO - Going to convert document batch...
2025-11-14 15:40:37,549 - INFO - Processing document 8-K_2024-07-26
2025-11-14 15:40:37,627 - INFO - Finished converting document 8-K_2024-07-26 in 0.16 sec.
2025-11-14 15:40:37,674 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:37,729 - INFO - Going to convert document batch...
2025-11-14 15:40:37,731 - INFO - Processing document 8-K_2024-08-15
2025-11-14 15:40:37,839 - INFO - Finished converting document 8-K_2024-08-15 in 0.19 sec.


Converted 'data\edgar_documents\AXP\8-K_2024-07-26' --> 'data\processed_data\AXP\8-K_2024-07-26.md'


2025-11-14 15:40:37,920 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:37,967 - INFO - Going to convert document batch...
2025-11-14 15:40:37,968 - INFO - Processing document 8-K_2024-09-16
2025-11-14 15:40:38,042 - INFO - Finished converting document 8-K_2024-09-16 in 0.14 sec.


Converted 'data\edgar_documents\AXP\8-K_2024-08-15' --> 'data\processed_data\AXP\8-K_2024-08-15.md'
Converted 'data\edgar_documents\AXP\8-K_2024-09-16' --> 'data\processed_data\AXP\8-K_2024-09-16.md'


2025-11-14 15:40:38,113 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:38,133 - INFO - Going to convert document batch...
2025-11-14 15:40:38,134 - INFO - Processing document 8-K_2024-09-27
2025-11-14 15:40:38,171 - INFO - Finished converting document 8-K_2024-09-27 in 0.09 sec.
2025-11-14 15:40:38,200 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:38,241 - INFO - Going to convert document batch...
2025-11-14 15:40:38,244 - INFO - Processing document 8-K_2024-10-15
2025-11-14 15:40:38,319 - INFO - Finished converting document 8-K_2024-10-15 in 0.12 sec.


Converted 'data\edgar_documents\AXP\8-K_2024-09-27' --> 'data\processed_data\AXP\8-K_2024-09-27.md'
Converted 'data\edgar_documents\AXP\8-K_2024-10-15' --> 'data\processed_data\AXP\8-K_2024-10-15.md'


2025-11-14 15:40:38,387 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:38,422 - INFO - Going to convert document batch...
2025-11-14 15:40:38,424 - INFO - Processing document 8-K_2024-10-18
2025-11-14 15:40:38,470 - INFO - Finished converting document 8-K_2024-10-18 in 0.11 sec.
2025-11-14 15:40:38,518 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:38,551 - INFO - Going to convert document batch...
2025-11-14 15:40:38,552 - INFO - Processing document 8-K_2024-11-15


Converted 'data\edgar_documents\AXP\8-K_2024-10-18' --> 'data\processed_data\AXP\8-K_2024-10-18.md'


2025-11-14 15:40:38,697 - INFO - Finished converting document 8-K_2024-11-15 in 0.20 sec.
2025-11-14 15:40:38,767 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:38,806 - INFO - Going to convert document batch...
2025-11-14 15:40:38,808 - INFO - Processing document 8-K_2024-12-16
2025-11-14 15:40:38,893 - INFO - Finished converting document 8-K_2024-12-16 in 0.14 sec.


Converted 'data\edgar_documents\AXP\8-K_2024-11-15' --> 'data\processed_data\AXP\8-K_2024-11-15.md'
Converted 'data\edgar_documents\AXP\8-K_2024-12-16' --> 'data\processed_data\AXP\8-K_2024-12-16.md'


2025-11-14 15:40:38,994 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:39,069 - INFO - Going to convert document batch...
2025-11-14 15:40:39,070 - INFO - Processing document 8-K_2025-01-15
2025-11-14 15:40:39,208 - INFO - Finished converting document 8-K_2025-01-15 in 0.25 sec.
2025-11-14 15:40:39,301 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:39,327 - INFO - Going to convert document batch...
2025-11-14 15:40:39,328 - INFO - Processing document 8-K_2025-01-16
2025-11-14 15:40:39,374 - INFO - Finished converting document 8-K_2025-01-16 in 0.09 sec.
2025-11-14 15:40:39,414 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:39,453 - INFO - Going to convert document batch...
2025-11-14 15:40:39,454 - INFO - Processing document 8-K_2025-01-24


Converted 'data\edgar_documents\AXP\8-K_2025-01-15' --> 'data\processed_data\AXP\8-K_2025-01-15.md'
Converted 'data\edgar_documents\AXP\8-K_2025-01-16' --> 'data\processed_data\AXP\8-K_2025-01-16.md'


2025-11-14 15:40:39,511 - INFO - Finished converting document 8-K_2025-01-24 in 0.12 sec.
2025-11-14 15:40:39,554 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:39,577 - INFO - Going to convert document batch...
2025-11-14 15:40:39,578 - INFO - Processing document 8-K_2025-01-30
2025-11-14 15:40:39,614 - INFO - Finished converting document 8-K_2025-01-30 in 0.08 sec.
2025-11-14 15:40:39,661 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:39,696 - INFO - Going to convert document batch...
2025-11-14 15:40:39,697 - INFO - Processing document 8-K_2025-02-18


Converted 'data\edgar_documents\AXP\8-K_2025-01-24' --> 'data\processed_data\AXP\8-K_2025-01-24.md'
Converted 'data\edgar_documents\AXP\8-K_2025-01-30' --> 'data\processed_data\AXP\8-K_2025-01-30.md'


2025-11-14 15:40:39,837 - INFO - Finished converting document 8-K_2025-02-18 in 0.20 sec.
2025-11-14 15:40:39,931 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:39,967 - INFO - Going to convert document batch...
2025-11-14 15:40:39,968 - INFO - Processing document 8-K_2025-03-03
2025-11-14 15:40:40,025 - INFO - Finished converting document 8-K_2025-03-03 in 0.12 sec.
2025-11-14 15:40:40,081 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\8-K_2025-02-18' --> 'data\processed_data\AXP\8-K_2025-02-18.md'
Converted 'data\edgar_documents\AXP\8-K_2025-03-03' --> 'data\processed_data\AXP\8-K_2025-03-03.md'


2025-11-14 15:40:40,157 - INFO - Going to convert document batch...
2025-11-14 15:40:40,159 - INFO - Processing document 8-K_2025-03-17
2025-11-14 15:40:40,227 - INFO - Finished converting document 8-K_2025-03-17 in 0.17 sec.
2025-11-14 15:40:40,266 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:40,303 - INFO - Going to convert document batch...
2025-11-14 15:40:40,304 - INFO - Processing document 8-K_2025-04-15


Converted 'data\edgar_documents\AXP\8-K_2025-03-17' --> 'data\processed_data\AXP\8-K_2025-03-17.md'


2025-11-14 15:40:40,886 - INFO - Finished converting document 8-K_2025-04-15 in 0.64 sec.
2025-11-14 15:40:40,994 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:41,033 - INFO - Going to convert document batch...
2025-11-14 15:40:41,035 - INFO - Processing document 8-K_2025-04-17
2025-11-14 15:40:41,085 - INFO - Finished converting document 8-K_2025-04-17 in 0.11 sec.


Converted 'data\edgar_documents\AXP\8-K_2025-04-15' --> 'data\processed_data\AXP\8-K_2025-04-15.md'
Converted 'data\edgar_documents\AXP\8-K_2025-04-17' --> 'data\processed_data\AXP\8-K_2025-04-17.md'


2025-11-14 15:40:41,162 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:41,199 - INFO - Going to convert document batch...
2025-11-14 15:40:41,201 - INFO - Processing document 8-K_2025-04-25
2025-11-14 15:40:41,267 - INFO - Finished converting document 8-K_2025-04-25 in 0.14 sec.
2025-11-14 15:40:41,315 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:41,383 - INFO - Going to convert document batch...
2025-11-14 15:40:41,384 - INFO - Processing document 8-K_2025-05-01


Converted 'data\edgar_documents\AXP\8-K_2025-04-25' --> 'data\processed_data\AXP\8-K_2025-04-25.md'


2025-11-14 15:40:41,526 - INFO - Finished converting document 8-K_2025-05-01 in 0.23 sec.
2025-11-14 15:40:41,616 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:41,668 - INFO - Going to convert document batch...
2025-11-14 15:40:41,668 - INFO - Processing document 8-K_2025-05-15
2025-11-14 15:40:41,741 - INFO - Finished converting document 8-K_2025-05-15 in 0.14 sec.
2025-11-14 15:40:41,792 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\8-K_2025-05-01' --> 'data\processed_data\AXP\8-K_2025-05-01.md'
Converted 'data\edgar_documents\AXP\8-K_2025-05-15' --> 'data\processed_data\AXP\8-K_2025-05-15.md'


2025-11-14 15:40:41,811 - INFO - Going to convert document batch...
2025-11-14 15:40:41,812 - INFO - Processing document 8-K_2025-05-20
2025-11-14 15:40:41,844 - INFO - Finished converting document 8-K_2025-05-20 in 0.08 sec.
2025-11-14 15:40:41,873 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:41,905 - INFO - Going to convert document batch...
2025-11-14 15:40:41,906 - INFO - Processing document 8-K_2025-06-16
2025-11-14 15:40:41,951 - INFO - Finished converting document 8-K_2025-06-16 in 0.09 sec.
2025-11-14 15:40:42,037 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\8-K_2025-05-20' --> 'data\processed_data\AXP\8-K_2025-05-20.md'
Converted 'data\edgar_documents\AXP\8-K_2025-06-16' --> 'data\processed_data\AXP\8-K_2025-06-16.md'


2025-11-14 15:40:42,089 - INFO - Going to convert document batch...
2025-11-14 15:40:42,093 - INFO - Processing document 8-K_2025-07-01
2025-11-14 15:40:42,170 - INFO - Finished converting document 8-K_2025-07-01 in 0.17 sec.
2025-11-14 15:40:42,202 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:42,259 - INFO - Going to convert document batch...
2025-11-14 15:40:42,261 - INFO - Processing document 8-K_2025-07-15
2025-11-14 15:40:42,382 - INFO - Finished converting document 8-K_2025-07-15 in 0.19 sec.


Converted 'data\edgar_documents\AXP\8-K_2025-07-01' --> 'data\processed_data\AXP\8-K_2025-07-01.md'


2025-11-14 15:40:42,467 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:42,518 - INFO - Going to convert document batch...
2025-11-14 15:40:42,521 - INFO - Processing document 8-K_2025-07-18
2025-11-14 15:40:42,596 - INFO - Finished converting document 8-K_2025-07-18 in 0.14 sec.


Converted 'data\edgar_documents\AXP\8-K_2025-07-15' --> 'data\processed_data\AXP\8-K_2025-07-15.md'
Converted 'data\edgar_documents\AXP\8-K_2025-07-18' --> 'data\processed_data\AXP\8-K_2025-07-18.md'


2025-11-14 15:40:42,672 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:42,692 - INFO - Going to convert document batch...
2025-11-14 15:40:42,693 - INFO - Processing document 8-K_2025-07-23
2025-11-14 15:40:42,724 - INFO - Finished converting document 8-K_2025-07-23 in 0.08 sec.
2025-11-14 15:40:42,752 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:42,784 - INFO - Going to convert document batch...
2025-11-14 15:40:42,786 - INFO - Processing document 8-K_2025-07-25
2025-11-14 15:40:42,826 - INFO - Finished converting document 8-K_2025-07-25 in 0.09 sec.
2025-11-14 15:40:42,872 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:42,915 - INFO - Going to convert document batch...
2025-11-14 15:40:42,916 - INFO - Processing document 8-K_2025-08-15


Converted 'data\edgar_documents\AXP\8-K_2025-07-23' --> 'data\processed_data\AXP\8-K_2025-07-23.md'
Converted 'data\edgar_documents\AXP\8-K_2025-07-25' --> 'data\processed_data\AXP\8-K_2025-07-25.md'


2025-11-14 15:40:42,978 - INFO - Finished converting document 8-K_2025-08-15 in 0.12 sec.
2025-11-14 15:40:43,022 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:43,059 - INFO - Going to convert document batch...
2025-11-14 15:40:43,060 - INFO - Processing document 8-K_2025-09-15
2025-11-14 15:40:43,133 - INFO - Finished converting document 8-K_2025-09-15 in 0.12 sec.


Converted 'data\edgar_documents\AXP\8-K_2025-08-15' --> 'data\processed_data\AXP\8-K_2025-08-15.md'
Converted 'data\edgar_documents\AXP\8-K_2025-09-15' --> 'data\processed_data\AXP\8-K_2025-09-15.md'


2025-11-14 15:40:43,199 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:43,223 - INFO - Going to convert document batch...
2025-11-14 15:40:43,224 - INFO - Processing document 8-K_2025-09-29
2025-11-14 15:40:43,259 - INFO - Finished converting document 8-K_2025-09-29 in 0.08 sec.
2025-11-14 15:40:43,293 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:43,330 - INFO - Going to convert document batch...
2025-11-14 15:40:43,331 - INFO - Processing document 8-K_2025-10-15
2025-11-14 15:40:43,405 - INFO - Finished converting document 8-K_2025-10-15 in 0.12 sec.
2025-11-14 15:40:43,473 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\AXP\8-K_2025-09-29' --> 'data\processed_data\AXP\8-K_2025-09-29.md'
Converted 'data\edgar_documents\AXP\8-K_2025-10-15' --> 'data\processed_data\AXP\8-K_2025-10-15.md'


2025-11-14 15:40:43,499 - INFO - Going to convert document batch...
2025-11-14 15:40:43,500 - INFO - Processing document 8-K_2025-10-17
2025-11-14 15:40:43,538 - INFO - Finished converting document 8-K_2025-10-17 in 0.09 sec.
2025-11-14 15:40:43,568 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:43,591 - INFO - Going to convert document batch...
2025-11-14 15:40:43,593 - INFO - Processing document 8-K_2025-10-24
2025-11-14 15:40:43,636 - INFO - Finished converting document 8-K_2025-10-24 in 0.08 sec.


Converted 'data\edgar_documents\AXP\8-K_2025-10-17' --> 'data\processed_data\AXP\8-K_2025-10-17.md'
Converted 'data\edgar_documents\AXP\8-K_2025-10-24' --> 'data\processed_data\AXP\8-K_2025-10-24.md'


2025-11-14 15:40:43,743 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:43,743 - ERROR - Input document DEF-14A_2023-03-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:40:43,747 - INFO - Going to convert document batch...
2025-11-14 15:40:43,800 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:40:43,800 - ERROR - Input document DEF-14A_2024-03-15 with format No

Error processing data\edgar_documents\AXP\DEF-14A_2023-03-17: File format not allowed: data\edgar_documents\AXP\DEF-14A_2023-03-17
Error processing data\edgar_documents\AXP\DEF-14A_2024-03-15: File format not allowed: data\edgar_documents\AXP\DEF-14A_2024-03-15
Error processing data\edgar_documents\AXP\DEF-14A_2025-03-14: File format not allowed: data\edgar_documents\AXP\DEF-14A_2025-03-14
Processed 149 new files. Errors: 20
Found 106 files to process in data\edgar_documents\BA


2025-11-14 15:40:44,048 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:40:46,485 - INFO - Going to convert document batch...
2025-11-14 15:40:46,486 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:40:46,487 - INFO - Processing document 10-K_2023-01-27
2025-11-14 15:40:52,229 - INFO - Finished converting document 10-K_2023-01-27 in 8.36 sec.
2025-11-14 15:40:54,041 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\10-K_2023-01-27' --> 'data\processed_data\BA\10-K_2023-01-27.md'


2025-11-14 15:40:56,375 - INFO - Going to convert document batch...
2025-11-14 15:40:56,376 - INFO - Processing document 10-K_2024-01-31
2025-11-14 15:41:01,591 - INFO - Finished converting document 10-K_2024-01-31 in 7.66 sec.
2025-11-14 15:41:03,908 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\10-K_2024-01-31' --> 'data\processed_data\BA\10-K_2024-01-31.md'


2025-11-14 15:41:07,284 - INFO - Going to convert document batch...
2025-11-14 15:41:07,285 - INFO - Processing document 10-K_2025-02-03
2025-11-14 15:41:13,152 - INFO - Finished converting document 10-K_2025-02-03 in 9.34 sec.
2025-11-14 15:41:15,504 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\10-K_2025-02-03' --> 'data\processed_data\BA\10-K_2025-02-03.md'


2025-11-14 15:41:16,334 - INFO - Going to convert document batch...
2025-11-14 15:41:16,336 - INFO - Processing document 10-Q_2023-04-26
2025-11-14 15:41:19,607 - INFO - Finished converting document 10-Q_2023-04-26 in 4.20 sec.
2025-11-14 15:41:20,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\10-Q_2023-04-26' --> 'data\processed_data\BA\10-Q_2023-04-26.md'


2025-11-14 15:41:22,048 - INFO - Going to convert document batch...
2025-11-14 15:41:22,050 - INFO - Processing document 10-Q_2023-07-26
2025-11-14 15:41:24,595 - INFO - Finished converting document 10-Q_2023-07-26 in 3.84 sec.
2025-11-14 15:41:25,882 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\10-Q_2023-07-26' --> 'data\processed_data\BA\10-Q_2023-07-26.md'


2025-11-14 15:41:28,028 - INFO - Going to convert document batch...
2025-11-14 15:41:28,029 - INFO - Processing document 10-Q_2023-10-25
2025-11-14 15:41:30,736 - INFO - Finished converting document 10-Q_2023-10-25 in 4.89 sec.
2025-11-14 15:41:32,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\10-Q_2023-10-25' --> 'data\processed_data\BA\10-Q_2023-10-25.md'


2025-11-14 15:41:32,947 - INFO - Going to convert document batch...
2025-11-14 15:41:32,949 - INFO - Processing document 10-Q_2024-04-24
2025-11-14 15:41:35,284 - INFO - Finished converting document 10-Q_2024-04-24 in 3.30 sec.
2025-11-14 15:41:36,630 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\10-Q_2024-04-24' --> 'data\processed_data\BA\10-Q_2024-04-24.md'


2025-11-14 15:41:38,247 - INFO - Going to convert document batch...
2025-11-14 15:41:38,248 - INFO - Processing document 10-Q_2024-07-31
2025-11-14 15:41:41,291 - INFO - Finished converting document 10-Q_2024-07-31 in 4.72 sec.
2025-11-14 15:41:42,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\10-Q_2024-07-31' --> 'data\processed_data\BA\10-Q_2024-07-31.md'


2025-11-14 15:41:44,651 - INFO - Going to convert document batch...
2025-11-14 15:41:44,653 - INFO - Processing document 10-Q_2024-10-23
2025-11-14 15:41:47,398 - INFO - Finished converting document 10-Q_2024-10-23 in 4.77 sec.
2025-11-14 15:41:49,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\10-Q_2024-10-23' --> 'data\processed_data\BA\10-Q_2024-10-23.md'


2025-11-14 15:41:50,013 - INFO - Going to convert document batch...
2025-11-14 15:41:50,020 - INFO - Processing document 10-Q_2025-04-23
2025-11-14 15:41:52,518 - INFO - Finished converting document 10-Q_2025-04-23 in 3.56 sec.
2025-11-14 15:41:54,710 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\10-Q_2025-04-23' --> 'data\processed_data\BA\10-Q_2025-04-23.md'


2025-11-14 15:41:56,332 - INFO - Going to convert document batch...
2025-11-14 15:41:56,334 - INFO - Processing document 10-Q_2025-07-29
2025-11-14 15:41:59,271 - INFO - Finished converting document 10-Q_2025-07-29 in 4.61 sec.
2025-11-14 15:42:00,657 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\10-Q_2025-07-29' --> 'data\processed_data\BA\10-Q_2025-07-29.md'


2025-11-14 15:42:02,335 - INFO - Going to convert document batch...
2025-11-14 15:42:02,336 - INFO - Processing document 10-Q_2025-10-29
2025-11-14 15:42:05,391 - INFO - Finished converting document 10-Q_2025-10-29 in 4.80 sec.
2025-11-14 15:42:07,032 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:07,062 - INFO - Going to convert document batch...
2025-11-14 15:42:07,064 - INFO - Processing document 4_2023-01-05
2025-11-14 15:42:07,122 - INFO - Finished converting document 4_2023-01-05 in 0.12 sec.


Converted 'data\edgar_documents\BA\10-Q_2025-10-29' --> 'data\processed_data\BA\10-Q_2025-10-29.md'
Converted 'data\edgar_documents\BA\4_2023-01-05' --> 'data\processed_data\BA\4_2023-01-05.md'


2025-11-14 15:42:07,248 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:07,279 - INFO - Going to convert document batch...
2025-11-14 15:42:07,281 - INFO - Processing document 4_2023-02-21
2025-11-14 15:42:07,341 - INFO - Finished converting document 4_2023-02-21 in 0.14 sec.
2025-11-14 15:42:07,415 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:07,439 - INFO - Going to convert document batch...
2025-11-14 15:42:07,441 - INFO - Processing document 4_2023-02-28
2025-11-14 15:42:07,494 - INFO - Finished converting document 4_2023-02-28 in 0.09 sec.
2025-11-14 15:42:07,579 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\4_2023-02-21' --> 'data\processed_data\BA\4_2023-02-21.md'
Converted 'data\edgar_documents\BA\4_2023-02-28' --> 'data\processed_data\BA\4_2023-02-28.md'


2025-11-14 15:42:07,609 - INFO - Going to convert document batch...
2025-11-14 15:42:07,611 - INFO - Processing document 4_2023-04-05
2025-11-14 15:42:07,674 - INFO - Finished converting document 4_2023-04-05 in 0.12 sec.
2025-11-14 15:42:07,736 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:07,753 - INFO - Going to convert document batch...
2025-11-14 15:42:07,756 - INFO - Processing document 4_2023-04-18
2025-11-14 15:42:07,810 - INFO - Finished converting document 4_2023-04-18 in 0.09 sec.
2025-11-14 15:42:07,926 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\4_2023-04-05' --> 'data\processed_data\BA\4_2023-04-05.md'
Converted 'data\edgar_documents\BA\4_2023-04-18' --> 'data\processed_data\BA\4_2023-04-18.md'


2025-11-14 15:42:07,954 - INFO - Going to convert document batch...
2025-11-14 15:42:07,956 - INFO - Processing document 4_2023-05-03
2025-11-14 15:42:08,046 - INFO - Finished converting document 4_2023-05-03 in 0.16 sec.
2025-11-14 15:42:08,148 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:08,175 - INFO - Going to convert document batch...
2025-11-14 15:42:08,177 - INFO - Processing document 4_2023-05-08
2025-11-14 15:42:08,245 - INFO - Finished converting document 4_2023-05-08 in 0.14 sec.


Converted 'data\edgar_documents\BA\4_2023-05-03' --> 'data\processed_data\BA\4_2023-05-03.md'


2025-11-14 15:42:08,334 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:08,375 - INFO - Going to convert document batch...
2025-11-14 15:42:08,378 - INFO - Processing document 4_2023-07-06
2025-11-14 15:42:08,457 - INFO - Finished converting document 4_2023-07-06 in 0.14 sec.


Converted 'data\edgar_documents\BA\4_2023-05-08' --> 'data\processed_data\BA\4_2023-05-08.md'


2025-11-14 15:42:08,569 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:08,596 - INFO - Going to convert document batch...
2025-11-14 15:42:08,598 - INFO - Processing document 4_2023-07-10
2025-11-14 15:42:08,669 - INFO - Finished converting document 4_2023-07-10 in 0.12 sec.


Converted 'data\edgar_documents\BA\4_2023-07-06' --> 'data\processed_data\BA\4_2023-07-06.md'
Converted 'data\edgar_documents\BA\4_2023-07-10' --> 'data\processed_data\BA\4_2023-07-10.md'


2025-11-14 15:42:08,980 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:09,033 - INFO - Going to convert document batch...
2025-11-14 15:42:09,035 - INFO - Processing document 4_2023-08-02
2025-11-14 15:42:09,097 - INFO - Finished converting document 4_2023-08-02 in 0.34 sec.
2025-11-14 15:42:09,158 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:09,172 - INFO - Going to convert document batch...
2025-11-14 15:42:09,173 - INFO - Processing document 4_2023-08-03
2025-11-14 15:42:09,245 - INFO - Finished converting document 4_2023-08-03 in 0.11 sec.
2025-11-14 15:42:09,321 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\4_2023-08-02' --> 'data\processed_data\BA\4_2023-08-02.md'
Converted 'data\edgar_documents\BA\4_2023-08-03' --> 'data\processed_data\BA\4_2023-08-03.md'


2025-11-14 15:42:09,356 - INFO - Going to convert document batch...
2025-11-14 15:42:09,357 - INFO - Processing document 4_2023-10-04
2025-11-14 15:42:09,396 - INFO - Finished converting document 4_2023-10-04 in 0.09 sec.
2025-11-14 15:42:09,488 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:09,537 - INFO - Going to convert document batch...
2025-11-14 15:42:09,538 - INFO - Processing document 4_2023-12-05
2025-11-14 15:42:09,582 - INFO - Finished converting document 4_2023-12-05 in 0.12 sec.


Converted 'data\edgar_documents\BA\4_2023-10-04' --> 'data\processed_data\BA\4_2023-10-04.md'
Converted 'data\edgar_documents\BA\4_2023-12-05' --> 'data\processed_data\BA\4_2023-12-05.md'


2025-11-14 15:42:09,679 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:09,700 - INFO - Going to convert document batch...
2025-11-14 15:42:09,702 - INFO - Processing document 4_2023-12-18
2025-11-14 15:42:09,760 - INFO - Finished converting document 4_2023-12-18 in 0.12 sec.
2025-11-14 15:42:09,828 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:09,845 - INFO - Going to convert document batch...
2025-11-14 15:42:09,846 - INFO - Processing document 4_2024-01-04
2025-11-14 15:42:09,924 - INFO - Finished converting document 4_2024-01-04 in 0.12 sec.


Converted 'data\edgar_documents\BA\4_2023-12-18' --> 'data\processed_data\BA\4_2023-12-18.md'
Converted 'data\edgar_documents\BA\4_2024-01-04' --> 'data\processed_data\BA\4_2024-01-04.md'


2025-11-14 15:42:10,022 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:10,055 - INFO - Going to convert document batch...
2025-11-14 15:42:10,057 - INFO - Processing document 4_2024-01-22
2025-11-14 15:42:10,178 - INFO - Finished converting document 4_2024-01-22 in 0.20 sec.
2025-11-14 15:42:10,238 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:10,253 - INFO - Going to convert document batch...
2025-11-14 15:42:10,254 - INFO - Processing document 4_2024-02-21
2025-11-14 15:42:10,285 - INFO - Finished converting document 4_2024-02-21 in 0.06 sec.
2025-11-14 15:42:10,368 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\4_2024-01-22' --> 'data\processed_data\BA\4_2024-01-22.md'
Converted 'data\edgar_documents\BA\4_2024-02-21' --> 'data\processed_data\BA\4_2024-02-21.md'


2025-11-14 15:42:10,401 - INFO - Going to convert document batch...
2025-11-14 15:42:10,404 - INFO - Processing document 4_2024-02-22
2025-11-14 15:42:10,472 - INFO - Finished converting document 4_2024-02-22 in 0.14 sec.
2025-11-14 15:42:10,569 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:10,602 - INFO - Going to convert document batch...
2025-11-14 15:42:10,604 - INFO - Processing document 4_2024-03-01
2025-11-14 15:42:10,685 - INFO - Finished converting document 4_2024-03-01 in 0.16 sec.


Converted 'data\edgar_documents\BA\4_2024-02-22' --> 'data\processed_data\BA\4_2024-02-22.md'


2025-11-14 15:42:10,800 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:10,832 - INFO - Going to convert document batch...
2025-11-14 15:42:10,833 - INFO - Processing document 4_2024-03-13
2025-11-14 15:42:10,898 - INFO - Finished converting document 4_2024-03-13 in 0.12 sec.


Converted 'data\edgar_documents\BA\4_2024-03-01' --> 'data\processed_data\BA\4_2024-03-01.md'
Converted 'data\edgar_documents\BA\4_2024-03-13' --> 'data\processed_data\BA\4_2024-03-13.md'


2025-11-14 15:42:11,004 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:11,047 - INFO - Going to convert document batch...
2025-11-14 15:42:11,048 - INFO - Processing document 4_2024-04-03
2025-11-14 15:42:11,120 - INFO - Finished converting document 4_2024-04-03 in 0.17 sec.
2025-11-14 15:42:11,227 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:42:11,228 - ERROR - Input document 4_2024-07-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:42

Converted 'data\edgar_documents\BA\4_2024-04-03' --> 'data\processed_data\BA\4_2024-04-03.md'
Error processing data\edgar_documents\BA\4_2024-07-01: File format not allowed: data\edgar_documents\BA\4_2024-07-01


2025-11-14 15:42:11,463 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:42:11,465 - ERROR - Input document 4_2024-07-31 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:42:11,467 - INFO - Going to convert document batch...
2025-11-14 15:42:11,505 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:11,548 - INFO - Going to convert document batch...
2025-11-14 15:42:11,550 - INFO - Processing document 4_2024-08-09


Converted 'data\edgar_documents\BA\4_2024-07-03' --> 'data\processed_data\BA\4_2024-07-03.md'
Error processing data\edgar_documents\BA\4_2024-07-31: File format not allowed: data\edgar_documents\BA\4_2024-07-31


2025-11-14 15:42:11,613 - INFO - Finished converting document 4_2024-08-09 in 0.14 sec.
2025-11-14 15:42:11,708 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:11,736 - INFO - Going to convert document batch...
2025-11-14 15:42:11,738 - INFO - Processing document 4_2024-08-29
2025-11-14 15:42:11,804 - INFO - Finished converting document 4_2024-08-29 in 0.11 sec.


Converted 'data\edgar_documents\BA\4_2024-08-09' --> 'data\processed_data\BA\4_2024-08-09.md'
Converted 'data\edgar_documents\BA\4_2024-08-29' --> 'data\processed_data\BA\4_2024-08-29.md'


2025-11-14 15:42:11,909 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:11,951 - INFO - Going to convert document batch...
2025-11-14 15:42:11,954 - INFO - Processing document 4_2024-09-05
2025-11-14 15:42:12,039 - INFO - Finished converting document 4_2024-09-05 in 0.16 sec.
2025-11-14 15:42:12,139 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:12,170 - INFO - Going to convert document batch...
2025-11-14 15:42:12,172 - INFO - Processing document 4_2024-10-03
2025-11-14 15:42:12,237 - INFO - Finished converting document 4_2024-10-03 in 0.14 sec.


Converted 'data\edgar_documents\BA\4_2024-09-05' --> 'data\processed_data\BA\4_2024-09-05.md'
Converted 'data\edgar_documents\BA\4_2024-10-03' --> 'data\processed_data\BA\4_2024-10-03.md'


2025-11-14 15:42:12,519 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:42:12,522 - ERROR - Input document 4_2024-10-28 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:42:12,526 - INFO - Going to convert document batch...
2025-11-14 15:42:12,556 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:42:12,559 - ERROR - Input document 4_2024-10-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\BA\4_2024-10-28: File format not allowed: data\edgar_documents\BA\4_2024-10-28
Error processing data\edgar_documents\BA\4_2024-10-29: File format not allowed: data\edgar_documents\BA\4_2024-10-29
Error processing data\edgar_documents\BA\4_2024-11-18: File format not allowed: data\edgar_documents\BA\4_2024-11-18


2025-11-14 15:42:12,877 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:42:12,879 - ERROR - Input document 4_2024-12-20 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:42:12,884 - INFO - Going to convert document batch...
2025-11-14 15:42:12,922 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:12,955 - INFO - Going to convert document batch...
2025-11-14 15:42:12,957 - INFO - Processing document 4_2025-01-03


Converted 'data\edgar_documents\BA\4_2024-12-04' --> 'data\processed_data\BA\4_2024-12-04.md'
Error processing data\edgar_documents\BA\4_2024-12-20: File format not allowed: data\edgar_documents\BA\4_2024-12-20


2025-11-14 15:42:13,119 - INFO - Finished converting document 4_2025-01-03 in 0.23 sec.
2025-11-14 15:42:13,181 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:13,198 - INFO - Going to convert document batch...
2025-11-14 15:42:13,199 - INFO - Processing document 4_2025-01-06
2025-11-14 15:42:13,239 - INFO - Finished converting document 4_2025-01-06 in 0.06 sec.
2025-11-14 15:42:13,325 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\4_2025-01-03' --> 'data\processed_data\BA\4_2025-01-03.md'
Converted 'data\edgar_documents\BA\4_2025-01-06' --> 'data\processed_data\BA\4_2025-01-06.md'


2025-11-14 15:42:13,364 - INFO - Going to convert document batch...
2025-11-14 15:42:13,366 - INFO - Processing document 4_2025-01-17
2025-11-14 15:42:13,410 - INFO - Finished converting document 4_2025-01-17 in 0.12 sec.
2025-11-14 15:42:13,502 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:13,525 - INFO - Going to convert document batch...
2025-11-14 15:42:13,526 - INFO - Processing document 4_2025-02-20
2025-11-14 15:42:13,561 - INFO - Finished converting document 4_2025-02-20 in 0.11 sec.


Converted 'data\edgar_documents\BA\4_2025-01-17' --> 'data\processed_data\BA\4_2025-01-17.md'
Converted 'data\edgar_documents\BA\4_2025-02-20' --> 'data\processed_data\BA\4_2025-02-20.md'


2025-11-14 15:42:13,637 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:13,669 - INFO - Going to convert document batch...
2025-11-14 15:42:13,670 - INFO - Processing document 4_2025-02-21
2025-11-14 15:42:13,711 - INFO - Finished converting document 4_2025-02-21 in 0.11 sec.
2025-11-14 15:42:13,772 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:13,789 - INFO - Going to convert document batch...
2025-11-14 15:42:13,792 - INFO - Processing document 4_2025-02-26
2025-11-14 15:42:13,871 - INFO - Finished converting document 4_2025-02-26 in 0.12 sec.


Converted 'data\edgar_documents\BA\4_2025-02-21' --> 'data\processed_data\BA\4_2025-02-21.md'
Converted 'data\edgar_documents\BA\4_2025-02-26' --> 'data\processed_data\BA\4_2025-02-26.md'


2025-11-14 15:42:14,065 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:14,098 - INFO - Going to convert document batch...
2025-11-14 15:42:14,101 - INFO - Processing document 4_2025-02-28
2025-11-14 15:42:14,188 - INFO - Finished converting document 4_2025-02-28 in 0.25 sec.
2025-11-14 15:42:14,284 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:14,317 - INFO - Going to convert document batch...
2025-11-14 15:42:14,319 - INFO - Processing document 4_2025-03-11
2025-11-14 15:42:14,388 - INFO - Finished converting document 4_2025-03-11 in 0.12 sec.


Converted 'data\edgar_documents\BA\4_2025-02-28' --> 'data\processed_data\BA\4_2025-02-28.md'


2025-11-14 15:42:14,515 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\4_2025-03-11' --> 'data\processed_data\BA\4_2025-03-11.md'


2025-11-14 15:42:15,635 - INFO - Going to convert document batch...
2025-11-14 15:42:15,637 - INFO - Processing document 4_2025-04-03
2025-11-14 15:42:15,696 - INFO - Finished converting document 4_2025-04-03 in 1.23 sec.
2025-11-14 15:42:15,776 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:15,793 - INFO - Going to convert document batch...
2025-11-14 15:42:15,794 - INFO - Processing document 4_2025-05-05
2025-11-14 15:42:15,831 - INFO - Finished converting document 4_2025-05-05 in 0.09 sec.


Converted 'data\edgar_documents\BA\4_2025-04-03' --> 'data\processed_data\BA\4_2025-04-03.md'
Converted 'data\edgar_documents\BA\4_2025-05-05' --> 'data\processed_data\BA\4_2025-05-05.md'


2025-11-14 15:42:15,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:16,026 - INFO - Going to convert document batch...
2025-11-14 15:42:16,027 - INFO - Processing document 4_2025-05-08
2025-11-14 15:42:16,089 - INFO - Finished converting document 4_2025-05-08 in 0.24 sec.
2025-11-14 15:42:16,172 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:16,202 - INFO - Going to convert document batch...
2025-11-14 15:42:16,204 - INFO - Processing document 4_2025-05-15
2025-11-14 15:42:16,245 - INFO - Finished converting document 4_2025-05-15 in 0.09 sec.
2025-11-14 15:42:16,305 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:16,325 - INFO - Going to convert document batch...
2025-11-14 15:42:16,326 - INFO - Processing document 4_2025-05-19
2025-11-14 15:42:16,361 - INFO - Finished converting document 4_2025-05-19 in 0.08 sec.


Converted 'data\edgar_documents\BA\4_2025-05-08' --> 'data\processed_data\BA\4_2025-05-08.md'
Converted 'data\edgar_documents\BA\4_2025-05-15' --> 'data\processed_data\BA\4_2025-05-15.md'


2025-11-14 15:42:16,412 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:16,427 - INFO - Going to convert document batch...
2025-11-14 15:42:16,429 - INFO - Processing document 4_2025-07-03
2025-11-14 15:42:16,485 - INFO - Finished converting document 4_2025-07-03 in 0.09 sec.


Converted 'data\edgar_documents\BA\4_2025-05-19' --> 'data\processed_data\BA\4_2025-05-19.md'


2025-11-14 15:42:16,677 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:16,714 - INFO - Going to convert document batch...
2025-11-14 15:42:16,716 - INFO - Processing document 4_2025-07-31
2025-11-14 15:42:16,792 - INFO - Finished converting document 4_2025-07-31 in 0.14 sec.


Converted 'data\edgar_documents\BA\4_2025-07-03' --> 'data\processed_data\BA\4_2025-07-03.md'


2025-11-14 15:42:16,911 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:16,956 - INFO - Going to convert document batch...
2025-11-14 15:42:16,959 - INFO - Processing document 4_2025-08-12
2025-11-14 15:42:17,019 - INFO - Finished converting document 4_2025-08-12 in 0.14 sec.


Converted 'data\edgar_documents\BA\4_2025-07-31' --> 'data\processed_data\BA\4_2025-07-31.md'
Converted 'data\edgar_documents\BA\4_2025-08-12' --> 'data\processed_data\BA\4_2025-08-12.md'


2025-11-14 15:42:17,090 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:17,109 - INFO - Going to convert document batch...
2025-11-14 15:42:17,110 - INFO - Processing document 4_2025-08-19
2025-11-14 15:42:17,151 - INFO - Finished converting document 4_2025-08-19 in 0.09 sec.
2025-11-14 15:42:17,233 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:17,266 - INFO - Going to convert document batch...
2025-11-14 15:42:17,268 - INFO - Processing document 4_2025-08-21
2025-11-14 15:42:17,318 - INFO - Finished converting document 4_2025-08-21 in 0.11 sec.
2025-11-14 15:42:17,387 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\4_2025-08-19' --> 'data\processed_data\BA\4_2025-08-19.md'
Converted 'data\edgar_documents\BA\4_2025-08-21' --> 'data\processed_data\BA\4_2025-08-21.md'


2025-11-14 15:42:17,416 - INFO - Going to convert document batch...
2025-11-14 15:42:17,417 - INFO - Processing document 4_2025-09-03
2025-11-14 15:42:17,480 - INFO - Finished converting document 4_2025-09-03 in 0.14 sec.
2025-11-14 15:42:17,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:17,629 - INFO - Going to convert document batch...
2025-11-14 15:42:17,631 - INFO - Processing document 4_2025-10-03
2025-11-14 15:42:17,694 - INFO - Finished converting document 4_2025-10-03 in 0.12 sec.


Converted 'data\edgar_documents\BA\4_2025-09-03' --> 'data\processed_data\BA\4_2025-09-03.md'
Converted 'data\edgar_documents\BA\4_2025-10-03' --> 'data\processed_data\BA\4_2025-10-03.md'


2025-11-14 15:42:17,800 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:17,834 - INFO - Going to convert document batch...
2025-11-14 15:42:17,835 - INFO - Processing document 4_2025-11-10
2025-11-14 15:42:17,882 - INFO - Finished converting document 4_2025-11-10 in 0.12 sec.
2025-11-14 15:42:17,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:18,014 - INFO - Going to convert document batch...
2025-11-14 15:42:18,016 - INFO - Processing document 8-K_2023-01-25
2025-11-14 15:42:18,049 - INFO - Finished converting document 8-K_2023-01-25 in 0.11 sec.
2025-11-14 15:42:18,098 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\4_2025-11-10' --> 'data\processed_data\BA\4_2025-11-10.md'
Converted 'data\edgar_documents\BA\8-K_2023-01-25' --> 'data\processed_data\BA\8-K_2023-01-25.md'


2025-11-14 15:42:18,120 - INFO - Going to convert document batch...
2025-11-14 15:42:18,122 - INFO - Processing document 8-K_2023-02-17
2025-11-14 15:42:18,164 - INFO - Finished converting document 8-K_2023-02-17 in 0.09 sec.
2025-11-14 15:42:18,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:18,268 - INFO - Going to convert document batch...
2025-11-14 15:42:18,269 - INFO - Processing document 8-K_2023-03-15
2025-11-14 15:42:18,328 - INFO - Finished converting document 8-K_2023-03-15 in 0.14 sec.


Converted 'data\edgar_documents\BA\8-K_2023-02-17' --> 'data\processed_data\BA\8-K_2023-02-17.md'
Converted 'data\edgar_documents\BA\8-K_2023-03-15' --> 'data\processed_data\BA\8-K_2023-03-15.md'


2025-11-14 15:42:18,402 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:18,441 - INFO - Going to convert document batch...
2025-11-14 15:42:18,444 - INFO - Processing document 8-K_2023-04-11
2025-11-14 15:42:18,524 - INFO - Finished converting document 8-K_2023-04-11 in 0.16 sec.
2025-11-14 15:42:18,592 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:18,645 - INFO - Going to convert document batch...
2025-11-14 15:42:18,647 - INFO - Processing document 8-K_2023-04-19
2025-11-14 15:42:18,742 - INFO - Finished converting document 8-K_2023-04-19 in 0.19 sec.


Converted 'data\edgar_documents\BA\8-K_2023-04-11' --> 'data\processed_data\BA\8-K_2023-04-11.md'


2025-11-14 15:42:18,863 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:18,911 - INFO - Going to convert document batch...
2025-11-14 15:42:18,914 - INFO - Processing document 8-K_2023-04-26
2025-11-14 15:42:18,989 - INFO - Finished converting document 8-K_2023-04-26 in 0.16 sec.


Converted 'data\edgar_documents\BA\8-K_2023-04-19' --> 'data\processed_data\BA\8-K_2023-04-19.md'


2025-11-14 15:42:19,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:19,120 - INFO - Going to convert document batch...
2025-11-14 15:42:19,125 - INFO - Processing document 8-K_2023-07-26
2025-11-14 15:42:19,180 - INFO - Finished converting document 8-K_2023-07-26 in 0.14 sec.


Converted 'data\edgar_documents\BA\8-K_2023-04-26' --> 'data\processed_data\BA\8-K_2023-04-26.md'
Converted 'data\edgar_documents\BA\8-K_2023-07-26' --> 'data\processed_data\BA\8-K_2023-07-26.md'


2025-11-14 15:42:19,248 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:19,299 - INFO - Going to convert document batch...
2025-11-14 15:42:19,302 - INFO - Processing document 8-K_2023-08-24
2025-11-14 15:42:19,365 - INFO - Finished converting document 8-K_2023-08-24 in 0.16 sec.
2025-11-14 15:42:19,421 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:19,470 - INFO - Going to convert document batch...
2025-11-14 15:42:19,471 - INFO - Processing document 8-K_2023-09-05
2025-11-14 15:42:19,559 - INFO - Finished converting document 8-K_2023-09-05 in 0.16 sec.


Converted 'data\edgar_documents\BA\8-K_2023-08-24' --> 'data\processed_data\BA\8-K_2023-08-24.md'


2025-11-14 15:42:19,622 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:19,667 - INFO - Going to convert document batch...
2025-11-14 15:42:19,669 - INFO - Processing document 8-K_2023-09-22
2025-11-14 15:42:19,713 - INFO - Finished converting document 8-K_2023-09-22 in 0.12 sec.
2025-11-14 15:42:19,770 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\8-K_2023-09-05' --> 'data\processed_data\BA\8-K_2023-09-05.md'
Converted 'data\edgar_documents\BA\8-K_2023-09-22' --> 'data\processed_data\BA\8-K_2023-09-22.md'


2025-11-14 15:42:19,811 - INFO - Going to convert document batch...
2025-11-14 15:42:19,812 - INFO - Processing document 8-K_2023-10-25
2025-11-14 15:42:19,847 - INFO - Finished converting document 8-K_2023-10-25 in 0.11 sec.
2025-11-14 15:42:19,891 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:19,929 - INFO - Going to convert document batch...
2025-11-14 15:42:19,935 - INFO - Processing document 8-K_2023-12-11
2025-11-14 15:42:19,999 - INFO - Finished converting document 8-K_2023-12-11 in 0.12 sec.


Converted 'data\edgar_documents\BA\8-K_2023-10-25' --> 'data\processed_data\BA\8-K_2023-10-25.md'
Converted 'data\edgar_documents\BA\8-K_2023-12-11' --> 'data\processed_data\BA\8-K_2023-12-11.md'


2025-11-14 15:42:20,068 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:20,106 - INFO - Going to convert document batch...
2025-11-14 15:42:20,108 - INFO - Processing document 8-K_2024-01-31
2025-11-14 15:42:20,182 - INFO - Finished converting document 8-K_2024-01-31 in 0.16 sec.
2025-11-14 15:42:20,235 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:20,253 - INFO - Going to convert document batch...
2025-11-14 15:42:20,256 - INFO - Processing document 8-K_2024-03-25
2025-11-14 15:42:20,320 - INFO - Finished converting document 8-K_2024-03-25 in 0.09 sec.
2025-11-14 15:42:20,392 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\8-K_2024-01-31' --> 'data\processed_data\BA\8-K_2024-01-31.md'
Converted 'data\edgar_documents\BA\8-K_2024-03-25' --> 'data\processed_data\BA\8-K_2024-03-25.md'


2025-11-14 15:42:20,427 - INFO - Going to convert document batch...
2025-11-14 15:42:20,429 - INFO - Processing document 8-K_2024-04-24
2025-11-14 15:42:20,515 - INFO - Finished converting document 8-K_2024-04-24 in 0.16 sec.
2025-11-14 15:42:20,590 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:20,617 - INFO - Going to convert document batch...
2025-11-14 15:42:20,619 - INFO - Processing document 8-K_2024-05-03
2025-11-14 15:42:20,701 - INFO - Finished converting document 8-K_2024-05-03 in 0.14 sec.


Converted 'data\edgar_documents\BA\8-K_2024-04-24' --> 'data\processed_data\BA\8-K_2024-04-24.md'
Converted 'data\edgar_documents\BA\8-K_2024-05-03' --> 'data\processed_data\BA\8-K_2024-05-03.md'


2025-11-14 15:42:20,785 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:20,828 - INFO - Going to convert document batch...
2025-11-14 15:42:20,830 - INFO - Processing document 8-K_2024-05-17
2025-11-14 15:42:20,877 - INFO - Finished converting document 8-K_2024-05-17 in 0.14 sec.
2025-11-14 15:42:20,937 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:20,963 - INFO - Going to convert document batch...
2025-11-14 15:42:20,964 - INFO - Processing document 8-K_2024-07-01
2025-11-14 15:42:21,059 - INFO - Finished converting document 8-K_2024-07-01 in 0.16 sec.


Converted 'data\edgar_documents\BA\8-K_2024-05-17' --> 'data\processed_data\BA\8-K_2024-05-17.md'
Converted 'data\edgar_documents\BA\8-K_2024-07-01' --> 'data\processed_data\BA\8-K_2024-07-01.md'


2025-11-14 15:42:21,137 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:21,184 - INFO - Going to convert document batch...
2025-11-14 15:42:21,186 - INFO - Processing document 8-K_2024-07-31
2025-11-14 15:42:21,256 - INFO - Finished converting document 8-K_2024-07-31 in 0.16 sec.
2025-11-14 15:42:21,328 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:21,350 - INFO - Going to convert document batch...
2025-11-14 15:42:21,353 - INFO - Processing document 8-K_2024-09-13
2025-11-14 15:42:21,401 - INFO - Finished converting document 8-K_2024-09-13 in 0.11 sec.
2025-11-14 15:42:21,469 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\8-K_2024-07-31' --> 'data\processed_data\BA\8-K_2024-07-31.md'
Converted 'data\edgar_documents\BA\8-K_2024-09-13' --> 'data\processed_data\BA\8-K_2024-09-13.md'


2025-11-14 15:42:21,522 - INFO - Going to convert document batch...
2025-11-14 15:42:21,524 - INFO - Processing document 8-K_2024-09-20
2025-11-14 15:42:21,555 - INFO - Finished converting document 8-K_2024-09-20 in 0.12 sec.
2025-11-14 15:42:21,584 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:21,601 - INFO - Going to convert document batch...
2025-11-14 15:42:21,602 - INFO - Processing document 8-K_2024-10-11
2025-11-14 15:42:21,634 - INFO - Finished converting document 8-K_2024-10-11 in 0.06 sec.
2025-11-14 15:42:21,677 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:21,694 - INFO - Going to convert document batch...
2025-11-14 15:42:21,696 - INFO - Processing document 8-K_2024-10-15
2025-11-14 15:42:21,730 - INFO - Finished converting document 8-K_2024-10-15 in 0.08 sec.


Converted 'data\edgar_documents\BA\8-K_2024-09-20' --> 'data\processed_data\BA\8-K_2024-09-20.md'
Converted 'data\edgar_documents\BA\8-K_2024-10-11' --> 'data\processed_data\BA\8-K_2024-10-11.md'
Converted 'data\edgar_documents\BA\8-K_2024-10-15' --> 'data\processed_data\BA\8-K_2024-10-15.md'


2025-11-14 15:42:21,786 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:21,805 - INFO - Going to convert document batch...
2025-11-14 15:42:21,807 - INFO - Processing document 8-K_2024-10-23
2025-11-14 15:42:21,849 - INFO - Finished converting document 8-K_2024-10-23 in 0.09 sec.
2025-11-14 15:42:21,904 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:21,944 - INFO - Going to convert document batch...
2025-11-14 15:42:21,946 - INFO - Processing document 8-K_2024-10-30
2025-11-14 15:42:22,030 - INFO - Finished converting document 8-K_2024-10-30 in 0.17 sec.


Converted 'data\edgar_documents\BA\8-K_2024-10-23' --> 'data\processed_data\BA\8-K_2024-10-23.md'


2025-11-14 15:42:22,095 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:22,135 - INFO - Going to convert document batch...
2025-11-14 15:42:22,138 - INFO - Processing document 8-K_2024-10-31
2025-11-14 15:42:22,182 - INFO - Finished converting document 8-K_2024-10-31 in 0.12 sec.


Converted 'data\edgar_documents\BA\8-K_2024-10-30' --> 'data\processed_data\BA\8-K_2024-10-30.md'
Converted 'data\edgar_documents\BA\8-K_2024-10-31' --> 'data\processed_data\BA\8-K_2024-10-31.md'


2025-11-14 15:42:22,249 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:22,270 - INFO - Going to convert document batch...
2025-11-14 15:42:22,273 - INFO - Processing document 8-K_2024-11-18
2025-11-14 15:42:22,358 - INFO - Finished converting document 8-K_2024-11-18 in 0.16 sec.
2025-11-14 15:42:22,442 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:22,465 - INFO - Going to convert document batch...
2025-11-14 15:42:22,467 - INFO - Processing document 8-K_2025-01-23
2025-11-14 15:42:22,508 - INFO - Finished converting document 8-K_2025-01-23 in 0.08 sec.
2025-11-14 15:42:22,570 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:22,593 - INFO - Going to convert document batch...
2025-11-14 15:42:22,594 - INFO - Processing document 8-K_2025-01-28


Converted 'data\edgar_documents\BA\8-K_2024-11-18' --> 'data\processed_data\BA\8-K_2024-11-18.md'
Converted 'data\edgar_documents\BA\8-K_2025-01-23' --> 'data\processed_data\BA\8-K_2025-01-23.md'


2025-11-14 15:42:22,639 - INFO - Finished converting document 8-K_2025-01-28 in 0.11 sec.
2025-11-14 15:42:22,702 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:22,733 - INFO - Going to convert document batch...
2025-11-14 15:42:22,735 - INFO - Processing document 8-K_2025-02-25
2025-11-14 15:42:22,787 - INFO - Finished converting document 8-K_2025-02-25 in 0.12 sec.
2025-11-14 15:42:22,856 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BA\8-K_2025-01-28' --> 'data\processed_data\BA\8-K_2025-01-28.md'
Converted 'data\edgar_documents\BA\8-K_2025-02-25' --> 'data\processed_data\BA\8-K_2025-02-25.md'


2025-11-14 15:42:22,900 - INFO - Going to convert document batch...
2025-11-14 15:42:22,903 - INFO - Processing document 8-K_2025-04-23
2025-11-14 15:42:22,970 - INFO - Finished converting document 8-K_2025-04-23 in 0.16 sec.
2025-11-14 15:42:23,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:23,082 - INFO - Going to convert document batch...
2025-11-14 15:42:23,084 - INFO - Processing document 8-K_2025-04-24
2025-11-14 15:42:23,165 - INFO - Finished converting document 8-K_2025-04-24 in 0.14 sec.


Converted 'data\edgar_documents\BA\8-K_2025-04-23' --> 'data\processed_data\BA\8-K_2025-04-23.md'
Converted 'data\edgar_documents\BA\8-K_2025-04-24' --> 'data\processed_data\BA\8-K_2025-04-24.md'


2025-11-14 15:42:23,266 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:23,311 - INFO - Going to convert document batch...
2025-11-14 15:42:23,313 - INFO - Processing document 8-K_2025-06-04
2025-11-14 15:42:23,383 - INFO - Finished converting document 8-K_2025-06-04 in 0.16 sec.
2025-11-14 15:42:23,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:23,481 - INFO - Going to convert document batch...
2025-11-14 15:42:23,482 - INFO - Processing document 8-K_2025-07-03
2025-11-14 15:42:23,532 - INFO - Finished converting document 8-K_2025-07-03 in 0.12 sec.


Converted 'data\edgar_documents\BA\8-K_2025-06-04' --> 'data\processed_data\BA\8-K_2025-06-04.md'
Converted 'data\edgar_documents\BA\8-K_2025-07-03' --> 'data\processed_data\BA\8-K_2025-07-03.md'


2025-11-14 15:42:23,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:23,631 - INFO - Going to convert document batch...
2025-11-14 15:42:23,632 - INFO - Processing document 8-K_2025-07-29
2025-11-14 15:42:23,671 - INFO - Finished converting document 8-K_2025-07-29 in 0.12 sec.
2025-11-14 15:42:23,727 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:23,764 - INFO - Going to convert document batch...
2025-11-14 15:42:23,767 - INFO - Processing document 8-K_2025-08-28
2025-11-14 15:42:23,834 - INFO - Finished converting document 8-K_2025-08-28 in 0.14 sec.


Converted 'data\edgar_documents\BA\8-K_2025-07-29' --> 'data\processed_data\BA\8-K_2025-07-29.md'
Converted 'data\edgar_documents\BA\8-K_2025-08-28' --> 'data\processed_data\BA\8-K_2025-08-28.md'


2025-11-14 15:42:23,903 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:23,926 - INFO - Going to convert document batch...
2025-11-14 15:42:23,927 - INFO - Processing document 8-K_2025-10-29
2025-11-14 15:42:23,966 - INFO - Finished converting document 8-K_2025-10-29 in 0.11 sec.
2025-11-14 15:42:24,042 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:42:24,045 - ERROR - Input document DEF-14A_2023-03-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>

Converted 'data\edgar_documents\BA\8-K_2025-10-29' --> 'data\processed_data\BA\8-K_2025-10-29.md'
Error processing data\edgar_documents\BA\DEF-14A_2023-03-03: File format not allowed: data\edgar_documents\BA\DEF-14A_2023-03-03
Error processing data\edgar_documents\BA\DEF-14A_2024-04-05: File format not allowed: data\edgar_documents\BA\DEF-14A_2024-04-05
Error processing data\edgar_documents\BA\DEF-14A_2025-03-07: File format not allowed: data\edgar_documents\BA\DEF-14A_2025-03-07
Processed 97 new files. Errors: 9
Found 128 files to process in data\edgar_documents\BK


2025-11-14 15:42:24,229 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:26,024 - INFO - Going to convert document batch...
2025-11-14 15:42:26,025 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:42:26,026 - INFO - Processing document 10-K_2023-02-27
2025-11-14 15:42:27,243 - INFO - Finished converting document 10-K_2023-02-27 in 3.06 sec.
2025-11-14 15:42:27,686 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BK\10-K_2023-02-27' --> 'data\processed_data\BK\10-K_2023-02-27.md'


2025-11-14 15:42:29,455 - INFO - Going to convert document batch...
2025-11-14 15:42:29,458 - INFO - Processing document 10-K_2024-02-28
2025-11-14 15:42:30,683 - INFO - Finished converting document 10-K_2024-02-28 in 3.06 sec.
2025-11-14 15:42:31,093 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BK\10-K_2024-02-28' --> 'data\processed_data\BK\10-K_2024-02-28.md'


2025-11-14 15:42:32,229 - INFO - Going to convert document batch...
2025-11-14 15:42:32,231 - INFO - Processing document 10-K_2025-02-27
2025-11-14 15:42:33,382 - INFO - Finished converting document 10-K_2025-02-27 in 2.34 sec.


Converted 'data\edgar_documents\BK\10-K_2025-02-27' --> 'data\processed_data\BK\10-K_2025-02-27.md'


2025-11-14 15:42:33,954 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:42:40,259 - INFO - Going to convert document batch...
2025-11-14 15:42:40,261 - INFO - Processing document 10-Q_2023-05-05
2025-11-14 15:42:48,167 - INFO - Finished converting document 10-Q_2023-05-05 in 14.45 sec.
2025-11-14 15:42:49,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BK\10-Q_2023-05-05' --> 'data\processed_data\BK\10-Q_2023-05-05.md'


2025-11-14 15:42:51,900 - INFO - Going to convert document batch...
2025-11-14 15:42:51,900 - INFO - Processing document 10-Q_2023-08-04
2025-11-14 15:42:56,416 - INFO - Finished converting document 10-Q_2023-08-04 in 7.17 sec.
2025-11-14 15:42:57,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BK\10-Q_2023-08-04' --> 'data\processed_data\BK\10-Q_2023-08-04.md'


2025-11-14 15:43:00,216 - INFO - Going to convert document batch...
2025-11-14 15:43:00,217 - INFO - Processing document 10-Q_2023-11-03
2025-11-14 15:43:04,951 - INFO - Finished converting document 10-Q_2023-11-03 in 7.23 sec.
2025-11-14 15:43:07,308 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BK\10-Q_2023-11-03' --> 'data\processed_data\BK\10-Q_2023-11-03.md'


2025-11-14 15:43:09,139 - INFO - Going to convert document batch...
2025-11-14 15:43:09,140 - INFO - Processing document 10-Q_2024-05-03
2025-11-14 15:43:12,916 - INFO - Finished converting document 10-Q_2024-05-03 in 5.77 sec.
2025-11-14 15:43:14,268 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BK\10-Q_2024-05-03' --> 'data\processed_data\BK\10-Q_2024-05-03.md'


2025-11-14 15:43:16,606 - INFO - Going to convert document batch...
2025-11-14 15:43:16,607 - INFO - Processing document 10-Q_2024-08-02
2025-11-14 15:43:21,775 - INFO - Finished converting document 10-Q_2024-08-02 in 7.67 sec.
2025-11-14 15:43:23,278 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BK\10-Q_2024-08-02' --> 'data\processed_data\BK\10-Q_2024-08-02.md'


2025-11-14 15:43:25,725 - INFO - Going to convert document batch...
2025-11-14 15:43:25,726 - INFO - Processing document 10-Q_2024-11-01
2025-11-14 15:43:30,477 - INFO - Finished converting document 10-Q_2024-11-01 in 7.38 sec.


Converted 'data\edgar_documents\BK\10-Q_2024-11-01' --> 'data\processed_data\BK\10-Q_2024-11-01.md'


2025-11-14 15:43:32,017 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:34,189 - INFO - Going to convert document batch...
2025-11-14 15:43:34,190 - INFO - Processing document 10-Q_2025-05-02
2025-11-14 15:43:37,886 - INFO - Finished converting document 10-Q_2025-05-02 in 6.09 sec.
2025-11-14 15:43:39,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BK\10-Q_2025-05-02' --> 'data\processed_data\BK\10-Q_2025-05-02.md'


2025-11-14 15:43:41,569 - INFO - Going to convert document batch...
2025-11-14 15:43:41,571 - INFO - Processing document 10-Q_2025-08-01
2025-11-14 15:43:46,608 - INFO - Finished converting document 10-Q_2025-08-01 in 7.53 sec.
2025-11-14 15:43:48,050 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BK\10-Q_2025-08-01' --> 'data\processed_data\BK\10-Q_2025-08-01.md'


2025-11-14 15:43:50,486 - INFO - Going to convert document batch...
2025-11-14 15:43:50,487 - INFO - Processing document 10-Q_2025-10-31
2025-11-14 15:43:55,093 - INFO - Finished converting document 10-Q_2025-10-31 in 7.20 sec.
2025-11-14 15:43:56,434 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:56,450 - INFO - Going to convert document batch...
2025-11-14 15:43:56,451 - INFO - Processing document 4_2023-01-19
2025-11-14 15:43:56,470 - INFO - Finished converting document 4_2023-01-19 in 0.06 sec.
2025-11-14 15:43:56,538 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:56,548 - INFO - Going to convert document batch...
2025-11-14 15:43:56,549 - INFO - Processing document 4_2023-01-24
2025-11-14 15:43:56,569 - INFO - Finished converting document 4_2023-01-24 in 0.05 sec.
2025-11-14 15:43:56,601 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\BK\10-Q_2025-10-31' --> 'data\processed_data\BK\10-Q_2025-10-31.md'
Converted 'data\edgar_documents\BK\4_2023-01-19' --> 'data\processed_data\BK\4_2023-01-19.md'
Converted 'data\edgar_documents\BK\4_2023-01-24' --> 'data\processed_data\BK\4_2023-01-24.md'


2025-11-14 15:43:56,601 - ERROR - Input document 4_2023-01-26 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:43:56,602 - INFO - Going to convert document batch...
2025-11-14 15:43:56,613 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:56,622 - INFO - Going to convert document batch...
2025-11-14 15:43:56,623 - INFO - Processing document 4_2023-02-03
2025-11-14 15:43:56,641 - INFO - Finished converting document 4_2023-02-03 in 0.05 sec.
2025-11-14 15:43:56,670 - INFO - detec

Error processing data\edgar_documents\BK\4_2023-01-26: File format not allowed: data\edgar_documents\BK\4_2023-01-26
Converted 'data\edgar_documents\BK\4_2023-02-03' --> 'data\processed_data\BK\4_2023-02-03.md'
Converted 'data\edgar_documents\BK\4_2023-02-10' --> 'data\processed_data\BK\4_2023-02-10.md'
Converted 'data\edgar_documents\BK\4_2023-02-14' --> 'data\processed_data\BK\4_2023-02-14.md'


2025-11-14 15:43:56,800 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:56,809 - INFO - Going to convert document batch...
2025-11-14 15:43:56,810 - INFO - Processing document 4_2023-02-15
2025-11-14 15:43:56,830 - INFO - Finished converting document 4_2023-02-15 in 0.05 sec.
2025-11-14 15:43:56,879 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:56,890 - INFO - Going to convert document batch...
2025-11-14 15:43:56,891 - INFO - Processing document 4_2023-02-17
2025-11-14 15:43:56,910 - INFO - Finished converting document 4_2023-02-17 in 0.06 sec.
2025-11-14 15:43:56,941 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:56,948 - INFO - Going to convert document batch...
2025-11-14 15:43:56,949 - INFO - Processing document 4_2023-02-21
2025-11-14 15:43:56,964 - INFO - Finished converting document 4_2023-02-21 in 0.05 sec.
2025-11-14 15:43:56,995 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\BK\4_2023-02-15' --> 'data\processed_data\BK\4_2023-02-15.md'
Converted 'data\edgar_documents\BK\4_2023-02-17' --> 'data\processed_data\BK\4_2023-02-17.md'
Converted 'data\edgar_documents\BK\4_2023-02-21' --> 'data\processed_data\BK\4_2023-02-21.md'


2025-11-14 15:43:57,053 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:57,061 - INFO - Going to convert document batch...
2025-11-14 15:43:57,061 - INFO - Processing document 4_2023-03-03
2025-11-14 15:43:57,078 - INFO - Finished converting document 4_2023-03-03 in 0.03 sec.
2025-11-14 15:43:57,109 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:57,116 - INFO - Going to convert document batch...
2025-11-14 15:43:57,116 - INFO - Processing document 4_2023-03-10
2025-11-14 15:43:57,135 - INFO - Finished converting document 4_2023-03-10 in 0.03 sec.
2025-11-14 15:43:57,166 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:57,174 - INFO - Going to convert document batch...
2025-11-14 15:43:57,175 - INFO - Processing document 4_2023-04-05
2025-11-14 15:43:57,193 - INFO - Finished converting document 4_2023-04-05 in 0.03 sec.
2025-11-14 15:43:57,230 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\BK\4_2023-02-28' --> 'data\processed_data\BK\4_2023-02-28.md'
Converted 'data\edgar_documents\BK\4_2023-03-03' --> 'data\processed_data\BK\4_2023-03-03.md'
Converted 'data\edgar_documents\BK\4_2023-03-10' --> 'data\processed_data\BK\4_2023-03-10.md'
Converted 'data\edgar_documents\BK\4_2023-04-05' --> 'data\processed_data\BK\4_2023-04-05.md'


2025-11-14 15:43:57,231 - ERROR - Input document 4_2023-04-19 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:43:57,232 - INFO - Going to convert document batch...
2025-11-14 15:43:57,243 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:57,251 - INFO - Going to convert document batch...
2025-11-14 15:43:57,252 - INFO - Processing document 4_2023-04-21
2025-11-14 15:43:57,275 - INFO - Finished converting document 4_2023-04-21 in 0.03 sec.
2025-11-14 15:43:57,310 - INFO - detec

Error processing data\edgar_documents\BK\4_2023-04-19: File format not allowed: data\edgar_documents\BK\4_2023-04-19
Converted 'data\edgar_documents\BK\4_2023-04-21' --> 'data\processed_data\BK\4_2023-04-21.md'
Converted 'data\edgar_documents\BK\4_2023-07-06' --> 'data\processed_data\BK\4_2023-07-06.md'
Converted 'data\edgar_documents\BK\4_2023-07-21' --> 'data\processed_data\BK\4_2023-07-21.md'


2025-11-14 15:43:57,440 - INFO - Going to convert document batch...
2025-11-14 15:43:57,442 - INFO - Processing document 4_2023-08-01
2025-11-14 15:43:57,468 - INFO - Finished converting document 4_2023-08-01 in 0.05 sec.
2025-11-14 15:43:57,515 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:57,522 - INFO - Going to convert document batch...
2025-11-14 15:43:57,523 - INFO - Processing document 4_2023-08-07
2025-11-14 15:43:57,542 - INFO - Finished converting document 4_2023-08-07 in 0.05 sec.
2025-11-14 15:43:57,573 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:57,583 - INFO - Going to convert document batch...
2025-11-14 15:43:57,583 - INFO - Processing document 4_2023-08-14


Converted 'data\edgar_documents\BK\4_2023-08-01' --> 'data\processed_data\BK\4_2023-08-01.md'
Converted 'data\edgar_documents\BK\4_2023-08-07' --> 'data\processed_data\BK\4_2023-08-07.md'


2025-11-14 15:43:58,511 - INFO - Finished converting document 4_2023-08-14 in 0.95 sec.
2025-11-14 15:43:58,544 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:58,550 - INFO - Going to convert document batch...
2025-11-14 15:43:58,551 - INFO - Processing document 4_2023-10-04
2025-11-14 15:43:58,568 - INFO - Finished converting document 4_2023-10-04 in 0.03 sec.
2025-11-14 15:43:58,598 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:43:58,599 - ERROR - Input document 4_2023-10-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'js

Converted 'data\edgar_documents\BK\4_2023-08-14' --> 'data\processed_data\BK\4_2023-08-14.md'
Converted 'data\edgar_documents\BK\4_2023-10-04' --> 'data\processed_data\BK\4_2023-10-04.md'
Error processing data\edgar_documents\BK\4_2023-10-18: File format not allowed: data\edgar_documents\BK\4_2023-10-18
Error processing data\edgar_documents\BK\4_2023-10-19: File format not allowed: data\edgar_documents\BK\4_2023-10-19
Converted 'data\edgar_documents\BK\4_2024-01-17' --> 'data\processed_data\BK\4_2024-01-17.md'


2025-11-14 15:43:58,743 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:58,750 - INFO - Going to convert document batch...
2025-11-14 15:43:58,751 - INFO - Processing document 4_2024-02-05
2025-11-14 15:43:58,768 - INFO - Finished converting document 4_2024-02-05 in 0.03 sec.
2025-11-14 15:43:58,800 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:58,808 - INFO - Going to convert document batch...
2025-11-14 15:43:58,809 - INFO - Processing document 4_2024-02-09
2025-11-14 15:43:58,827 - INFO - Finished converting document 4_2024-02-09 in 0.05 sec.
2025-11-14 15:43:58,858 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:58,865 - INFO - Going to convert document batch...
2025-11-14 15:43:58,866 - INFO - Processing document 4_2024-02-12
2025-11-14 15:43:58,883 - INFO - Finished converting document 4_2024-02-12 in 0.03 sec.
2025-11-14 15:43:58,917 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BK\4_2024-02-02' --> 'data\processed_data\BK\4_2024-02-02.md'
Converted 'data\edgar_documents\BK\4_2024-02-05' --> 'data\processed_data\BK\4_2024-02-05.md'
Converted 'data\edgar_documents\BK\4_2024-02-09' --> 'data\processed_data\BK\4_2024-02-09.md'
Converted 'data\edgar_documents\BK\4_2024-02-12' --> 'data\processed_data\BK\4_2024-02-12.md'


2025-11-14 15:43:58,926 - INFO - Going to convert document batch...
2025-11-14 15:43:58,926 - INFO - Processing document 4_2024-02-13
2025-11-14 15:43:58,943 - INFO - Finished converting document 4_2024-02-13 in 0.03 sec.
2025-11-14 15:43:58,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:58,985 - INFO - Going to convert document batch...
2025-11-14 15:43:58,986 - INFO - Processing document 4_2024-02-20
2025-11-14 15:43:59,008 - INFO - Finished converting document 4_2024-02-20 in 0.03 sec.
2025-11-14 15:43:59,045 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:59,052 - INFO - Going to convert document batch...
2025-11-14 15:43:59,053 - INFO - Processing document 4_2024-02-27
2025-11-14 15:43:59,075 - INFO - Finished converting document 4_2024-02-27 in 0.05 sec.
2025-11-14 15:43:59,105 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:59,113 - INFO - Going to convert document batch...
2025-11-14 15:43:59,113 - 

Converted 'data\edgar_documents\BK\4_2024-02-13' --> 'data\processed_data\BK\4_2024-02-13.md'
Converted 'data\edgar_documents\BK\4_2024-02-20' --> 'data\processed_data\BK\4_2024-02-20.md'
Converted 'data\edgar_documents\BK\4_2024-02-27' --> 'data\processed_data\BK\4_2024-02-27.md'
Converted 'data\edgar_documents\BK\4_2024-03-01' --> 'data\processed_data\BK\4_2024-03-01.md'


2025-11-14 15:43:59,165 - ERROR - Input document 4_2024-03-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:43:59,166 - INFO - Going to convert document batch...
2025-11-14 15:43:59,179 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:43:59,179 - ERROR - Input document 4_2024-03-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\BK\4_2024-03-07: File format not allowed: data\edgar_documents\BK\4_2024-03-07
Error processing data\edgar_documents\BK\4_2024-03-08: File format not allowed: data\edgar_documents\BK\4_2024-03-08
Converted 'data\edgar_documents\BK\4_2024-04-03' --> 'data\processed_data\BK\4_2024-04-03.md'
Converted 'data\edgar_documents\BK\4_2024-04-19' --> 'data\processed_data\BK\4_2024-04-19.md'


2025-11-14 15:43:59,388 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:59,395 - INFO - Going to convert document batch...
2025-11-14 15:43:59,396 - INFO - Processing document 4_2024-04-23
2025-11-14 15:43:59,414 - INFO - Finished converting document 4_2024-04-23 in 0.03 sec.
2025-11-14 15:43:59,445 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:59,453 - INFO - Going to convert document batch...
2025-11-14 15:43:59,454 - INFO - Processing document 4_2024-05-09
2025-11-14 15:43:59,473 - INFO - Finished converting document 4_2024-05-09 in 0.03 sec.
2025-11-14 15:43:59,505 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:43:59,512 - INFO - Going to convert document batch...
2025-11-14 15:43:59,514 - INFO - Processing document 4_2024-07-03
2025-11-14 15:43:59,530 - INFO - Finished converting document 4_2024-07-03 in 0.03 sec.
2025-11-14 15:43:59,562 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\BK\4_2024-04-22' --> 'data\processed_data\BK\4_2024-04-22.md'
Converted 'data\edgar_documents\BK\4_2024-04-23' --> 'data\processed_data\BK\4_2024-04-23.md'
Converted 'data\edgar_documents\BK\4_2024-05-09' --> 'data\processed_data\BK\4_2024-05-09.md'
Converted 'data\edgar_documents\BK\4_2024-07-03' --> 'data\processed_data\BK\4_2024-07-03.md'


2025-11-14 15:43:59,563 - ERROR - Input document 4_2024-07-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:43:59,564 - INFO - Going to convert document batch...
2025-11-14 15:43:59,580 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:43:59,580 - ERROR - Input document 4_2024-07-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\BK\4_2024-07-15: File format not allowed: data\edgar_documents\BK\4_2024-07-15
Error processing data\edgar_documents\BK\4_2024-07-17: File format not allowed: data\edgar_documents\BK\4_2024-07-17
Converted 'data\edgar_documents\BK\4_2024-07-19' --> 'data\processed_data\BK\4_2024-07-19.md'
Converted 'data\edgar_documents\BK\4_2024-10-03' --> 'data\processed_data\BK\4_2024-10-03.md'


2025-11-14 15:43:59,749 - INFO - Processing document 4_2024-10-17
2025-11-14 15:43:59,767 - INFO - Finished converting document 4_2024-10-17 in 0.06 sec.
2025-11-14 15:43:59,801 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:43:59,802 - ERROR - Input document 4_2024-11-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:43:59,803 - INFO - Going to convert document batch...
2025-11-14 15:43:59,815 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-1

Converted 'data\edgar_documents\BK\4_2024-10-17' --> 'data\processed_data\BK\4_2024-10-17.md'
Error processing data\edgar_documents\BK\4_2024-11-13: File format not allowed: data\edgar_documents\BK\4_2024-11-13
Error processing data\edgar_documents\BK\4_2024-11-14: File format not allowed: data\edgar_documents\BK\4_2024-11-14
Error processing data\edgar_documents\BK\4_2024-12-10: File format not allowed: data\edgar_documents\BK\4_2024-12-10
Converted 'data\edgar_documents\BK\4_2025-02-05' --> 'data\processed_data\BK\4_2025-02-05.md'
Converted 'data\edgar_documents\BK\4_2025-02-19' --> 'data\processed_data\BK\4_2025-02-19.md'


2025-11-14 15:43:59,987 - INFO - Going to convert document batch...
2025-11-14 15:43:59,988 - INFO - Processing document 4_2025-02-28
2025-11-14 15:44:00,008 - INFO - Finished converting document 4_2025-02-28 in 0.03 sec.
2025-11-14 15:44:00,053 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:44:00,053 - ERROR - Input document 4_2025-03-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:44:00,055 - INFO - Going to convert document batch...
2025-11-14 15:44:00,067 - IN

Converted 'data\edgar_documents\BK\4_2025-02-28' --> 'data\processed_data\BK\4_2025-02-28.md'
Error processing data\edgar_documents\BK\4_2025-03-03: File format not allowed: data\edgar_documents\BK\4_2025-03-03
Converted 'data\edgar_documents\BK\4_2025-03-04' --> 'data\processed_data\BK\4_2025-03-04.md'
Error processing data\edgar_documents\BK\4_2025-03-05: File format not allowed: data\edgar_documents\BK\4_2025-03-05
Error processing data\edgar_documents\BK\4_2025-03-07: File format not allowed: data\edgar_documents\BK\4_2025-03-07
Error processing data\edgar_documents\BK\4_2025-03-11: File format not allowed: data\edgar_documents\BK\4_2025-03-11


2025-11-14 15:44:00,224 - INFO - Going to convert document batch...
2025-11-14 15:44:00,225 - INFO - Processing document 4_2025-04-02
2025-11-14 15:44:00,283 - INFO - Finished converting document 4_2025-04-02 in 0.08 sec.
2025-11-14 15:44:00,322 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:00,332 - INFO - Going to convert document batch...
2025-11-14 15:44:00,333 - INFO - Processing document 4_2025-04-16
2025-11-14 15:44:00,350 - INFO - Finished converting document 4_2025-04-16 in 0.03 sec.
2025-11-14 15:44:00,380 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:00,389 - INFO - Going to convert document batch...
2025-11-14 15:44:00,390 - INFO - Processing document 4_2025-04-23
2025-11-14 15:44:00,409 - INFO - Finished converting document 4_2025-04-23 in 0.05 sec.
2025-11-14 15:44:00,440 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:00,446 - INFO - Going to convert document batch...
2025-11-14 15:44:00,447 - 

Converted 'data\edgar_documents\BK\4_2025-04-02' --> 'data\processed_data\BK\4_2025-04-02.md'
Converted 'data\edgar_documents\BK\4_2025-04-16' --> 'data\processed_data\BK\4_2025-04-16.md'
Converted 'data\edgar_documents\BK\4_2025-04-23' --> 'data\processed_data\BK\4_2025-04-23.md'
Converted 'data\edgar_documents\BK\4_2025-05-01' --> 'data\processed_data\BK\4_2025-05-01.md'


2025-11-14 15:44:00,509 - ERROR - Input document 4_2025-06-04 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:44:00,511 - INFO - Going to convert document batch...
2025-11-14 15:44:00,526 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:00,535 - INFO - Going to convert document batch...
2025-11-14 15:44:00,537 - INFO - Processing document 4_2025-07-03
2025-11-14 15:44:00,555 - INFO - Finished converting document 4_2025-07-03 in 0.03 sec.
2025-11-14 15:44:00,585 - INFO - detec

Error processing data\edgar_documents\BK\4_2025-06-04: File format not allowed: data\edgar_documents\BK\4_2025-06-04
Converted 'data\edgar_documents\BK\4_2025-07-03' --> 'data\processed_data\BK\4_2025-07-03.md'
Converted 'data\edgar_documents\BK\4_2025-07-24' --> 'data\processed_data\BK\4_2025-07-24.md'
Error processing data\edgar_documents\BK\4_2025-09-03: File format not allowed: data\edgar_documents\BK\4_2025-09-03
Error processing data\edgar_documents\BK\4_2025-09-05: File format not allowed: data\edgar_documents\BK\4_2025-09-05


2025-11-14 15:44:00,708 - INFO - Processing document 4_2025-10-03
2025-11-14 15:44:00,725 - INFO - Finished converting document 4_2025-10-03 in 0.03 sec.
2025-11-14 15:44:00,757 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:00,765 - INFO - Going to convert document batch...
2025-11-14 15:44:00,765 - INFO - Processing document 4_2025-11-03
2025-11-14 15:44:00,783 - INFO - Finished converting document 4_2025-11-03 in 0.03 sec.
2025-11-14 15:44:00,813 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:00,819 - INFO - Going to convert document batch...
2025-11-14 15:44:00,820 - INFO - Processing document 4_2025-11-07
2025-11-14 15:44:00,839 - INFO - Finished converting document 4_2025-11-07 in 0.05 sec.
2025-11-14 15:44:00,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:00,885 - INFO - Going to convert document batch...
2025-11-14 15:44:00,886 - INFO - Processing document 8-K_2023-01-13
2025-11-14 15:44:00,907 - 

Converted 'data\edgar_documents\BK\4_2025-10-03' --> 'data\processed_data\BK\4_2025-10-03.md'
Converted 'data\edgar_documents\BK\4_2025-11-03' --> 'data\processed_data\BK\4_2025-11-03.md'
Converted 'data\edgar_documents\BK\4_2025-11-07' --> 'data\processed_data\BK\4_2025-11-07.md'
Converted 'data\edgar_documents\BK\8-K_2023-01-13' --> 'data\processed_data\BK\8-K_2023-01-13.md'


2025-11-14 15:44:00,946 - INFO - Going to convert document batch...
2025-11-14 15:44:00,947 - INFO - Processing document 8-K_2023-01-31
2025-11-14 15:44:00,966 - INFO - Finished converting document 8-K_2023-01-31 in 0.05 sec.
2025-11-14 15:44:00,990 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,011 - INFO - Going to convert document batch...
2025-11-14 15:44:01,011 - INFO - Processing document 8-K_2023-04-12
2025-11-14 15:44:01,038 - INFO - Finished converting document 8-K_2023-04-12 in 0.06 sec.
2025-11-14 15:44:01,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,078 - INFO - Going to convert document batch...
2025-11-14 15:44:01,080 - INFO - Processing document 8-K_2023-04-18
2025-11-14 15:44:01,098 - INFO - Finished converting document 8-K_2023-04-18 in 0.05 sec.
2025-11-14 15:44:01,148 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,164 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BK\8-K_2023-01-31' --> 'data\processed_data\BK\8-K_2023-01-31.md'
Converted 'data\edgar_documents\BK\8-K_2023-04-12' --> 'data\processed_data\BK\8-K_2023-04-12.md'
Converted 'data\edgar_documents\BK\8-K_2023-04-18' --> 'data\processed_data\BK\8-K_2023-04-18.md'


2025-11-14 15:44:01,164 - INFO - Processing document 8-K_2023-04-26
2025-11-14 15:44:01,182 - INFO - Finished converting document 8-K_2023-04-26 in 0.08 sec.
2025-11-14 15:44:01,207 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,215 - INFO - Going to convert document batch...
2025-11-14 15:44:01,216 - INFO - Processing document 8-K_2023-05-24
2025-11-14 15:44:01,233 - INFO - Finished converting document 8-K_2023-05-24 in 0.05 sec.
2025-11-14 15:44:01,256 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,264 - INFO - Going to convert document batch...
2025-11-14 15:44:01,265 - INFO - Processing document 8-K_2023-06-30
2025-11-14 15:44:01,277 - INFO - Finished converting document 8-K_2023-06-30 in 0.05 sec.
2025-11-14 15:44:01,299 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,311 - INFO - Going to convert document batch...
2025-11-14 15:44:01,312 - INFO - Processing document 8-K_2023-07-18
2025-11-14 15:

Converted 'data\edgar_documents\BK\8-K_2023-04-26' --> 'data\processed_data\BK\8-K_2023-04-26.md'
Converted 'data\edgar_documents\BK\8-K_2023-05-24' --> 'data\processed_data\BK\8-K_2023-05-24.md'
Converted 'data\edgar_documents\BK\8-K_2023-06-30' --> 'data\processed_data\BK\8-K_2023-06-30.md'
Converted 'data\edgar_documents\BK\8-K_2023-07-18' --> 'data\processed_data\BK\8-K_2023-07-18.md'


2025-11-14 15:44:01,375 - INFO - Processing document 8-K_2023-08-11
2025-11-14 15:44:01,399 - INFO - Finished converting document 8-K_2023-08-11 in 0.05 sec.
2025-11-14 15:44:01,426 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,436 - INFO - Going to convert document batch...
2025-11-14 15:44:01,437 - INFO - Processing document 8-K_2023-09-05
2025-11-14 15:44:01,456 - INFO - Finished converting document 8-K_2023-09-05 in 0.05 sec.
2025-11-14 15:44:01,480 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,490 - INFO - Going to convert document batch...
2025-11-14 15:44:01,491 - INFO - Processing document 8-K_2023-09-12
2025-11-14 15:44:01,510 - INFO - Finished converting document 8-K_2023-09-12 in 0.05 sec.
2025-11-14 15:44:01,533 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,548 - INFO - Going to convert document batch...
2025-11-14 15:44:01,549 - INFO - Processing document 8-K_2023-10-17
2025-11-14 15:

Converted 'data\edgar_documents\BK\8-K_2023-08-11' --> 'data\processed_data\BK\8-K_2023-08-11.md'
Converted 'data\edgar_documents\BK\8-K_2023-09-05' --> 'data\processed_data\BK\8-K_2023-09-05.md'
Converted 'data\edgar_documents\BK\8-K_2023-09-12' --> 'data\processed_data\BK\8-K_2023-09-12.md'
Converted 'data\edgar_documents\BK\8-K_2023-10-17' --> 'data\processed_data\BK\8-K_2023-10-17.md'


2025-11-14 15:44:01,606 - INFO - Going to convert document batch...
2025-11-14 15:44:01,607 - INFO - Processing document 8-K_2023-10-25
2025-11-14 15:44:01,627 - INFO - Finished converting document 8-K_2023-10-25 in 0.05 sec.
2025-11-14 15:44:01,650 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,659 - INFO - Going to convert document batch...
2025-11-14 15:44:01,660 - INFO - Processing document 8-K_2023-11-17
2025-11-14 15:44:01,675 - INFO - Finished converting document 8-K_2023-11-17 in 0.03 sec.
2025-11-14 15:44:01,697 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,708 - INFO - Going to convert document batch...
2025-11-14 15:44:01,708 - INFO - Processing document 8-K_2023-12-21
2025-11-14 15:44:01,725 - INFO - Finished converting document 8-K_2023-12-21 in 0.03 sec.
2025-11-14 15:44:01,749 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,761 - INFO - Going to convert document batch...
2025-11-14 15:

Converted 'data\edgar_documents\BK\8-K_2023-10-25' --> 'data\processed_data\BK\8-K_2023-10-25.md'
Converted 'data\edgar_documents\BK\8-K_2023-11-17' --> 'data\processed_data\BK\8-K_2023-11-17.md'
Converted 'data\edgar_documents\BK\8-K_2023-12-21' --> 'data\processed_data\BK\8-K_2023-12-21.md'
Converted 'data\edgar_documents\BK\8-K_2024-01-12' --> 'data\processed_data\BK\8-K_2024-01-12.md'


2025-11-14 15:44:01,853 - INFO - Going to convert document batch...
2025-11-14 15:44:01,854 - INFO - Processing document 8-K_2024-03-05
2025-11-14 15:44:01,867 - INFO - Finished converting document 8-K_2024-03-05 in 0.06 sec.
2025-11-14 15:44:01,914 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,931 - INFO - Going to convert document batch...
2025-11-14 15:44:01,931 - INFO - Processing document 8-K_2024-03-14
2025-11-14 15:44:01,947 - INFO - Finished converting document 8-K_2024-03-14 in 0.06 sec.
2025-11-14 15:44:01,971 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:01,978 - INFO - Going to convert document batch...
2025-11-14 15:44:01,980 - INFO - Processing document 8-K_2024-03-26
2025-11-14 15:44:01,995 - INFO - Finished converting document 8-K_2024-03-26 in 0.05 sec.
2025-11-14 15:44:02,017 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:02,033 - INFO - Going to convert document batch...
2025-11-14 15:

Converted 'data\edgar_documents\BK\8-K_2024-03-05' --> 'data\processed_data\BK\8-K_2024-03-05.md'
Converted 'data\edgar_documents\BK\8-K_2024-03-14' --> 'data\processed_data\BK\8-K_2024-03-14.md'
Converted 'data\edgar_documents\BK\8-K_2024-03-26' --> 'data\processed_data\BK\8-K_2024-03-26.md'


2025-11-14 15:44:02,085 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:02,096 - INFO - Going to convert document batch...
2025-11-14 15:44:02,097 - INFO - Processing document 8-K_2024-04-16
2025-11-14 15:44:02,116 - INFO - Finished converting document 8-K_2024-04-16 in 0.05 sec.
2025-11-14 15:44:02,164 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:02,176 - INFO - Going to convert document batch...
2025-11-14 15:44:02,177 - INFO - Processing document 8-K_2024-06-18
2025-11-14 15:44:02,191 - INFO - Finished converting document 8-K_2024-06-18 in 0.06 sec.
2025-11-14 15:44:02,234 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:02,250 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BK\8-K_2024-04-10' --> 'data\processed_data\BK\8-K_2024-04-10.md'
Converted 'data\edgar_documents\BK\8-K_2024-04-16' --> 'data\processed_data\BK\8-K_2024-04-16.md'
Converted 'data\edgar_documents\BK\8-K_2024-06-18' --> 'data\processed_data\BK\8-K_2024-06-18.md'


2025-11-14 15:44:02,251 - INFO - Processing document 8-K_2024-06-28
2025-11-14 15:44:02,265 - INFO - Finished converting document 8-K_2024-06-28 in 0.06 sec.
2025-11-14 15:44:02,287 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:02,323 - INFO - Going to convert document batch...
2025-11-14 15:44:02,325 - INFO - Processing document 8-K_2024-07-12
2025-11-14 15:44:02,362 - INFO - Finished converting document 8-K_2024-07-12 in 0.09 sec.
2025-11-14 15:44:02,390 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:02,399 - INFO - Going to convert document batch...
2025-11-14 15:44:02,400 - INFO - Processing document 8-K_2024-07-22
2025-11-14 15:44:02,417 - INFO - Finished converting document 8-K_2024-07-22 in 0.05 sec.
2025-11-14 15:44:02,441 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:02,450 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BK\8-K_2024-06-28' --> 'data\processed_data\BK\8-K_2024-06-28.md'
Converted 'data\edgar_documents\BK\8-K_2024-07-12' --> 'data\processed_data\BK\8-K_2024-07-12.md'
Converted 'data\edgar_documents\BK\8-K_2024-07-22' --> 'data\processed_data\BK\8-K_2024-07-22.md'


2025-11-14 15:44:02,451 - INFO - Processing document 8-K_2024-10-11
2025-11-14 15:44:02,470 - INFO - Finished converting document 8-K_2024-10-11 in 0.05 sec.
2025-11-14 15:44:02,499 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:02,509 - INFO - Going to convert document batch...
2025-11-14 15:44:02,510 - INFO - Processing document 8-K_2024-11-20
2025-11-14 15:44:02,528 - INFO - Finished converting document 8-K_2024-11-20 in 0.05 sec.
2025-11-14 15:44:02,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:02,559 - INFO - Going to convert document batch...
2025-11-14 15:44:02,560 - INFO - Processing document 8-K_2024-12-05
2025-11-14 15:44:02,575 - INFO - Finished converting document 8-K_2024-12-05 in 0.05 sec.
2025-11-14 15:44:02,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:02,604 - INFO - Going to convert document batch...
2025-11-14 15:44:02,605 - INFO - Processing document 8-K_2025-01-08
2025-11-14 15:

Converted 'data\edgar_documents\BK\8-K_2024-10-11' --> 'data\processed_data\BK\8-K_2024-10-11.md'
Converted 'data\edgar_documents\BK\8-K_2024-11-20' --> 'data\processed_data\BK\8-K_2024-11-20.md'
Converted 'data\edgar_documents\BK\8-K_2024-12-05' --> 'data\processed_data\BK\8-K_2024-12-05.md'
Converted 'data\edgar_documents\BK\8-K_2025-01-08' --> 'data\processed_data\BK\8-K_2025-01-08.md'


2025-11-14 15:44:02,674 - INFO - Finished converting document 8-K_2025-01-15 in 0.05 sec.
2025-11-14 15:44:02,702 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:02,712 - INFO - Going to convert document batch...
2025-11-14 15:44:02,713 - INFO - Processing document 8-K_2025-02-11
2025-11-14 15:44:02,729 - INFO - Finished converting document 8-K_2025-02-11 in 0.05 sec.
2025-11-14 15:44:02,752 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:02,763 - INFO - Going to convert document batch...
2025-11-14 15:44:02,764 - INFO - Processing document 8-K_2025-03-03


Converted 'data\edgar_documents\BK\8-K_2025-01-15' --> 'data\processed_data\BK\8-K_2025-01-15.md'
Converted 'data\edgar_documents\BK\8-K_2025-02-11' --> 'data\processed_data\BK\8-K_2025-02-11.md'


2025-11-14 15:44:03,014 - INFO - Finished converting document 8-K_2025-03-03 in 0.28 sec.
2025-11-14 15:44:03,058 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:03,077 - INFO - Going to convert document batch...
2025-11-14 15:44:03,077 - INFO - Processing document 8-K_2025-03-10
2025-11-14 15:44:03,099 - INFO - Finished converting document 8-K_2025-03-10 in 0.08 sec.
2025-11-14 15:44:03,127 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:03,140 - INFO - Going to convert document batch...
2025-11-14 15:44:03,141 - INFO - Processing document 8-K_2025-03-14
2025-11-14 15:44:03,164 - INFO - Finished converting document 8-K_2025-03-14 in 0.05 sec.
2025-11-14 15:44:03,193 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:03,205 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BK\8-K_2025-03-03' --> 'data\processed_data\BK\8-K_2025-03-03.md'
Converted 'data\edgar_documents\BK\8-K_2025-03-10' --> 'data\processed_data\BK\8-K_2025-03-10.md'
Converted 'data\edgar_documents\BK\8-K_2025-03-14' --> 'data\processed_data\BK\8-K_2025-03-14.md'


2025-11-14 15:44:03,206 - INFO - Processing document 8-K_2025-04-11
2025-11-14 15:44:03,226 - INFO - Finished converting document 8-K_2025-04-11 in 0.05 sec.
2025-11-14 15:44:03,257 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:03,271 - INFO - Going to convert document batch...
2025-11-14 15:44:03,272 - INFO - Processing document 8-K_2025-04-16
2025-11-14 15:44:03,295 - INFO - Finished converting document 8-K_2025-04-16 in 0.06 sec.
2025-11-14 15:44:03,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:03,370 - INFO - Going to convert document batch...
2025-11-14 15:44:03,371 - INFO - Processing document 8-K_2025-06-10
2025-11-14 15:44:03,389 - INFO - Finished converting document 8-K_2025-06-10 in 0.08 sec.
2025-11-14 15:44:03,411 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:03,421 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BK\8-K_2025-04-11' --> 'data\processed_data\BK\8-K_2025-04-11.md'
Converted 'data\edgar_documents\BK\8-K_2025-04-16' --> 'data\processed_data\BK\8-K_2025-04-16.md'
Converted 'data\edgar_documents\BK\8-K_2025-06-10' --> 'data\processed_data\BK\8-K_2025-06-10.md'


2025-11-14 15:44:03,422 - INFO - Processing document 8-K_2025-06-12
2025-11-14 15:44:03,439 - INFO - Finished converting document 8-K_2025-06-12 in 0.05 sec.
2025-11-14 15:44:03,462 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:03,472 - INFO - Going to convert document batch...
2025-11-14 15:44:03,473 - INFO - Processing document 8-K_2025-07-01
2025-11-14 15:44:03,489 - INFO - Finished converting document 8-K_2025-07-01 in 0.03 sec.
2025-11-14 15:44:03,510 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:03,520 - INFO - Going to convert document batch...
2025-11-14 15:44:03,521 - INFO - Processing document 8-K_2025-07-15
2025-11-14 15:44:03,541 - INFO - Finished converting document 8-K_2025-07-15 in 0.03 sec.
2025-11-14 15:44:03,571 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:03,579 - INFO - Going to convert document batch...
2025-11-14 15:44:03,580 - INFO - Processing document 8-K_2025-09-03
2025-11-14 15:

Converted 'data\edgar_documents\BK\8-K_2025-06-12' --> 'data\processed_data\BK\8-K_2025-06-12.md'
Converted 'data\edgar_documents\BK\8-K_2025-07-01' --> 'data\processed_data\BK\8-K_2025-07-01.md'
Converted 'data\edgar_documents\BK\8-K_2025-07-15' --> 'data\processed_data\BK\8-K_2025-07-15.md'
Converted 'data\edgar_documents\BK\8-K_2025-09-03' --> 'data\processed_data\BK\8-K_2025-09-03.md'


2025-11-14 15:44:03,665 - INFO - Going to convert document batch...
2025-11-14 15:44:03,665 - INFO - Processing document 8-K_2025-09-10
2025-11-14 15:44:03,689 - INFO - Finished converting document 8-K_2025-09-10 in 0.08 sec.
2025-11-14 15:44:03,718 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:03,727 - INFO - Going to convert document batch...
2025-11-14 15:44:03,728 - INFO - Processing document 8-K_2025-09-11
2025-11-14 15:44:03,745 - INFO - Finished converting document 8-K_2025-09-11 in 0.05 sec.
2025-11-14 15:44:03,768 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:03,778 - INFO - Going to convert document batch...
2025-11-14 15:44:03,779 - INFO - Processing document 8-K_2025-09-23
2025-11-14 15:44:03,796 - INFO - Finished converting document 8-K_2025-09-23 in 0.05 sec.
2025-11-14 15:44:03,847 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:44:03,861 - INFO - Going to convert document batch...
2025-11-14 15:

Converted 'data\edgar_documents\BK\8-K_2025-09-10' --> 'data\processed_data\BK\8-K_2025-09-10.md'
Converted 'data\edgar_documents\BK\8-K_2025-09-11' --> 'data\processed_data\BK\8-K_2025-09-11.md'
Converted 'data\edgar_documents\BK\8-K_2025-09-23' --> 'data\processed_data\BK\8-K_2025-09-23.md'


2025-11-14 15:44:03,935 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:44:03,936 - ERROR - Input document DEF-14A_2023-03-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:44:03,939 - INFO - Going to convert document batch...
2025-11-14 15:44:03,975 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:44:03,976 - ERROR - Input document DEF-14A_2024-02-29 with format No

Converted 'data\edgar_documents\BK\8-K_2025-10-16' --> 'data\processed_data\BK\8-K_2025-10-16.md'
Error processing data\edgar_documents\BK\DEF-14A_2023-03-01: File format not allowed: data\edgar_documents\BK\DEF-14A_2023-03-01
Error processing data\edgar_documents\BK\DEF-14A_2024-02-29: File format not allowed: data\edgar_documents\BK\DEF-14A_2024-02-29
Error processing data\edgar_documents\BK\DEF-14A_2025-03-05: File format not allowed: data\edgar_documents\BK\DEF-14A_2025-03-05
Processed 107 new files. Errors: 21
Found 124 files to process in data\edgar_documents\BKNG


2025-11-14 15:44:04,854 - INFO - Going to convert document batch...
2025-11-14 15:44:04,855 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:44:04,855 - INFO - Processing document 10-K_2023-02-23
2025-11-14 15:44:06,848 - INFO - Finished converting document 10-K_2023-02-23 in 2.83 sec.
2025-11-14 15:44:07,443 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\10-K_2023-02-23' --> 'data\processed_data\BKNG\10-K_2023-02-23.md'


2025-11-14 15:44:08,267 - INFO - Going to convert document batch...
2025-11-14 15:44:08,268 - INFO - Processing document 10-K_2024-02-22
2025-11-14 15:44:13,205 - INFO - Finished converting document 10-K_2024-02-22 in 5.81 sec.
2025-11-14 15:44:15,032 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\10-K_2024-02-22' --> 'data\processed_data\BKNG\10-K_2024-02-22.md'


2025-11-14 15:44:16,945 - INFO - Going to convert document batch...
2025-11-14 15:44:16,947 - INFO - Processing document 10-K_2025-02-20
2025-11-14 15:44:23,699 - INFO - Finished converting document 10-K_2025-02-20 in 8.75 sec.
2025-11-14 15:44:25,581 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\10-K_2025-02-20' --> 'data\processed_data\BKNG\10-K_2025-02-20.md'


2025-11-14 15:44:27,159 - INFO - Going to convert document batch...
2025-11-14 15:44:27,160 - INFO - Processing document 10-Q_2023-05-04
2025-11-14 15:44:29,246 - INFO - Finished converting document 10-Q_2023-05-04 in 3.72 sec.
2025-11-14 15:44:30,712 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\10-Q_2023-05-04' --> 'data\processed_data\BKNG\10-Q_2023-05-04.md'


2025-11-14 15:44:33,177 - INFO - Going to convert document batch...
2025-11-14 15:44:33,181 - INFO - Processing document 10-Q_2023-08-03
2025-11-14 15:44:35,462 - INFO - Finished converting document 10-Q_2023-08-03 in 4.84 sec.
2025-11-14 15:44:36,879 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\10-Q_2023-08-03' --> 'data\processed_data\BKNG\10-Q_2023-08-03.md'


2025-11-14 15:44:38,390 - INFO - Going to convert document batch...
2025-11-14 15:44:38,392 - INFO - Processing document 10-Q_2023-11-02
2025-11-14 15:44:41,114 - INFO - Finished converting document 10-Q_2023-11-02 in 4.26 sec.
2025-11-14 15:44:42,289 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\10-Q_2023-11-02' --> 'data\processed_data\BKNG\10-Q_2023-11-02.md'


2025-11-14 15:44:44,063 - INFO - Going to convert document batch...
2025-11-14 15:44:44,064 - INFO - Processing document 10-Q_2024-05-02
2025-11-14 15:44:46,084 - INFO - Finished converting document 10-Q_2024-05-02 in 3.83 sec.
2025-11-14 15:44:47,313 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\10-Q_2024-05-02' --> 'data\processed_data\BKNG\10-Q_2024-05-02.md'


2025-11-14 15:44:49,403 - INFO - Going to convert document batch...
2025-11-14 15:44:49,406 - INFO - Processing document 10-Q_2024-08-01
2025-11-14 15:44:52,075 - INFO - Finished converting document 10-Q_2024-08-01 in 4.80 sec.
2025-11-14 15:44:53,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\10-Q_2024-08-01' --> 'data\processed_data\BKNG\10-Q_2024-08-01.md'


2025-11-14 15:44:54,532 - INFO - Going to convert document batch...
2025-11-14 15:44:54,534 - INFO - Processing document 10-Q_2024-10-30
2025-11-14 15:44:56,794 - INFO - Finished converting document 10-Q_2024-10-30 in 3.50 sec.
2025-11-14 15:44:57,993 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\10-Q_2024-10-30' --> 'data\processed_data\BKNG\10-Q_2024-10-30.md'


2025-11-14 15:44:59,994 - INFO - Going to convert document batch...
2025-11-14 15:44:59,996 - INFO - Processing document 10-Q_2025-04-29
2025-11-14 15:45:02,117 - INFO - Finished converting document 10-Q_2025-04-29 in 4.16 sec.
2025-11-14 15:45:03,240 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\10-Q_2025-04-29' --> 'data\processed_data\BKNG\10-Q_2025-04-29.md'


2025-11-14 15:45:04,655 - INFO - Going to convert document batch...
2025-11-14 15:45:04,657 - INFO - Processing document 10-Q_2025-07-29
2025-11-14 15:45:07,862 - INFO - Finished converting document 10-Q_2025-07-29 in 4.69 sec.
2025-11-14 15:45:09,229 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\10-Q_2025-07-29' --> 'data\processed_data\BKNG\10-Q_2025-07-29.md'


2025-11-14 15:45:10,508 - INFO - Going to convert document batch...
2025-11-14 15:45:10,510 - INFO - Processing document 10-Q_2025-10-28
2025-11-14 15:45:12,970 - INFO - Finished converting document 10-Q_2025-10-28 in 3.78 sec.
2025-11-14 15:45:14,233 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:14,294 - INFO - Going to convert document batch...
2025-11-14 15:45:14,296 - INFO - Processing document 4_2023-01-19
2025-11-14 15:45:14,416 - INFO - Finished converting document 4_2023-01-19 in 0.19 sec.


Converted 'data\edgar_documents\BKNG\10-Q_2025-10-28' --> 'data\processed_data\BKNG\10-Q_2025-10-28.md'


2025-11-14 15:45:14,555 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:14,577 - INFO - Going to convert document batch...
2025-11-14 15:45:14,585 - INFO - Processing document 4_2023-02-17
2025-11-14 15:45:14,637 - INFO - Finished converting document 4_2023-02-17 in 0.11 sec.
2025-11-14 15:45:14,719 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\4_2023-01-19' --> 'data\processed_data\BKNG\4_2023-01-19.md'
Converted 'data\edgar_documents\BKNG\4_2023-02-17' --> 'data\processed_data\BKNG\4_2023-02-17.md'


2025-11-14 15:45:14,749 - INFO - Going to convert document batch...
2025-11-14 15:45:14,750 - INFO - Processing document 4_2023-03-06
2025-11-14 15:45:14,826 - INFO - Finished converting document 4_2023-03-06 in 0.14 sec.
2025-11-14 15:45:14,899 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:14,918 - INFO - Going to convert document batch...
2025-11-14 15:45:14,919 - INFO - Processing document 4_2023-03-08
2025-11-14 15:45:14,953 - INFO - Finished converting document 4_2023-03-08 in 0.08 sec.
2025-11-14 15:45:15,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\4_2023-03-06' --> 'data\processed_data\BKNG\4_2023-03-06.md'
Converted 'data\edgar_documents\BKNG\4_2023-03-08' --> 'data\processed_data\BKNG\4_2023-03-08.md'


2025-11-14 15:45:15,067 - INFO - Going to convert document batch...
2025-11-14 15:45:15,070 - INFO - Processing document 4_2023-03-10
2025-11-14 15:45:15,132 - INFO - Finished converting document 4_2023-03-10 in 0.11 sec.
2025-11-14 15:45:15,182 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:15,200 - INFO - Going to convert document batch...
2025-11-14 15:45:15,202 - INFO - Processing document 4_2023-03-17
2025-11-14 15:45:15,259 - INFO - Finished converting document 4_2023-03-17 in 0.08 sec.


Converted 'data\edgar_documents\BKNG\4_2023-03-10' --> 'data\processed_data\BKNG\4_2023-03-10.md'
Converted 'data\edgar_documents\BKNG\4_2023-03-17' --> 'data\processed_data\BKNG\4_2023-03-17.md'


2025-11-14 15:45:15,357 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:15,388 - INFO - Going to convert document batch...
2025-11-14 15:45:15,390 - INFO - Processing document 4_2023-04-18
2025-11-14 15:45:15,428 - INFO - Finished converting document 4_2023-04-18 in 0.09 sec.
2025-11-14 15:45:15,502 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:15,520 - INFO - Going to convert document batch...
2025-11-14 15:45:15,521 - INFO - Processing document 4_2023-04-19
2025-11-14 15:45:15,565 - INFO - Finished converting document 4_2023-04-19 in 0.08 sec.
2025-11-14 15:45:15,628 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:15,647 - INFO - Going to convert document batch...
2025-11-14 15:45:15,648 - INFO - Processing document 4_2023-05-02


Converted 'data\edgar_documents\BKNG\4_2023-04-18' --> 'data\processed_data\BKNG\4_2023-04-18.md'
Converted 'data\edgar_documents\BKNG\4_2023-04-19' --> 'data\processed_data\BKNG\4_2023-04-19.md'


2025-11-14 15:45:15,683 - INFO - Finished converting document 4_2023-05-02 in 0.08 sec.
2025-11-14 15:45:15,773 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:45:15,773 - ERROR - Input document 4_2023-05-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:45:15,775 - INFO - Going to convert document batch...
2025-11-14 15:45:15,803 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:45:15,804 - ERROR - Input document 4_2023-05-10 with forma

Converted 'data\edgar_documents\BKNG\4_2023-05-02' --> 'data\processed_data\BKNG\4_2023-05-02.md'
Error processing data\edgar_documents\BKNG\4_2023-05-09: File format not allowed: data\edgar_documents\BKNG\4_2023-05-09
Error processing data\edgar_documents\BKNG\4_2023-05-10: File format not allowed: data\edgar_documents\BKNG\4_2023-05-10


2025-11-14 15:45:15,973 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:15,991 - INFO - Going to convert document batch...
2025-11-14 15:45:15,993 - INFO - Processing document 4_2023-05-31
2025-11-14 15:45:16,032 - INFO - Finished converting document 4_2023-05-31 in 0.08 sec.
2025-11-14 15:45:16,115 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\4_2023-05-16' --> 'data\processed_data\BKNG\4_2023-05-16.md'
Converted 'data\edgar_documents\BKNG\4_2023-05-31' --> 'data\processed_data\BKNG\4_2023-05-31.md'


2025-11-14 15:45:16,144 - INFO - Going to convert document batch...
2025-11-14 15:45:16,145 - INFO - Processing document 4_2023-06-16
2025-11-14 15:45:17,079 - INFO - Finished converting document 4_2023-06-16 in 0.98 sec.
2025-11-14 15:45:17,151 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:17,176 - INFO - Going to convert document batch...
2025-11-14 15:45:17,177 - INFO - Processing document 4_2023-07-18
2025-11-14 15:45:17,230 - INFO - Finished converting document 4_2023-07-18 in 0.11 sec.


Converted 'data\edgar_documents\BKNG\4_2023-06-16' --> 'data\processed_data\BKNG\4_2023-06-16.md'
Converted 'data\edgar_documents\BKNG\4_2023-07-18' --> 'data\processed_data\BKNG\4_2023-07-18.md'


2025-11-14 15:45:17,307 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:17,322 - INFO - Going to convert document batch...
2025-11-14 15:45:17,323 - INFO - Processing document 4_2023-08-09
2025-11-14 15:45:17,357 - INFO - Finished converting document 4_2023-08-09 in 0.08 sec.
2025-11-14 15:45:17,405 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:17,423 - INFO - Going to convert document batch...
2025-11-14 15:45:17,424 - INFO - Processing document 4_2023-08-10
2025-11-14 15:45:17,450 - INFO - Finished converting document 4_2023-08-10 in 0.06 sec.
2025-11-14 15:45:17,560 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\4_2023-08-09' --> 'data\processed_data\BKNG\4_2023-08-09.md'
Converted 'data\edgar_documents\BKNG\4_2023-08-10' --> 'data\processed_data\BKNG\4_2023-08-10.md'


2025-11-14 15:45:17,588 - INFO - Going to convert document batch...
2025-11-14 15:45:17,590 - INFO - Processing document 4_2023-08-14
2025-11-14 15:45:17,653 - INFO - Finished converting document 4_2023-08-14 in 0.12 sec.
2025-11-14 15:45:17,718 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:17,732 - INFO - Going to convert document batch...
2025-11-14 15:45:17,733 - INFO - Processing document 4_2023-08-16
2025-11-14 15:45:17,764 - INFO - Finished converting document 4_2023-08-16 in 0.06 sec.
2025-11-14 15:45:17,819 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:17,835 - INFO - Going to convert document batch...
2025-11-14 15:45:17,837 - INFO - Processing document 4_2023-08-28
2025-11-14 15:45:17,871 - INFO - Finished converting document 4_2023-08-28 in 0.08 sec.


Converted 'data\edgar_documents\BKNG\4_2023-08-14' --> 'data\processed_data\BKNG\4_2023-08-14.md'
Converted 'data\edgar_documents\BKNG\4_2023-08-16' --> 'data\processed_data\BKNG\4_2023-08-16.md'


2025-11-14 15:45:17,920 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:17,950 - INFO - Going to convert document batch...
2025-11-14 15:45:17,952 - INFO - Processing document 4_2023-09-01
2025-11-14 15:45:18,028 - INFO - Finished converting document 4_2023-09-01 in 0.12 sec.


Converted 'data\edgar_documents\BKNG\4_2023-08-28' --> 'data\processed_data\BKNG\4_2023-08-28.md'


2025-11-14 15:45:18,114 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:18,140 - INFO - Going to convert document batch...
2025-11-14 15:45:18,141 - INFO - Processing document 4_2023-09-12
2025-11-14 15:45:18,184 - INFO - Finished converting document 4_2023-09-12 in 0.09 sec.
2025-11-14 15:45:18,237 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:18,272 - INFO - Going to convert document batch...
2025-11-14 15:45:18,273 - INFO - Processing document 4_2023-09-18


Converted 'data\edgar_documents\BKNG\4_2023-09-01' --> 'data\processed_data\BKNG\4_2023-09-01.md'
Converted 'data\edgar_documents\BKNG\4_2023-09-12' --> 'data\processed_data\BKNG\4_2023-09-12.md'


2025-11-14 15:45:18,355 - INFO - Finished converting document 4_2023-09-18 in 0.14 sec.
2025-11-14 15:45:18,432 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:18,463 - INFO - Going to convert document batch...
2025-11-14 15:45:18,464 - INFO - Processing document 4_2023-10-17
2025-11-14 15:45:18,578 - INFO - Finished converting document 4_2023-10-17 in 0.16 sec.


Converted 'data\edgar_documents\BKNG\4_2023-09-18' --> 'data\processed_data\BKNG\4_2023-09-18.md'


2025-11-14 15:45:18,689 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:18,724 - INFO - Going to convert document batch...
2025-11-14 15:45:18,725 - INFO - Processing document 4_2023-11-13
2025-11-14 15:45:18,775 - INFO - Finished converting document 4_2023-11-13 in 0.09 sec.
2025-11-14 15:45:18,850 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:18,884 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BKNG\4_2023-10-17' --> 'data\processed_data\BKNG\4_2023-10-17.md'
Converted 'data\edgar_documents\BKNG\4_2023-11-13' --> 'data\processed_data\BKNG\4_2023-11-13.md'


2025-11-14 15:45:18,885 - INFO - Processing document 4_2023-11-16
2025-11-14 15:45:18,958 - INFO - Finished converting document 4_2023-11-16 in 0.12 sec.
2025-11-14 15:45:19,040 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:19,053 - INFO - Going to convert document batch...
2025-11-14 15:45:19,054 - INFO - Processing document 4_2023-12-12
2025-11-14 15:45:19,102 - INFO - Finished converting document 4_2023-12-12 in 0.08 sec.
2025-11-14 15:45:19,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\4_2023-11-16' --> 'data\processed_data\BKNG\4_2023-11-16.md'
Converted 'data\edgar_documents\BKNG\4_2023-12-12' --> 'data\processed_data\BKNG\4_2023-12-12.md'


2025-11-14 15:45:19,233 - INFO - Going to convert document batch...
2025-11-14 15:45:19,234 - INFO - Processing document 4_2023-12-18
2025-11-14 15:45:19,301 - INFO - Finished converting document 4_2023-12-18 in 0.12 sec.
2025-11-14 15:45:19,377 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:19,461 - INFO - Going to convert document batch...
2025-11-14 15:45:19,464 - INFO - Processing document 4_2024-01-17


Converted 'data\edgar_documents\BKNG\4_2023-12-18' --> 'data\processed_data\BKNG\4_2023-12-18.md'


2025-11-14 15:45:19,574 - INFO - Finished converting document 4_2024-01-17 in 0.23 sec.
2025-11-14 15:45:19,660 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:19,677 - INFO - Going to convert document batch...
2025-11-14 15:45:19,680 - INFO - Processing document 4_2024-02-08
2025-11-14 15:45:19,716 - INFO - Finished converting document 4_2024-02-08 in 0.08 sec.
2025-11-14 15:45:19,779 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\4_2024-01-17' --> 'data\processed_data\BKNG\4_2024-01-17.md'
Converted 'data\edgar_documents\BKNG\4_2024-02-08' --> 'data\processed_data\BKNG\4_2024-02-08.md'


2025-11-14 15:45:19,850 - INFO - Going to convert document batch...
2025-11-14 15:45:19,853 - INFO - Processing document 4_2024-02-16
2025-11-14 15:45:19,977 - INFO - Finished converting document 4_2024-02-16 in 0.22 sec.
2025-11-14 15:45:20,155 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:45:20,157 - ERROR - Input document 4_2024-02-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:45:20,162 - INFO - Going to convert document batch...
2025-11-14 15:45:20,225 - IN

Converted 'data\edgar_documents\BKNG\4_2024-02-16' --> 'data\processed_data\BKNG\4_2024-02-16.md'
Error processing data\edgar_documents\BKNG\4_2024-02-27: File format not allowed: data\edgar_documents\BKNG\4_2024-02-27
Error processing data\edgar_documents\BKNG\4_2024-02-28: File format not allowed: data\edgar_documents\BKNG\4_2024-02-28


2025-11-14 15:45:20,307 - INFO - Finished converting document 4_2024-03-05 in 0.08 sec.
2025-11-14 15:45:20,369 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:20,386 - INFO - Going to convert document batch...
2025-11-14 15:45:20,387 - INFO - Processing document 4_2024-03-08
2025-11-14 15:45:20,449 - INFO - Finished converting document 4_2024-03-08 in 0.11 sec.


Converted 'data\edgar_documents\BKNG\4_2024-03-05' --> 'data\processed_data\BKNG\4_2024-03-05.md'


2025-11-14 15:45:20,546 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:20,576 - INFO - Going to convert document batch...
2025-11-14 15:45:20,578 - INFO - Processing document 4_2024-03-18
2025-11-14 15:45:20,638 - INFO - Finished converting document 4_2024-03-18 in 0.11 sec.
2025-11-14 15:45:20,692 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\4_2024-03-08' --> 'data\processed_data\BKNG\4_2024-03-08.md'
Converted 'data\edgar_documents\BKNG\4_2024-03-18' --> 'data\processed_data\BKNG\4_2024-03-18.md'


2025-11-14 15:45:20,754 - INFO - Going to convert document batch...
2025-11-14 15:45:20,756 - INFO - Processing document 4_2024-04-16
2025-11-14 15:45:20,859 - INFO - Finished converting document 4_2024-04-16 in 0.19 sec.
2025-11-14 15:45:20,934 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:20,949 - INFO - Going to convert document batch...
2025-11-14 15:45:20,950 - INFO - Processing document 4_2024-05-03
2025-11-14 15:45:21,049 - INFO - Finished converting document 4_2024-05-03 in 0.12 sec.


Converted 'data\edgar_documents\BKNG\4_2024-04-16' --> 'data\processed_data\BKNG\4_2024-04-16.md'
Converted 'data\edgar_documents\BKNG\4_2024-05-03' --> 'data\processed_data\BKNG\4_2024-05-03.md'


2025-11-14 15:45:21,137 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:21,164 - INFO - Going to convert document batch...
2025-11-14 15:45:21,167 - INFO - Processing document 4_2024-05-09
2025-11-14 15:45:21,239 - INFO - Finished converting document 4_2024-05-09 in 0.12 sec.
2025-11-14 15:45:21,328 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:21,360 - INFO - Going to convert document batch...
2025-11-14 15:45:21,363 - INFO - Processing document 4_2024-05-13
2025-11-14 15:45:21,430 - INFO - Finished converting document 4_2024-05-13 in 0.11 sec.


Converted 'data\edgar_documents\BKNG\4_2024-05-09' --> 'data\processed_data\BKNG\4_2024-05-09.md'
Converted 'data\edgar_documents\BKNG\4_2024-05-13' --> 'data\processed_data\BKNG\4_2024-05-13.md'


2025-11-14 15:45:21,541 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:21,601 - INFO - Going to convert document batch...
2025-11-14 15:45:21,603 - INFO - Processing document 4_2024-05-16
2025-11-14 15:45:21,720 - INFO - Finished converting document 4_2024-05-16 in 0.20 sec.
2025-11-14 15:45:21,827 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:21,853 - INFO - Going to convert document batch...
2025-11-14 15:45:21,855 - INFO - Processing document 4_2024-05-31
2025-11-14 15:45:21,917 - INFO - Finished converting document 4_2024-05-31 in 0.11 sec.
2025-11-14 15:45:22,010 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\4_2024-05-16' --> 'data\processed_data\BKNG\4_2024-05-16.md'
Converted 'data\edgar_documents\BKNG\4_2024-05-31' --> 'data\processed_data\BKNG\4_2024-05-31.md'


2025-11-14 15:45:22,086 - INFO - Going to convert document batch...
2025-11-14 15:45:22,088 - INFO - Processing document 4_2024-06-18
2025-11-14 15:45:22,189 - INFO - Finished converting document 4_2024-06-18 in 0.22 sec.
2025-11-14 15:45:22,277 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:22,319 - INFO - Going to convert document batch...
2025-11-14 15:45:22,322 - INFO - Processing document 4_2024-07-16


Converted 'data\edgar_documents\BKNG\4_2024-06-18' --> 'data\processed_data\BKNG\4_2024-06-18.md'


2025-11-14 15:45:22,481 - INFO - Finished converting document 4_2024-07-16 in 0.23 sec.
2025-11-14 15:45:22,618 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:22,636 - INFO - Going to convert document batch...
2025-11-14 15:45:22,638 - INFO - Processing document 4_2024-08-13
2025-11-14 15:45:22,707 - INFO - Finished converting document 4_2024-08-13 in 0.11 sec.


Converted 'data\edgar_documents\BKNG\4_2024-07-16' --> 'data\processed_data\BKNG\4_2024-07-16.md'
Converted 'data\edgar_documents\BKNG\4_2024-08-13' --> 'data\processed_data\BKNG\4_2024-08-13.md'


2025-11-14 15:45:22,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:22,828 - INFO - Going to convert document batch...
2025-11-14 15:45:22,830 - INFO - Processing document 4_2024-08-16
2025-11-14 15:45:22,907 - INFO - Finished converting document 4_2024-08-16 in 0.14 sec.
2025-11-14 15:45:23,017 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:23,038 - INFO - Going to convert document batch...
2025-11-14 15:45:23,039 - INFO - Processing document 4_2024-08-28
2025-11-14 15:45:23,099 - INFO - Finished converting document 4_2024-08-28 in 0.11 sec.


Converted 'data\edgar_documents\BKNG\4_2024-08-16' --> 'data\processed_data\BKNG\4_2024-08-16.md'
Converted 'data\edgar_documents\BKNG\4_2024-08-28' --> 'data\processed_data\BKNG\4_2024-08-28.md'


2025-11-14 15:45:23,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:23,211 - INFO - Going to convert document batch...
2025-11-14 15:45:23,214 - INFO - Processing document 4_2024-11-13
2025-11-14 15:45:23,270 - INFO - Finished converting document 4_2024-11-13 in 0.11 sec.
2025-11-14 15:45:23,336 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:23,353 - INFO - Going to convert document batch...
2025-11-14 15:45:23,354 - INFO - Processing document 4_2024-11-15
2025-11-14 15:45:23,404 - INFO - Finished converting document 4_2024-11-15 in 0.09 sec.
2025-11-14 15:45:23,492 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:45:23,493 - ERROR - Input document 4_2024-11-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <Inp

Converted 'data\edgar_documents\BKNG\4_2024-11-13' --> 'data\processed_data\BKNG\4_2024-11-13.md'
Converted 'data\edgar_documents\BKNG\4_2024-11-15' --> 'data\processed_data\BKNG\4_2024-11-15.md'


2025-11-14 15:45:23,521 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:45:23,522 - ERROR - Input document 4_2024-11-19 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:45:23,524 - INFO - Going to convert document batch...
2025-11-14 15:45:23,538 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:23,566 - INFO - Going to convert document batch...
2025-11-14 15:45:23,568 - INFO - Processing document 4_2024-11-25
2025-11-14 15:45:23,619 - INFO - Fin

Error processing data\edgar_documents\BKNG\4_2024-11-18: File format not allowed: data\edgar_documents\BKNG\4_2024-11-18
Error processing data\edgar_documents\BKNG\4_2024-11-19: File format not allowed: data\edgar_documents\BKNG\4_2024-11-19
Converted 'data\edgar_documents\BKNG\4_2024-11-25' --> 'data\processed_data\BKNG\4_2024-11-25.md'


2025-11-14 15:45:23,688 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:23,714 - INFO - Going to convert document batch...
2025-11-14 15:45:23,716 - INFO - Processing document 4_2025-02-25
2025-11-14 15:45:23,787 - INFO - Finished converting document 4_2025-02-25 in 0.11 sec.
2025-11-14 15:45:23,869 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:23,890 - INFO - Going to convert document batch...
2025-11-14 15:45:23,891 - INFO - Processing document 4_2025-03-04
2025-11-14 15:45:23,984 - INFO - Finished converting document 4_2025-03-04 in 0.14 sec.


Converted 'data\edgar_documents\BKNG\4_2025-02-25' --> 'data\processed_data\BKNG\4_2025-02-25.md'
Converted 'data\edgar_documents\BKNG\4_2025-03-04' --> 'data\processed_data\BKNG\4_2025-03-04.md'


2025-11-14 15:45:24,084 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:24,122 - INFO - Going to convert document batch...
2025-11-14 15:45:24,124 - INFO - Processing document 4_2025-03-06
2025-11-14 15:45:24,180 - INFO - Finished converting document 4_2025-03-06 in 0.12 sec.
2025-11-14 15:45:24,234 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:24,250 - INFO - Going to convert document batch...
2025-11-14 15:45:24,252 - INFO - Processing document 4_2025-05-05
2025-11-14 15:45:24,286 - INFO - Finished converting document 4_2025-05-05 in 0.06 sec.
2025-11-14 15:45:24,380 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:45:24,381 - ERROR - Input document 4_2025-05-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <Inp

Converted 'data\edgar_documents\BKNG\4_2025-03-06' --> 'data\processed_data\BKNG\4_2025-03-06.md'
Converted 'data\edgar_documents\BKNG\4_2025-05-05' --> 'data\processed_data\BKNG\4_2025-05-05.md'
Error processing data\edgar_documents\BKNG\4_2025-05-06: File format not allowed: data\edgar_documents\BKNG\4_2025-05-06


2025-11-14 15:45:24,418 - ERROR - Input document 4_2025-05-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:45:24,421 - INFO - Going to convert document batch...
2025-11-14 15:45:24,439 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:24,485 - INFO - Going to convert document batch...
2025-11-14 15:45:24,487 - INFO - Processing document 4_2025-05-13
2025-11-14 15:45:24,550 - INFO - Finished converting document 4_2025-05-13 in 0.12 sec.
2025-11-14 15:45:24,619 - INFO - detec

Error processing data\edgar_documents\BKNG\4_2025-05-07: File format not allowed: data\edgar_documents\BKNG\4_2025-05-07
Converted 'data\edgar_documents\BKNG\4_2025-05-13' --> 'data\processed_data\BKNG\4_2025-05-13.md'


2025-11-14 15:45:24,688 - INFO - Going to convert document batch...
2025-11-14 15:45:24,691 - INFO - Processing document 4_2025-05-16
2025-11-14 15:45:24,893 - INFO - Finished converting document 4_2025-05-16 in 0.30 sec.
2025-11-14 15:45:25,072 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:25,107 - INFO - Going to convert document batch...
2025-11-14 15:45:25,109 - INFO - Processing document 4_2025-06-02
2025-11-14 15:45:25,171 - INFO - Finished converting document 4_2025-06-02 in 0.12 sec.
2025-11-14 15:45:25,246 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\4_2025-05-16' --> 'data\processed_data\BKNG\4_2025-05-16.md'
Converted 'data\edgar_documents\BKNG\4_2025-06-02' --> 'data\processed_data\BKNG\4_2025-06-02.md'


2025-11-14 15:45:25,283 - INFO - Going to convert document batch...
2025-11-14 15:45:25,284 - INFO - Processing document 4_2025-06-17
2025-11-14 15:45:25,385 - INFO - Finished converting document 4_2025-06-17 in 0.17 sec.
2025-11-14 15:45:25,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\4_2025-06-17' --> 'data\processed_data\BKNG\4_2025-06-17.md'


2025-11-14 15:45:26,301 - INFO - Going to convert document batch...
2025-11-14 15:45:26,303 - INFO - Processing document 4_2025-07-16
2025-11-14 15:45:26,392 - INFO - Finished converting document 4_2025-07-16 in 0.91 sec.
2025-11-14 15:45:26,507 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:26,534 - INFO - Going to convert document batch...
2025-11-14 15:45:26,536 - INFO - Processing document 4_2025-08-01
2025-11-14 15:45:26,601 - INFO - Finished converting document 4_2025-08-01 in 0.12 sec.
2025-11-14 15:45:26,661 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\4_2025-07-16' --> 'data\processed_data\BKNG\4_2025-07-16.md'
Converted 'data\edgar_documents\BKNG\4_2025-08-01' --> 'data\processed_data\BKNG\4_2025-08-01.md'


2025-11-14 15:45:26,722 - INFO - Going to convert document batch...
2025-11-14 15:45:26,724 - INFO - Processing document 4_2025-08-18
2025-11-14 15:45:26,843 - INFO - Finished converting document 4_2025-08-18 in 0.20 sec.
2025-11-14 15:45:26,923 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:27,021 - INFO - Going to convert document batch...
2025-11-14 15:45:27,022 - INFO - Processing document 4_2025-09-09


Converted 'data\edgar_documents\BKNG\4_2025-08-18' --> 'data\processed_data\BKNG\4_2025-08-18.md'


2025-11-14 15:45:27,180 - INFO - Finished converting document 4_2025-09-09 in 0.27 sec.
2025-11-14 15:45:27,313 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:27,390 - INFO - Going to convert document batch...
2025-11-14 15:45:27,393 - INFO - Processing document 4_2025-09-16


Converted 'data\edgar_documents\BKNG\4_2025-09-09' --> 'data\processed_data\BKNG\4_2025-09-09.md'


2025-11-14 15:45:27,590 - INFO - Finished converting document 4_2025-09-16 in 0.30 sec.
2025-11-14 15:45:27,750 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:27,805 - INFO - Going to convert document batch...
2025-11-14 15:45:27,809 - INFO - Processing document 4_2025-10-16


Converted 'data\edgar_documents\BKNG\4_2025-09-16' --> 'data\processed_data\BKNG\4_2025-09-16.md'


2025-11-14 15:45:27,923 - INFO - Finished converting document 4_2025-10-16 in 0.20 sec.
2025-11-14 15:45:28,065 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:45:28,067 - ERROR - Input document 4_2025-11-04 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:45:28,070 - INFO - Going to convert document batch...
2025-11-14 15:45:28,113 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:45:28,115 - ERROR - Input document 4_2025-11-05 with forma

Converted 'data\edgar_documents\BKNG\4_2025-10-16' --> 'data\processed_data\BKNG\4_2025-10-16.md'
Error processing data\edgar_documents\BKNG\4_2025-11-04: File format not allowed: data\edgar_documents\BKNG\4_2025-11-04
Error processing data\edgar_documents\BKNG\4_2025-11-05: File format not allowed: data\edgar_documents\BKNG\4_2025-11-05


2025-11-14 15:45:28,240 - INFO - Finished converting document 4_2025-11-10 in 0.11 sec.
2025-11-14 15:45:28,299 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:28,346 - INFO - Going to convert document batch...
2025-11-14 15:45:28,348 - INFO - Processing document 8-K_2023-01-13
2025-11-14 15:45:28,392 - INFO - Finished converting document 8-K_2023-01-13 in 0.11 sec.
2025-11-14 15:45:28,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\4_2025-11-10' --> 'data\processed_data\BKNG\4_2025-11-10.md'
Converted 'data\edgar_documents\BKNG\8-K_2023-01-13' --> 'data\processed_data\BKNG\8-K_2023-01-13.md'


2025-11-14 15:45:28,545 - INFO - Going to convert document batch...
2025-11-14 15:45:28,547 - INFO - Processing document 8-K_2023-02-23
2025-11-14 15:45:28,598 - INFO - Finished converting document 8-K_2023-02-23 in 0.17 sec.
2025-11-14 15:45:28,653 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:28,716 - INFO - Going to convert document batch...
2025-11-14 15:45:28,719 - INFO - Processing document 8-K_2023-04-11
2025-11-14 15:45:28,803 - INFO - Finished converting document 8-K_2023-04-11 in 0.17 sec.


Converted 'data\edgar_documents\BKNG\8-K_2023-02-23' --> 'data\processed_data\BKNG\8-K_2023-02-23.md'


2025-11-14 15:45:28,885 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:28,945 - INFO - Going to convert document batch...
2025-11-14 15:45:28,946 - INFO - Processing document 8-K_2023-04-24
2025-11-14 15:45:29,005 - INFO - Finished converting document 8-K_2023-04-24 in 0.16 sec.


Converted 'data\edgar_documents\BKNG\8-K_2023-04-11' --> 'data\processed_data\BKNG\8-K_2023-04-11.md'
Converted 'data\edgar_documents\BKNG\8-K_2023-04-24' --> 'data\processed_data\BKNG\8-K_2023-04-24.md'


2025-11-14 15:45:29,063 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:29,103 - INFO - Going to convert document batch...
2025-11-14 15:45:29,104 - INFO - Processing document 8-K_2023-05-04
2025-11-14 15:45:29,146 - INFO - Finished converting document 8-K_2023-05-04 in 0.11 sec.
2025-11-14 15:45:29,201 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:29,260 - INFO - Going to convert document batch...
2025-11-14 15:45:29,263 - INFO - Processing document 8-K_2023-05-12


Converted 'data\edgar_documents\BKNG\8-K_2023-05-04' --> 'data\processed_data\BKNG\8-K_2023-05-04.md'


2025-11-14 15:45:29,402 - INFO - Finished converting document 8-K_2023-05-12 in 0.23 sec.
2025-11-14 15:45:29,507 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:29,578 - INFO - Going to convert document batch...
2025-11-14 15:45:29,579 - INFO - Processing document 8-K_2023-05-19
2025-11-14 15:45:29,643 - INFO - Finished converting document 8-K_2023-05-19 in 0.16 sec.


Converted 'data\edgar_documents\BKNG\8-K_2023-05-12' --> 'data\processed_data\BKNG\8-K_2023-05-12.md'


2025-11-14 15:45:29,715 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:29,783 - INFO - Going to convert document batch...
2025-11-14 15:45:29,785 - INFO - Processing document 8-K_2023-06-07
2025-11-14 15:45:29,853 - INFO - Finished converting document 8-K_2023-06-07 in 0.16 sec.


Converted 'data\edgar_documents\BKNG\8-K_2023-05-19' --> 'data\processed_data\BKNG\8-K_2023-05-19.md'


2025-11-14 15:45:29,938 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:30,014 - INFO - Going to convert document batch...
2025-11-14 15:45:30,016 - INFO - Processing document 8-K_2023-07-05
2025-11-14 15:45:30,061 - INFO - Finished converting document 8-K_2023-07-05 in 0.16 sec.


Converted 'data\edgar_documents\BKNG\8-K_2023-06-07' --> 'data\processed_data\BKNG\8-K_2023-06-07.md'
Converted 'data\edgar_documents\BKNG\8-K_2023-07-05' --> 'data\processed_data\BKNG\8-K_2023-07-05.md'


2025-11-14 15:45:30,117 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:30,187 - INFO - Going to convert document batch...
2025-11-14 15:45:30,188 - INFO - Processing document 8-K_2023-08-03
2025-11-14 15:45:30,246 - INFO - Finished converting document 8-K_2023-08-03 in 0.17 sec.
2025-11-14 15:45:30,286 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:30,371 - INFO - Going to convert document batch...
2025-11-14 15:45:30,381 - INFO - Processing document 8-K_2023-09-25
2025-11-14 15:45:30,467 - INFO - Finished converting document 8-K_2023-09-25 in 0.20 sec.


Converted 'data\edgar_documents\BKNG\8-K_2023-08-03' --> 'data\processed_data\BKNG\8-K_2023-08-03.md'


2025-11-14 15:45:30,602 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:30,646 - INFO - Going to convert document batch...
2025-11-14 15:45:30,648 - INFO - Processing document 8-K_2023-10-24
2025-11-14 15:45:30,719 - INFO - Finished converting document 8-K_2023-10-24 in 0.17 sec.


Converted 'data\edgar_documents\BKNG\8-K_2023-09-25' --> 'data\processed_data\BKNG\8-K_2023-09-25.md'
Converted 'data\edgar_documents\BKNG\8-K_2023-10-24' --> 'data\processed_data\BKNG\8-K_2023-10-24.md'


2025-11-14 15:45:30,810 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:30,877 - INFO - Going to convert document batch...
2025-11-14 15:45:30,879 - INFO - Processing document 8-K_2023-11-02
2025-11-14 15:45:30,948 - INFO - Finished converting document 8-K_2023-11-02 in 0.20 sec.
2025-11-14 15:45:31,034 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:31,110 - INFO - Going to convert document batch...
2025-11-14 15:45:31,112 - INFO - Processing document 8-K_2023-12-13
2025-11-14 15:45:31,195 - INFO - Finished converting document 8-K_2023-12-13 in 0.17 sec.


Converted 'data\edgar_documents\BKNG\8-K_2023-11-02' --> 'data\processed_data\BKNG\8-K_2023-11-02.md'


2025-11-14 15:45:31,269 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:31,326 - INFO - Going to convert document batch...
2025-11-14 15:45:31,328 - INFO - Processing document 8-K_2024-01-19
2025-11-14 15:45:31,402 - INFO - Finished converting document 8-K_2024-01-19 in 0.17 sec.


Converted 'data\edgar_documents\BKNG\8-K_2023-12-13' --> 'data\processed_data\BKNG\8-K_2023-12-13.md'


2025-11-14 15:45:31,470 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:31,533 - INFO - Going to convert document batch...
2025-11-14 15:45:31,534 - INFO - Processing document 8-K_2024-02-22
2025-11-14 15:45:31,605 - INFO - Finished converting document 8-K_2024-02-22 in 0.16 sec.


Converted 'data\edgar_documents\BKNG\8-K_2024-01-19' --> 'data\processed_data\BKNG\8-K_2024-01-19.md'
Converted 'data\edgar_documents\BKNG\8-K_2024-02-22' --> 'data\processed_data\BKNG\8-K_2024-02-22.md'


2025-11-14 15:45:31,666 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:31,710 - INFO - Going to convert document batch...
2025-11-14 15:45:31,712 - INFO - Processing document 8-K_2024-03-01
2025-11-14 15:45:31,884 - INFO - Finished converting document 8-K_2024-03-01 in 0.25 sec.
2025-11-14 15:45:32,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:32,097 - INFO - Going to convert document batch...
2025-11-14 15:45:32,099 - INFO - Processing document 8-K_2024-04-05


Converted 'data\edgar_documents\BKNG\8-K_2024-03-01' --> 'data\processed_data\BKNG\8-K_2024-03-01.md'


2025-11-14 15:45:32,201 - INFO - Finished converting document 8-K_2024-04-05 in 0.23 sec.
2025-11-14 15:45:32,273 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:32,322 - INFO - Going to convert document batch...
2025-11-14 15:45:32,324 - INFO - Processing document 8-K_2024-04-22
2025-11-14 15:45:32,406 - INFO - Finished converting document 8-K_2024-04-22 in 0.17 sec.


Converted 'data\edgar_documents\BKNG\8-K_2024-04-05' --> 'data\processed_data\BKNG\8-K_2024-04-05.md'


2025-11-14 15:45:32,520 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:32,586 - INFO - Going to convert document batch...
2025-11-14 15:45:32,588 - INFO - Processing document 8-K_2024-05-02


Converted 'data\edgar_documents\BKNG\8-K_2024-04-22' --> 'data\processed_data\BKNG\8-K_2024-04-22.md'


2025-11-14 15:45:32,667 - INFO - Finished converting document 8-K_2024-05-02 in 0.20 sec.
2025-11-14 15:45:32,725 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:32,752 - INFO - Going to convert document batch...
2025-11-14 15:45:32,753 - INFO - Processing document 8-K_2024-05-10
2025-11-14 15:45:32,807 - INFO - Finished converting document 8-K_2024-05-10 in 0.11 sec.
2025-11-14 15:45:32,868 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\8-K_2024-05-02' --> 'data\processed_data\BKNG\8-K_2024-05-02.md'
Converted 'data\edgar_documents\BKNG\8-K_2024-05-10' --> 'data\processed_data\BKNG\8-K_2024-05-10.md'


2025-11-14 15:45:32,917 - INFO - Going to convert document batch...
2025-11-14 15:45:32,918 - INFO - Processing document 8-K_2024-06-05
2025-11-14 15:45:33,040 - INFO - Finished converting document 8-K_2024-06-05 in 0.20 sec.
2025-11-14 15:45:33,101 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:33,147 - INFO - Going to convert document batch...
2025-11-14 15:45:33,149 - INFO - Processing document 8-K_2024-08-01
2025-11-14 15:45:33,217 - INFO - Finished converting document 8-K_2024-08-01 in 0.14 sec.
2025-11-14 15:45:33,269 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\8-K_2024-06-05' --> 'data\processed_data\BKNG\8-K_2024-06-05.md'
Converted 'data\edgar_documents\BKNG\8-K_2024-08-01' --> 'data\processed_data\BKNG\8-K_2024-08-01.md'


2025-11-14 15:45:33,335 - INFO - Going to convert document batch...
2025-11-14 15:45:33,337 - INFO - Processing document 8-K_2024-10-30
2025-11-14 15:45:33,408 - INFO - Finished converting document 8-K_2024-10-30 in 0.16 sec.
2025-11-14 15:45:33,477 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:45:33,479 - ERROR - Input document 8-K_2024-11-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:45:33,481 - INFO - Going to convert docu

Converted 'data\edgar_documents\BKNG\8-K_2024-10-30' --> 'data\processed_data\BKNG\8-K_2024-10-30.md'
Error processing data\edgar_documents\BKNG\8-K_2024-11-08: File format not allowed: data\edgar_documents\BKNG\8-K_2024-11-08


2025-11-14 15:45:33,693 - INFO - Finished converting document 8-K_2024-11-21 in 0.20 sec.
2025-11-14 15:45:33,792 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:33,850 - INFO - Going to convert document batch...
2025-11-14 15:45:33,851 - INFO - Processing document 8-K_2024-12-10


Converted 'data\edgar_documents\BKNG\8-K_2024-11-21' --> 'data\processed_data\BKNG\8-K_2024-11-21.md'


2025-11-14 15:45:34,652 - INFO - Finished converting document 8-K_2024-12-10 in 0.88 sec.
2025-11-14 15:45:34,720 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:34,785 - INFO - Going to convert document batch...
2025-11-14 15:45:34,787 - INFO - Processing document 8-K_2024-12-18
2025-11-14 15:45:34,882 - INFO - Finished converting document 8-K_2024-12-18 in 0.19 sec.


Converted 'data\edgar_documents\BKNG\8-K_2024-12-10' --> 'data\processed_data\BKNG\8-K_2024-12-10.md'


2025-11-14 15:45:34,960 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:35,014 - INFO - Going to convert document batch...
2025-11-14 15:45:35,016 - INFO - Processing document 8-K_2025-02-20
2025-11-14 15:45:35,068 - INFO - Finished converting document 8-K_2025-02-20 in 0.12 sec.


Converted 'data\edgar_documents\BKNG\8-K_2024-12-18' --> 'data\processed_data\BKNG\8-K_2024-12-18.md'
Converted 'data\edgar_documents\BKNG\8-K_2025-02-20' --> 'data\processed_data\BKNG\8-K_2025-02-20.md'


2025-11-14 15:45:35,135 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:35,204 - INFO - Going to convert document batch...
2025-11-14 15:45:35,207 - INFO - Processing document 8-K_2025-04-22
2025-11-14 15:45:35,261 - INFO - Finished converting document 8-K_2025-04-22 in 0.17 sec.
2025-11-14 15:45:35,318 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:35,419 - INFO - Going to convert document batch...
2025-11-14 15:45:35,423 - INFO - Processing document 8-K_2025-04-29


Converted 'data\edgar_documents\BKNG\8-K_2025-04-22' --> 'data\processed_data\BKNG\8-K_2025-04-22.md'


2025-11-14 15:45:35,520 - INFO - Finished converting document 8-K_2025-04-29 in 0.22 sec.
2025-11-14 15:45:35,590 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:35,660 - INFO - Going to convert document batch...
2025-11-14 15:45:35,662 - INFO - Processing document 8-K_2025-05-09


Converted 'data\edgar_documents\BKNG\8-K_2025-04-29' --> 'data\processed_data\BKNG\8-K_2025-04-29.md'


2025-11-14 15:45:35,838 - INFO - Finished converting document 8-K_2025-05-09 in 0.28 sec.
2025-11-14 15:45:35,969 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:36,064 - INFO - Going to convert document batch...
2025-11-14 15:45:36,065 - INFO - Processing document 8-K_2025-06-04


Converted 'data\edgar_documents\BKNG\8-K_2025-05-09' --> 'data\processed_data\BKNG\8-K_2025-05-09.md'


2025-11-14 15:45:36,161 - INFO - Finished converting document 8-K_2025-06-04 in 0.22 sec.
2025-11-14 15:45:36,236 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:36,287 - INFO - Going to convert document batch...
2025-11-14 15:45:36,290 - INFO - Processing document 8-K_2025-07-29
2025-11-14 15:45:36,377 - INFO - Finished converting document 8-K_2025-07-29 in 0.16 sec.


Converted 'data\edgar_documents\BKNG\8-K_2025-06-04' --> 'data\processed_data\BKNG\8-K_2025-06-04.md'
Converted 'data\edgar_documents\BKNG\8-K_2025-07-29' --> 'data\processed_data\BKNG\8-K_2025-07-29.md'


2025-11-14 15:45:36,459 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:36,577 - INFO - Going to convert document batch...
2025-11-14 15:45:36,581 - INFO - Processing document 8-K_2025-09-19
2025-11-14 15:45:36,687 - INFO - Finished converting document 8-K_2025-09-19 in 0.27 sec.
2025-11-14 15:45:36,719 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:36,753 - INFO - Going to convert document batch...
2025-11-14 15:45:36,754 - INFO - Processing document 8-K_2025-10-17
2025-11-14 15:45:36,802 - INFO - Finished converting document 8-K_2025-10-17 in 0.09 sec.
2025-11-14 15:45:36,890 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\8-K_2025-09-19' --> 'data\processed_data\BKNG\8-K_2025-09-19.md'
Converted 'data\edgar_documents\BKNG\8-K_2025-10-17' --> 'data\processed_data\BKNG\8-K_2025-10-17.md'


2025-11-14 15:45:36,954 - INFO - Going to convert document batch...
2025-11-14 15:45:36,957 - INFO - Processing document 8-K_2025-10-28
2025-11-14 15:45:37,027 - INFO - Finished converting document 8-K_2025-10-28 in 0.19 sec.
2025-11-14 15:45:37,082 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:45:37,145 - INFO - Going to convert document batch...
2025-11-14 15:45:37,146 - INFO - Processing document 8-K_2025-11-07
2025-11-14 15:45:37,243 - INFO - Finished converting document 8-K_2025-11-07 in 0.17 sec.


Converted 'data\edgar_documents\BKNG\8-K_2025-10-28' --> 'data\processed_data\BKNG\8-K_2025-10-28.md'


2025-11-14 15:45:37,339 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:45:37,341 - ERROR - Input document DEF-14A_2023-04-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:45:37,343 - INFO - Going to convert document batch...
2025-11-14 15:45:37,369 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\8-K_2025-11-07' --> 'data\processed_data\BKNG\8-K_2025-11-07.md'
Error processing data\edgar_documents\BKNG\DEF-14A_2023-04-24: File format not allowed: data\edgar_documents\BKNG\DEF-14A_2023-04-24


2025-11-14 15:45:38,549 - INFO - Going to convert document batch...
2025-11-14 15:45:38,551 - INFO - Processing document DEF-14A_2024-04-23
2025-11-14 15:45:42,365 - INFO - Finished converting document DEF-14A_2024-04-23 in 5.01 sec.
2025-11-14 15:45:45,119 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BKNG\DEF-14A_2024-04-23' --> 'data\processed_data\BKNG\DEF-14A_2024-04-23.md'


2025-11-14 15:45:47,097 - INFO - Going to convert document batch...
2025-11-14 15:45:47,099 - INFO - Processing document DEF-14A_2025-04-22
2025-11-14 15:45:50,375 - INFO - Finished converting document DEF-14A_2025-04-22 in 5.31 sec.


Converted 'data\edgar_documents\BKNG\DEF-14A_2025-04-22' --> 'data\processed_data\BKNG\DEF-14A_2025-04-22.md'
Processed 112 new files. Errors: 12
Found 62 files to process in data\edgar_documents\BLK


2025-11-14 15:45:53,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:46:00,127 - INFO - Going to convert document batch...
2025-11-14 15:46:00,128 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:46:00,129 - INFO - Processing document 10-K_2025-02-25
2025-11-14 15:46:13,892 - INFO - Finished converting document 10-K_2025-02-25 in 21.06 sec.


Converted 'data\edgar_documents\BLK\10-K_2025-02-25' --> 'data\processed_data\BLK\10-K_2025-02-25.md'


2025-11-14 15:46:15,984 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:46:21,651 - INFO - Going to convert document batch...
2025-11-14 15:46:21,652 - INFO - Processing document 10-Q_2024-11-06
2025-11-14 15:46:28,105 - INFO - Finished converting document 10-Q_2024-11-06 in 12.36 sec.
2025-11-14 15:46:29,534 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BLK\10-Q_2024-11-06' --> 'data\processed_data\BLK\10-Q_2024-11-06.md'


2025-11-14 15:46:35,057 - INFO - Going to convert document batch...
2025-11-14 15:46:35,059 - INFO - Processing document 10-Q_2025-05-07
2025-11-14 15:46:41,117 - INFO - Finished converting document 10-Q_2025-05-07 in 11.73 sec.
2025-11-14 15:46:42,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BLK\10-Q_2025-05-07' --> 'data\processed_data\BLK\10-Q_2025-05-07.md'


2025-11-14 15:46:48,792 - INFO - Going to convert document batch...
2025-11-14 15:46:48,794 - INFO - Processing document 10-Q_2025-08-06
2025-11-14 15:46:57,183 - INFO - Finished converting document 10-Q_2025-08-06 in 15.25 sec.


Converted 'data\edgar_documents\BLK\10-Q_2025-08-06' --> 'data\processed_data\BLK\10-Q_2025-08-06.md'


2025-11-14 15:46:58,872 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:06,720 - INFO - Going to convert document batch...
2025-11-14 15:47:06,722 - INFO - Processing document 10-Q_2025-11-05
2025-11-14 15:47:15,819 - INFO - Finished converting document 10-Q_2025-11-05 in 17.17 sec.
2025-11-14 15:47:17,399 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:47:17,400 - ERROR - Input document 4_2024-03-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-1

Converted 'data\edgar_documents\BLK\10-Q_2025-11-05' --> 'data\processed_data\BLK\10-Q_2025-11-05.md'
Error processing data\edgar_documents\BLK\4_2024-03-05: File format not allowed: data\edgar_documents\BLK\4_2024-03-05
Error processing data\edgar_documents\BLK\4_2024-03-07: File format not allowed: data\edgar_documents\BLK\4_2024-03-07
Error processing data\edgar_documents\BLK\4_2024-07-17: File format not allowed: data\edgar_documents\BLK\4_2024-07-17
Error processing data\edgar_documents\BLK\4_2024-07-19: File format not allowed: data\edgar_documents\BLK\4_2024-07-19


2025-11-14 15:47:17,574 - INFO - Going to convert document batch...
2025-11-14 15:47:17,580 - INFO - Processing document 4_2024-10-02
2025-11-14 15:47:17,627 - INFO - Finished converting document 4_2024-10-02 in 0.11 sec.
2025-11-14 15:47:17,717 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:17,762 - INFO - Going to convert document batch...
2025-11-14 15:47:17,765 - INFO - Processing document 4_2024-12-06
2025-11-14 15:47:17,879 - INFO - Finished converting document 4_2024-12-06 in 0.17 sec.


Converted 'data\edgar_documents\BLK\4_2024-10-02' --> 'data\processed_data\BLK\4_2024-10-02.md'


2025-11-14 15:47:17,989 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:18,007 - INFO - Going to convert document batch...
2025-11-14 15:47:18,010 - INFO - Processing document 4_2025-01-03
2025-11-14 15:47:18,061 - INFO - Finished converting document 4_2025-01-03 in 0.09 sec.
2025-11-14 15:47:18,147 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BLK\4_2024-12-06' --> 'data\processed_data\BLK\4_2024-12-06.md'
Converted 'data\edgar_documents\BLK\4_2025-01-03' --> 'data\processed_data\BLK\4_2025-01-03.md'


2025-11-14 15:47:18,172 - INFO - Going to convert document batch...
2025-11-14 15:47:18,175 - INFO - Processing document 4_2025-01-17
2025-11-14 15:47:18,235 - INFO - Finished converting document 4_2025-01-17 in 0.11 sec.
2025-11-14 15:47:18,310 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:18,331 - INFO - Going to convert document batch...
2025-11-14 15:47:18,332 - INFO - Processing document 4_2025-01-23
2025-11-14 15:47:18,385 - INFO - Finished converting document 4_2025-01-23 in 0.11 sec.


Converted 'data\edgar_documents\BLK\4_2025-01-17' --> 'data\processed_data\BLK\4_2025-01-17.md'
Converted 'data\edgar_documents\BLK\4_2025-01-23' --> 'data\processed_data\BLK\4_2025-01-23.md'


2025-11-14 15:47:18,494 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:18,536 - INFO - Going to convert document batch...
2025-11-14 15:47:18,537 - INFO - Processing document 4_2025-01-31
2025-11-14 15:47:18,606 - INFO - Finished converting document 4_2025-01-31 in 0.14 sec.
2025-11-14 15:47:18,710 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:18,742 - INFO - Going to convert document batch...
2025-11-14 15:47:18,743 - INFO - Processing document 4_2025-02-04
2025-11-14 15:47:18,812 - INFO - Finished converting document 4_2025-02-04 in 0.14 sec.


Converted 'data\edgar_documents\BLK\4_2025-01-31' --> 'data\processed_data\BLK\4_2025-01-31.md'


2025-11-14 15:47:18,883 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:18,914 - INFO - Going to convert document batch...
2025-11-14 15:47:18,915 - INFO - Processing document 4_2025-02-28
2025-11-14 15:47:18,974 - INFO - Finished converting document 4_2025-02-28 in 0.11 sec.


Converted 'data\edgar_documents\BLK\4_2025-02-04' --> 'data\processed_data\BLK\4_2025-02-04.md'
Converted 'data\edgar_documents\BLK\4_2025-02-28' --> 'data\processed_data\BLK\4_2025-02-28.md'


2025-11-14 15:47:19,061 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:19,088 - INFO - Going to convert document batch...
2025-11-14 15:47:19,090 - INFO - Processing document 4_2025-03-04
2025-11-14 15:47:19,143 - INFO - Finished converting document 4_2025-03-04 in 0.11 sec.
2025-11-14 15:47:19,212 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:19,245 - INFO - Going to convert document batch...
2025-11-14 15:47:19,246 - INFO - Processing document 4_2025-03-06
2025-11-14 15:47:19,298 - INFO - Finished converting document 4_2025-03-06 in 0.09 sec.


Converted 'data\edgar_documents\BLK\4_2025-03-04' --> 'data\processed_data\BLK\4_2025-03-04.md'
Converted 'data\edgar_documents\BLK\4_2025-03-06' --> 'data\processed_data\BLK\4_2025-03-06.md'


2025-11-14 15:47:19,402 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:19,422 - INFO - Going to convert document batch...
2025-11-14 15:47:19,424 - INFO - Processing document 4_2025-03-07
2025-11-14 15:47:19,477 - INFO - Finished converting document 4_2025-03-07 in 0.11 sec.
2025-11-14 15:47:19,564 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:19,586 - INFO - Going to convert document batch...
2025-11-14 15:47:19,587 - INFO - Processing document 4_2025-03-10
2025-11-14 15:47:19,650 - INFO - Finished converting document 4_2025-03-10 in 0.09 sec.


Converted 'data\edgar_documents\BLK\4_2025-03-07' --> 'data\processed_data\BLK\4_2025-03-07.md'
Converted 'data\edgar_documents\BLK\4_2025-03-10' --> 'data\processed_data\BLK\4_2025-03-10.md'


2025-11-14 15:47:19,750 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:19,778 - INFO - Going to convert document batch...
2025-11-14 15:47:19,780 - INFO - Processing document 4_2025-03-11
2025-11-14 15:47:19,844 - INFO - Finished converting document 4_2025-03-11 in 0.12 sec.
2025-11-14 15:47:19,902 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:19,933 - INFO - Going to convert document batch...
2025-11-14 15:47:19,935 - INFO - Processing document 4_2025-03-12
2025-11-14 15:47:19,993 - INFO - Finished converting document 4_2025-03-12 in 0.09 sec.


Converted 'data\edgar_documents\BLK\4_2025-03-11' --> 'data\processed_data\BLK\4_2025-03-11.md'
Converted 'data\edgar_documents\BLK\4_2025-03-12' --> 'data\processed_data\BLK\4_2025-03-12.md'


2025-11-14 15:47:20,086 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:20,116 - INFO - Going to convert document batch...
2025-11-14 15:47:20,118 - INFO - Processing document 4_2025-03-13
2025-11-14 15:47:20,163 - INFO - Finished converting document 4_2025-03-13 in 0.09 sec.
2025-11-14 15:47:20,249 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:20,272 - INFO - Going to convert document batch...
2025-11-14 15:47:20,275 - INFO - Processing document 4_2025-03-14
2025-11-14 15:47:20,354 - INFO - Finished converting document 4_2025-03-14 in 0.12 sec.


Converted 'data\edgar_documents\BLK\4_2025-03-13' --> 'data\processed_data\BLK\4_2025-03-13.md'
Converted 'data\edgar_documents\BLK\4_2025-03-14' --> 'data\processed_data\BLK\4_2025-03-14.md'


2025-11-14 15:47:20,433 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:20,464 - INFO - Going to convert document batch...
2025-11-14 15:47:20,465 - INFO - Processing document 4_2025-03-17
2025-11-14 15:47:20,534 - INFO - Finished converting document 4_2025-03-17 in 0.12 sec.
2025-11-14 15:47:20,591 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:20,616 - INFO - Going to convert document batch...
2025-11-14 15:47:20,618 - INFO - Processing document 4_2025-03-18
2025-11-14 15:47:20,674 - INFO - Finished converting document 4_2025-03-18 in 0.09 sec.


Converted 'data\edgar_documents\BLK\4_2025-03-17' --> 'data\processed_data\BLK\4_2025-03-17.md'
Converted 'data\edgar_documents\BLK\4_2025-03-18' --> 'data\processed_data\BLK\4_2025-03-18.md'


2025-11-14 15:47:20,766 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:20,802 - INFO - Going to convert document batch...
2025-11-14 15:47:20,804 - INFO - Processing document 4_2025-03-19
2025-11-14 15:47:20,840 - INFO - Finished converting document 4_2025-03-19 in 0.11 sec.
2025-11-14 15:47:20,893 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:20,924 - INFO - Going to convert document batch...
2025-11-14 15:47:20,927 - INFO - Processing document 4_2025-03-20
2025-11-14 15:47:20,964 - INFO - Finished converting document 4_2025-03-20 in 0.09 sec.
2025-11-14 15:47:21,039 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BLK\4_2025-03-19' --> 'data\processed_data\BLK\4_2025-03-19.md'
Converted 'data\edgar_documents\BLK\4_2025-03-20' --> 'data\processed_data\BLK\4_2025-03-20.md'


2025-11-14 15:47:21,070 - INFO - Going to convert document batch...
2025-11-14 15:47:21,074 - INFO - Processing document 4_2025-03-21
2025-11-14 15:47:21,189 - INFO - Finished converting document 4_2025-03-21 in 0.19 sec.
2025-11-14 15:47:21,290 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:21,317 - INFO - Going to convert document batch...
2025-11-14 15:47:21,319 - INFO - Processing document 4_2025-03-24
2025-11-14 15:47:21,389 - INFO - Finished converting document 4_2025-03-24 in 0.11 sec.


Converted 'data\edgar_documents\BLK\4_2025-03-21' --> 'data\processed_data\BLK\4_2025-03-21.md'
Converted 'data\edgar_documents\BLK\4_2025-03-24' --> 'data\processed_data\BLK\4_2025-03-24.md'


2025-11-14 15:47:21,478 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:47:21,480 - ERROR - Input document 4_2025-03-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:47:21,483 - INFO - Going to convert document batch...
2025-11-14 15:47:21,509 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:21,532 - INFO - Going to convert document batch...
2025-11-14 15:47:21,533 - INFO - Processing document 4_2025-04-02
2025-11-14 15:47:21,576 - INFO - Fin

Error processing data\edgar_documents\BLK\4_2025-03-27: File format not allowed: data\edgar_documents\BLK\4_2025-03-27
Converted 'data\edgar_documents\BLK\4_2025-04-02' --> 'data\processed_data\BLK\4_2025-04-02.md'


2025-11-14 15:47:21,807 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:21,832 - INFO - Going to convert document batch...
2025-11-14 15:47:21,837 - INFO - Processing document 4_2025-04-23
2025-11-14 15:47:21,913 - INFO - Finished converting document 4_2025-04-23 in 0.12 sec.


Converted 'data\edgar_documents\BLK\4_2025-04-17' --> 'data\processed_data\BLK\4_2025-04-17.md'
Converted 'data\edgar_documents\BLK\4_2025-04-23' --> 'data\processed_data\BLK\4_2025-04-23.md'


2025-11-14 15:47:22,006 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:22,049 - INFO - Going to convert document batch...
2025-11-14 15:47:22,050 - INFO - Processing document 4_2025-04-28
2025-11-14 15:47:22,125 - INFO - Finished converting document 4_2025-04-28 in 0.14 sec.
2025-11-14 15:47:22,214 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:22,267 - INFO - Going to convert document batch...
2025-11-14 15:47:22,269 - INFO - Processing document 4_2025-05-01
2025-11-14 15:47:22,362 - INFO - Finished converting document 4_2025-05-01 in 0.17 sec.


Converted 'data\edgar_documents\BLK\4_2025-04-28' --> 'data\processed_data\BLK\4_2025-04-28.md'


2025-11-14 15:47:22,466 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:22,493 - INFO - Going to convert document batch...
2025-11-14 15:47:22,495 - INFO - Processing document 4_2025-05-21
2025-11-14 15:47:22,547 - INFO - Finished converting document 4_2025-05-21 in 0.09 sec.
2025-11-14 15:47:22,632 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BLK\4_2025-05-01' --> 'data\processed_data\BLK\4_2025-05-01.md'
Converted 'data\edgar_documents\BLK\4_2025-05-21' --> 'data\processed_data\BLK\4_2025-05-21.md'


2025-11-14 15:47:22,670 - INFO - Going to convert document batch...
2025-11-14 15:47:22,673 - INFO - Processing document 4_2025-05-28
2025-11-14 15:47:22,780 - INFO - Finished converting document 4_2025-05-28 in 0.19 sec.
2025-11-14 15:47:22,845 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:22,869 - INFO - Going to convert document batch...
2025-11-14 15:47:22,871 - INFO - Processing document 4_2025-07-02
2025-11-14 15:47:22,931 - INFO - Finished converting document 4_2025-07-02 in 0.09 sec.
2025-11-14 15:47:23,016 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BLK\4_2025-05-28' --> 'data\processed_data\BLK\4_2025-05-28.md'
Converted 'data\edgar_documents\BLK\4_2025-07-02' --> 'data\processed_data\BLK\4_2025-07-02.md'


2025-11-14 15:47:23,040 - INFO - Going to convert document batch...
2025-11-14 15:47:23,041 - INFO - Processing document 4_2025-07-18
2025-11-14 15:47:23,085 - INFO - Finished converting document 4_2025-07-18 in 0.09 sec.
2025-11-14 15:47:23,141 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:23,170 - INFO - Going to convert document batch...
2025-11-14 15:47:23,172 - INFO - Processing document 4_2025-07-25
2025-11-14 15:47:23,230 - INFO - Finished converting document 4_2025-07-25 in 0.11 sec.


Converted 'data\edgar_documents\BLK\4_2025-07-18' --> 'data\processed_data\BLK\4_2025-07-18.md'
Converted 'data\edgar_documents\BLK\4_2025-07-25' --> 'data\processed_data\BLK\4_2025-07-25.md'


2025-11-14 15:47:23,317 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:23,348 - INFO - Going to convert document batch...
2025-11-14 15:47:23,349 - INFO - Processing document 4_2025-08-01
2025-11-14 15:47:23,408 - INFO - Finished converting document 4_2025-08-01 in 0.12 sec.
2025-11-14 15:47:23,476 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:23,494 - INFO - Going to convert document batch...
2025-11-14 15:47:23,495 - INFO - Processing document 4_2025-10-02
2025-11-14 15:47:23,552 - INFO - Finished converting document 4_2025-10-02 in 0.09 sec.


Converted 'data\edgar_documents\BLK\4_2025-08-01' --> 'data\processed_data\BLK\4_2025-08-01.md'
Converted 'data\edgar_documents\BLK\4_2025-10-02' --> 'data\processed_data\BLK\4_2025-10-02.md'


2025-11-14 15:47:23,640 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:23,676 - INFO - Going to convert document batch...
2025-11-14 15:47:23,677 - INFO - Processing document 4_2025-10-22
2025-11-14 15:47:23,783 - INFO - Finished converting document 4_2025-10-22 in 0.17 sec.
2025-11-14 15:47:23,918 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:23,974 - INFO - Going to convert document batch...
2025-11-14 15:47:23,976 - INFO - Processing document 8-K_2024-10-01
2025-11-14 15:47:24,035 - INFO - Finished converting document 8-K_2024-10-01 in 0.16 sec.


Converted 'data\edgar_documents\BLK\4_2025-10-22' --> 'data\processed_data\BLK\4_2025-10-22.md'
Converted 'data\edgar_documents\BLK\8-K_2024-10-01' --> 'data\processed_data\BLK\8-K_2024-10-01.md'


2025-11-14 15:47:24,099 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:24,151 - INFO - Going to convert document batch...
2025-11-14 15:47:24,153 - INFO - Processing document 8-K_2024-10-11
2025-11-14 15:47:24,192 - INFO - Finished converting document 8-K_2024-10-11 in 0.12 sec.
2025-11-14 15:47:24,245 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:24,281 - INFO - Going to convert document batch...
2025-11-14 15:47:24,283 - INFO - Processing document 8-K_2024-11-08
2025-11-14 15:47:24,344 - INFO - Finished converting document 8-K_2024-11-08 in 0.11 sec.


Converted 'data\edgar_documents\BLK\8-K_2024-10-11' --> 'data\processed_data\BLK\8-K_2024-10-11.md'
Converted 'data\edgar_documents\BLK\8-K_2024-11-08' --> 'data\processed_data\BLK\8-K_2024-11-08.md'


2025-11-14 15:47:24,417 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:24,461 - INFO - Going to convert document batch...
2025-11-14 15:47:24,462 - INFO - Processing document 8-K_2024-11-19
2025-11-14 15:47:24,513 - INFO - Finished converting document 8-K_2024-11-19 in 0.14 sec.
2025-11-14 15:47:24,559 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:24,594 - INFO - Going to convert document batch...
2025-11-14 15:47:24,596 - INFO - Processing document 8-K_2024-12-03
2025-11-14 15:47:24,637 - INFO - Finished converting document 8-K_2024-12-03 in 0.09 sec.
2025-11-14 15:47:24,675 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:24,698 - INFO - Going to convert document batch...
2025-11-14 15:47:24,699 - INFO - Processing document 8-K_2025-01-15
2025-11-14 15:47:24,744 - INFO - Finished converting document 8-K_2025-01-15 in 0.08 sec.


Converted 'data\edgar_documents\BLK\8-K_2024-11-19' --> 'data\processed_data\BLK\8-K_2024-11-19.md'
Converted 'data\edgar_documents\BLK\8-K_2024-12-03' --> 'data\processed_data\BLK\8-K_2024-12-03.md'


2025-11-14 15:47:24,786 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:24,820 - INFO - Going to convert document batch...
2025-11-14 15:47:24,823 - INFO - Processing document 8-K_2025-02-14
2025-11-14 15:47:24,857 - INFO - Finished converting document 8-K_2025-02-14 in 0.09 sec.
2025-11-14 15:47:24,896 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:24,928 - INFO - Going to convert document batch...
2025-11-14 15:47:24,929 - INFO - Processing document 8-K_2025-03-03
2025-11-14 15:47:24,956 - INFO - Finished converting document 8-K_2025-03-03 in 0.08 sec.


Converted 'data\edgar_documents\BLK\8-K_2025-01-15' --> 'data\processed_data\BLK\8-K_2025-01-15.md'
Converted 'data\edgar_documents\BLK\8-K_2025-02-14' --> 'data\processed_data\BLK\8-K_2025-02-14.md'


2025-11-14 15:47:25,006 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:25,041 - INFO - Going to convert document batch...
2025-11-14 15:47:25,043 - INFO - Processing document 8-K_2025-03-26
2025-11-14 15:47:25,088 - INFO - Finished converting document 8-K_2025-03-26 in 0.11 sec.
2025-11-14 15:47:25,123 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:25,164 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BLK\8-K_2025-03-03' --> 'data\processed_data\BLK\8-K_2025-03-03.md'
Converted 'data\edgar_documents\BLK\8-K_2025-03-26' --> 'data\processed_data\BLK\8-K_2025-03-26.md'


2025-11-14 15:47:25,174 - INFO - Processing document 8-K_2025-04-03
2025-11-14 15:47:25,228 - INFO - Finished converting document 8-K_2025-04-03 in 0.11 sec.
2025-11-14 15:47:25,272 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:25,299 - INFO - Going to convert document batch...
2025-11-14 15:47:25,301 - INFO - Processing document 8-K_2025-04-07
2025-11-14 15:47:25,344 - INFO - Finished converting document 8-K_2025-04-07 in 0.09 sec.
2025-11-14 15:47:25,408 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BLK\8-K_2025-04-03' --> 'data\processed_data\BLK\8-K_2025-04-03.md'
Converted 'data\edgar_documents\BLK\8-K_2025-04-07' --> 'data\processed_data\BLK\8-K_2025-04-07.md'


2025-11-14 15:47:25,436 - INFO - Going to convert document batch...
2025-11-14 15:47:25,438 - INFO - Processing document 8-K_2025-04-11
2025-11-14 15:47:25,492 - INFO - Finished converting document 8-K_2025-04-11 in 0.11 sec.
2025-11-14 15:47:25,526 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:25,595 - INFO - Going to convert document batch...
2025-11-14 15:47:25,597 - INFO - Processing document 8-K_2025-05-16


Converted 'data\edgar_documents\BLK\8-K_2025-04-11' --> 'data\processed_data\BLK\8-K_2025-04-11.md'


2025-11-14 15:47:25,706 - INFO - Finished converting document 8-K_2025-05-16 in 0.20 sec.
2025-11-14 15:47:25,758 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:25,781 - INFO - Going to convert document batch...
2025-11-14 15:47:25,783 - INFO - Processing document 8-K_2025-07-01
2025-11-14 15:47:25,823 - INFO - Finished converting document 8-K_2025-07-01 in 0.09 sec.
2025-11-14 15:47:25,873 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:25,910 - INFO - Going to convert document batch...
2025-11-14 15:47:25,912 - INFO - Processing document 8-K_2025-07-15
2025-11-14 15:47:25,956 - INFO - Finished converting document 8-K_2025-07-15 in 0.11 sec.


Converted 'data\edgar_documents\BLK\8-K_2025-05-16' --> 'data\processed_data\BLK\8-K_2025-05-16.md'
Converted 'data\edgar_documents\BLK\8-K_2025-07-01' --> 'data\processed_data\BLK\8-K_2025-07-01.md'


2025-11-14 15:47:25,996 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:26,036 - INFO - Going to convert document batch...
2025-11-14 15:47:26,037 - INFO - Processing document 8-K_2025-10-14
2025-11-14 15:47:26,075 - INFO - Finished converting document 8-K_2025-10-14 in 0.11 sec.


Converted 'data\edgar_documents\BLK\8-K_2025-07-15' --> 'data\processed_data\BLK\8-K_2025-07-15.md'
Converted 'data\edgar_documents\BLK\8-K_2025-10-14' --> 'data\processed_data\BLK\8-K_2025-10-14.md'


2025-11-14 15:47:26,209 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:30,227 - INFO - Going to convert document batch...
2025-11-14 15:47:30,228 - INFO - Processing document DEF-14A_2025-04-04
2025-11-14 15:47:42,547 - INFO - Finished converting document DEF-14A_2025-04-04 in 16.45 sec.


Converted 'data\edgar_documents\BLK\DEF-14A_2025-04-04' --> 'data\processed_data\BLK\DEF-14A_2025-04-04.md'
Processed 57 new files. Errors: 5
Found 107 files to process in data\edgar_documents\BMY


2025-11-14 15:47:46,195 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:47:48,848 - INFO - Going to convert document batch...
2025-11-14 15:47:48,849 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:47:48,850 - INFO - Processing document 10-K_2023-02-14
2025-11-14 15:47:55,371 - INFO - Finished converting document 10-K_2023-02-14 in 9.31 sec.
2025-11-14 15:47:56,269 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\10-K_2023-02-14' --> 'data\processed_data\BMY\10-K_2023-02-14.md'


2025-11-14 15:47:57,335 - INFO - Going to convert document batch...
2025-11-14 15:47:57,336 - INFO - Processing document 10-K_2024-02-13
2025-11-14 15:48:00,920 - INFO - Finished converting document 10-K_2024-02-13 in 4.75 sec.
2025-11-14 15:48:01,857 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\10-K_2024-02-13' --> 'data\processed_data\BMY\10-K_2024-02-13.md'


2025-11-14 15:48:02,671 - INFO - Going to convert document batch...
2025-11-14 15:48:02,672 - INFO - Processing document 10-K_2025-02-12
2025-11-14 15:48:06,267 - INFO - Finished converting document 10-K_2025-02-12 in 4.48 sec.
2025-11-14 15:48:07,192 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\10-K_2025-02-12' --> 'data\processed_data\BMY\10-K_2025-02-12.md'


2025-11-14 15:48:07,620 - INFO - Going to convert document batch...
2025-11-14 15:48:07,621 - INFO - Processing document 10-Q_2023-04-27
2025-11-14 15:48:08,621 - INFO - Finished converting document 10-Q_2023-04-27 in 1.47 sec.
2025-11-14 15:48:09,089 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\10-Q_2023-04-27' --> 'data\processed_data\BMY\10-Q_2023-04-27.md'


2025-11-14 15:48:10,357 - INFO - Going to convert document batch...
2025-11-14 15:48:10,358 - INFO - Processing document 10-Q_2023-07-27
2025-11-14 15:48:11,465 - INFO - Finished converting document 10-Q_2023-07-27 in 2.42 sec.
2025-11-14 15:48:12,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\10-Q_2023-07-27' --> 'data\processed_data\BMY\10-Q_2023-07-27.md'


2025-11-14 15:48:12,898 - INFO - Going to convert document batch...
2025-11-14 15:48:12,900 - INFO - Processing document 10-Q_2023-10-26
2025-11-14 15:48:14,115 - INFO - Finished converting document 10-Q_2023-10-26 in 2.12 sec.
2025-11-14 15:48:14,692 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\10-Q_2023-10-26' --> 'data\processed_data\BMY\10-Q_2023-10-26.md'


2025-11-14 15:48:15,163 - INFO - Going to convert document batch...
2025-11-14 15:48:15,164 - INFO - Processing document 10-Q_2024-04-25
2025-11-14 15:48:16,127 - INFO - Finished converting document 10-Q_2024-04-25 in 1.47 sec.
2025-11-14 15:48:16,645 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\10-Q_2024-04-25' --> 'data\processed_data\BMY\10-Q_2024-04-25.md'


2025-11-14 15:48:17,591 - INFO - Going to convert document batch...
2025-11-14 15:48:17,592 - INFO - Processing document 10-Q_2024-07-26
2025-11-14 15:48:18,796 - INFO - Finished converting document 10-Q_2024-07-26 in 2.20 sec.
2025-11-14 15:48:19,364 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\10-Q_2024-07-26' --> 'data\processed_data\BMY\10-Q_2024-07-26.md'


2025-11-14 15:48:20,286 - INFO - Going to convert document batch...
2025-11-14 15:48:20,287 - INFO - Processing document 10-Q_2024-10-31
2025-11-14 15:48:21,580 - INFO - Finished converting document 10-Q_2024-10-31 in 2.25 sec.
2025-11-14 15:48:22,408 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\10-Q_2024-10-31' --> 'data\processed_data\BMY\10-Q_2024-10-31.md'


2025-11-14 15:48:23,440 - INFO - Going to convert document batch...
2025-11-14 15:48:23,441 - INFO - Processing document 10-Q_2025-04-24
2025-11-14 15:48:24,889 - INFO - Finished converting document 10-Q_2025-04-24 in 2.52 sec.
2025-11-14 15:48:25,557 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\10-Q_2025-04-24' --> 'data\processed_data\BMY\10-Q_2025-04-24.md'


2025-11-14 15:48:26,146 - INFO - Going to convert document batch...
2025-11-14 15:48:26,148 - INFO - Processing document 10-Q_2025-07-31
2025-11-14 15:48:27,981 - INFO - Finished converting document 10-Q_2025-07-31 in 2.48 sec.
2025-11-14 15:48:28,689 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\10-Q_2025-07-31' --> 'data\processed_data\BMY\10-Q_2025-07-31.md'


2025-11-14 15:48:29,320 - INFO - Going to convert document batch...
2025-11-14 15:48:29,321 - INFO - Processing document 10-Q_2025-10-30
2025-11-14 15:48:30,561 - INFO - Finished converting document 10-Q_2025-10-30 in 1.92 sec.
2025-11-14 15:48:31,526 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:31,534 - INFO - Going to convert document batch...
2025-11-14 15:48:31,535 - INFO - Processing document 4_2023-01-04
2025-11-14 15:48:31,554 - INFO - Finished converting document 4_2023-01-04 in 0.05 sec.
2025-11-14 15:48:31,618 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:31,636 - INFO - Going to convert document batch...
2025-11-14 15:48:31,637 - INFO - Processing document 4_2023-02-03
2025-11-14 15:48:31,661 - INFO - Finished converting document 4_2023-02-03 in 0.08 sec.


Converted 'data\edgar_documents\BMY\10-Q_2025-10-30' --> 'data\processed_data\BMY\10-Q_2025-10-30.md'
Converted 'data\edgar_documents\BMY\4_2023-01-04' --> 'data\processed_data\BMY\4_2023-01-04.md'
Converted 'data\edgar_documents\BMY\4_2023-02-03' --> 'data\processed_data\BMY\4_2023-02-03.md'


2025-11-14 15:48:31,713 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:31,721 - INFO - Going to convert document batch...
2025-11-14 15:48:31,725 - INFO - Processing document 4_2023-02-08
2025-11-14 15:48:31,762 - INFO - Finished converting document 4_2023-02-08 in 0.08 sec.
2025-11-14 15:48:31,796 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:31,814 - INFO - Going to convert document batch...
2025-11-14 15:48:31,815 - INFO - Processing document 4_2023-03-14
2025-11-14 15:48:31,855 - INFO - Finished converting document 4_2023-03-14 in 0.08 sec.
2025-11-14 15:48:31,913 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:31,923 - INFO - Going to convert document batch...
2025-11-14 15:48:31,924 - INFO - Processing document 4_2023-04-04
2025-11-14 15:48:31,943 - INFO - Finished converting document 4_2023-04-04 in 0.05 sec.


Converted 'data\edgar_documents\BMY\4_2023-02-08' --> 'data\processed_data\BMY\4_2023-02-08.md'
Converted 'data\edgar_documents\BMY\4_2023-03-14' --> 'data\processed_data\BMY\4_2023-03-14.md'
Converted 'data\edgar_documents\BMY\4_2023-04-04' --> 'data\processed_data\BMY\4_2023-04-04.md'


2025-11-14 15:48:31,993 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:32,009 - INFO - Going to convert document batch...
2025-11-14 15:48:32,010 - INFO - Processing document 4_2023-05-03
2025-11-14 15:48:32,046 - INFO - Finished converting document 4_2023-05-03 in 0.08 sec.
2025-11-14 15:48:32,095 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:32,104 - INFO - Going to convert document batch...
2025-11-14 15:48:32,104 - INFO - Processing document 4_2023-05-04
2025-11-14 15:48:32,124 - INFO - Finished converting document 4_2023-05-04 in 0.05 sec.
2025-11-14 15:48:32,168 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:32,183 - INFO - Going to convert document batch...
2025-11-14 15:48:32,183 - INFO - Processing document 4_2023-06-06
2025-11-14 15:48:32,208 - INFO - Finished converting document 4_2023-06-06 in 0.05 sec.
2025-11-14 15:48:32,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\4_2023-05-03' --> 'data\processed_data\BMY\4_2023-05-03.md'
Converted 'data\edgar_documents\BMY\4_2023-05-04' --> 'data\processed_data\BMY\4_2023-05-04.md'
Converted 'data\edgar_documents\BMY\4_2023-06-06' --> 'data\processed_data\BMY\4_2023-06-06.md'


2025-11-14 15:48:32,277 - INFO - Going to convert document batch...
2025-11-14 15:48:32,279 - INFO - Processing document 4_2023-07-05
2025-11-14 15:48:32,305 - INFO - Finished converting document 4_2023-07-05 in 0.06 sec.
2025-11-14 15:48:32,350 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:32,370 - INFO - Going to convert document batch...
2025-11-14 15:48:32,371 - INFO - Processing document 4_2023-08-07
2025-11-14 15:48:32,392 - INFO - Finished converting document 4_2023-08-07 in 0.06 sec.
2025-11-14 15:48:32,424 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:32,433 - INFO - Going to convert document batch...
2025-11-14 15:48:32,434 - INFO - Processing document 4_2023-08-28
2025-11-14 15:48:32,463 - INFO - Finished converting document 4_2023-08-28 in 0.05 sec.
2025-11-14 15:48:32,515 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BMY\4_2023-07-05' --> 'data\processed_data\BMY\4_2023-07-05.md'
Converted 'data\edgar_documents\BMY\4_2023-08-07' --> 'data\processed_data\BMY\4_2023-08-07.md'
Converted 'data\edgar_documents\BMY\4_2023-08-28' --> 'data\processed_data\BMY\4_2023-08-28.md'


2025-11-14 15:48:32,533 - INFO - Going to convert document batch...
2025-11-14 15:48:32,534 - INFO - Processing document 4_2023-10-03
2025-11-14 15:48:32,556 - INFO - Finished converting document 4_2023-10-03 in 0.06 sec.
2025-11-14 15:48:32,591 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:32,600 - INFO - Going to convert document batch...
2025-11-14 15:48:32,601 - INFO - Processing document 4_2023-10-04
2025-11-14 15:48:32,620 - INFO - Finished converting document 4_2023-10-04 in 0.05 sec.
2025-11-14 15:48:32,653 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:32,665 - INFO - Going to convert document batch...
2025-11-14 15:48:32,665 - INFO - Processing document 4_2023-10-12
2025-11-14 15:48:32,684 - INFO - Finished converting document 4_2023-10-12 in 0.05 sec.
2025-11-14 15:48:32,760 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\BMY\4_2023-10-03' --> 'data\processed_data\BMY\4_2023-10-03.md'
Converted 'data\edgar_documents\BMY\4_2023-10-04' --> 'data\processed_data\BMY\4_2023-10-04.md'
Converted 'data\edgar_documents\BMY\4_2023-10-12' --> 'data\processed_data\BMY\4_2023-10-12.md'


2025-11-14 15:48:32,762 - ERROR - Input document 4_2023-10-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:48:32,763 - INFO - Going to convert document batch...
2025-11-14 15:48:32,788 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:48:32,789 - ERROR - Input document 4_2023-11-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\BMY\4_2023-10-30: File format not allowed: data\edgar_documents\BMY\4_2023-10-30
Error processing data\edgar_documents\BMY\4_2023-11-01: File format not allowed: data\edgar_documents\BMY\4_2023-11-01
Converted 'data\edgar_documents\BMY\4_2023-11-03' --> 'data\processed_data\BMY\4_2023-11-03.md'
Converted 'data\edgar_documents\BMY\4_2023-11-21' --> 'data\processed_data\BMY\4_2023-11-21.md'


2025-11-14 15:48:32,964 - INFO - Finished converting document 4_2023-11-24 in 0.05 sec.
2025-11-14 15:48:33,000 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:33,007 - INFO - Going to convert document batch...
2025-11-14 15:48:33,008 - INFO - Processing document 4_2023-11-30
2025-11-14 15:48:33,027 - INFO - Finished converting document 4_2023-11-30 in 0.05 sec.
2025-11-14 15:48:33,076 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:33,088 - INFO - Going to convert document batch...
2025-11-14 15:48:33,089 - INFO - Processing document 4_2023-12-05
2025-11-14 15:48:33,120 - INFO - Finished converting document 4_2023-12-05 in 0.08 sec.
2025-11-14 15:48:33,153 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:33,163 - INFO - Going to convert document batch...
2025-11-14 15:48:33,164 - INFO - Processing document 4_2023-12-07


Converted 'data\edgar_documents\BMY\4_2023-11-24' --> 'data\processed_data\BMY\4_2023-11-24.md'
Converted 'data\edgar_documents\BMY\4_2023-11-30' --> 'data\processed_data\BMY\4_2023-11-30.md'
Converted 'data\edgar_documents\BMY\4_2023-12-05' --> 'data\processed_data\BMY\4_2023-12-05.md'


2025-11-14 15:48:33,181 - INFO - Finished converting document 4_2023-12-07 in 0.03 sec.
2025-11-14 15:48:33,217 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:33,224 - INFO - Going to convert document batch...
2025-11-14 15:48:33,226 - INFO - Processing document 4_2024-01-03
2025-11-14 15:48:33,249 - INFO - Finished converting document 4_2024-01-03 in 0.05 sec.
2025-11-14 15:48:33,284 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:33,292 - INFO - Going to convert document batch...
2025-11-14 15:48:33,292 - INFO - Processing document 4_2024-02-05
2025-11-14 15:48:33,319 - INFO - Finished converting document 4_2024-02-05 in 0.05 sec.
2025-11-14 15:48:33,366 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:48:33,367 - ERROR - Input document 4_2024-02-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFo

Converted 'data\edgar_documents\BMY\4_2023-12-07' --> 'data\processed_data\BMY\4_2023-12-07.md'
Converted 'data\edgar_documents\BMY\4_2024-01-03' --> 'data\processed_data\BMY\4_2024-01-03.md'
Converted 'data\edgar_documents\BMY\4_2024-02-05' --> 'data\processed_data\BMY\4_2024-02-05.md'
Error processing data\edgar_documents\BMY\4_2024-02-13: File format not allowed: data\edgar_documents\BMY\4_2024-02-13


2025-11-14 15:48:33,396 - ERROR - Input document 4_2024-02-16 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:48:33,399 - INFO - Going to convert document batch...
2025-11-14 15:48:33,415 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:33,431 - INFO - Going to convert document batch...
2025-11-14 15:48:33,432 - INFO - Processing document 4_2024-03-04
2025-11-14 15:48:33,454 - INFO - Finished converting document 4_2024-03-04 in 0.06 sec.
2025-11-14 15:48:33,488 - INFO - detec

Error processing data\edgar_documents\BMY\4_2024-02-16: File format not allowed: data\edgar_documents\BMY\4_2024-02-16
Converted 'data\edgar_documents\BMY\4_2024-03-04' --> 'data\processed_data\BMY\4_2024-03-04.md'


2025-11-14 15:48:33,658 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:33,670 - INFO - Going to convert document batch...
2025-11-14 15:48:33,671 - INFO - Processing document 4_2024-04-02
2025-11-14 15:48:33,698 - INFO - Finished converting document 4_2024-04-02 in 0.06 sec.
2025-11-14 15:48:33,751 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:33,772 - INFO - Going to convert document batch...
2025-11-14 15:48:33,773 - INFO - Processing document 4_2024-05-03
2025-11-14 15:48:33,801 - INFO - Finished converting document 4_2024-05-03 in 0.08 sec.


Converted 'data\edgar_documents\BMY\4_2024-03-12' --> 'data\processed_data\BMY\4_2024-03-12.md'
Converted 'data\edgar_documents\BMY\4_2024-04-02' --> 'data\processed_data\BMY\4_2024-04-02.md'


2025-11-14 15:48:33,840 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:33,865 - INFO - Going to convert document batch...
2025-11-14 15:48:33,866 - INFO - Processing document 4_2024-07-02
2025-11-14 15:48:33,916 - INFO - Finished converting document 4_2024-07-02 in 0.09 sec.
2025-11-14 15:48:33,967 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:33,981 - INFO - Going to convert document batch...
2025-11-14 15:48:33,981 - INFO - Processing document 4_2024-07-31
2025-11-14 15:48:34,009 - INFO - Finished converting document 4_2024-07-31 in 0.05 sec.


Converted 'data\edgar_documents\BMY\4_2024-05-03' --> 'data\processed_data\BMY\4_2024-05-03.md'
Converted 'data\edgar_documents\BMY\4_2024-07-02' --> 'data\processed_data\BMY\4_2024-07-02.md'


2025-11-14 15:48:34,055 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:34,070 - INFO - Going to convert document batch...
2025-11-14 15:48:34,071 - INFO - Processing document 4_2024-08-05
2025-11-14 15:48:34,095 - INFO - Finished converting document 4_2024-08-05 in 0.05 sec.
2025-11-14 15:48:34,142 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:34,154 - INFO - Going to convert document batch...
2025-11-14 15:48:34,155 - INFO - Processing document 4_2024-10-02
2025-11-14 15:48:34,174 - INFO - Finished converting document 4_2024-10-02 in 0.06 sec.
2025-11-14 15:48:34,223 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:34,234 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BMY\4_2024-07-31' --> 'data\processed_data\BMY\4_2024-07-31.md'
Converted 'data\edgar_documents\BMY\4_2024-08-05' --> 'data\processed_data\BMY\4_2024-08-05.md'
Converted 'data\edgar_documents\BMY\4_2024-10-02' --> 'data\processed_data\BMY\4_2024-10-02.md'


2025-11-14 15:48:34,236 - INFO - Processing document 4_2024-10-03
2025-11-14 15:48:34,258 - INFO - Finished converting document 4_2024-10-03 in 0.06 sec.
2025-11-14 15:48:34,293 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:34,301 - INFO - Going to convert document batch...
2025-11-14 15:48:34,301 - INFO - Processing document 4_2024-11-05
2025-11-14 15:48:34,318 - INFO - Finished converting document 4_2024-11-05 in 0.03 sec.
2025-11-14 15:48:34,369 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:34,380 - INFO - Going to convert document batch...
2025-11-14 15:48:34,381 - INFO - Processing document 4_2025-01-02
2025-11-14 15:48:34,401 - INFO - Finished converting document 4_2025-01-02 in 0.06 sec.
2025-11-14 15:48:34,453 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:34,467 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BMY\4_2024-10-03' --> 'data\processed_data\BMY\4_2024-10-03.md'
Converted 'data\edgar_documents\BMY\4_2024-11-05' --> 'data\processed_data\BMY\4_2024-11-05.md'
Converted 'data\edgar_documents\BMY\4_2025-01-02' --> 'data\processed_data\BMY\4_2025-01-02.md'


2025-11-14 15:48:34,468 - INFO - Processing document 4_2025-02-04
2025-11-14 15:48:34,514 - INFO - Finished converting document 4_2025-02-04 in 0.09 sec.
2025-11-14 15:48:34,556 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:34,570 - INFO - Going to convert document batch...
2025-11-14 15:48:34,571 - INFO - Processing document 4_2025-02-19
2025-11-14 15:48:34,591 - INFO - Finished converting document 4_2025-02-19 in 0.05 sec.
2025-11-14 15:48:34,623 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:34,632 - INFO - Going to convert document batch...
2025-11-14 15:48:34,633 - INFO - Processing document 4_2025-02-21
2025-11-14 15:48:34,652 - INFO - Finished converting document 4_2025-02-21 in 0.05 sec.
2025-11-14 15:48:34,684 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:34,694 - INFO - Going to convert document batch...
2025-11-14 15:48:34,695 - INFO - Processing document 4_2025-03-04
2025-11-14 15:48:34,717 - IN

Converted 'data\edgar_documents\BMY\4_2025-02-04' --> 'data\processed_data\BMY\4_2025-02-04.md'
Converted 'data\edgar_documents\BMY\4_2025-02-19' --> 'data\processed_data\BMY\4_2025-02-19.md'
Converted 'data\edgar_documents\BMY\4_2025-02-21' --> 'data\processed_data\BMY\4_2025-02-21.md'
Converted 'data\edgar_documents\BMY\4_2025-03-04' --> 'data\processed_data\BMY\4_2025-03-04.md'


2025-11-14 15:48:34,756 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:34,775 - INFO - Going to convert document batch...
2025-11-14 15:48:34,777 - INFO - Processing document 4_2025-03-12
2025-11-14 15:48:34,824 - INFO - Finished converting document 4_2025-03-12 in 0.09 sec.
2025-11-14 15:48:34,876 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:34,885 - INFO - Going to convert document batch...
2025-11-14 15:48:34,886 - INFO - Processing document 4_2025-04-01
2025-11-14 15:48:34,906 - INFO - Finished converting document 4_2025-04-01 in 0.05 sec.
2025-11-14 15:48:34,941 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:34,952 - INFO - Going to convert document batch...
2025-11-14 15:48:34,953 - INFO - Processing document 4_2025-04-03
2025-11-14 15:48:34,979 - INFO - Finished converting document 4_2025-04-03 in 0.06 sec.
2025-11-14 15:48:35,012 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\BMY\4_2025-03-12' --> 'data\processed_data\BMY\4_2025-03-12.md'
Converted 'data\edgar_documents\BMY\4_2025-04-01' --> 'data\processed_data\BMY\4_2025-04-01.md'
Converted 'data\edgar_documents\BMY\4_2025-04-03' --> 'data\processed_data\BMY\4_2025-04-03.md'


2025-11-14 15:48:35,072 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:35,106 - INFO - Going to convert document batch...
2025-11-14 15:48:35,109 - INFO - Processing document 4_2025-05-05
2025-11-14 15:48:35,166 - INFO - Finished converting document 4_2025-05-05 in 0.09 sec.
2025-11-14 15:48:35,204 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:35,215 - INFO - Going to convert document batch...
2025-11-14 15:48:35,217 - INFO - Processing document 4_2025-05-13
2025-11-14 15:48:35,242 - INFO - Finished converting document 4_2025-05-13 in 0.05 sec.


Converted 'data\edgar_documents\BMY\4_2025-04-29' --> 'data\processed_data\BMY\4_2025-04-29.md'
Converted 'data\edgar_documents\BMY\4_2025-05-05' --> 'data\processed_data\BMY\4_2025-05-05.md'


2025-11-14 15:48:35,288 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:35,299 - INFO - Going to convert document batch...
2025-11-14 15:48:35,299 - INFO - Processing document 4_2025-06-04
2025-11-14 15:48:35,323 - INFO - Finished converting document 4_2025-06-04 in 0.06 sec.
2025-11-14 15:48:35,382 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:35,392 - INFO - Going to convert document batch...
2025-11-14 15:48:35,392 - INFO - Processing document 4_2025-06-16
2025-11-14 15:48:35,413 - INFO - Finished converting document 4_2025-06-16 in 0.06 sec.


Converted 'data\edgar_documents\BMY\4_2025-05-13' --> 'data\processed_data\BMY\4_2025-05-13.md'
Converted 'data\edgar_documents\BMY\4_2025-06-04' --> 'data\processed_data\BMY\4_2025-06-04.md'
Converted 'data\edgar_documents\BMY\4_2025-06-16' --> 'data\processed_data\BMY\4_2025-06-16.md'


2025-11-14 15:48:35,450 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:35,456 - INFO - Going to convert document batch...
2025-11-14 15:48:35,457 - INFO - Processing document 4_2025-07-01
2025-11-14 15:48:35,477 - INFO - Finished converting document 4_2025-07-01 in 0.03 sec.
2025-11-14 15:48:35,513 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:35,522 - INFO - Going to convert document batch...
2025-11-14 15:48:35,524 - INFO - Processing document 4_2025-07-02
2025-11-14 15:48:35,543 - INFO - Finished converting document 4_2025-07-02 in 0.05 sec.
2025-11-14 15:48:35,591 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:35,601 - INFO - Going to convert document batch...
2025-11-14 15:48:35,602 - INFO - Processing document 4_2025-08-05
2025-11-14 15:48:35,622 - INFO - Finished converting document 4_2025-08-05 in 0.06 sec.
2025-11-14 15:48:35,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\BMY\4_2025-07-01' --> 'data\processed_data\BMY\4_2025-07-01.md'
Converted 'data\edgar_documents\BMY\4_2025-07-02' --> 'data\processed_data\BMY\4_2025-07-02.md'
Converted 'data\edgar_documents\BMY\4_2025-08-05' --> 'data\processed_data\BMY\4_2025-08-05.md'


2025-11-14 15:48:35,684 - INFO - Processing document 4_2025-09-03
2025-11-14 15:48:35,705 - INFO - Finished converting document 4_2025-09-03 in 0.06 sec.
2025-11-14 15:48:35,739 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:35,746 - INFO - Going to convert document batch...
2025-11-14 15:48:35,747 - INFO - Processing document 4_2025-10-02
2025-11-14 15:48:35,766 - INFO - Finished converting document 4_2025-10-02 in 0.05 sec.
2025-11-14 15:48:35,814 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:35,829 - INFO - Going to convert document batch...
2025-11-14 15:48:35,830 - INFO - Processing document 4_2025-10-06
2025-11-14 15:48:35,849 - INFO - Finished converting document 4_2025-10-06 in 0.06 sec.
2025-11-14 15:48:35,894 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:48:35,895 - ERROR - Input document 4_2025-11-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>

Converted 'data\edgar_documents\BMY\4_2025-09-03' --> 'data\processed_data\BMY\4_2025-09-03.md'
Converted 'data\edgar_documents\BMY\4_2025-10-02' --> 'data\processed_data\BMY\4_2025-10-02.md'
Converted 'data\edgar_documents\BMY\4_2025-10-06' --> 'data\processed_data\BMY\4_2025-10-06.md'
Error processing data\edgar_documents\BMY\4_2025-11-03: File format not allowed: data\edgar_documents\BMY\4_2025-11-03


2025-11-14 15:48:35,918 - INFO - Going to convert document batch...
2025-11-14 15:48:35,919 - INFO - Processing document 4_2025-11-04
2025-11-14 15:48:35,943 - INFO - Finished converting document 4_2025-11-04 in 0.05 sec.
2025-11-14 15:48:35,991 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:48:35,992 - ERROR - Input document 4_2025-11-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:48:35,995 - INFO - Going to convert document batch...
2025-11-14 15:48:36,009 - IN

Converted 'data\edgar_documents\BMY\4_2025-11-04' --> 'data\processed_data\BMY\4_2025-11-04.md'
Error processing data\edgar_documents\BMY\4_2025-11-07: File format not allowed: data\edgar_documents\BMY\4_2025-11-07
Converted 'data\edgar_documents\BMY\8-K_2023-01-09' --> 'data\processed_data\BMY\8-K_2023-01-09.md'
Converted 'data\edgar_documents\BMY\8-K_2023-01-31' --> 'data\processed_data\BMY\8-K_2023-01-31.md'


2025-11-14 15:48:36,163 - INFO - Going to convert document batch...
2025-11-14 15:48:36,165 - INFO - Processing document 8-K_2023-02-02
2025-11-14 15:48:36,198 - INFO - Finished converting document 8-K_2023-02-02 in 0.08 sec.
2025-11-14 15:48:36,234 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:36,248 - INFO - Going to convert document batch...
2025-11-14 15:48:36,249 - INFO - Processing document 8-K_2023-02-28
2025-11-14 15:48:36,267 - INFO - Finished converting document 8-K_2023-02-28 in 0.05 sec.
2025-11-14 15:48:36,290 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:36,307 - INFO - Going to convert document batch...
2025-11-14 15:48:36,309 - INFO - Processing document 8-K_2023-04-26
2025-11-14 15:48:36,341 - INFO - Finished converting document 8-K_2023-04-26 in 0.06 sec.
2025-11-14 15:48:36,385 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:36,406 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BMY\8-K_2023-02-02' --> 'data\processed_data\BMY\8-K_2023-02-02.md'
Converted 'data\edgar_documents\BMY\8-K_2023-02-28' --> 'data\processed_data\BMY\8-K_2023-02-28.md'
Converted 'data\edgar_documents\BMY\8-K_2023-04-26' --> 'data\processed_data\BMY\8-K_2023-04-26.md'


2025-11-14 15:48:36,407 - INFO - Processing document 8-K_2023-04-27
2025-11-14 15:48:36,449 - INFO - Finished converting document 8-K_2023-04-27 in 0.09 sec.
2025-11-14 15:48:36,507 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:36,532 - INFO - Going to convert document batch...
2025-11-14 15:48:36,534 - INFO - Processing document 8-K_2023-05-04
2025-11-14 15:48:36,571 - INFO - Finished converting document 8-K_2023-05-04 in 0.09 sec.
2025-11-14 15:48:36,601 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:36,617 - INFO - Going to convert document batch...
2025-11-14 15:48:36,618 - INFO - Processing document 8-K_2023-07-27
2025-11-14 15:48:36,639 - INFO - Finished converting document 8-K_2023-07-27 in 0.06 sec.


Converted 'data\edgar_documents\BMY\8-K_2023-04-27' --> 'data\processed_data\BMY\8-K_2023-04-27.md'
Converted 'data\edgar_documents\BMY\8-K_2023-05-04' --> 'data\processed_data\BMY\8-K_2023-05-04.md'


2025-11-14 15:48:36,668 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:36,687 - INFO - Going to convert document batch...
2025-11-14 15:48:36,688 - INFO - Processing document 8-K_2023-08-10
2025-11-14 15:48:36,717 - INFO - Finished converting document 8-K_2023-08-10 in 0.06 sec.
2025-11-14 15:48:36,747 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:36,763 - INFO - Going to convert document batch...
2025-11-14 15:48:36,764 - INFO - Processing document 8-K_2023-10-26


Converted 'data\edgar_documents\BMY\8-K_2023-07-27' --> 'data\processed_data\BMY\8-K_2023-07-27.md'
Converted 'data\edgar_documents\BMY\8-K_2023-08-10' --> 'data\processed_data\BMY\8-K_2023-08-10.md'


2025-11-14 15:48:37,289 - INFO - Finished converting document 8-K_2023-10-26 in 0.55 sec.
2025-11-14 15:48:37,337 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:37,351 - INFO - Going to convert document batch...
2025-11-14 15:48:37,352 - INFO - Processing document 8-K_2023-10-31
2025-11-14 15:48:37,375 - INFO - Finished converting document 8-K_2023-10-31 in 0.06 sec.
2025-11-14 15:48:37,428 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:37,454 - INFO - Going to convert document batch...
2025-11-14 15:48:37,456 - INFO - Processing document 8-K_2023-11-13
2025-11-14 15:48:37,497 - INFO - Finished converting document 8-K_2023-11-13 in 0.11 sec.


Converted 'data\edgar_documents\BMY\8-K_2023-10-26' --> 'data\processed_data\BMY\8-K_2023-10-26.md'
Converted 'data\edgar_documents\BMY\8-K_2023-10-31' --> 'data\processed_data\BMY\8-K_2023-10-31.md'


2025-11-14 15:48:37,545 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:37,569 - INFO - Going to convert document batch...
2025-11-14 15:48:37,571 - INFO - Processing document 8-K_2023-12-22
2025-11-14 15:48:37,603 - INFO - Finished converting document 8-K_2023-12-22 in 0.08 sec.
2025-11-14 15:48:37,633 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:37,651 - INFO - Going to convert document batch...
2025-11-14 15:48:37,652 - INFO - Processing document 8-K_2024-01-08
2025-11-14 15:48:37,681 - INFO - Finished converting document 8-K_2024-01-08 in 0.06 sec.


Converted 'data\edgar_documents\BMY\8-K_2023-11-13' --> 'data\processed_data\BMY\8-K_2023-11-13.md'
Converted 'data\edgar_documents\BMY\8-K_2023-12-22' --> 'data\processed_data\BMY\8-K_2023-12-22.md'
Converted 'data\edgar_documents\BMY\8-K_2024-01-08' --> 'data\processed_data\BMY\8-K_2024-01-08.md'


2025-11-14 15:48:37,719 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:37,732 - INFO - Going to convert document batch...
2025-11-14 15:48:37,733 - INFO - Processing document 8-K_2024-02-02
2025-11-14 15:48:37,758 - INFO - Finished converting document 8-K_2024-02-02 in 0.06 sec.
2025-11-14 15:48:37,789 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:48:37,790 - ERROR - Input document 8-K_2024-02-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <I

Converted 'data\edgar_documents\BMY\8-K_2024-02-02' --> 'data\processed_data\BMY\8-K_2024-02-02.md'
Error processing data\edgar_documents\BMY\8-K_2024-02-14: File format not allowed: data\edgar_documents\BMY\8-K_2024-02-14
Error processing data\edgar_documents\BMY\8-K_2024-02-15: File format not allowed: data\edgar_documents\BMY\8-K_2024-02-15
Error processing data\edgar_documents\BMY\8-K_2024-02-22: File format not allowed: data\edgar_documents\BMY\8-K_2024-02-22
Error processing data\edgar_documents\BMY\8-K_2024-03-18: File format not allowed: data\edgar_documents\BMY\8-K_2024-03-18
Converted 'data\edgar_documents\BMY\8-K_2024-04-25' --> 'data\processed_data\BMY\8-K_2024-04-25.md'


2025-11-14 15:48:37,953 - ERROR - Input document 8-K_2024-05-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:48:37,954 - INFO - Going to convert document batch...
2025-11-14 15:48:37,970 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:48:37,971 - ERROR - Input document 8-K_2024-06-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, 

Error processing data\edgar_documents\BMY\8-K_2024-05-09: File format not allowed: data\edgar_documents\BMY\8-K_2024-05-09
Error processing data\edgar_documents\BMY\8-K_2024-06-18: File format not allowed: data\edgar_documents\BMY\8-K_2024-06-18
Converted 'data\edgar_documents\BMY\8-K_2024-07-26' --> 'data\processed_data\BMY\8-K_2024-07-26.md'
Converted 'data\edgar_documents\BMY\8-K_2024-10-31' --> 'data\processed_data\BMY\8-K_2024-10-31.md'
Error processing data\edgar_documents\BMY\8-K_2025-01-13: File format not allowed: data\edgar_documents\BMY\8-K_2025-01-13


2025-11-14 15:48:38,161 - INFO - Going to convert document batch...
2025-11-14 15:48:38,162 - INFO - Processing document 8-K_2025-02-06
2025-11-14 15:48:38,189 - INFO - Finished converting document 8-K_2025-02-06 in 0.06 sec.
2025-11-14 15:48:38,224 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:48:38,225 - ERROR - Input document 8-K_2025-02-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:48:38,227 - INFO - Going to convert docu

Converted 'data\edgar_documents\BMY\8-K_2025-02-06' --> 'data\processed_data\BMY\8-K_2025-02-06.md'
Error processing data\edgar_documents\BMY\8-K_2025-02-18: File format not allowed: data\edgar_documents\BMY\8-K_2025-02-18
Converted 'data\edgar_documents\BMY\8-K_2025-04-24' --> 'data\processed_data\BMY\8-K_2025-04-24.md'
Error processing data\edgar_documents\BMY\8-K_2025-05-07: File format not allowed: data\edgar_documents\BMY\8-K_2025-05-07
Error processing data\edgar_documents\BMY\8-K_2025-07-25: File format not allowed: data\edgar_documents\BMY\8-K_2025-07-25


2025-11-14 15:48:38,422 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:38,433 - INFO - Going to convert document batch...
2025-11-14 15:48:38,434 - INFO - Processing document 8-K_2025-10-30
2025-11-14 15:48:38,453 - INFO - Finished converting document 8-K_2025-10-30 in 0.05 sec.
2025-11-14 15:48:38,502 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:48:38,503 - ERROR - Input document 8-K_2025-11-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <I

Converted 'data\edgar_documents\BMY\8-K_2025-07-31' --> 'data\processed_data\BMY\8-K_2025-07-31.md'
Converted 'data\edgar_documents\BMY\8-K_2025-10-30' --> 'data\processed_data\BMY\8-K_2025-10-30.md'
Error processing data\edgar_documents\BMY\8-K_2025-11-03: File format not allowed: data\edgar_documents\BMY\8-K_2025-11-03
Error processing data\edgar_documents\BMY\8-K_2025-11-10: File format not allowed: data\edgar_documents\BMY\8-K_2025-11-10


2025-11-14 15:48:39,337 - INFO - Going to convert document batch...
2025-11-14 15:48:39,338 - INFO - Processing document DEF-14A_2023-03-23
2025-11-14 15:48:44,016 - INFO - Finished converting document DEF-14A_2023-03-23 in 5.48 sec.
2025-11-14 15:48:44,742 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:48:44,743 - ERROR - Input document DEF-14A_2024-03-28 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:48:44,746 - INFO - Going to 

Converted 'data\edgar_documents\BMY\DEF-14A_2023-03-23' --> 'data\processed_data\BMY\DEF-14A_2023-03-23.md'
Error processing data\edgar_documents\BMY\DEF-14A_2024-03-28: File format not allowed: data\edgar_documents\BMY\DEF-14A_2024-03-28


2025-11-14 15:48:45,510 - INFO - Going to convert document batch...
2025-11-14 15:48:45,511 - INFO - Processing document DEF-14A_2025-03-26
2025-11-14 15:48:47,130 - INFO - Finished converting document DEF-14A_2025-03-26 in 2.38 sec.


Converted 'data\edgar_documents\BMY\DEF-14A_2025-03-26' --> 'data\processed_data\BMY\DEF-14A_2025-03-26.md'
Processed 88 new files. Errors: 19
Found 157 files to process in data\edgar_documents\BRK-B


2025-11-14 15:48:48,225 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:48:51,071 - INFO - Going to convert document batch...
2025-11-14 15:48:51,072 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:48:51,072 - INFO - Processing document 10-K_2023-02-27
2025-11-14 15:48:56,348 - INFO - Finished converting document 10-K_2023-02-27 in 8.42 sec.
2025-11-14 15:48:57,225 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\10-K_2023-02-27' --> 'data\processed_data\BRK-B\10-K_2023-02-27.md'


2025-11-14 15:49:00,635 - INFO - Going to convert document batch...
2025-11-14 15:49:00,636 - INFO - Processing document 10-K_2024-02-26
2025-11-14 15:49:07,623 - INFO - Finished converting document 10-K_2024-02-26 in 10.61 sec.


Converted 'data\edgar_documents\BRK-B\10-K_2024-02-26' --> 'data\processed_data\BRK-B\10-K_2024-02-26.md'


2025-11-14 15:49:09,063 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:49:17,866 - INFO - Going to convert document batch...
2025-11-14 15:49:17,867 - INFO - Processing document 10-K_2025-02-24
2025-11-14 15:49:31,422 - INFO - Finished converting document 10-K_2025-02-24 in 22.55 sec.
2025-11-14 15:49:33,178 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\10-K_2025-02-24' --> 'data\processed_data\BRK-B\10-K_2025-02-24.md'


2025-11-14 15:49:35,225 - INFO - Going to convert document batch...
2025-11-14 15:49:35,226 - INFO - Processing document 10-Q_2023-05-08
2025-11-14 15:49:37,897 - INFO - Finished converting document 10-Q_2023-05-08 in 4.83 sec.
2025-11-14 15:49:38,387 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\10-Q_2023-05-08' --> 'data\processed_data\BRK-B\10-Q_2023-05-08.md'


2025-11-14 15:49:40,006 - INFO - Going to convert document batch...
2025-11-14 15:49:40,007 - INFO - Processing document 10-Q_2023-08-07
2025-11-14 15:49:44,675 - INFO - Finished converting document 10-Q_2023-08-07 in 6.44 sec.
2025-11-14 15:49:45,743 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\10-Q_2023-08-07' --> 'data\processed_data\BRK-B\10-Q_2023-08-07.md'


2025-11-14 15:49:49,138 - INFO - Going to convert document batch...
2025-11-14 15:49:49,139 - INFO - Processing document 10-Q_2023-11-06
2025-11-14 15:49:51,898 - INFO - Finished converting document 10-Q_2023-11-06 in 6.28 sec.
2025-11-14 15:49:52,428 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\10-Q_2023-11-06' --> 'data\processed_data\BRK-B\10-Q_2023-11-06.md'


2025-11-14 15:49:53,603 - INFO - Going to convert document batch...
2025-11-14 15:49:53,604 - INFO - Processing document 10-Q_2024-05-06
2025-11-14 15:49:55,863 - INFO - Finished converting document 10-Q_2024-05-06 in 3.50 sec.
2025-11-14 15:49:56,260 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\10-Q_2024-05-06' --> 'data\processed_data\BRK-B\10-Q_2024-05-06.md'


2025-11-14 15:49:57,552 - INFO - Going to convert document batch...
2025-11-14 15:49:57,553 - INFO - Processing document 10-Q_2024-08-05
2025-11-14 15:50:00,260 - INFO - Finished converting document 10-Q_2024-08-05 in 4.09 sec.
2025-11-14 15:50:00,732 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\10-Q_2024-08-05' --> 'data\processed_data\BRK-B\10-Q_2024-08-05.md'


2025-11-14 15:50:03,475 - INFO - Going to convert document batch...
2025-11-14 15:50:03,476 - INFO - Processing document 10-Q_2024-11-04
2025-11-14 15:50:07,838 - INFO - Finished converting document 10-Q_2024-11-04 in 7.20 sec.
2025-11-14 15:50:08,656 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\10-Q_2024-11-04' --> 'data\processed_data\BRK-B\10-Q_2024-11-04.md'


2025-11-14 15:50:12,523 - INFO - Going to convert document batch...
2025-11-14 15:50:12,524 - INFO - Processing document 10-Q_2025-05-05
2025-11-14 15:50:15,999 - INFO - Finished converting document 10-Q_2025-05-05 in 7.45 sec.
2025-11-14 15:50:16,966 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\10-Q_2025-05-05' --> 'data\processed_data\BRK-B\10-Q_2025-05-05.md'


2025-11-14 15:50:21,553 - INFO - Going to convert document batch...
2025-11-14 15:50:21,554 - INFO - Processing document 10-Q_2025-08-04
2025-11-14 15:50:26,216 - INFO - Finished converting document 10-Q_2025-08-04 in 9.42 sec.
2025-11-14 15:50:27,242 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\10-Q_2025-08-04' --> 'data\processed_data\BRK-B\10-Q_2025-08-04.md'


2025-11-14 15:50:31,791 - INFO - Going to convert document batch...
2025-11-14 15:50:31,793 - INFO - Processing document 10-Q_2025-11-03
2025-11-14 15:50:36,374 - INFO - Finished converting document 10-Q_2025-11-03 in 9.27 sec.
2025-11-14 15:50:37,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:37,396 - INFO - Going to convert document batch...
2025-11-14 15:50:37,398 - INFO - Processing document 4_2023-02-24
2025-11-14 15:50:37,466 - INFO - Finished converting document 4_2023-02-24 in 0.14 sec.


Converted 'data\edgar_documents\BRK-B\10-Q_2025-11-03' --> 'data\processed_data\BRK-B\10-Q_2025-11-03.md'


2025-11-14 15:50:37,547 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:37,569 - INFO - Going to convert document batch...
2025-11-14 15:50:37,571 - INFO - Processing document 4_2023-03-03
2025-11-14 15:50:37,634 - INFO - Finished converting document 4_2023-03-03 in 0.09 sec.
2025-11-14 15:50:37,718 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2023-02-24' --> 'data\processed_data\BRK-B\4_2023-02-24.md'
Converted 'data\edgar_documents\BRK-B\4_2023-03-03' --> 'data\processed_data\BRK-B\4_2023-03-03.md'


2025-11-14 15:50:37,762 - INFO - Going to convert document batch...
2025-11-14 15:50:37,765 - INFO - Processing document 4_2023-03-07
2025-11-14 15:50:37,875 - INFO - Finished converting document 4_2023-03-07 in 0.19 sec.
2025-11-14 15:50:37,970 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:38,023 - INFO - Going to convert document batch...
2025-11-14 15:50:38,024 - INFO - Processing document 4_2023-03-15
2025-11-14 15:50:38,158 - INFO - Finished converting document 4_2023-03-15 in 0.20 sec.


Converted 'data\edgar_documents\BRK-B\4_2023-03-07' --> 'data\processed_data\BRK-B\4_2023-03-07.md'


2025-11-14 15:50:38,258 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:38,281 - INFO - Going to convert document batch...
2025-11-14 15:50:38,282 - INFO - Processing document 4_2023-03-21
2025-11-14 15:50:38,338 - INFO - Finished converting document 4_2023-03-21 in 0.09 sec.
2025-11-14 15:50:38,427 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2023-03-15' --> 'data\processed_data\BRK-B\4_2023-03-15.md'
Converted 'data\edgar_documents\BRK-B\4_2023-03-21' --> 'data\processed_data\BRK-B\4_2023-03-21.md'


2025-11-14 15:50:38,463 - INFO - Going to convert document batch...
2025-11-14 15:50:38,466 - INFO - Processing document 4_2023-03-27
2025-11-14 15:50:38,559 - INFO - Finished converting document 4_2023-03-27 in 0.16 sec.
2025-11-14 15:50:38,654 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:50:38,655 - ERROR - Input document 4_2023-04-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:50:38,657 - INFO - Going to convert document batch...
2025-11-14 15:50:38,676 - IN

Converted 'data\edgar_documents\BRK-B\4_2023-03-27' --> 'data\processed_data\BRK-B\4_2023-03-27.md'
Error processing data\edgar_documents\BRK-B\4_2023-04-05: File format not allowed: data\edgar_documents\BRK-B\4_2023-04-05
Error processing data\edgar_documents\BRK-B\4_2023-04-17: File format not allowed: data\edgar_documents\BRK-B\4_2023-04-17


2025-11-14 15:50:38,876 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:38,942 - INFO - Going to convert document batch...
2025-11-14 15:50:38,944 - INFO - Processing document 4_2023-05-15


Converted 'data\edgar_documents\BRK-B\4_2023-05-12' --> 'data\processed_data\BRK-B\4_2023-05-12.md'


2025-11-14 15:50:39,080 - INFO - Finished converting document 4_2023-05-15 in 0.22 sec.
2025-11-14 15:50:39,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:39,238 - INFO - Going to convert document batch...
2025-11-14 15:50:39,239 - INFO - Processing document 4_2023-05-18
2025-11-14 15:50:39,317 - INFO - Finished converting document 4_2023-05-18 in 0.12 sec.


Converted 'data\edgar_documents\BRK-B\4_2023-05-15' --> 'data\processed_data\BRK-B\4_2023-05-15.md'
Converted 'data\edgar_documents\BRK-B\4_2023-05-18' --> 'data\processed_data\BRK-B\4_2023-05-18.md'


2025-11-14 15:50:39,417 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:39,448 - INFO - Going to convert document batch...
2025-11-14 15:50:39,449 - INFO - Processing document 4_2023-05-30
2025-11-14 15:50:39,528 - INFO - Finished converting document 4_2023-05-30 in 0.14 sec.
2025-11-14 15:50:39,615 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:39,642 - INFO - Going to convert document batch...
2025-11-14 15:50:39,643 - INFO - Processing document 4_2023-06-09
2025-11-14 15:50:39,703 - INFO - Finished converting document 4_2023-06-09 in 0.11 sec.


Converted 'data\edgar_documents\BRK-B\4_2023-05-30' --> 'data\processed_data\BRK-B\4_2023-05-30.md'


2025-11-14 15:50:39,794 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:39,823 - INFO - Going to convert document batch...
2025-11-14 15:50:39,824 - INFO - Processing document 4_2023-06-22
2025-11-14 15:50:39,885 - INFO - Finished converting document 4_2023-06-22 in 0.11 sec.
2025-11-14 15:50:39,979 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2023-06-09' --> 'data\processed_data\BRK-B\4_2023-06-09.md'
Converted 'data\edgar_documents\BRK-B\4_2023-06-22' --> 'data\processed_data\BRK-B\4_2023-06-22.md'


2025-11-14 15:50:40,028 - INFO - Going to convert document batch...
2025-11-14 15:50:40,029 - INFO - Processing document 4_2023-06-28
2025-11-14 15:50:40,106 - INFO - Finished converting document 4_2023-06-28 in 0.16 sec.
2025-11-14 15:50:40,195 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:40,220 - INFO - Going to convert document batch...
2025-11-14 15:50:40,221 - INFO - Processing document 4_2023-06-30
2025-11-14 15:50:40,273 - INFO - Finished converting document 4_2023-06-30 in 0.08 sec.
2025-11-14 15:50:40,356 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:40,376 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BRK-B\4_2023-06-28' --> 'data\processed_data\BRK-B\4_2023-06-28.md'
Converted 'data\edgar_documents\BRK-B\4_2023-06-30' --> 'data\processed_data\BRK-B\4_2023-06-30.md'


2025-11-14 15:50:40,377 - INFO - Processing document 4_2023-08-10
2025-11-14 15:50:40,424 - INFO - Finished converting document 4_2023-08-10 in 0.09 sec.
2025-11-14 15:50:40,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:40,526 - INFO - Going to convert document batch...
2025-11-14 15:50:40,527 - INFO - Processing document 4_2023-08-15
2025-11-14 15:50:40,569 - INFO - Finished converting document 4_2023-08-15 in 0.09 sec.
2025-11-14 15:50:40,639 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2023-08-10' --> 'data\processed_data\BRK-B\4_2023-08-10.md'
Converted 'data\edgar_documents\BRK-B\4_2023-08-15' --> 'data\processed_data\BRK-B\4_2023-08-15.md'


2025-11-14 15:50:40,658 - INFO - Going to convert document batch...
2025-11-14 15:50:40,660 - INFO - Processing document 4_2023-08-16
2025-11-14 15:50:40,712 - INFO - Finished converting document 4_2023-08-16 in 0.09 sec.
2025-11-14 15:50:40,769 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:40,793 - INFO - Going to convert document batch...
2025-11-14 15:50:40,794 - INFO - Processing document 4_2023-08-17
2025-11-14 15:50:40,848 - INFO - Finished converting document 4_2023-08-17 in 0.09 sec.
2025-11-14 15:50:40,910 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:40,931 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BRK-B\4_2023-08-16' --> 'data\processed_data\BRK-B\4_2023-08-16.md'
Converted 'data\edgar_documents\BRK-B\4_2023-08-17' --> 'data\processed_data\BRK-B\4_2023-08-17.md'


2025-11-14 15:50:40,932 - INFO - Processing document 4_2023-09-08
2025-11-14 15:50:41,002 - INFO - Finished converting document 4_2023-09-08 in 0.11 sec.
2025-11-14 15:50:41,082 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:41,111 - INFO - Going to convert document batch...
2025-11-14 15:50:41,112 - INFO - Processing document 4_2023-09-13
2025-11-14 15:50:41,180 - INFO - Finished converting document 4_2023-09-13 in 0.11 sec.


Converted 'data\edgar_documents\BRK-B\4_2023-09-08' --> 'data\processed_data\BRK-B\4_2023-09-08.md'
Converted 'data\edgar_documents\BRK-B\4_2023-09-13' --> 'data\processed_data\BRK-B\4_2023-09-13.md'


2025-11-14 15:50:41,281 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:41,314 - INFO - Going to convert document batch...
2025-11-14 15:50:41,315 - INFO - Processing document 4_2023-09-22
2025-11-14 15:50:41,393 - INFO - Finished converting document 4_2023-09-22 in 0.14 sec.
2025-11-14 15:50:41,465 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:41,494 - INFO - Going to convert document batch...
2025-11-14 15:50:41,495 - INFO - Processing document 4_2023-09-27
2025-11-14 15:50:41,561 - INFO - Finished converting document 4_2023-09-27 in 0.11 sec.
2025-11-14 15:50:41,629 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2023-09-22' --> 'data\processed_data\BRK-B\4_2023-09-22.md'
Converted 'data\edgar_documents\BRK-B\4_2023-09-27' --> 'data\processed_data\BRK-B\4_2023-09-27.md'


2025-11-14 15:50:41,657 - INFO - Going to convert document batch...
2025-11-14 15:50:41,658 - INFO - Processing document 4_2023-10-02
2025-11-14 15:50:41,727 - INFO - Finished converting document 4_2023-10-02 in 0.11 sec.
2025-11-14 15:50:41,810 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:41,832 - INFO - Going to convert document batch...
2025-11-14 15:50:41,833 - INFO - Processing document 4_2023-10-05
2025-11-14 15:50:41,890 - INFO - Finished converting document 4_2023-10-05 in 0.11 sec.
2025-11-14 15:50:41,953 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2023-10-02' --> 'data\processed_data\BRK-B\4_2023-10-02.md'
Converted 'data\edgar_documents\BRK-B\4_2023-10-05' --> 'data\processed_data\BRK-B\4_2023-10-05.md'


2025-11-14 15:50:41,982 - INFO - Going to convert document batch...
2025-11-14 15:50:41,983 - INFO - Processing document 4_2023-10-25
2025-11-14 15:50:42,047 - INFO - Finished converting document 4_2023-10-25 in 0.11 sec.
2025-11-14 15:50:42,135 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:42,168 - INFO - Going to convert document batch...
2025-11-14 15:50:42,171 - INFO - Processing document 4_2023-10-30
2025-11-14 15:50:42,267 - INFO - Finished converting document 4_2023-10-30 in 0.16 sec.


Converted 'data\edgar_documents\BRK-B\4_2023-10-25' --> 'data\processed_data\BRK-B\4_2023-10-25.md'


2025-11-14 15:50:42,359 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:50:42,360 - ERROR - Input document 4_2023-11-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:50:42,362 - INFO - Going to convert document batch...
2025-11-14 15:50:42,375 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:42,400 - INFO - Going to convert document batch...
2025-11-14 15:50:42,402 - INFO - Processing document 4_2023-11-13
2025-11-14 15:50:42,452 - INFO - Fin

Converted 'data\edgar_documents\BRK-B\4_2023-10-30' --> 'data\processed_data\BRK-B\4_2023-10-30.md'
Error processing data\edgar_documents\BRK-B\4_2023-11-08: File format not allowed: data\edgar_documents\BRK-B\4_2023-11-08
Converted 'data\edgar_documents\BRK-B\4_2023-11-13' --> 'data\processed_data\BRK-B\4_2023-11-13.md'
Error processing data\edgar_documents\BRK-B\4_2023-11-20: File format not allowed: data\edgar_documents\BRK-B\4_2023-11-20


2025-11-14 15:50:42,539 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:42,562 - INFO - Going to convert document batch...
2025-11-14 15:50:42,563 - INFO - Processing document 4_2023-11-21
2025-11-14 15:50:42,627 - INFO - Finished converting document 4_2023-11-21 in 0.09 sec.
2025-11-14 15:50:42,691 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:42,716 - INFO - Going to convert document batch...
2025-11-14 15:50:42,717 - INFO - Processing document 4_2023-11-27
2025-11-14 15:50:42,776 - INFO - Finished converting document 4_2023-11-27 in 0.11 sec.
2025-11-14 15:50:42,859 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2023-11-21' --> 'data\processed_data\BRK-B\4_2023-11-21.md'
Converted 'data\edgar_documents\BRK-B\4_2023-11-27' --> 'data\processed_data\BRK-B\4_2023-11-27.md'


2025-11-14 15:50:44,201 - INFO - Going to convert document batch...
2025-11-14 15:50:44,202 - INFO - Processing document 4_2023-12-13
2025-11-14 15:50:44,285 - INFO - Finished converting document 4_2023-12-13 in 1.45 sec.
2025-11-14 15:50:44,361 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:44,386 - INFO - Going to convert document batch...
2025-11-14 15:50:44,388 - INFO - Processing document 4_2023-12-14
2025-11-14 15:50:44,454 - INFO - Finished converting document 4_2023-12-14 in 0.11 sec.
2025-11-14 15:50:44,533 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2023-12-13' --> 'data\processed_data\BRK-B\4_2023-12-13.md'
Converted 'data\edgar_documents\BRK-B\4_2023-12-14' --> 'data\processed_data\BRK-B\4_2023-12-14.md'


2025-11-14 15:50:44,556 - INFO - Going to convert document batch...
2025-11-14 15:50:44,557 - INFO - Processing document 4_2023-12-18
2025-11-14 15:50:44,612 - INFO - Finished converting document 4_2023-12-18 in 0.11 sec.
2025-11-14 15:50:44,671 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:44,704 - INFO - Going to convert document batch...
2025-11-14 15:50:44,705 - INFO - Processing document 4_2023-12-21
2025-11-14 15:50:44,789 - INFO - Finished converting document 4_2023-12-21 in 0.12 sec.


Converted 'data\edgar_documents\BRK-B\4_2023-12-18' --> 'data\processed_data\BRK-B\4_2023-12-18.md'
Converted 'data\edgar_documents\BRK-B\4_2023-12-21' --> 'data\processed_data\BRK-B\4_2023-12-21.md'


2025-11-14 15:50:44,882 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:44,912 - INFO - Going to convert document batch...
2025-11-14 15:50:44,913 - INFO - Processing document 4_2024-01-04
2025-11-14 15:50:44,980 - INFO - Finished converting document 4_2024-01-04 in 0.12 sec.
2025-11-14 15:50:45,050 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:45,077 - INFO - Going to convert document batch...
2025-11-14 15:50:45,079 - INFO - Processing document 4_2024-01-12
2025-11-14 15:50:45,134 - INFO - Finished converting document 4_2024-01-12 in 0.09 sec.
2025-11-14 15:50:45,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2024-01-04' --> 'data\processed_data\BRK-B\4_2024-01-04.md'
Converted 'data\edgar_documents\BRK-B\4_2024-01-12' --> 'data\processed_data\BRK-B\4_2024-01-12.md'


2025-11-14 15:50:45,229 - INFO - Going to convert document batch...
2025-11-14 15:50:45,231 - INFO - Processing document 4_2024-01-17
2025-11-14 15:50:45,312 - INFO - Finished converting document 4_2024-01-17 in 0.12 sec.
2025-11-14 15:50:45,401 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:45,429 - INFO - Going to convert document batch...
2025-11-14 15:50:45,431 - INFO - Processing document 4_2024-01-18
2025-11-14 15:50:45,561 - INFO - Finished converting document 4_2024-01-18 in 0.17 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-01-17' --> 'data\processed_data\BRK-B\4_2024-01-17.md'


2025-11-14 15:50:45,660 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:45,690 - INFO - Going to convert document batch...
2025-11-14 15:50:45,691 - INFO - Processing document 4_2024-01-25
2025-11-14 15:50:45,767 - INFO - Finished converting document 4_2024-01-25 in 0.12 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-01-18' --> 'data\processed_data\BRK-B\4_2024-01-18.md'
Converted 'data\edgar_documents\BRK-B\4_2024-01-25' --> 'data\processed_data\BRK-B\4_2024-01-25.md'


2025-11-14 15:50:45,849 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:45,886 - INFO - Going to convert document batch...
2025-11-14 15:50:45,888 - INFO - Processing document 4_2024-02-01
2025-11-14 15:50:45,978 - INFO - Finished converting document 4_2024-02-01 in 0.16 sec.
2025-11-14 15:50:46,045 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:46,081 - INFO - Going to convert document batch...
2025-11-14 15:50:46,083 - INFO - Processing document 4_2024-02-05
2025-11-14 15:50:46,167 - INFO - Finished converting document 4_2024-02-05 in 0.14 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-02-01' --> 'data\processed_data\BRK-B\4_2024-02-01.md'


2025-11-14 15:50:46,255 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:46,280 - INFO - Going to convert document batch...
2025-11-14 15:50:46,282 - INFO - Processing document 4_2024-03-06
2025-11-14 15:50:46,344 - INFO - Finished converting document 4_2024-03-06 in 0.11 sec.
2025-11-14 15:50:46,412 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2024-02-05' --> 'data\processed_data\BRK-B\4_2024-02-05.md'
Converted 'data\edgar_documents\BRK-B\4_2024-03-06' --> 'data\processed_data\BRK-B\4_2024-03-06.md'


2025-11-14 15:50:46,438 - INFO - Going to convert document batch...
2025-11-14 15:50:46,439 - INFO - Processing document 4_2024-03-12
2025-11-14 15:50:46,503 - INFO - Finished converting document 4_2024-03-12 in 0.09 sec.
2025-11-14 15:50:46,568 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:46,593 - INFO - Going to convert document batch...
2025-11-14 15:50:46,594 - INFO - Processing document 4_2024-03-25
2025-11-14 15:50:46,687 - INFO - Finished converting document 4_2024-03-25 in 0.14 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-03-12' --> 'data\processed_data\BRK-B\4_2024-03-12.md'
Converted 'data\edgar_documents\BRK-B\4_2024-03-25' --> 'data\processed_data\BRK-B\4_2024-03-25.md'


2025-11-14 15:50:46,757 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:46,783 - INFO - Going to convert document batch...
2025-11-14 15:50:46,785 - INFO - Processing document 4_2024-03-28
2025-11-14 15:50:46,849 - INFO - Finished converting document 4_2024-03-28 in 0.11 sec.
2025-11-14 15:50:46,914 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:46,940 - INFO - Going to convert document batch...
2025-11-14 15:50:46,942 - INFO - Processing document 4_2024-04-08
2025-11-14 15:50:47,013 - INFO - Finished converting document 4_2024-04-08 in 0.11 sec.
2025-11-14 15:50:47,114 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\BRK-B\4_2024-03-28' --> 'data\processed_data\BRK-B\4_2024-03-28.md'
Converted 'data\edgar_documents\BRK-B\4_2024-04-08' --> 'data\processed_data\BRK-B\4_2024-04-08.md'


2025-11-14 15:50:47,115 - ERROR - Input document 4_2024-04-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:50:47,117 - INFO - Going to convert document batch...
2025-11-14 15:50:47,131 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:47,159 - INFO - Going to convert document batch...
2025-11-14 15:50:47,160 - INFO - Processing document 4_2024-04-12
2025-11-14 15:50:47,220 - INFO - Finished converting document 4_2024-04-12 in 0.09 sec.
2025-11-14 15:50:47,297 - INFO - detec

Error processing data\edgar_documents\BRK-B\4_2024-04-09: File format not allowed: data\edgar_documents\BRK-B\4_2024-04-09
Converted 'data\edgar_documents\BRK-B\4_2024-04-12' --> 'data\processed_data\BRK-B\4_2024-04-12.md'
Error processing data\edgar_documents\BRK-B\4_2024-04-22: File format not allowed: data\edgar_documents\BRK-B\4_2024-04-22


2025-11-14 15:50:47,342 - INFO - Going to convert document batch...
2025-11-14 15:50:47,344 - INFO - Processing document 4_2024-04-26
2025-11-14 15:50:47,410 - INFO - Finished converting document 4_2024-04-26 in 0.11 sec.
2025-11-14 15:50:47,476 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:47,500 - INFO - Going to convert document batch...
2025-11-14 15:50:47,501 - INFO - Processing document 4_2024-05-01
2025-11-14 15:50:47,556 - INFO - Finished converting document 4_2024-05-01 in 0.09 sec.
2025-11-14 15:50:47,623 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:47,645 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BRK-B\4_2024-04-26' --> 'data\processed_data\BRK-B\4_2024-04-26.md'
Converted 'data\edgar_documents\BRK-B\4_2024-05-01' --> 'data\processed_data\BRK-B\4_2024-05-01.md'


2025-11-14 15:50:47,646 - INFO - Processing document 4_2024-05-17
2025-11-14 15:50:47,705 - INFO - Finished converting document 4_2024-05-17 in 0.09 sec.
2025-11-14 15:50:47,769 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:47,795 - INFO - Going to convert document batch...
2025-11-14 15:50:47,796 - INFO - Processing document 4_2024-06-07
2025-11-14 15:50:47,880 - INFO - Finished converting document 4_2024-06-07 in 0.12 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-05-17' --> 'data\processed_data\BRK-B\4_2024-05-17.md'
Converted 'data\edgar_documents\BRK-B\4_2024-06-07' --> 'data\processed_data\BRK-B\4_2024-06-07.md'


2025-11-14 15:50:47,975 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:48,008 - INFO - Going to convert document batch...
2025-11-14 15:50:48,009 - INFO - Processing document 4_2024-06-12
2025-11-14 15:50:48,075 - INFO - Finished converting document 4_2024-06-12 in 0.12 sec.
2025-11-14 15:50:48,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:48,169 - INFO - Going to convert document batch...
2025-11-14 15:50:48,171 - INFO - Processing document 4_2024-06-17
2025-11-14 15:50:48,236 - INFO - Finished converting document 4_2024-06-17 in 0.11 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-06-12' --> 'data\processed_data\BRK-B\4_2024-06-12.md'
Converted 'data\edgar_documents\BRK-B\4_2024-06-17' --> 'data\processed_data\BRK-B\4_2024-06-17.md'


2025-11-14 15:50:48,327 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:48,356 - INFO - Going to convert document batch...
2025-11-14 15:50:48,357 - INFO - Processing document 4_2024-06-20
2025-11-14 15:50:48,427 - INFO - Finished converting document 4_2024-06-20 in 0.12 sec.
2025-11-14 15:50:48,528 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:48,550 - INFO - Going to convert document batch...
2025-11-14 15:50:48,551 - INFO - Processing document 4_2024-06-28
2025-11-14 15:50:48,605 - INFO - Finished converting document 4_2024-06-28 in 0.09 sec.
2025-11-14 15:50:48,683 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:48,699 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BRK-B\4_2024-06-20' --> 'data\processed_data\BRK-B\4_2024-06-20.md'
Converted 'data\edgar_documents\BRK-B\4_2024-06-28' --> 'data\processed_data\BRK-B\4_2024-06-28.md'


2025-11-14 15:50:48,701 - INFO - Processing document 4_2024-07-02
2025-11-14 15:50:48,745 - INFO - Finished converting document 4_2024-07-02 in 0.09 sec.
2025-11-14 15:50:48,813 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:48,844 - INFO - Going to convert document batch...
2025-11-14 15:50:48,845 - INFO - Processing document 4_2024-07-19
2025-11-14 15:50:48,915 - INFO - Finished converting document 4_2024-07-19 in 0.12 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-07-02' --> 'data\processed_data\BRK-B\4_2024-07-02.md'


2025-11-14 15:50:48,979 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:49,006 - INFO - Going to convert document batch...
2025-11-14 15:50:49,007 - INFO - Processing document 4_2024-07-24
2025-11-14 15:50:49,067 - INFO - Finished converting document 4_2024-07-24 in 0.09 sec.
2025-11-14 15:50:49,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:49,177 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BRK-B\4_2024-07-19' --> 'data\processed_data\BRK-B\4_2024-07-19.md'
Converted 'data\edgar_documents\BRK-B\4_2024-07-24' --> 'data\processed_data\BRK-B\4_2024-07-24.md'


2025-11-14 15:50:49,178 - INFO - Processing document 4_2024-07-29
2025-11-14 15:50:49,255 - INFO - Finished converting document 4_2024-07-29 in 0.14 sec.
2025-11-14 15:50:49,333 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:49,365 - INFO - Going to convert document batch...
2025-11-14 15:50:49,366 - INFO - Processing document 4_2024-08-01
2025-11-14 15:50:49,447 - INFO - Finished converting document 4_2024-08-01 in 0.12 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-07-29' --> 'data\processed_data\BRK-B\4_2024-07-29.md'


2025-11-14 15:50:49,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:49,550 - INFO - Going to convert document batch...
2025-11-14 15:50:49,551 - INFO - Processing document 4_2024-08-19
2025-11-14 15:50:49,616 - INFO - Finished converting document 4_2024-08-19 in 0.09 sec.
2025-11-14 15:50:49,701 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2024-08-01' --> 'data\processed_data\BRK-B\4_2024-08-01.md'
Converted 'data\edgar_documents\BRK-B\4_2024-08-19' --> 'data\processed_data\BRK-B\4_2024-08-19.md'


2025-11-14 15:50:49,726 - INFO - Going to convert document batch...
2025-11-14 15:50:49,727 - INFO - Processing document 4_2024-08-27
2025-11-14 15:50:49,795 - INFO - Finished converting document 4_2024-08-27 in 0.12 sec.
2025-11-14 15:50:49,859 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2024-08-27' --> 'data\processed_data\BRK-B\4_2024-08-27.md'


2025-11-14 15:50:50,321 - INFO - Going to convert document batch...
2025-11-14 15:50:50,323 - INFO - Processing document 4_2024-08-30
2025-11-14 15:50:50,390 - INFO - Finished converting document 4_2024-08-30 in 0.55 sec.
2025-11-14 15:50:50,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:50,495 - INFO - Going to convert document batch...
2025-11-14 15:50:50,496 - INFO - Processing document 4_2024-09-05
2025-11-14 15:50:50,576 - INFO - Finished converting document 4_2024-09-05 in 0.12 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-08-30' --> 'data\processed_data\BRK-B\4_2024-08-30.md'
Converted 'data\edgar_documents\BRK-B\4_2024-09-05' --> 'data\processed_data\BRK-B\4_2024-09-05.md'


2025-11-14 15:50:50,662 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:50,693 - INFO - Going to convert document batch...
2025-11-14 15:50:50,694 - INFO - Processing document 4_2024-09-10
2025-11-14 15:50:50,758 - INFO - Finished converting document 4_2024-09-10 in 0.12 sec.
2025-11-14 15:50:50,834 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:50,861 - INFO - Going to convert document batch...
2025-11-14 15:50:50,862 - INFO - Processing document 4_2024-09-11
2025-11-14 15:50:50,928 - INFO - Finished converting document 4_2024-09-11 in 0.09 sec.
2025-11-14 15:50:50,995 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2024-09-10' --> 'data\processed_data\BRK-B\4_2024-09-10.md'
Converted 'data\edgar_documents\BRK-B\4_2024-09-11' --> 'data\processed_data\BRK-B\4_2024-09-11.md'


2025-11-14 15:50:51,021 - INFO - Going to convert document batch...
2025-11-14 15:50:51,022 - INFO - Processing document 4_2024-09-12
2025-11-14 15:50:51,085 - INFO - Finished converting document 4_2024-09-12 in 0.09 sec.
2025-11-14 15:50:51,171 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:51,200 - INFO - Going to convert document batch...
2025-11-14 15:50:51,201 - INFO - Processing document 4_2024-09-13
2025-11-14 15:50:51,263 - INFO - Finished converting document 4_2024-09-13 in 0.11 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-09-12' --> 'data\processed_data\BRK-B\4_2024-09-12.md'
Converted 'data\edgar_documents\BRK-B\4_2024-09-13' --> 'data\processed_data\BRK-B\4_2024-09-13.md'


2025-11-14 15:50:51,358 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:51,396 - INFO - Going to convert document batch...
2025-11-14 15:50:51,397 - INFO - Processing document 4_2024-09-19
2025-11-14 15:50:51,473 - INFO - Finished converting document 4_2024-09-19 in 0.14 sec.
2025-11-14 15:50:51,545 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:51,569 - INFO - Going to convert document batch...
2025-11-14 15:50:51,570 - INFO - Processing document 4_2024-09-24
2025-11-14 15:50:51,639 - INFO - Finished converting document 4_2024-09-24 in 0.11 sec.
2025-11-14 15:50:51,712 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2024-09-19' --> 'data\processed_data\BRK-B\4_2024-09-19.md'
Converted 'data\edgar_documents\BRK-B\4_2024-09-24' --> 'data\processed_data\BRK-B\4_2024-09-24.md'


2025-11-14 15:50:51,740 - INFO - Going to convert document batch...
2025-11-14 15:50:51,742 - INFO - Processing document 4_2024-09-27
2025-11-14 15:50:51,812 - INFO - Finished converting document 4_2024-09-27 in 0.11 sec.
2025-11-14 15:50:51,886 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:50:51,886 - ERROR - Input document 4_2024-10-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:50:51,889 - INFO - Going to convert document batch...
2025-11-14 15:50:51,901 - IN

Converted 'data\edgar_documents\BRK-B\4_2024-09-27' --> 'data\processed_data\BRK-B\4_2024-09-27.md'
Error processing data\edgar_documents\BRK-B\4_2024-10-01: File format not allowed: data\edgar_documents\BRK-B\4_2024-10-01
Converted 'data\edgar_documents\BRK-B\4_2024-10-02' --> 'data\processed_data\BRK-B\4_2024-10-02.md'


2025-11-14 15:50:52,079 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:52,113 - INFO - Going to convert document batch...
2025-11-14 15:50:52,115 - INFO - Processing document 4_2024-10-07
2025-11-14 15:50:52,188 - INFO - Finished converting document 4_2024-10-07 in 0.14 sec.
2025-11-14 15:50:52,253 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:52,289 - INFO - Going to convert document batch...
2025-11-14 15:50:52,290 - INFO - Processing document 4_2024-10-10
2025-11-14 15:50:52,371 - INFO - Finished converting document 4_2024-10-10 in 0.14 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-10-07' --> 'data\processed_data\BRK-B\4_2024-10-07.md'
Converted 'data\edgar_documents\BRK-B\4_2024-10-10' --> 'data\processed_data\BRK-B\4_2024-10-10.md'


2025-11-14 15:50:52,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:52,503 - INFO - Going to convert document batch...
2025-11-14 15:50:52,508 - INFO - Processing document 4_2024-10-11
2025-11-14 15:50:52,584 - INFO - Finished converting document 4_2024-10-11 in 0.14 sec.
2025-11-14 15:50:52,654 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:52,680 - INFO - Going to convert document batch...
2025-11-14 15:50:52,681 - INFO - Processing document 4_2024-10-17
2025-11-14 15:50:52,747 - INFO - Finished converting document 4_2024-10-17 in 0.11 sec.
2025-11-14 15:50:52,816 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:52,844 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BRK-B\4_2024-10-11' --> 'data\processed_data\BRK-B\4_2024-10-11.md'
Converted 'data\edgar_documents\BRK-B\4_2024-10-17' --> 'data\processed_data\BRK-B\4_2024-10-17.md'


2025-11-14 15:50:52,845 - INFO - Processing document 4_2024-10-18
2025-11-14 15:50:52,915 - INFO - Finished converting document 4_2024-10-18 in 0.11 sec.
2025-11-14 15:50:52,989 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:53,017 - INFO - Going to convert document batch...
2025-11-14 15:50:53,018 - INFO - Processing document 4_2024-10-31
2025-11-14 15:50:53,085 - INFO - Finished converting document 4_2024-10-31 in 0.11 sec.
2025-11-14 15:50:53,159 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2024-10-18' --> 'data\processed_data\BRK-B\4_2024-10-18.md'
Converted 'data\edgar_documents\BRK-B\4_2024-10-31' --> 'data\processed_data\BRK-B\4_2024-10-31.md'


2025-11-14 15:50:53,178 - INFO - Going to convert document batch...
2025-11-14 15:50:53,180 - INFO - Processing document 4_2024-11-07
2025-11-14 15:50:53,237 - INFO - Finished converting document 4_2024-11-07 in 0.09 sec.
2025-11-14 15:50:53,297 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:53,323 - INFO - Going to convert document batch...
2025-11-14 15:50:53,324 - INFO - Processing document 4_2024-11-22
2025-11-14 15:50:53,385 - INFO - Finished converting document 4_2024-11-22 in 0.11 sec.
2025-11-14 15:50:53,466 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2024-11-07' --> 'data\processed_data\BRK-B\4_2024-11-07.md'
Converted 'data\edgar_documents\BRK-B\4_2024-11-22' --> 'data\processed_data\BRK-B\4_2024-11-22.md'


2025-11-14 15:50:53,492 - INFO - Going to convert document batch...
2025-11-14 15:50:53,493 - INFO - Processing document 4_2024-11-25
2025-11-14 15:50:53,594 - INFO - Finished converting document 4_2024-11-25 in 0.16 sec.
2025-11-14 15:50:53,671 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:53,693 - INFO - Going to convert document batch...
2025-11-14 15:50:53,694 - INFO - Processing document 4_2024-12-04
2025-11-14 15:50:53,745 - INFO - Finished converting document 4_2024-12-04 in 0.09 sec.
2025-11-14 15:50:53,807 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:53,835 - INFO - Going to convert document batch...
2025-11-14 15:50:53,837 - INFO - Processing document 4_2024-12-11


Converted 'data\edgar_documents\BRK-B\4_2024-11-25' --> 'data\processed_data\BRK-B\4_2024-11-25.md'
Converted 'data\edgar_documents\BRK-B\4_2024-12-04' --> 'data\processed_data\BRK-B\4_2024-12-04.md'


2025-11-14 15:50:53,906 - INFO - Finished converting document 4_2024-12-11 in 0.11 sec.
2025-11-14 15:50:53,966 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:54,009 - INFO - Going to convert document batch...
2025-11-14 15:50:54,010 - INFO - Processing document 4_2024-12-19
2025-11-14 15:50:54,122 - INFO - Finished converting document 4_2024-12-19 in 0.17 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-12-11' --> 'data\processed_data\BRK-B\4_2024-12-11.md'


2025-11-14 15:50:54,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:54,277 - INFO - Going to convert document batch...
2025-11-14 15:50:54,278 - INFO - Processing document 4_2024-12-26
2025-11-14 15:50:54,391 - INFO - Finished converting document 4_2024-12-26 in 0.17 sec.


Converted 'data\edgar_documents\BRK-B\4_2024-12-19' --> 'data\processed_data\BRK-B\4_2024-12-19.md'


2025-11-14 15:50:54,496 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:54,525 - INFO - Going to convert document batch...
2025-11-14 15:50:54,526 - INFO - Processing document 4_2024-12-27
2025-11-14 15:50:54,569 - INFO - Finished converting document 4_2024-12-27 in 0.08 sec.
2025-11-14 15:50:54,627 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:54,670 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BRK-B\4_2024-12-26' --> 'data\processed_data\BRK-B\4_2024-12-26.md'
Converted 'data\edgar_documents\BRK-B\4_2024-12-27' --> 'data\processed_data\BRK-B\4_2024-12-27.md'


2025-11-14 15:50:54,672 - INFO - Processing document 4_2024-12-30
2025-11-14 15:50:54,793 - INFO - Finished converting document 4_2024-12-30 in 0.19 sec.
2025-11-14 15:50:54,888 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:54,908 - INFO - Going to convert document batch...
2025-11-14 15:50:54,910 - INFO - Processing document 4_2025-01-03
2025-11-14 15:50:54,954 - INFO - Finished converting document 4_2025-01-03 in 0.08 sec.
2025-11-14 15:50:55,008 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:55,037 - INFO - Going to convert document batch...
2025-11-14 15:50:55,038 - INFO - Processing document 4_2025-01-17


Converted 'data\edgar_documents\BRK-B\4_2024-12-30' --> 'data\processed_data\BRK-B\4_2024-12-30.md'
Converted 'data\edgar_documents\BRK-B\4_2025-01-03' --> 'data\processed_data\BRK-B\4_2025-01-03.md'


2025-11-14 15:50:55,096 - INFO - Finished converting document 4_2025-01-17 in 0.09 sec.
2025-11-14 15:50:55,166 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:55,197 - INFO - Going to convert document batch...
2025-11-14 15:50:55,198 - INFO - Processing document 4_2025-02-03
2025-11-14 15:50:55,272 - INFO - Finished converting document 4_2025-02-03 in 0.11 sec.
2025-11-14 15:50:55,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2025-01-17' --> 'data\processed_data\BRK-B\4_2025-01-17.md'
Converted 'data\edgar_documents\BRK-B\4_2025-02-03' --> 'data\processed_data\BRK-B\4_2025-02-03.md'


2025-11-14 15:50:55,381 - INFO - Going to convert document batch...
2025-11-14 15:50:55,383 - INFO - Processing document 4_2025-02-11
2025-11-14 15:50:55,460 - INFO - Finished converting document 4_2025-02-11 in 0.11 sec.
2025-11-14 15:50:55,534 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:55,559 - INFO - Going to convert document batch...
2025-11-14 15:50:55,561 - INFO - Processing document 4_2025-02-13
2025-11-14 15:50:55,617 - INFO - Finished converting document 4_2025-02-13 in 0.09 sec.
2025-11-14 15:50:55,712 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2025-02-11' --> 'data\processed_data\BRK-B\4_2025-02-11.md'
Converted 'data\edgar_documents\BRK-B\4_2025-02-13' --> 'data\processed_data\BRK-B\4_2025-02-13.md'


2025-11-14 15:50:55,772 - INFO - Going to convert document batch...
2025-11-14 15:50:55,773 - INFO - Processing document 4_2025-02-19
2025-11-14 15:50:55,955 - INFO - Finished converting document 4_2025-02-19 in 0.27 sec.
2025-11-14 15:50:56,102 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:56,133 - INFO - Going to convert document batch...
2025-11-14 15:50:56,134 - INFO - Processing document 4_2025-02-25
2025-11-14 15:50:56,200 - INFO - Finished converting document 4_2025-02-25 in 0.14 sec.


Converted 'data\edgar_documents\BRK-B\4_2025-02-19' --> 'data\processed_data\BRK-B\4_2025-02-19.md'
Converted 'data\edgar_documents\BRK-B\4_2025-02-25' --> 'data\processed_data\BRK-B\4_2025-02-25.md'


2025-11-14 15:50:56,285 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:56,319 - INFO - Going to convert document batch...
2025-11-14 15:50:56,320 - INFO - Processing document 4_2025-03-04
2025-11-14 15:50:56,841 - INFO - Finished converting document 4_2025-03-04 in 0.59 sec.
2025-11-14 15:50:56,907 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:56,937 - INFO - Going to convert document batch...
2025-11-14 15:50:56,938 - INFO - Processing document 4_2025-03-14
2025-11-14 15:50:57,007 - INFO - Finished converting document 4_2025-03-14 in 0.11 sec.


Converted 'data\edgar_documents\BRK-B\4_2025-03-04' --> 'data\processed_data\BRK-B\4_2025-03-04.md'
Converted 'data\edgar_documents\BRK-B\4_2025-03-14' --> 'data\processed_data\BRK-B\4_2025-03-14.md'


2025-11-14 15:50:57,084 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:57,112 - INFO - Going to convert document batch...
2025-11-14 15:50:57,114 - INFO - Processing document 4_2025-03-21
2025-11-14 15:50:57,155 - INFO - Finished converting document 4_2025-03-21 in 0.09 sec.
2025-11-14 15:50:57,234 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:50:57,235 - ERROR - Input document 4_2025-04-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:50

Converted 'data\edgar_documents\BRK-B\4_2025-03-21' --> 'data\processed_data\BRK-B\4_2025-03-21.md'
Error processing data\edgar_documents\BRK-B\4_2025-04-01: File format not allowed: data\edgar_documents\BRK-B\4_2025-04-01


2025-11-14 15:50:57,416 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:57,438 - INFO - Going to convert document batch...
2025-11-14 15:50:57,439 - INFO - Processing document 4_2025-04-09
2025-11-14 15:50:57,487 - INFO - Finished converting document 4_2025-04-09 in 0.08 sec.
2025-11-14 15:50:57,569 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:50:57,571 - ERROR - Input document 4_2025-04-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:50

Converted 'data\edgar_documents\BRK-B\4_2025-04-04' --> 'data\processed_data\BRK-B\4_2025-04-04.md'
Converted 'data\edgar_documents\BRK-B\4_2025-04-09' --> 'data\processed_data\BRK-B\4_2025-04-09.md'
Error processing data\edgar_documents\BRK-B\4_2025-04-15: File format not allowed: data\edgar_documents\BRK-B\4_2025-04-15


2025-11-14 15:50:57,615 - INFO - Going to convert document batch...
2025-11-14 15:50:57,617 - INFO - Processing document 4_2025-05-12
2025-11-14 15:50:57,679 - INFO - Finished converting document 4_2025-05-12 in 0.09 sec.
2025-11-14 15:50:57,753 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:57,776 - INFO - Going to convert document batch...
2025-11-14 15:50:57,778 - INFO - Processing document 4_2025-05-15
2025-11-14 15:50:57,829 - INFO - Finished converting document 4_2025-05-15 in 0.09 sec.
2025-11-14 15:50:57,899 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\4_2025-05-12' --> 'data\processed_data\BRK-B\4_2025-05-12.md'
Converted 'data\edgar_documents\BRK-B\4_2025-05-15' --> 'data\processed_data\BRK-B\4_2025-05-15.md'


2025-11-14 15:50:57,938 - INFO - Going to convert document batch...
2025-11-14 15:50:57,939 - INFO - Processing document 4_2025-05-27
2025-11-14 15:50:58,024 - INFO - Finished converting document 4_2025-05-27 in 0.14 sec.
2025-11-14 15:50:58,101 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:58,124 - INFO - Going to convert document batch...
2025-11-14 15:50:58,126 - INFO - Processing document 4_2025-06-30
2025-11-14 15:50:58,186 - INFO - Finished converting document 4_2025-06-30 in 0.09 sec.
2025-11-14 15:50:58,266 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:58,283 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BRK-B\4_2025-05-27' --> 'data\processed_data\BRK-B\4_2025-05-27.md'
Converted 'data\edgar_documents\BRK-B\4_2025-06-30' --> 'data\processed_data\BRK-B\4_2025-06-30.md'


2025-11-14 15:50:58,284 - INFO - Processing document 4_2025-07-16
2025-11-14 15:50:58,341 - INFO - Finished converting document 4_2025-07-16 in 0.11 sec.
2025-11-14 15:50:58,420 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:58,442 - INFO - Going to convert document batch...
2025-11-14 15:50:58,443 - INFO - Processing document 4_2025-08-01
2025-11-14 15:50:58,495 - INFO - Finished converting document 4_2025-08-01 in 0.09 sec.
2025-11-14 15:50:58,570 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:58,592 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BRK-B\4_2025-07-16' --> 'data\processed_data\BRK-B\4_2025-07-16.md'
Converted 'data\edgar_documents\BRK-B\4_2025-08-01' --> 'data\processed_data\BRK-B\4_2025-08-01.md'


2025-11-14 15:50:58,593 - INFO - Processing document 4_2025-08-04
2025-11-14 15:50:58,654 - INFO - Finished converting document 4_2025-08-04 in 0.11 sec.
2025-11-14 15:50:58,721 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:58,746 - INFO - Going to convert document batch...
2025-11-14 15:50:58,748 - INFO - Processing document 4_2025-08-08
2025-11-14 15:50:58,806 - INFO - Finished converting document 4_2025-08-08 in 0.09 sec.
2025-11-14 15:50:58,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:58,901 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BRK-B\4_2025-08-04' --> 'data\processed_data\BRK-B\4_2025-08-04.md'
Converted 'data\edgar_documents\BRK-B\4_2025-08-08' --> 'data\processed_data\BRK-B\4_2025-08-08.md'


2025-11-14 15:50:58,902 - INFO - Processing document 4_2025-09-26
2025-11-14 15:50:58,979 - INFO - Finished converting document 4_2025-09-26 in 0.12 sec.
2025-11-14 15:50:59,057 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:59,081 - INFO - Going to convert document batch...
2025-11-14 15:50:59,082 - INFO - Processing document 4_2025-10-24
2025-11-14 15:50:59,148 - INFO - Finished converting document 4_2025-10-24 in 0.09 sec.


Converted 'data\edgar_documents\BRK-B\4_2025-09-26' --> 'data\processed_data\BRK-B\4_2025-09-26.md'
Converted 'data\edgar_documents\BRK-B\4_2025-10-24' --> 'data\processed_data\BRK-B\4_2025-10-24.md'


2025-11-14 15:50:59,242 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:59,269 - INFO - Going to convert document batch...
2025-11-14 15:50:59,271 - INFO - Processing document 4_2025-10-29
2025-11-14 15:50:59,331 - INFO - Finished converting document 4_2025-10-29 in 0.12 sec.
2025-11-14 15:50:59,405 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:59,436 - INFO - Going to convert document batch...
2025-11-14 15:50:59,438 - INFO - Processing document 4_2025-11-05
2025-11-14 15:50:59,505 - INFO - Finished converting document 4_2025-11-05 in 0.11 sec.
2025-11-14 15:50:59,596 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\BRK-B\4_2025-10-29' --> 'data\processed_data\BRK-B\4_2025-10-29.md'
Converted 'data\edgar_documents\BRK-B\4_2025-11-05' --> 'data\processed_data\BRK-B\4_2025-11-05.md'


2025-11-14 15:50:59,596 - ERROR - Input document 4_2025-11-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:50:59,599 - INFO - Going to convert document batch...
2025-11-14 15:50:59,615 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:59,665 - INFO - Going to convert document batch...
2025-11-14 15:50:59,666 - INFO - Processing document 8-K_2023-03-01
2025-11-14 15:50:59,723 - INFO - Finished converting document 8-K_2023-03-01 in 0.12 sec.
2025-11-14 15:50:59,800 - INFO - d

Error processing data\edgar_documents\BRK-B\4_2025-11-06: File format not allowed: data\edgar_documents\BRK-B\4_2025-11-06
Converted 'data\edgar_documents\BRK-B\8-K_2023-03-01' --> 'data\processed_data\BRK-B\8-K_2023-03-01.md'


2025-11-14 15:50:59,834 - INFO - Going to convert document batch...
2025-11-14 15:50:59,835 - INFO - Processing document 8-K_2023-04-20
2025-11-14 15:50:59,887 - INFO - Finished converting document 8-K_2023-04-20 in 0.14 sec.
2025-11-14 15:50:59,925 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:50:59,972 - INFO - Going to convert document batch...
2025-11-14 15:50:59,973 - INFO - Processing document 8-K_2023-05-02
2025-11-14 15:51:00,023 - INFO - Finished converting document 8-K_2023-05-02 in 0.11 sec.
2025-11-14 15:51:00,057 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\8-K_2023-04-20' --> 'data\processed_data\BRK-B\8-K_2023-04-20.md'
Converted 'data\edgar_documents\BRK-B\8-K_2023-05-02' --> 'data\processed_data\BRK-B\8-K_2023-05-02.md'


2025-11-14 15:51:00,127 - INFO - Going to convert document batch...
2025-11-14 15:51:00,128 - INFO - Processing document 8-K_2023-05-10
2025-11-14 15:51:00,228 - INFO - Finished converting document 8-K_2023-05-10 in 0.17 sec.
2025-11-14 15:51:00,282 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:00,315 - INFO - Going to convert document batch...
2025-11-14 15:51:00,316 - INFO - Processing document 8-K_2023-08-07
2025-11-14 15:51:00,369 - INFO - Finished converting document 8-K_2023-08-07 in 0.09 sec.
2025-11-14 15:51:00,435 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:00,470 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\BRK-B\8-K_2023-05-10' --> 'data\processed_data\BRK-B\8-K_2023-05-10.md'
Converted 'data\edgar_documents\BRK-B\8-K_2023-08-07' --> 'data\processed_data\BRK-B\8-K_2023-08-07.md'


2025-11-14 15:51:00,471 - INFO - Processing document 8-K_2023-11-07
2025-11-14 15:51:00,517 - INFO - Finished converting document 8-K_2023-11-07 in 0.12 sec.
2025-11-14 15:51:00,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:00,592 - INFO - Going to convert document batch...
2025-11-14 15:51:00,593 - INFO - Processing document 8-K_2023-11-29
2025-11-14 15:51:00,666 - INFO - Finished converting document 8-K_2023-11-29 in 0.14 sec.


Converted 'data\edgar_documents\BRK-B\8-K_2023-11-07' --> 'data\processed_data\BRK-B\8-K_2023-11-07.md'
Converted 'data\edgar_documents\BRK-B\8-K_2023-11-29' --> 'data\processed_data\BRK-B\8-K_2023-11-29.md'


2025-11-14 15:51:00,755 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:00,792 - INFO - Going to convert document batch...
2025-11-14 15:51:00,793 - INFO - Processing document 8-K_2023-12-01
2025-11-14 15:51:00,837 - INFO - Finished converting document 8-K_2023-12-01 in 0.12 sec.
2025-11-14 15:51:00,875 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:00,899 - INFO - Going to convert document batch...
2025-11-14 15:51:00,900 - INFO - Processing document 8-K_2024-01-10
2025-11-14 15:51:00,928 - INFO - Finished converting document 8-K_2024-01-10 in 0.06 sec.
2025-11-14 15:51:00,964 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:00,983 - INFO - Going to convert document batch...
2025-11-14 15:51:00,984 - INFO - Processing document 8-K_2024-02-26
2025-11-14 15:51:01,015 - INFO - Finished converting document 8-K_2024-02-26 in 0.08 sec.
2025-11-14 15:51:01,043 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\8-K_2023-12-01' --> 'data\processed_data\BRK-B\8-K_2023-12-01.md'
Converted 'data\edgar_documents\BRK-B\8-K_2024-01-10' --> 'data\processed_data\BRK-B\8-K_2024-01-10.md'
Converted 'data\edgar_documents\BRK-B\8-K_2024-02-26' --> 'data\processed_data\BRK-B\8-K_2024-02-26.md'


2025-11-14 15:51:01,066 - INFO - Going to convert document batch...
2025-11-14 15:51:01,068 - INFO - Processing document 8-K_2024-04-26
2025-11-14 15:51:01,110 - INFO - Finished converting document 8-K_2024-04-26 in 0.08 sec.
2025-11-14 15:51:01,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:01,174 - INFO - Going to convert document batch...
2025-11-14 15:51:01,175 - INFO - Processing document 8-K_2024-05-07
2025-11-14 15:51:01,218 - INFO - Finished converting document 8-K_2024-05-07 in 0.09 sec.
2025-11-14 15:51:01,250 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:01,266 - INFO - Going to convert document batch...
2025-11-14 15:51:01,266 - INFO - Processing document 8-K_2024-08-05
2025-11-14 15:51:01,289 - INFO - Finished converting document 8-K_2024-08-05 in 0.05 sec.
2025-11-14 15:51:01,315 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\8-K_2024-04-26' --> 'data\processed_data\BRK-B\8-K_2024-04-26.md'
Converted 'data\edgar_documents\BRK-B\8-K_2024-05-07' --> 'data\processed_data\BRK-B\8-K_2024-05-07.md'
Converted 'data\edgar_documents\BRK-B\8-K_2024-08-05' --> 'data\processed_data\BRK-B\8-K_2024-08-05.md'


2025-11-14 15:51:01,334 - INFO - Going to convert document batch...
2025-11-14 15:51:01,334 - INFO - Processing document 8-K_2024-10-23
2025-11-14 15:51:01,366 - INFO - Finished converting document 8-K_2024-10-23 in 0.06 sec.
2025-11-14 15:51:01,396 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:01,412 - INFO - Going to convert document batch...
2025-11-14 15:51:01,413 - INFO - Processing document 8-K_2024-11-04
2025-11-14 15:51:01,436 - INFO - Finished converting document 8-K_2024-11-04 in 0.06 sec.
2025-11-14 15:51:01,462 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:01,479 - INFO - Going to convert document batch...
2025-11-14 15:51:01,479 - INFO - Processing document 8-K_2025-02-24
2025-11-14 15:51:01,504 - INFO - Finished converting document 8-K_2025-02-24 in 0.05 sec.
2025-11-14 15:51:01,530 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:01,549 - INFO - Going to convert document batch...
2025-11-14 15:

Converted 'data\edgar_documents\BRK-B\8-K_2024-10-23' --> 'data\processed_data\BRK-B\8-K_2024-10-23.md'
Converted 'data\edgar_documents\BRK-B\8-K_2024-11-04' --> 'data\processed_data\BRK-B\8-K_2024-11-04.md'
Converted 'data\edgar_documents\BRK-B\8-K_2025-02-24' --> 'data\processed_data\BRK-B\8-K_2025-02-24.md'


2025-11-14 15:51:01,578 - INFO - Finished converting document 8-K_2025-04-17 in 0.06 sec.
2025-11-14 15:51:01,609 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:01,650 - INFO - Going to convert document batch...
2025-11-14 15:51:01,652 - INFO - Processing document 8-K_2025-05-06
2025-11-14 15:51:01,698 - INFO - Finished converting document 8-K_2025-05-06 in 0.11 sec.
2025-11-14 15:51:01,729 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\BRK-B\8-K_2025-04-17' --> 'data\processed_data\BRK-B\8-K_2025-04-17.md'
Converted 'data\edgar_documents\BRK-B\8-K_2025-05-06' --> 'data\processed_data\BRK-B\8-K_2025-05-06.md'


2025-11-14 15:51:01,982 - INFO - Going to convert document batch...
2025-11-14 15:51:01,983 - INFO - Processing document 8-K_2025-05-08
2025-11-14 15:51:02,008 - INFO - Finished converting document 8-K_2025-05-08 in 0.28 sec.
2025-11-14 15:51:02,037 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:02,060 - INFO - Going to convert document batch...
2025-11-14 15:51:02,061 - INFO - Processing document 8-K_2025-08-04
2025-11-14 15:51:02,091 - INFO - Finished converting document 8-K_2025-08-04 in 0.08 sec.
2025-11-14 15:51:02,145 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:02,188 - INFO - Going to convert document batch...
2025-11-14 15:51:02,189 - INFO - Processing document 8-K_2025-10-03
2025-11-14 15:51:02,256 - INFO - Finished converting document 8-K_2025-10-03 in 0.12 sec.


Converted 'data\edgar_documents\BRK-B\8-K_2025-05-08' --> 'data\processed_data\BRK-B\8-K_2025-05-08.md'
Converted 'data\edgar_documents\BRK-B\8-K_2025-08-04' --> 'data\processed_data\BRK-B\8-K_2025-08-04.md'


2025-11-14 15:51:02,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:51:02,343 - INFO - Going to convert document batch...
2025-11-14 15:51:02,344 - INFO - Processing document 8-K_2025-11-03
2025-11-14 15:51:02,400 - INFO - Finished converting document 8-K_2025-11-03 in 0.11 sec.
2025-11-14 15:51:02,455 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:51:02,457 - ERROR - Input document DEF-14A_2023-03-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>

Converted 'data\edgar_documents\BRK-B\8-K_2025-10-03' --> 'data\processed_data\BRK-B\8-K_2025-10-03.md'
Converted 'data\edgar_documents\BRK-B\8-K_2025-11-03' --> 'data\processed_data\BRK-B\8-K_2025-11-03.md'
Error processing data\edgar_documents\BRK-B\DEF-14A_2023-03-17: File format not allowed: data\edgar_documents\BRK-B\DEF-14A_2023-03-17


2025-11-14 15:51:02,485 - ERROR - Input document DEF-14A_2024-03-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:51:02,488 - INFO - Going to convert document batch...
2025-11-14 15:51:02,512 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:51:02,513 - ERROR - Input document DEF-14A_2025-03-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: '

Error processing data\edgar_documents\BRK-B\DEF-14A_2024-03-15: File format not allowed: data\edgar_documents\BRK-B\DEF-14A_2024-03-15
Error processing data\edgar_documents\BRK-B\DEF-14A_2025-03-14: File format not allowed: data\edgar_documents\BRK-B\DEF-14A_2025-03-14
Processed 144 new files. Errors: 13
Found 165 files to process in data\edgar_documents\CAT


2025-11-14 15:51:06,792 - INFO - Going to convert document batch...
2025-11-14 15:51:06,795 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:51:06,796 - INFO - Processing document 10-K_2023-02-15
2025-11-14 15:51:17,096 - INFO - Finished converting document 10-K_2023-02-15 in 14.56 sec.
2025-11-14 15:51:19,715 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\10-K_2023-02-15' --> 'data\processed_data\CAT\10-K_2023-02-15.md'


2025-11-14 15:51:23,561 - INFO - Going to convert document batch...
2025-11-14 15:51:23,563 - INFO - Processing document 10-K_2024-02-16
2025-11-14 15:51:33,378 - INFO - Finished converting document 10-K_2024-02-16 in 13.75 sec.
2025-11-14 15:51:38,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\10-K_2024-02-16' --> 'data\processed_data\CAT\10-K_2024-02-16.md'


2025-11-14 15:51:42,369 - INFO - Going to convert document batch...
2025-11-14 15:51:42,370 - INFO - Processing document 10-K_2025-02-14
2025-11-14 15:51:52,404 - INFO - Finished converting document 10-K_2025-02-14 in 14.48 sec.
2025-11-14 15:51:55,305 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\10-K_2025-02-14' --> 'data\processed_data\CAT\10-K_2025-02-14.md'


2025-11-14 15:51:58,464 - INFO - Going to convert document batch...
2025-11-14 15:51:58,465 - INFO - Processing document 10-Q_2023-05-03
2025-11-14 15:52:02,550 - INFO - Finished converting document 10-Q_2023-05-03 in 7.31 sec.
2025-11-14 15:52:04,468 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\10-Q_2023-05-03' --> 'data\processed_data\CAT\10-Q_2023-05-03.md'


2025-11-14 15:52:08,211 - INFO - Going to convert document batch...
2025-11-14 15:52:08,212 - INFO - Processing document 10-Q_2023-08-02
2025-11-14 15:52:13,357 - INFO - Finished converting document 10-Q_2023-08-02 in 8.98 sec.
2025-11-14 15:52:15,803 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\10-Q_2023-08-02' --> 'data\processed_data\CAT\10-Q_2023-08-02.md'


2025-11-14 15:52:18,343 - INFO - Going to convert document batch...
2025-11-14 15:52:18,344 - INFO - Processing document 10-Q_2023-11-01
2025-11-14 15:52:22,117 - INFO - Finished converting document 10-Q_2023-11-01 in 6.39 sec.
2025-11-14 15:52:25,545 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\10-Q_2023-11-01' --> 'data\processed_data\CAT\10-Q_2023-11-01.md'


2025-11-14 15:52:28,084 - INFO - Going to convert document batch...
2025-11-14 15:52:28,086 - INFO - Processing document 10-Q_2024-05-01
2025-11-14 15:52:33,577 - INFO - Finished converting document 10-Q_2024-05-01 in 8.09 sec.
2025-11-14 15:52:35,547 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\10-Q_2024-05-01' --> 'data\processed_data\CAT\10-Q_2024-05-01.md'


2025-11-14 15:52:38,258 - INFO - Going to convert document batch...
2025-11-14 15:52:38,259 - INFO - Processing document 10-Q_2024-08-07
2025-11-14 15:52:44,815 - INFO - Finished converting document 10-Q_2024-08-07 in 9.36 sec.
2025-11-14 15:52:47,304 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\10-Q_2024-08-07' --> 'data\processed_data\CAT\10-Q_2024-08-07.md'


2025-11-14 15:52:50,982 - INFO - Going to convert document batch...
2025-11-14 15:52:50,983 - INFO - Processing document 10-Q_2024-11-06
2025-11-14 15:52:56,817 - INFO - Finished converting document 10-Q_2024-11-06 in 9.59 sec.
2025-11-14 15:52:59,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\10-Q_2024-11-06' --> 'data\processed_data\CAT\10-Q_2024-11-06.md'


2025-11-14 15:53:02,745 - INFO - Going to convert document batch...
2025-11-14 15:53:02,747 - INFO - Processing document 10-Q_2025-05-07
2025-11-14 15:53:06,971 - INFO - Finished converting document 10-Q_2025-05-07 in 7.50 sec.
2025-11-14 15:53:09,144 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\10-Q_2025-05-07' --> 'data\processed_data\CAT\10-Q_2025-05-07.md'


2025-11-14 15:53:13,206 - INFO - Going to convert document batch...
2025-11-14 15:53:13,208 - INFO - Processing document 10-Q_2025-08-06
2025-11-14 15:53:19,134 - INFO - Finished converting document 10-Q_2025-08-06 in 10.06 sec.
2025-11-14 15:53:21,738 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\10-Q_2025-08-06' --> 'data\processed_data\CAT\10-Q_2025-08-06.md'


2025-11-14 15:53:25,469 - INFO - Going to convert document batch...
2025-11-14 15:53:25,470 - INFO - Processing document 10-Q_2025-11-03
2025-11-14 15:53:31,809 - INFO - Finished converting document 10-Q_2025-11-03 in 10.16 sec.
2025-11-14 15:53:34,378 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:34,403 - INFO - Going to convert document batch...
2025-11-14 15:53:34,404 - INFO - Processing document 4_2023-01-03
2025-11-14 15:53:34,448 - INFO - Finished converting document 4_2023-01-03 in 0.09 sec.
2025-11-14 15:53:34,538 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\10-Q_2025-11-03' --> 'data\processed_data\CAT\10-Q_2025-11-03.md'
Converted 'data\edgar_documents\CAT\4_2023-01-03' --> 'data\processed_data\CAT\4_2023-01-03.md'


2025-11-14 15:53:34,561 - INFO - Going to convert document batch...
2025-11-14 15:53:34,563 - INFO - Processing document 4_2023-01-09
2025-11-14 15:53:34,614 - INFO - Finished converting document 4_2023-01-09 in 0.09 sec.
2025-11-14 15:53:34,671 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:34,697 - INFO - Going to convert document batch...
2025-11-14 15:53:34,700 - INFO - Processing document 4_2023-01-10
2025-11-14 15:53:34,779 - INFO - Finished converting document 4_2023-01-10 in 0.12 sec.


Converted 'data\edgar_documents\CAT\4_2023-01-09' --> 'data\processed_data\CAT\4_2023-01-09.md'
Converted 'data\edgar_documents\CAT\4_2023-01-10' --> 'data\processed_data\CAT\4_2023-01-10.md'


2025-11-14 15:53:34,856 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:34,909 - INFO - Going to convert document batch...
2025-11-14 15:53:34,910 - INFO - Processing document 4_2023-02-06
2025-11-14 15:53:35,013 - INFO - Finished converting document 4_2023-02-06 in 0.17 sec.
2025-11-14 15:53:35,090 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:35,110 - INFO - Going to convert document batch...
2025-11-14 15:53:35,112 - INFO - Processing document 4_2023-02-07
2025-11-14 15:53:35,158 - INFO - Finished converting document 4_2023-02-07 in 0.08 sec.
2025-11-14 15:53:35,233 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:35,253 - INFO - Going to convert document batch...
2025-11-14 15:53:35,255 - INFO - Processing document 4_2023-02-08


Converted 'data\edgar_documents\CAT\4_2023-02-06' --> 'data\processed_data\CAT\4_2023-02-06.md'
Converted 'data\edgar_documents\CAT\4_2023-02-07' --> 'data\processed_data\CAT\4_2023-02-07.md'


2025-11-14 15:53:35,293 - INFO - Finished converting document 4_2023-02-08 in 0.09 sec.
2025-11-14 15:53:35,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:35,373 - INFO - Going to convert document batch...
2025-11-14 15:53:35,374 - INFO - Processing document 4_2023-02-10
2025-11-14 15:53:35,415 - INFO - Finished converting document 4_2023-02-10 in 0.06 sec.
2025-11-14 15:53:35,484 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:35,502 - INFO - Going to convert document batch...
2025-11-14 15:53:35,504 - INFO - Processing document 4_2023-02-21


Converted 'data\edgar_documents\CAT\4_2023-02-08' --> 'data\processed_data\CAT\4_2023-02-08.md'
Converted 'data\edgar_documents\CAT\4_2023-02-10' --> 'data\processed_data\CAT\4_2023-02-10.md'


2025-11-14 15:53:35,564 - INFO - Finished converting document 4_2023-02-21 in 0.11 sec.
2025-11-14 15:53:35,629 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:35,648 - INFO - Going to convert document batch...
2025-11-14 15:53:35,649 - INFO - Processing document 4_2023-03-06
2025-11-14 15:53:35,696 - INFO - Finished converting document 4_2023-03-06 in 0.08 sec.
2025-11-14 15:53:35,758 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:35,774 - INFO - Going to convert document batch...
2025-11-14 15:53:35,775 - INFO - Processing document 4_2023-03-08


Converted 'data\edgar_documents\CAT\4_2023-02-21' --> 'data\processed_data\CAT\4_2023-02-21.md'
Converted 'data\edgar_documents\CAT\4_2023-03-06' --> 'data\processed_data\CAT\4_2023-03-06.md'


2025-11-14 15:53:35,815 - INFO - Finished converting document 4_2023-03-08 in 0.08 sec.
2025-11-14 15:53:35,882 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:35,899 - INFO - Going to convert document batch...
2025-11-14 15:53:35,900 - INFO - Processing document 4_2023-03-14
2025-11-14 15:53:35,945 - INFO - Finished converting document 4_2023-03-14 in 0.08 sec.
2025-11-14 15:53:36,026 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2023-03-08' --> 'data\processed_data\CAT\4_2023-03-08.md'
Converted 'data\edgar_documents\CAT\4_2023-03-14' --> 'data\processed_data\CAT\4_2023-03-14.md'


2025-11-14 15:53:36,058 - INFO - Going to convert document batch...
2025-11-14 15:53:36,066 - INFO - Processing document 4_2023-03-16
2025-11-14 15:53:36,115 - INFO - Finished converting document 4_2023-03-16 in 0.11 sec.
2025-11-14 15:53:36,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:36,211 - INFO - Going to convert document batch...
2025-11-14 15:53:36,212 - INFO - Processing document 4_2023-04-04
2025-11-14 15:53:36,260 - INFO - Finished converting document 4_2023-04-04 in 0.11 sec.
2025-11-14 15:53:36,334 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2023-03-16' --> 'data\processed_data\CAT\4_2023-03-16.md'
Converted 'data\edgar_documents\CAT\4_2023-04-04' --> 'data\processed_data\CAT\4_2023-04-04.md'


2025-11-14 15:53:36,355 - INFO - Going to convert document batch...
2025-11-14 15:53:36,357 - INFO - Processing document 4_2023-05-31
2025-11-14 15:53:36,414 - INFO - Finished converting document 4_2023-05-31 in 0.08 sec.
2025-11-14 15:53:36,495 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:36,519 - INFO - Going to convert document batch...
2025-11-14 15:53:36,520 - INFO - Processing document 4_2023-06-09
2025-11-14 15:53:36,570 - INFO - Finished converting document 4_2023-06-09 in 0.08 sec.
2025-11-14 15:53:36,645 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:36,664 - INFO - Going to convert document batch...
2025-11-14 15:53:36,666 - INFO - Processing document 4_2023-06-15


Converted 'data\edgar_documents\CAT\4_2023-05-31' --> 'data\processed_data\CAT\4_2023-05-31.md'
Converted 'data\edgar_documents\CAT\4_2023-06-09' --> 'data\processed_data\CAT\4_2023-06-09.md'


2025-11-14 15:53:36,709 - INFO - Finished converting document 4_2023-06-15 in 0.08 sec.
2025-11-14 15:53:36,785 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:36,803 - INFO - Going to convert document batch...
2025-11-14 15:53:36,804 - INFO - Processing document 4_2023-06-27
2025-11-14 15:53:36,850 - INFO - Finished converting document 4_2023-06-27 in 0.08 sec.
2025-11-14 15:53:36,941 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2023-06-15' --> 'data\processed_data\CAT\4_2023-06-15.md'
Converted 'data\edgar_documents\CAT\4_2023-06-27' --> 'data\processed_data\CAT\4_2023-06-27.md'


2025-11-14 15:53:36,963 - INFO - Going to convert document batch...
2025-11-14 15:53:36,965 - INFO - Processing document 4_2023-07-03
2025-11-14 15:53:37,022 - INFO - Finished converting document 4_2023-07-03 in 0.11 sec.
2025-11-14 15:53:37,127 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:37,159 - INFO - Going to convert document batch...
2025-11-14 15:53:37,160 - INFO - Processing document 4_2023-07-19
2025-11-14 15:53:37,215 - INFO - Finished converting document 4_2023-07-19 in 0.11 sec.
2025-11-14 15:53:37,300 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2023-07-03' --> 'data\processed_data\CAT\4_2023-07-03.md'
Converted 'data\edgar_documents\CAT\4_2023-07-19' --> 'data\processed_data\CAT\4_2023-07-19.md'


2025-11-14 15:53:37,322 - INFO - Going to convert document batch...
2025-11-14 15:53:37,325 - INFO - Processing document 4_2023-07-28
2025-11-14 15:53:37,371 - INFO - Finished converting document 4_2023-07-28 in 0.11 sec.
2025-11-14 15:53:37,430 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:37,452 - INFO - Going to convert document batch...
2025-11-14 15:53:37,454 - INFO - Processing document 4_2023-08-02
2025-11-14 15:53:37,506 - INFO - Finished converting document 4_2023-08-02 in 0.09 sec.
2025-11-14 15:53:37,584 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:37,616 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2023-07-28' --> 'data\processed_data\CAT\4_2023-07-28.md'
Converted 'data\edgar_documents\CAT\4_2023-08-02' --> 'data\processed_data\CAT\4_2023-08-02.md'


2025-11-14 15:53:37,618 - INFO - Processing document 4_2023-08-03
2025-11-14 15:53:37,686 - INFO - Finished converting document 4_2023-08-03 in 0.14 sec.
2025-11-14 15:53:37,753 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:37,787 - INFO - Going to convert document batch...
2025-11-14 15:53:37,788 - INFO - Processing document 4_2023-08-04
2025-11-14 15:53:37,856 - INFO - Finished converting document 4_2023-08-04 in 0.12 sec.


Converted 'data\edgar_documents\CAT\4_2023-08-03' --> 'data\processed_data\CAT\4_2023-08-03.md'
Converted 'data\edgar_documents\CAT\4_2023-08-04' --> 'data\processed_data\CAT\4_2023-08-04.md'


2025-11-14 15:53:37,949 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:37,978 - INFO - Going to convert document batch...
2025-11-14 15:53:37,979 - INFO - Processing document 4_2023-08-07
2025-11-14 15:53:38,035 - INFO - Finished converting document 4_2023-08-07 in 0.11 sec.
2025-11-14 15:53:38,097 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:38,119 - INFO - Going to convert document batch...
2025-11-14 15:53:38,120 - INFO - Processing document 4_2023-08-08
2025-11-14 15:53:38,158 - INFO - Finished converting document 4_2023-08-08 in 0.08 sec.
2025-11-14 15:53:38,205 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:38,228 - INFO - Going to convert document batch...
2025-11-14 15:53:38,229 - INFO - Processing document 4_2023-08-10
2025-11-14 15:53:38,285 - INFO - Finished converting document 4_2023-08-10 in 0.09 sec.


Converted 'data\edgar_documents\CAT\4_2023-08-07' --> 'data\processed_data\CAT\4_2023-08-07.md'
Converted 'data\edgar_documents\CAT\4_2023-08-08' --> 'data\processed_data\CAT\4_2023-08-08.md'


2025-11-14 15:53:38,352 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:38,371 - INFO - Going to convert document batch...
2025-11-14 15:53:38,372 - INFO - Processing document 4_2023-08-28
2025-11-14 15:53:38,419 - INFO - Finished converting document 4_2023-08-28 in 0.08 sec.
2025-11-14 15:53:38,498 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:38,537 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2023-08-10' --> 'data\processed_data\CAT\4_2023-08-10.md'
Converted 'data\edgar_documents\CAT\4_2023-08-28' --> 'data\processed_data\CAT\4_2023-08-28.md'


2025-11-14 15:53:38,539 - INFO - Processing document 4_2023-08-31
2025-11-14 15:53:38,612 - INFO - Finished converting document 4_2023-08-31 in 0.14 sec.
2025-11-14 15:53:38,688 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:38,705 - INFO - Going to convert document batch...
2025-11-14 15:53:38,707 - INFO - Processing document 4_2023-09-05
2025-11-14 15:53:38,752 - INFO - Finished converting document 4_2023-09-05 in 0.08 sec.
2025-11-14 15:53:38,840 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:38,863 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2023-08-31' --> 'data\processed_data\CAT\4_2023-08-31.md'
Converted 'data\edgar_documents\CAT\4_2023-09-05' --> 'data\processed_data\CAT\4_2023-09-05.md'


2025-11-14 15:53:38,864 - INFO - Processing document 4_2023-09-27
2025-11-14 15:53:38,916 - INFO - Finished converting document 4_2023-09-27 in 0.11 sec.
2025-11-14 15:53:38,995 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:39,019 - INFO - Going to convert document batch...
2025-11-14 15:53:39,022 - INFO - Processing document 4_2023-10-02
2025-11-14 15:53:39,084 - INFO - Finished converting document 4_2023-10-02 in 0.11 sec.


Converted 'data\edgar_documents\CAT\4_2023-09-27' --> 'data\processed_data\CAT\4_2023-09-27.md'
Converted 'data\edgar_documents\CAT\4_2023-10-02' --> 'data\processed_data\CAT\4_2023-10-02.md'


2025-11-14 15:53:39,174 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:39,203 - INFO - Going to convert document batch...
2025-11-14 15:53:39,205 - INFO - Processing document 4_2023-10-27
2025-11-14 15:53:39,253 - INFO - Finished converting document 4_2023-10-27 in 0.11 sec.
2025-11-14 15:53:39,368 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:39,385 - INFO - Going to convert document batch...
2025-11-14 15:53:39,388 - INFO - Processing document 4_2023-11-27
2025-11-14 15:53:39,434 - INFO - Finished converting document 4_2023-11-27 in 0.11 sec.
2025-11-14 15:53:39,493 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:39,526 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2023-10-27' --> 'data\processed_data\CAT\4_2023-10-27.md'
Converted 'data\edgar_documents\CAT\4_2023-11-27' --> 'data\processed_data\CAT\4_2023-11-27.md'


2025-11-14 15:53:39,527 - INFO - Processing document 4_2023-12-19
2025-11-14 15:53:39,592 - INFO - Finished converting document 4_2023-12-19 in 0.11 sec.
2025-11-14 15:53:39,654 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:39,674 - INFO - Going to convert document batch...
2025-11-14 15:53:39,676 - INFO - Processing document 4_2023-12-27
2025-11-14 15:53:39,717 - INFO - Finished converting document 4_2023-12-27 in 0.08 sec.
2025-11-14 15:53:39,801 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:39,820 - INFO - Going to convert document batch...
2025-11-14 15:53:39,822 - INFO - Processing document 4_2024-01-02


Converted 'data\edgar_documents\CAT\4_2023-12-19' --> 'data\processed_data\CAT\4_2023-12-19.md'
Converted 'data\edgar_documents\CAT\4_2023-12-27' --> 'data\processed_data\CAT\4_2023-12-27.md'


2025-11-14 15:53:39,888 - INFO - Finished converting document 4_2024-01-02 in 0.12 sec.
2025-11-14 15:53:39,972 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:39,990 - INFO - Going to convert document batch...
2025-11-14 15:53:39,992 - INFO - Processing document 4_2024-01-16
2025-11-14 15:53:40,031 - INFO - Finished converting document 4_2024-01-16 in 0.08 sec.
2025-11-14 15:53:40,099 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:40,121 - INFO - Going to convert document batch...
2025-11-14 15:53:40,123 - INFO - Processing document 4_2024-01-26
2025-11-14 15:53:40,162 - INFO - Finished converting document 4_2024-01-26 in 0.09 sec.


Converted 'data\edgar_documents\CAT\4_2024-01-02' --> 'data\processed_data\CAT\4_2024-01-02.md'
Converted 'data\edgar_documents\CAT\4_2024-01-16' --> 'data\processed_data\CAT\4_2024-01-16.md'


2025-11-14 15:53:40,217 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:40,241 - INFO - Going to convert document batch...
2025-11-14 15:53:40,242 - INFO - Processing document 4_2024-02-06
2025-11-14 15:53:40,298 - INFO - Finished converting document 4_2024-02-06 in 0.09 sec.
2025-11-14 15:53:40,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:40,403 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2024-01-26' --> 'data\processed_data\CAT\4_2024-01-26.md'
Converted 'data\edgar_documents\CAT\4_2024-02-06' --> 'data\processed_data\CAT\4_2024-02-06.md'


2025-11-14 15:53:40,404 - INFO - Processing document 4_2024-02-08
2025-11-14 15:53:40,462 - INFO - Finished converting document 4_2024-02-08 in 0.11 sec.
2025-11-14 15:53:40,530 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:40,549 - INFO - Going to convert document batch...
2025-11-14 15:53:40,551 - INFO - Processing document 4_2024-02-15
2025-11-14 15:53:40,600 - INFO - Finished converting document 4_2024-02-15 in 0.08 sec.
2025-11-14 15:53:40,665 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:40,694 - INFO - Going to convert document batch...
2025-11-14 15:53:40,696 - INFO - Processing document 4_2024-02-16


Converted 'data\edgar_documents\CAT\4_2024-02-08' --> 'data\processed_data\CAT\4_2024-02-08.md'
Converted 'data\edgar_documents\CAT\4_2024-02-15' --> 'data\processed_data\CAT\4_2024-02-15.md'


2025-11-14 15:53:40,757 - INFO - Finished converting document 4_2024-02-16 in 0.11 sec.
2025-11-14 15:53:40,829 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:40,852 - INFO - Going to convert document batch...
2025-11-14 15:53:40,853 - INFO - Processing document 4_2024-02-23
2025-11-14 15:53:40,901 - INFO - Finished converting document 4_2024-02-23 in 0.09 sec.
2025-11-14 15:53:40,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:41,012 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2024-02-16' --> 'data\processed_data\CAT\4_2024-02-16.md'
Converted 'data\edgar_documents\CAT\4_2024-02-23' --> 'data\processed_data\CAT\4_2024-02-23.md'


2025-11-14 15:53:41,013 - INFO - Processing document 4_2024-02-26
2025-11-14 15:53:41,072 - INFO - Finished converting document 4_2024-02-26 in 0.08 sec.
2025-11-14 15:53:41,152 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:41,181 - INFO - Going to convert document batch...
2025-11-14 15:53:41,182 - INFO - Processing document 4_2024-02-27
2025-11-14 15:53:41,235 - INFO - Finished converting document 4_2024-02-27 in 0.09 sec.
2025-11-14 15:53:41,313 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:41,333 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2024-02-26' --> 'data\processed_data\CAT\4_2024-02-26.md'
Converted 'data\edgar_documents\CAT\4_2024-02-27' --> 'data\processed_data\CAT\4_2024-02-27.md'


2025-11-14 15:53:41,335 - INFO - Processing document 4_2024-02-29
2025-11-14 15:53:41,394 - INFO - Finished converting document 4_2024-02-29 in 0.11 sec.
2025-11-14 15:53:41,476 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:41,500 - INFO - Going to convert document batch...
2025-11-14 15:53:41,501 - INFO - Processing document 4_2024-03-05
2025-11-14 15:53:41,552 - INFO - Finished converting document 4_2024-03-05 in 0.11 sec.


Converted 'data\edgar_documents\CAT\4_2024-02-29' --> 'data\processed_data\CAT\4_2024-02-29.md'
Converted 'data\edgar_documents\CAT\4_2024-03-05' --> 'data\processed_data\CAT\4_2024-03-05.md'


2025-11-14 15:53:41,625 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:41,645 - INFO - Going to convert document batch...
2025-11-14 15:53:41,646 - INFO - Processing document 4_2024-03-06
2025-11-14 15:53:41,717 - INFO - Finished converting document 4_2024-03-06 in 0.12 sec.
2025-11-14 15:53:41,785 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:41,821 - INFO - Going to convert document batch...
2025-11-14 15:53:41,823 - INFO - Processing document 4_2024-03-08
2025-11-14 15:53:41,894 - INFO - Finished converting document 4_2024-03-08 in 0.12 sec.


Converted 'data\edgar_documents\CAT\4_2024-03-06' --> 'data\processed_data\CAT\4_2024-03-06.md'
Converted 'data\edgar_documents\CAT\4_2024-03-08' --> 'data\processed_data\CAT\4_2024-03-08.md'


2025-11-14 15:53:41,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:42,006 - INFO - Going to convert document batch...
2025-11-14 15:53:42,008 - INFO - Processing document 4_2024-03-12
2025-11-14 15:53:42,082 - INFO - Finished converting document 4_2024-03-12 in 0.12 sec.
2025-11-14 15:53:42,141 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:42,160 - INFO - Going to convert document batch...
2025-11-14 15:53:42,161 - INFO - Processing document 4_2024-03-18
2025-11-14 15:53:42,214 - INFO - Finished converting document 4_2024-03-18 in 0.09 sec.
2025-11-14 15:53:42,286 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:42,305 - INFO - Going to convert document batch...
2025-11-14 15:53:42,306 - INFO - Processing document 4_2024-04-01


Converted 'data\edgar_documents\CAT\4_2024-03-12' --> 'data\processed_data\CAT\4_2024-03-12.md'
Converted 'data\edgar_documents\CAT\4_2024-03-18' --> 'data\processed_data\CAT\4_2024-03-18.md'


2025-11-14 15:53:42,361 - INFO - Finished converting document 4_2024-04-01 in 0.09 sec.
2025-11-14 15:53:42,446 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:42,479 - INFO - Going to convert document batch...
2025-11-14 15:53:42,481 - INFO - Processing document 4_2024-04-02
2025-11-14 15:53:42,532 - INFO - Finished converting document 4_2024-04-02 in 0.11 sec.
2025-11-14 15:53:42,595 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:42,616 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2024-04-01' --> 'data\processed_data\CAT\4_2024-04-01.md'
Converted 'data\edgar_documents\CAT\4_2024-04-02' --> 'data\processed_data\CAT\4_2024-04-02.md'


2025-11-14 15:53:42,617 - INFO - Processing document 4_2024-04-29
2025-11-14 15:53:42,666 - INFO - Finished converting document 4_2024-04-29 in 0.08 sec.
2025-11-14 15:53:42,737 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:42,755 - INFO - Going to convert document batch...
2025-11-14 15:53:42,756 - INFO - Processing document 4_2024-04-30
2025-11-14 15:53:42,800 - INFO - Finished converting document 4_2024-04-30 in 0.08 sec.
2025-11-14 15:53:42,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:42,890 - INFO - Going to convert document batch...
2025-11-14 15:53:42,891 - INFO - Processing document 4_2024-05-02


Converted 'data\edgar_documents\CAT\4_2024-04-29' --> 'data\processed_data\CAT\4_2024-04-29.md'
Converted 'data\edgar_documents\CAT\4_2024-04-30' --> 'data\processed_data\CAT\4_2024-04-30.md'


2025-11-14 15:53:42,936 - INFO - Finished converting document 4_2024-05-02 in 0.09 sec.
2025-11-14 15:53:42,999 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:43,018 - INFO - Going to convert document batch...
2025-11-14 15:53:43,019 - INFO - Processing document 4_2024-05-06
2025-11-14 15:53:43,068 - INFO - Finished converting document 4_2024-05-06 in 0.08 sec.
2025-11-14 15:53:43,136 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:43,157 - INFO - Going to convert document batch...
2025-11-14 15:53:43,160 - INFO - Processing document 4_2024-05-07


Converted 'data\edgar_documents\CAT\4_2024-05-02' --> 'data\processed_data\CAT\4_2024-05-02.md'
Converted 'data\edgar_documents\CAT\4_2024-05-06' --> 'data\processed_data\CAT\4_2024-05-06.md'


2025-11-14 15:53:43,210 - INFO - Finished converting document 4_2024-05-07 in 0.09 sec.
2025-11-14 15:53:43,288 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:43,304 - INFO - Going to convert document batch...
2025-11-14 15:53:43,305 - INFO - Processing document 4_2024-05-08
2025-11-14 15:53:43,362 - INFO - Finished converting document 4_2024-05-08 in 0.09 sec.
2025-11-14 15:53:43,430 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:43,465 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2024-05-07' --> 'data\processed_data\CAT\4_2024-05-07.md'
Converted 'data\edgar_documents\CAT\4_2024-05-08' --> 'data\processed_data\CAT\4_2024-05-08.md'


2025-11-14 15:53:43,466 - INFO - Processing document 4_2024-05-14
2025-11-14 15:53:43,524 - INFO - Finished converting document 4_2024-05-14 in 0.11 sec.
2025-11-14 15:53:43,594 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:43,606 - INFO - Going to convert document batch...
2025-11-14 15:53:43,607 - INFO - Processing document 4_2024-05-22
2025-11-14 15:53:43,675 - INFO - Finished converting document 4_2024-05-22 in 0.09 sec.
2025-11-14 15:53:43,751 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:43,767 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2024-05-14' --> 'data\processed_data\CAT\4_2024-05-14.md'
Converted 'data\edgar_documents\CAT\4_2024-05-22' --> 'data\processed_data\CAT\4_2024-05-22.md'


2025-11-14 15:53:43,769 - INFO - Processing document 4_2024-05-28
2025-11-14 15:53:43,814 - INFO - Finished converting document 4_2024-05-28 in 0.09 sec.
2025-11-14 15:53:43,867 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:43,885 - INFO - Going to convert document batch...
2025-11-14 15:53:43,887 - INFO - Processing document 4_2024-05-31
2025-11-14 15:53:43,925 - INFO - Finished converting document 4_2024-05-31 in 0.06 sec.
2025-11-14 15:53:43,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:44,005 - INFO - Going to convert document batch...
2025-11-14 15:53:44,006 - INFO - Processing document 4_2024-06-13
2025-11-14 15:53:44,046 - INFO - Finished converting document 4_2024-06-13 in 0.09 sec.


Converted 'data\edgar_documents\CAT\4_2024-05-28' --> 'data\processed_data\CAT\4_2024-05-28.md'
Converted 'data\edgar_documents\CAT\4_2024-05-31' --> 'data\processed_data\CAT\4_2024-05-31.md'


2025-11-14 15:53:44,116 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:44,138 - INFO - Going to convert document batch...
2025-11-14 15:53:44,140 - INFO - Processing document 4_2024-06-27
2025-11-14 15:53:44,191 - INFO - Finished converting document 4_2024-06-27 in 0.08 sec.
2025-11-14 15:53:44,253 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:44,273 - INFO - Going to convert document batch...
2025-11-14 15:53:44,274 - INFO - Processing document 4_2024-07-01
2025-11-14 15:53:44,318 - INFO - Finished converting document 4_2024-07-01 in 0.08 sec.


Converted 'data\edgar_documents\CAT\4_2024-06-13' --> 'data\processed_data\CAT\4_2024-06-13.md'
Converted 'data\edgar_documents\CAT\4_2024-06-27' --> 'data\processed_data\CAT\4_2024-06-27.md'


2025-11-14 15:53:44,381 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:44,399 - INFO - Going to convert document batch...
2025-11-14 15:53:44,401 - INFO - Processing document 4_2024-07-17
2025-11-14 15:53:44,493 - INFO - Finished converting document 4_2024-07-17 in 0.12 sec.


Converted 'data\edgar_documents\CAT\4_2024-07-01' --> 'data\processed_data\CAT\4_2024-07-01.md'
Converted 'data\edgar_documents\CAT\4_2024-07-17' --> 'data\processed_data\CAT\4_2024-07-17.md'


2025-11-14 15:53:44,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:44,601 - INFO - Going to convert document batch...
2025-11-14 15:53:44,603 - INFO - Processing document 4_2024-07-29
2025-11-14 15:53:44,654 - INFO - Finished converting document 4_2024-07-29 in 0.11 sec.
2025-11-14 15:53:44,715 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:44,736 - INFO - Going to convert document batch...
2025-11-14 15:53:44,738 - INFO - Processing document 4_2024-08-23
2025-11-14 15:53:44,783 - INFO - Finished converting document 4_2024-08-23 in 0.08 sec.
2025-11-14 15:53:44,867 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:44,886 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2024-07-29' --> 'data\processed_data\CAT\4_2024-07-29.md'
Converted 'data\edgar_documents\CAT\4_2024-08-23' --> 'data\processed_data\CAT\4_2024-08-23.md'


2025-11-14 15:53:44,887 - INFO - Processing document 4_2024-08-27
2025-11-14 15:53:44,946 - INFO - Finished converting document 4_2024-08-27 in 0.09 sec.
2025-11-14 15:53:45,007 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:45,036 - INFO - Going to convert document batch...
2025-11-14 15:53:45,037 - INFO - Processing document 4_2024-09-03
2025-11-14 15:53:45,102 - INFO - Finished converting document 4_2024-09-03 in 0.09 sec.
2025-11-14 15:53:45,173 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:45,194 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2024-08-27' --> 'data\processed_data\CAT\4_2024-08-27.md'
Converted 'data\edgar_documents\CAT\4_2024-09-03' --> 'data\processed_data\CAT\4_2024-09-03.md'


2025-11-14 15:53:45,196 - INFO - Processing document 4_2024-09-05
2025-11-14 15:53:45,240 - INFO - Finished converting document 4_2024-09-05 in 0.08 sec.
2025-11-14 15:53:45,301 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:45,322 - INFO - Going to convert document batch...
2025-11-14 15:53:45,324 - INFO - Processing document 4_2024-09-27
2025-11-14 15:53:45,373 - INFO - Finished converting document 4_2024-09-27 in 0.09 sec.
2025-11-14 15:53:45,450 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2024-09-05' --> 'data\processed_data\CAT\4_2024-09-05.md'
Converted 'data\edgar_documents\CAT\4_2024-09-27' --> 'data\processed_data\CAT\4_2024-09-27.md'


2025-11-14 15:53:45,470 - INFO - Going to convert document batch...
2025-11-14 15:53:45,472 - INFO - Processing document 4_2024-10-01
2025-11-14 15:53:45,523 - INFO - Finished converting document 4_2024-10-01 in 0.09 sec.
2025-11-14 15:53:45,582 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:45,605 - INFO - Going to convert document batch...
2025-11-14 15:53:45,607 - INFO - Processing document 4_2024-10-28
2025-11-14 15:53:45,660 - INFO - Finished converting document 4_2024-10-28 in 0.09 sec.
2025-11-14 15:53:45,743 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2024-10-01' --> 'data\processed_data\CAT\4_2024-10-01.md'
Converted 'data\edgar_documents\CAT\4_2024-10-28' --> 'data\processed_data\CAT\4_2024-10-28.md'


2025-11-14 15:53:45,768 - INFO - Going to convert document batch...
2025-11-14 15:53:45,771 - INFO - Processing document 4_2024-11-04
2025-11-14 15:53:45,831 - INFO - Finished converting document 4_2024-11-04 in 0.11 sec.
2025-11-14 15:53:45,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:45,928 - INFO - Going to convert document batch...
2025-11-14 15:53:45,929 - INFO - Processing document 4_2024-11-05
2025-11-14 15:53:45,973 - INFO - Finished converting document 4_2024-11-05 in 0.08 sec.
2025-11-14 15:53:46,034 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:46,065 - INFO - Going to convert document batch...
2025-11-14 15:53:46,066 - INFO - Processing document 4_2024-11-07
2025-11-14 15:53:46,130 - INFO - Finished converting document 4_2024-11-07 in 0.11 sec.


Converted 'data\edgar_documents\CAT\4_2024-11-04' --> 'data\processed_data\CAT\4_2024-11-04.md'
Converted 'data\edgar_documents\CAT\4_2024-11-05' --> 'data\processed_data\CAT\4_2024-11-05.md'


2025-11-14 15:53:46,204 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:46,229 - INFO - Going to convert document batch...
2025-11-14 15:53:46,230 - INFO - Processing document 4_2024-11-08
2025-11-14 15:53:46,307 - INFO - Finished converting document 4_2024-11-08 in 0.12 sec.
2025-11-14 15:53:46,380 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2024-11-07' --> 'data\processed_data\CAT\4_2024-11-07.md'
Converted 'data\edgar_documents\CAT\4_2024-11-08' --> 'data\processed_data\CAT\4_2024-11-08.md'


2025-11-14 15:53:46,404 - INFO - Going to convert document batch...
2025-11-14 15:53:46,405 - INFO - Processing document 4_2024-11-18
2025-11-14 15:53:46,462 - INFO - Finished converting document 4_2024-11-18 in 0.11 sec.
2025-11-14 15:53:46,540 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:46,561 - INFO - Going to convert document batch...
2025-11-14 15:53:46,562 - INFO - Processing document 4_2024-11-26
2025-11-14 15:53:46,616 - INFO - Finished converting document 4_2024-11-26 in 0.09 sec.
2025-11-14 15:53:46,687 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:46,718 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2024-11-18' --> 'data\processed_data\CAT\4_2024-11-18.md'
Converted 'data\edgar_documents\CAT\4_2024-11-26' --> 'data\processed_data\CAT\4_2024-11-26.md'


2025-11-14 15:53:46,719 - INFO - Processing document 4_2024-11-27
2025-11-14 15:53:46,780 - INFO - Finished converting document 4_2024-11-27 in 0.11 sec.
2025-11-14 15:53:46,872 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:46,901 - INFO - Going to convert document batch...
2025-11-14 15:53:46,903 - INFO - Processing document 4_2024-12-02
2025-11-14 15:53:46,993 - INFO - Finished converting document 4_2024-12-02 in 0.16 sec.


Converted 'data\edgar_documents\CAT\4_2024-11-27' --> 'data\processed_data\CAT\4_2024-11-27.md'


2025-11-14 15:53:47,081 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:47,101 - INFO - Going to convert document batch...
2025-11-14 15:53:47,102 - INFO - Processing document 4_2024-12-03
2025-11-14 15:53:47,142 - INFO - Finished converting document 4_2024-12-03 in 0.08 sec.
2025-11-14 15:53:47,226 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:47,243 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2024-12-02' --> 'data\processed_data\CAT\4_2024-12-02.md'
Converted 'data\edgar_documents\CAT\4_2024-12-03' --> 'data\processed_data\CAT\4_2024-12-03.md'


2025-11-14 15:53:47,245 - INFO - Processing document 4_2024-12-05
2025-11-14 15:53:47,279 - INFO - Finished converting document 4_2024-12-05 in 0.09 sec.
2025-11-14 15:53:47,344 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:47,361 - INFO - Going to convert document batch...
2025-11-14 15:53:47,363 - INFO - Processing document 4_2024-12-06
2025-11-14 15:53:47,414 - INFO - Finished converting document 4_2024-12-06 in 0.09 sec.
2025-11-14 15:53:47,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2024-12-05' --> 'data\processed_data\CAT\4_2024-12-05.md'
Converted 'data\edgar_documents\CAT\4_2024-12-06' --> 'data\processed_data\CAT\4_2024-12-06.md'


2025-11-14 15:53:47,526 - INFO - Going to convert document batch...
2025-11-14 15:53:47,527 - INFO - Processing document 4_2024-12-27
2025-11-14 15:53:47,581 - INFO - Finished converting document 4_2024-12-27 in 0.11 sec.
2025-11-14 15:53:47,639 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:47,662 - INFO - Going to convert document batch...
2025-11-14 15:53:47,663 - INFO - Processing document 4_2025-01-02


Converted 'data\edgar_documents\CAT\4_2024-12-27' --> 'data\processed_data\CAT\4_2024-12-27.md'


2025-11-14 15:53:48,972 - INFO - Finished converting document 4_2025-01-02 in 1.34 sec.
2025-11-14 15:53:49,034 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:49,059 - INFO - Going to convert document batch...
2025-11-14 15:53:49,059 - INFO - Processing document 4_2025-01-14
2025-11-14 15:53:49,121 - INFO - Finished converting document 4_2025-01-14 in 0.11 sec.
2025-11-14 15:53:49,208 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2025-01-02' --> 'data\processed_data\CAT\4_2025-01-02.md'
Converted 'data\edgar_documents\CAT\4_2025-01-14' --> 'data\processed_data\CAT\4_2025-01-14.md'


2025-11-14 15:53:49,228 - INFO - Going to convert document batch...
2025-11-14 15:53:49,229 - INFO - Processing document 4_2025-01-17
2025-11-14 15:53:49,275 - INFO - Finished converting document 4_2025-01-17 in 0.09 sec.
2025-11-14 15:53:49,346 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:49,367 - INFO - Going to convert document batch...
2025-11-14 15:53:49,368 - INFO - Processing document 4_2025-02-05
2025-11-14 15:53:49,424 - INFO - Finished converting document 4_2025-02-05 in 0.09 sec.
2025-11-14 15:53:49,510 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2025-01-17' --> 'data\processed_data\CAT\4_2025-01-17.md'
Converted 'data\edgar_documents\CAT\4_2025-02-05' --> 'data\processed_data\CAT\4_2025-02-05.md'


2025-11-14 15:53:49,541 - INFO - Going to convert document batch...
2025-11-14 15:53:49,543 - INFO - Processing document 4_2025-02-13
2025-11-14 15:53:49,606 - INFO - Finished converting document 4_2025-02-13 in 0.12 sec.
2025-11-14 15:53:49,679 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:49,706 - INFO - Going to convert document batch...
2025-11-14 15:53:49,707 - INFO - Processing document 4_2025-02-19
2025-11-14 15:53:49,771 - INFO - Finished converting document 4_2025-02-19 in 0.11 sec.
2025-11-14 15:53:49,857 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2025-02-13' --> 'data\processed_data\CAT\4_2025-02-13.md'
Converted 'data\edgar_documents\CAT\4_2025-02-19' --> 'data\processed_data\CAT\4_2025-02-19.md'


2025-11-14 15:53:49,882 - INFO - Going to convert document batch...
2025-11-14 15:53:49,884 - INFO - Processing document 4_2025-03-05
2025-11-14 15:53:49,948 - INFO - Finished converting document 4_2025-03-05 in 0.11 sec.
2025-11-14 15:53:50,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:50,050 - INFO - Going to convert document batch...
2025-11-14 15:53:50,051 - INFO - Processing document 4_2025-03-10
2025-11-14 15:53:50,105 - INFO - Finished converting document 4_2025-03-10 in 0.09 sec.
2025-11-14 15:53:50,185 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:50,211 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2025-03-05' --> 'data\processed_data\CAT\4_2025-03-05.md'
Converted 'data\edgar_documents\CAT\4_2025-03-10' --> 'data\processed_data\CAT\4_2025-03-10.md'


2025-11-14 15:53:50,213 - INFO - Processing document 4_2025-03-17
2025-11-14 15:53:50,286 - INFO - Finished converting document 4_2025-03-17 in 0.11 sec.
2025-11-14 15:53:50,459 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:50,495 - INFO - Going to convert document batch...
2025-11-14 15:53:50,497 - INFO - Processing document 4_2025-04-02
2025-11-14 15:53:50,558 - INFO - Finished converting document 4_2025-04-02 in 0.16 sec.


Converted 'data\edgar_documents\CAT\4_2025-03-17' --> 'data\processed_data\CAT\4_2025-03-17.md'


2025-11-14 15:53:50,641 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:50,666 - INFO - Going to convert document batch...
2025-11-14 15:53:50,667 - INFO - Processing document 4_2025-04-22
2025-11-14 15:53:50,728 - INFO - Finished converting document 4_2025-04-22 in 0.09 sec.
2025-11-14 15:53:50,812 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2025-04-02' --> 'data\processed_data\CAT\4_2025-04-02.md'
Converted 'data\edgar_documents\CAT\4_2025-04-22' --> 'data\processed_data\CAT\4_2025-04-22.md'


2025-11-14 15:53:50,834 - INFO - Going to convert document batch...
2025-11-14 15:53:50,837 - INFO - Processing document 4_2025-04-28
2025-11-14 15:53:50,913 - INFO - Finished converting document 4_2025-04-28 in 0.12 sec.
2025-11-14 15:53:51,012 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:51,040 - INFO - Going to convert document batch...
2025-11-14 15:53:51,041 - INFO - Processing document 4_2025-05-05
2025-11-14 15:53:51,102 - INFO - Finished converting document 4_2025-05-05 in 0.11 sec.
2025-11-14 15:53:51,179 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2025-04-28' --> 'data\processed_data\CAT\4_2025-04-28.md'
Converted 'data\edgar_documents\CAT\4_2025-05-05' --> 'data\processed_data\CAT\4_2025-05-05.md'


2025-11-14 15:53:51,203 - INFO - Going to convert document batch...
2025-11-14 15:53:51,205 - INFO - Processing document 4_2025-05-08
2025-11-14 15:53:51,267 - INFO - Finished converting document 4_2025-05-08 in 0.11 sec.
2025-11-14 15:53:51,354 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:53:51,355 - ERROR - Input document 4_2025-05-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:53:51,358 - INFO - Going to convert document batch...
2025-11-14 15:53:51,380 - IN

Converted 'data\edgar_documents\CAT\4_2025-05-08' --> 'data\processed_data\CAT\4_2025-05-08.md'
Error processing data\edgar_documents\CAT\4_2025-05-12: File format not allowed: data\edgar_documents\CAT\4_2025-05-12
Converted 'data\edgar_documents\CAT\4_2025-05-13' --> 'data\processed_data\CAT\4_2025-05-13.md'


2025-11-14 15:53:51,568 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:53:51,568 - ERROR - Input document 4_2025-05-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:53:51,570 - INFO - Going to convert document batch...
2025-11-14 15:53:51,586 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:51,608 - INFO - Going to convert document batch...
2025-11-14 15:53:51,609 - INFO - Processing document 4_2025-05-27
2025-11-14 15:53:51,657 - INFO - Fin

Error processing data\edgar_documents\CAT\4_2025-05-14: File format not allowed: data\edgar_documents\CAT\4_2025-05-14
Converted 'data\edgar_documents\CAT\4_2025-05-27' --> 'data\processed_data\CAT\4_2025-05-27.md'


2025-11-14 15:53:51,796 - INFO - Finished converting document 4_2025-06-13 in 0.09 sec.
2025-11-14 15:53:51,864 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:51,883 - INFO - Going to convert document batch...
2025-11-14 15:53:51,885 - INFO - Processing document 4_2025-06-27
2025-11-14 15:53:51,930 - INFO - Finished converting document 4_2025-06-27 in 0.08 sec.
2025-11-14 15:53:52,001 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:52,020 - INFO - Going to convert document batch...
2025-11-14 15:53:52,021 - INFO - Processing document 4_2025-07-02


Converted 'data\edgar_documents\CAT\4_2025-06-13' --> 'data\processed_data\CAT\4_2025-06-13.md'
Converted 'data\edgar_documents\CAT\4_2025-06-27' --> 'data\processed_data\CAT\4_2025-06-27.md'


2025-11-14 15:53:52,067 - INFO - Finished converting document 4_2025-07-02 in 0.09 sec.
2025-11-14 15:53:52,129 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:52,153 - INFO - Going to convert document batch...
2025-11-14 15:53:52,154 - INFO - Processing document 4_2025-07-21
2025-11-14 15:53:52,213 - INFO - Finished converting document 4_2025-07-21 in 0.11 sec.
2025-11-14 15:53:52,315 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2025-07-02' --> 'data\processed_data\CAT\4_2025-07-02.md'
Converted 'data\edgar_documents\CAT\4_2025-07-21' --> 'data\processed_data\CAT\4_2025-07-21.md'


2025-11-14 15:53:52,342 - INFO - Going to convert document batch...
2025-11-14 15:53:52,344 - INFO - Processing document 4_2025-07-28
2025-11-14 15:53:52,398 - INFO - Finished converting document 4_2025-07-28 in 0.11 sec.
2025-11-14 15:53:52,458 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:52,479 - INFO - Going to convert document batch...
2025-11-14 15:53:52,480 - INFO - Processing document 4_2025-08-08
2025-11-14 15:53:52,538 - INFO - Finished converting document 4_2025-08-08 in 0.09 sec.
2025-11-14 15:53:52,616 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:52,644 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2025-07-28' --> 'data\processed_data\CAT\4_2025-07-28.md'
Converted 'data\edgar_documents\CAT\4_2025-08-08' --> 'data\processed_data\CAT\4_2025-08-08.md'


2025-11-14 15:53:52,647 - INFO - Processing document 4_2025-08-13
2025-11-14 15:53:52,720 - INFO - Finished converting document 4_2025-08-13 in 0.14 sec.
2025-11-14 15:53:52,794 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:52,812 - INFO - Going to convert document batch...
2025-11-14 15:53:52,813 - INFO - Processing document 4_2025-08-19
2025-11-14 15:53:52,861 - INFO - Finished converting document 4_2025-08-19 in 0.08 sec.
2025-11-14 15:53:52,936 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:52,956 - INFO - Going to convert document batch...
2025-11-14 15:53:52,957 - INFO - Processing document 4_2025-08-27


Converted 'data\edgar_documents\CAT\4_2025-08-13' --> 'data\processed_data\CAT\4_2025-08-13.md'
Converted 'data\edgar_documents\CAT\4_2025-08-19' --> 'data\processed_data\CAT\4_2025-08-19.md'


2025-11-14 15:53:53,014 - INFO - Finished converting document 4_2025-08-27 in 0.11 sec.
2025-11-14 15:53:53,087 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:53,108 - INFO - Going to convert document batch...
2025-11-14 15:53:53,109 - INFO - Processing document 4_2025-09-03
2025-11-14 15:53:53,164 - INFO - Finished converting document 4_2025-09-03 in 0.09 sec.
2025-11-14 15:53:53,242 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\4_2025-08-27' --> 'data\processed_data\CAT\4_2025-08-27.md'
Converted 'data\edgar_documents\CAT\4_2025-09-03' --> 'data\processed_data\CAT\4_2025-09-03.md'


2025-11-14 15:53:53,269 - INFO - Going to convert document batch...
2025-11-14 15:53:53,271 - INFO - Processing document 4_2025-09-23
2025-11-14 15:53:53,312 - INFO - Finished converting document 4_2025-09-23 in 0.09 sec.
2025-11-14 15:53:53,370 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:53,387 - INFO - Going to convert document batch...
2025-11-14 15:53:53,388 - INFO - Processing document 4_2025-09-29
2025-11-14 15:53:53,432 - INFO - Finished converting document 4_2025-09-29 in 0.06 sec.
2025-11-14 15:53:53,503 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:53,527 - INFO - Going to convert document batch...
2025-11-14 15:53:53,530 - INFO - Processing document 4_2025-10-01


Converted 'data\edgar_documents\CAT\4_2025-09-23' --> 'data\processed_data\CAT\4_2025-09-23.md'
Converted 'data\edgar_documents\CAT\4_2025-09-29' --> 'data\processed_data\CAT\4_2025-09-29.md'


2025-11-14 15:53:53,585 - INFO - Finished converting document 4_2025-10-01 in 0.11 sec.
2025-11-14 15:53:53,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:53,680 - INFO - Going to convert document batch...
2025-11-14 15:53:53,681 - INFO - Processing document 4_2025-10-14
2025-11-14 15:53:53,747 - INFO - Finished converting document 4_2025-10-14 in 0.12 sec.


Converted 'data\edgar_documents\CAT\4_2025-10-01' --> 'data\processed_data\CAT\4_2025-10-01.md'
Converted 'data\edgar_documents\CAT\4_2025-10-14' --> 'data\processed_data\CAT\4_2025-10-14.md'


2025-11-14 15:53:53,846 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:53,874 - INFO - Going to convert document batch...
2025-11-14 15:53:53,876 - INFO - Processing document 4_2025-10-27
2025-11-14 15:53:53,929 - INFO - Finished converting document 4_2025-10-27 in 0.11 sec.
2025-11-14 15:53:53,984 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:54,004 - INFO - Going to convert document batch...
2025-11-14 15:53:54,005 - INFO - Processing document 4_2025-11-06
2025-11-14 15:53:54,060 - INFO - Finished converting document 4_2025-11-06 in 0.09 sec.
2025-11-14 15:53:54,131 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:54,152 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CAT\4_2025-10-27' --> 'data\processed_data\CAT\4_2025-10-27.md'
Converted 'data\edgar_documents\CAT\4_2025-11-06' --> 'data\processed_data\CAT\4_2025-11-06.md'


2025-11-14 15:53:54,153 - INFO - Processing document 4_2025-11-07
2025-11-14 15:53:54,206 - INFO - Finished converting document 4_2025-11-07 in 0.09 sec.
2025-11-14 15:53:54,304 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:54,354 - INFO - Going to convert document batch...
2025-11-14 15:53:54,355 - INFO - Processing document 8-K_2023-01-31
2025-11-14 15:53:54,422 - INFO - Finished converting document 8-K_2023-01-31 in 0.14 sec.


Converted 'data\edgar_documents\CAT\4_2025-11-07' --> 'data\processed_data\CAT\4_2025-11-07.md'


2025-11-14 15:53:54,586 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:54,628 - INFO - Going to convert document batch...
2025-11-14 15:53:54,629 - INFO - Processing document 8-K_2023-02-02
2025-11-14 15:53:54,689 - INFO - Finished converting document 8-K_2023-02-02 in 0.12 sec.


Converted 'data\edgar_documents\CAT\8-K_2023-01-31' --> 'data\processed_data\CAT\8-K_2023-01-31.md'


2025-11-14 15:53:54,825 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:54,862 - INFO - Going to convert document batch...
2025-11-14 15:53:54,863 - INFO - Processing document 8-K_2023-04-27
2025-11-14 15:53:54,919 - INFO - Finished converting document 8-K_2023-04-27 in 0.11 sec.


Converted 'data\edgar_documents\CAT\8-K_2023-02-02' --> 'data\processed_data\CAT\8-K_2023-02-02.md'


2025-11-14 15:53:55,073 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:55,127 - INFO - Going to convert document batch...
2025-11-14 15:53:55,129 - INFO - Processing document 8-K_2023-06-20
2025-11-14 15:53:55,239 - INFO - Finished converting document 8-K_2023-06-20 in 0.17 sec.


Converted 'data\edgar_documents\CAT\8-K_2023-04-27' --> 'data\processed_data\CAT\8-K_2023-04-27.md'


2025-11-14 15:53:55,327 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:55,371 - INFO - Going to convert document batch...
2025-11-14 15:53:55,373 - INFO - Processing document 8-K_2023-08-01
2025-11-14 15:53:55,435 - INFO - Finished converting document 8-K_2023-08-01 in 0.12 sec.


Converted 'data\edgar_documents\CAT\8-K_2023-06-20' --> 'data\processed_data\CAT\8-K_2023-06-20.md'


2025-11-14 15:53:55,607 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:55,643 - INFO - Going to convert document batch...
2025-11-14 15:53:55,645 - INFO - Processing document 8-K_2023-08-09
2025-11-14 15:53:55,707 - INFO - Finished converting document 8-K_2023-08-09 in 0.11 sec.


Converted 'data\edgar_documents\CAT\8-K_2023-08-01' --> 'data\processed_data\CAT\8-K_2023-08-01.md'


2025-11-14 15:53:55,863 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:55,895 - INFO - Going to convert document batch...
2025-11-14 15:53:55,896 - INFO - Processing document 8-K_2023-09-01
2025-11-14 15:53:56,009 - INFO - Finished converting document 8-K_2023-09-01 in 0.16 sec.


Converted 'data\edgar_documents\CAT\8-K_2023-08-09' --> 'data\processed_data\CAT\8-K_2023-08-09.md'


2025-11-14 15:53:56,091 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:56,134 - INFO - Going to convert document batch...
2025-11-14 15:53:56,136 - INFO - Processing document 8-K_2023-10-16
2025-11-14 15:53:56,191 - INFO - Finished converting document 8-K_2023-10-16 in 0.11 sec.


Converted 'data\edgar_documents\CAT\8-K_2023-09-01' --> 'data\processed_data\CAT\8-K_2023-09-01.md'


2025-11-14 15:53:56,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:56,385 - INFO - Going to convert document batch...
2025-11-14 15:53:56,387 - INFO - Processing document 8-K_2023-10-31
2025-11-14 15:53:56,454 - INFO - Finished converting document 8-K_2023-10-31 in 0.12 sec.


Converted 'data\edgar_documents\CAT\8-K_2023-10-16' --> 'data\processed_data\CAT\8-K_2023-10-16.md'


2025-11-14 15:53:56,623 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:56,663 - INFO - Going to convert document batch...
2025-11-14 15:53:56,665 - INFO - Processing document 8-K_2023-12-14
2025-11-14 15:53:56,725 - INFO - Finished converting document 8-K_2023-12-14 in 0.12 sec.


Converted 'data\edgar_documents\CAT\8-K_2023-10-31' --> 'data\processed_data\CAT\8-K_2023-10-31.md'


2025-11-14 15:53:56,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:56,919 - INFO - Going to convert document batch...
2025-11-14 15:53:56,921 - INFO - Processing document 8-K_2024-02-05
2025-11-14 15:53:56,978 - INFO - Finished converting document 8-K_2024-02-05 in 0.11 sec.


Converted 'data\edgar_documents\CAT\8-K_2023-12-14' --> 'data\processed_data\CAT\8-K_2023-12-14.md'


2025-11-14 15:53:57,123 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:57,155 - INFO - Going to convert document batch...
2025-11-14 15:53:57,156 - INFO - Processing document 8-K_2024-04-03
2025-11-14 15:53:57,211 - INFO - Finished converting document 8-K_2024-04-03 in 0.09 sec.


Converted 'data\edgar_documents\CAT\8-K_2024-02-05' --> 'data\processed_data\CAT\8-K_2024-02-05.md'


2025-11-14 15:53:57,371 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:57,405 - INFO - Going to convert document batch...
2025-11-14 15:53:57,407 - INFO - Processing document 8-K_2024-04-25
2025-11-14 15:53:57,498 - INFO - Finished converting document 8-K_2024-04-25 in 0.14 sec.


Converted 'data\edgar_documents\CAT\8-K_2024-04-03' --> 'data\processed_data\CAT\8-K_2024-04-03.md'


2025-11-14 15:53:57,667 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:57,705 - INFO - Going to convert document batch...
2025-11-14 15:53:57,706 - INFO - Processing document 8-K_2024-06-14
2025-11-14 15:53:57,785 - INFO - Finished converting document 8-K_2024-06-14 in 0.14 sec.


Converted 'data\edgar_documents\CAT\8-K_2024-04-25' --> 'data\processed_data\CAT\8-K_2024-04-25.md'
Converted 'data\edgar_documents\CAT\8-K_2024-06-14' --> 'data\processed_data\CAT\8-K_2024-06-14.md'


2025-11-14 15:53:57,873 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:57,902 - INFO - Going to convert document batch...
2025-11-14 15:53:57,904 - INFO - Processing document 8-K_2024-08-06
2025-11-14 15:53:57,970 - INFO - Finished converting document 8-K_2024-08-06 in 0.12 sec.
2025-11-14 15:53:58,127 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:58,164 - INFO - Going to convert document batch...
2025-11-14 15:53:58,165 - INFO - Processing document 8-K_2024-09-04


Converted 'data\edgar_documents\CAT\8-K_2024-08-06' --> 'data\processed_data\CAT\8-K_2024-08-06.md'


2025-11-14 15:53:58,768 - INFO - Finished converting document 8-K_2024-09-04 in 0.66 sec.
2025-11-14 15:53:58,837 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:58,877 - INFO - Going to convert document batch...
2025-11-14 15:53:58,878 - INFO - Processing document 8-K_2024-10-11
2025-11-14 15:53:58,925 - INFO - Finished converting document 8-K_2024-10-11 in 0.09 sec.


Converted 'data\edgar_documents\CAT\8-K_2024-09-04' --> 'data\processed_data\CAT\8-K_2024-09-04.md'


2025-11-14 15:53:59,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:59,148 - INFO - Going to convert document batch...
2025-11-14 15:53:59,150 - INFO - Processing document 8-K_2024-10-30
2025-11-14 15:53:59,230 - INFO - Finished converting document 8-K_2024-10-30 in 0.14 sec.


Converted 'data\edgar_documents\CAT\8-K_2024-10-11' --> 'data\processed_data\CAT\8-K_2024-10-11.md'


2025-11-14 15:53:59,371 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:59,402 - INFO - Going to convert document batch...
2025-11-14 15:53:59,404 - INFO - Processing document 8-K_2025-01-30
2025-11-14 15:53:59,454 - INFO - Finished converting document 8-K_2025-01-30 in 0.09 sec.


Converted 'data\edgar_documents\CAT\8-K_2024-10-30' --> 'data\processed_data\CAT\8-K_2024-10-30.md'


2025-11-14 15:53:59,582 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:59,609 - INFO - Going to convert document batch...
2025-11-14 15:53:59,610 - INFO - Processing document 8-K_2025-04-09
2025-11-14 15:53:59,683 - INFO - Finished converting document 8-K_2025-04-09 in 0.12 sec.
2025-11-14 15:53:59,753 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\8-K_2025-01-30' --> 'data\processed_data\CAT\8-K_2025-01-30.md'
Converted 'data\edgar_documents\CAT\8-K_2025-04-09' --> 'data\processed_data\CAT\8-K_2025-04-09.md'


2025-11-14 15:53:59,786 - INFO - Going to convert document batch...
2025-11-14 15:53:59,787 - INFO - Processing document 8-K_2025-04-15
2025-11-14 15:53:59,845 - INFO - Finished converting document 8-K_2025-04-15 in 0.12 sec.
2025-11-14 15:53:59,928 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:53:59,971 - INFO - Going to convert document batch...
2025-11-14 15:53:59,973 - INFO - Processing document 8-K_2025-04-30
2025-11-14 15:54:00,046 - INFO - Finished converting document 8-K_2025-04-30 in 0.14 sec.


Converted 'data\edgar_documents\CAT\8-K_2025-04-15' --> 'data\processed_data\CAT\8-K_2025-04-15.md'


2025-11-14 15:54:00,239 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:54:00,276 - INFO - Going to convert document batch...
2025-11-14 15:54:00,278 - INFO - Processing document 8-K_2025-05-15
2025-11-14 15:54:00,349 - INFO - Finished converting document 8-K_2025-05-15 in 0.12 sec.
2025-11-14 15:54:00,412 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\8-K_2025-04-30' --> 'data\processed_data\CAT\8-K_2025-04-30.md'
Converted 'data\edgar_documents\CAT\8-K_2025-05-15' --> 'data\processed_data\CAT\8-K_2025-05-15.md'


2025-11-14 15:54:00,454 - INFO - Going to convert document batch...
2025-11-14 15:54:00,455 - INFO - Processing document 8-K_2025-06-12
2025-11-14 15:54:00,552 - INFO - Finished converting document 8-K_2025-06-12 in 0.16 sec.
2025-11-14 15:54:00,627 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:54:00,671 - INFO - Going to convert document batch...
2025-11-14 15:54:00,672 - INFO - Processing document 8-K_2025-08-05
2025-11-14 15:54:00,731 - INFO - Finished converting document 8-K_2025-08-05 in 0.12 sec.


Converted 'data\edgar_documents\CAT\8-K_2025-06-12' --> 'data\processed_data\CAT\8-K_2025-06-12.md'


2025-11-14 15:54:00,880 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:54:00,908 - INFO - Going to convert document batch...
2025-11-14 15:54:00,909 - INFO - Processing document 8-K_2025-08-28
2025-11-14 15:54:00,966 - INFO - Finished converting document 8-K_2025-08-28 in 0.11 sec.
2025-11-14 15:54:01,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\8-K_2025-08-05' --> 'data\processed_data\CAT\8-K_2025-08-05.md'
Converted 'data\edgar_documents\CAT\8-K_2025-08-28' --> 'data\processed_data\CAT\8-K_2025-08-28.md'


2025-11-14 15:54:01,073 - INFO - Going to convert document batch...
2025-11-14 15:54:01,075 - INFO - Processing document 8-K_2025-09-03
2025-11-14 15:54:01,178 - INFO - Finished converting document 8-K_2025-09-03 in 0.16 sec.
2025-11-14 15:54:01,256 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:54:01,286 - INFO - Going to convert document batch...
2025-11-14 15:54:01,287 - INFO - Processing document 8-K_2025-10-29
2025-11-14 15:54:01,341 - INFO - Finished converting document 8-K_2025-10-29 in 0.11 sec.


Converted 'data\edgar_documents\CAT\8-K_2025-09-03' --> 'data\processed_data\CAT\8-K_2025-09-03.md'


2025-11-14 15:54:01,573 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:54:01,574 - ERROR - Input document DEF-14A_2023-05-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:54:01,581 - INFO - Going to convert document batch...
2025-11-14 15:54:01,612 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\8-K_2025-10-29' --> 'data\processed_data\CAT\8-K_2025-10-29.md'
Error processing data\edgar_documents\CAT\DEF-14A_2023-05-01: File format not allowed: data\edgar_documents\CAT\DEF-14A_2023-05-01


2025-11-14 15:54:02,571 - INFO - Going to convert document batch...
2025-11-14 15:54:02,572 - INFO - Processing document DEF-14A_2024-04-29
2025-11-14 15:54:05,655 - INFO - Finished converting document DEF-14A_2024-04-29 in 4.08 sec.
2025-11-14 15:54:07,489 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\DEF-14A_2024-04-29' --> 'data\processed_data\CAT\DEF-14A_2024-04-29.md'


2025-11-14 15:54:08,493 - INFO - Going to convert document batch...
2025-11-14 15:54:08,494 - INFO - Processing document DEF-14A_2025-04-30
2025-11-14 15:54:31,173 - INFO - Finished converting document DEF-14A_2025-04-30 in 23.72 sec.
2025-11-14 15:54:33,595 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CAT\DEF-14A_2025-04-30' --> 'data\processed_data\CAT\DEF-14A_2025-04-30.md'
Processed 162 new files. Errors: 3
Found 168 files to process in data\edgar_documents\CHTR


2025-11-14 15:54:34,830 - INFO - Going to convert document batch...
2025-11-14 15:54:34,831 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:54:34,832 - INFO - Processing document 10-K_2023-01-27
2025-11-14 15:54:40,269 - INFO - Finished converting document 10-K_2023-01-27 in 6.77 sec.
2025-11-14 15:54:41,769 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\10-K_2023-01-27' --> 'data\processed_data\CHTR\10-K_2023-01-27.md'


2025-11-14 15:54:43,158 - INFO - Going to convert document batch...
2025-11-14 15:54:43,159 - INFO - Processing document 10-K_2024-02-02
2025-11-14 15:54:48,257 - INFO - Finished converting document 10-K_2024-02-02 in 6.58 sec.
2025-11-14 15:54:49,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\10-K_2024-02-02' --> 'data\processed_data\CHTR\10-K_2024-02-02.md'


2025-11-14 15:54:51,223 - INFO - Going to convert document batch...
2025-11-14 15:54:51,224 - INFO - Processing document 10-K_2025-01-31
2025-11-14 15:54:56,198 - INFO - Finished converting document 10-K_2025-01-31 in 6.52 sec.
2025-11-14 15:54:57,634 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\10-K_2025-01-31' --> 'data\processed_data\CHTR\10-K_2025-01-31.md'


2025-11-14 15:54:59,035 - INFO - Going to convert document batch...
2025-11-14 15:54:59,036 - INFO - Processing document 10-Q_2023-04-28
2025-11-14 15:55:00,171 - INFO - Finished converting document 10-Q_2023-04-28 in 2.56 sec.
2025-11-14 15:55:00,734 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\10-Q_2023-04-28' --> 'data\processed_data\CHTR\10-Q_2023-04-28.md'


2025-11-14 15:55:01,426 - INFO - Going to convert document batch...
2025-11-14 15:55:01,429 - INFO - Processing document 10-Q_2023-07-28
2025-11-14 15:55:02,778 - INFO - Finished converting document 10-Q_2023-07-28 in 2.11 sec.
2025-11-14 15:55:03,519 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\10-Q_2023-07-28' --> 'data\processed_data\CHTR\10-Q_2023-07-28.md'


2025-11-14 15:55:04,228 - INFO - Going to convert document batch...
2025-11-14 15:55:04,229 - INFO - Processing document 10-Q_2023-10-27
2025-11-14 15:55:05,843 - INFO - Finished converting document 10-Q_2023-10-27 in 2.36 sec.
2025-11-14 15:55:06,415 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\10-Q_2023-10-27' --> 'data\processed_data\CHTR\10-Q_2023-10-27.md'


2025-11-14 15:55:07,667 - INFO - Going to convert document batch...
2025-11-14 15:55:07,668 - INFO - Processing document 10-Q_2024-04-26
2025-11-14 15:55:08,654 - INFO - Finished converting document 10-Q_2024-04-26 in 2.30 sec.
2025-11-14 15:55:09,252 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\10-Q_2024-04-26' --> 'data\processed_data\CHTR\10-Q_2024-04-26.md'


2025-11-14 15:55:09,945 - INFO - Going to convert document batch...
2025-11-14 15:55:09,946 - INFO - Processing document 10-Q_2024-07-26
2025-11-14 15:55:11,068 - INFO - Finished converting document 10-Q_2024-07-26 in 1.84 sec.
2025-11-14 15:55:11,611 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\10-Q_2024-07-26' --> 'data\processed_data\CHTR\10-Q_2024-07-26.md'


2025-11-14 15:55:12,738 - INFO - Going to convert document batch...
2025-11-14 15:55:12,739 - INFO - Processing document 10-Q_2024-11-01
2025-11-14 15:55:13,827 - INFO - Finished converting document 10-Q_2024-11-01 in 2.25 sec.
2025-11-14 15:55:14,491 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\10-Q_2024-11-01' --> 'data\processed_data\CHTR\10-Q_2024-11-01.md'


2025-11-14 15:55:14,969 - INFO - Going to convert document batch...
2025-11-14 15:55:14,971 - INFO - Processing document 10-Q_2025-04-25
2025-11-14 15:55:16,202 - INFO - Finished converting document 10-Q_2025-04-25 in 1.75 sec.
2025-11-14 15:55:16,783 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\10-Q_2025-04-25' --> 'data\processed_data\CHTR\10-Q_2025-04-25.md'


2025-11-14 15:55:17,510 - INFO - Going to convert document batch...
2025-11-14 15:55:17,511 - INFO - Processing document 10-Q_2025-07-25
2025-11-14 15:55:18,916 - INFO - Finished converting document 10-Q_2025-07-25 in 2.19 sec.
2025-11-14 15:55:19,480 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\10-Q_2025-07-25' --> 'data\processed_data\CHTR\10-Q_2025-07-25.md'


2025-11-14 15:55:20,750 - INFO - Going to convert document batch...
2025-11-14 15:55:20,751 - INFO - Processing document 10-Q_2025-10-31
2025-11-14 15:55:22,011 - INFO - Finished converting document 10-Q_2025-10-31 in 2.58 sec.
2025-11-14 15:55:22,535 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:22,555 - INFO - Going to convert document batch...
2025-11-14 15:55:22,558 - INFO - Processing document 4_2023-01-06
2025-11-14 15:55:22,597 - INFO - Finished converting document 4_2023-01-06 in 0.08 sec.
2025-11-14 15:55:22,659 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:22,673 - INFO - Going to convert document batch...
2025-11-14 15:55:22,674 - INFO - Processing document 4_2023-01-18
2025-11-14 15:55:22,706 - INFO - Finished converting document 4_2023-01-18 in 0.06 sec.


Converted 'data\edgar_documents\CHTR\10-Q_2025-10-31' --> 'data\processed_data\CHTR\10-Q_2025-10-31.md'
Converted 'data\edgar_documents\CHTR\4_2023-01-06' --> 'data\processed_data\CHTR\4_2023-01-06.md'


2025-11-14 15:55:22,756 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:22,787 - INFO - Going to convert document batch...
2025-11-14 15:55:22,788 - INFO - Processing document 4_2023-01-19
2025-11-14 15:55:22,862 - INFO - Finished converting document 4_2023-01-19 in 0.12 sec.
2025-11-14 15:55:22,943 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\4_2023-01-18' --> 'data\processed_data\CHTR\4_2023-01-18.md'
Converted 'data\edgar_documents\CHTR\4_2023-01-19' --> 'data\processed_data\CHTR\4_2023-01-19.md'


2025-11-14 15:55:22,958 - INFO - Going to convert document batch...
2025-11-14 15:55:22,959 - INFO - Processing document 4_2023-02-01
2025-11-14 15:55:22,992 - INFO - Finished converting document 4_2023-02-01 in 0.06 sec.
2025-11-14 15:55:23,038 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:23,053 - INFO - Going to convert document batch...
2025-11-14 15:55:23,054 - INFO - Processing document 4_2023-02-03
2025-11-14 15:55:23,088 - INFO - Finished converting document 4_2023-02-03 in 0.08 sec.
2025-11-14 15:55:23,138 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:23,155 - INFO - Going to convert document batch...
2025-11-14 15:55:23,156 - INFO - Processing document 4_2023-02-24
2025-11-14 15:55:23,197 - INFO - Finished converting document 4_2023-02-24 in 0.06 sec.


Converted 'data\edgar_documents\CHTR\4_2023-02-01' --> 'data\processed_data\CHTR\4_2023-02-01.md'
Converted 'data\edgar_documents\CHTR\4_2023-02-03' --> 'data\processed_data\CHTR\4_2023-02-03.md'


2025-11-14 15:55:23,249 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:23,272 - INFO - Going to convert document batch...
2025-11-14 15:55:23,273 - INFO - Processing document 4_2023-03-01
2025-11-14 15:55:23,327 - INFO - Finished converting document 4_2023-03-01 in 0.09 sec.
2025-11-14 15:55:23,412 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:23,426 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CHTR\4_2023-02-24' --> 'data\processed_data\CHTR\4_2023-02-24.md'
Converted 'data\edgar_documents\CHTR\4_2023-03-01' --> 'data\processed_data\CHTR\4_2023-03-01.md'


2025-11-14 15:55:23,428 - INFO - Processing document 4_2023-03-06
2025-11-14 15:55:23,464 - INFO - Finished converting document 4_2023-03-06 in 0.08 sec.
2025-11-14 15:55:23,514 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:23,533 - INFO - Going to convert document batch...
2025-11-14 15:55:23,534 - INFO - Processing document 4_2023-03-21
2025-11-14 15:55:23,575 - INFO - Finished converting document 4_2023-03-21 in 0.08 sec.
2025-11-14 15:55:23,640 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:23,659 - INFO - Going to convert document batch...
2025-11-14 15:55:23,659 - INFO - Processing document 4_2023-04-07
2025-11-14 15:55:23,698 - INFO - Finished converting document 4_2023-04-07 in 0.08 sec.


Converted 'data\edgar_documents\CHTR\4_2023-03-06' --> 'data\processed_data\CHTR\4_2023-03-06.md'
Converted 'data\edgar_documents\CHTR\4_2023-03-21' --> 'data\processed_data\CHTR\4_2023-03-21.md'


2025-11-14 15:55:23,767 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:23,788 - INFO - Going to convert document batch...
2025-11-14 15:55:23,789 - INFO - Processing document 4_2023-04-26
2025-11-14 15:55:23,831 - INFO - Finished converting document 4_2023-04-26 in 0.08 sec.
2025-11-14 15:55:23,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:23,920 - INFO - Going to convert document batch...
2025-11-14 15:55:23,923 - INFO - Processing document 4_2023-05-08


Converted 'data\edgar_documents\CHTR\4_2023-04-07' --> 'data\processed_data\CHTR\4_2023-04-07.md'
Converted 'data\edgar_documents\CHTR\4_2023-04-26' --> 'data\processed_data\CHTR\4_2023-04-26.md'


2025-11-14 15:55:23,961 - INFO - Finished converting document 4_2023-05-08 in 0.08 sec.
2025-11-14 15:55:24,028 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:24,045 - INFO - Going to convert document batch...
2025-11-14 15:55:24,051 - INFO - Processing document 4_2023-05-16
2025-11-14 15:55:24,104 - INFO - Finished converting document 4_2023-05-16 in 0.09 sec.
2025-11-14 15:55:24,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:24,184 - INFO - Going to convert document batch...
2025-11-14 15:55:24,186 - INFO - Processing document 4_2023-06-07


Converted 'data\edgar_documents\CHTR\4_2023-05-08' --> 'data\processed_data\CHTR\4_2023-05-08.md'
Converted 'data\edgar_documents\CHTR\4_2023-05-16' --> 'data\processed_data\CHTR\4_2023-05-16.md'


2025-11-14 15:55:24,228 - INFO - Finished converting document 4_2023-06-07 in 0.06 sec.
2025-11-14 15:55:24,294 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:24,330 - INFO - Going to convert document batch...
2025-11-14 15:55:24,330 - INFO - Processing document 4_2023-06-16
2025-11-14 15:55:24,431 - INFO - Finished converting document 4_2023-06-16 in 0.14 sec.


Converted 'data\edgar_documents\CHTR\4_2023-06-07' --> 'data\processed_data\CHTR\4_2023-06-07.md'


2025-11-14 15:55:24,532 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:24,554 - INFO - Going to convert document batch...
2025-11-14 15:55:24,556 - INFO - Processing document 4_2023-07-05
2025-11-14 15:55:24,604 - INFO - Finished converting document 4_2023-07-05 in 0.09 sec.
2025-11-14 15:55:24,675 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:24,697 - INFO - Going to convert document batch...
2025-11-14 15:55:24,698 - INFO - Processing document 4_2023-07-06


Converted 'data\edgar_documents\CHTR\4_2023-06-16' --> 'data\processed_data\CHTR\4_2023-06-16.md'
Converted 'data\edgar_documents\CHTR\4_2023-07-05' --> 'data\processed_data\CHTR\4_2023-07-05.md'


2025-11-14 15:55:24,744 - INFO - Finished converting document 4_2023-07-06 in 0.08 sec.
2025-11-14 15:55:24,812 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:24,844 - INFO - Going to convert document batch...
2025-11-14 15:55:24,845 - INFO - Processing document 4_2023-07-07
2025-11-14 15:55:24,925 - INFO - Finished converting document 4_2023-07-07 in 0.12 sec.


Converted 'data\edgar_documents\CHTR\4_2023-07-06' --> 'data\processed_data\CHTR\4_2023-07-06.md'


2025-11-14 15:55:25,006 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:25,053 - INFO - Going to convert document batch...
2025-11-14 15:55:25,054 - INFO - Processing document 4_2023-07-25
2025-11-14 15:55:25,148 - INFO - Finished converting document 4_2023-07-25 in 0.14 sec.


Converted 'data\edgar_documents\CHTR\4_2023-07-07' --> 'data\processed_data\CHTR\4_2023-07-07.md'


2025-11-14 15:55:25,226 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:25,244 - INFO - Going to convert document batch...
2025-11-14 15:55:25,245 - INFO - Processing document 4_2023-08-04
2025-11-14 15:55:25,279 - INFO - Finished converting document 4_2023-08-04 in 0.06 sec.
2025-11-14 15:55:25,345 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:25,378 - INFO - Going to convert document batch...
2025-11-14 15:55:25,379 - INFO - Processing document 4_2023-08-07


Converted 'data\edgar_documents\CHTR\4_2023-07-25' --> 'data\processed_data\CHTR\4_2023-07-25.md'
Converted 'data\edgar_documents\CHTR\4_2023-08-04' --> 'data\processed_data\CHTR\4_2023-08-04.md'


2025-11-14 15:55:25,463 - INFO - Finished converting document 4_2023-08-07 in 0.14 sec.
2025-11-14 15:55:25,562 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:25,645 - INFO - Going to convert document batch...
2025-11-14 15:55:25,646 - INFO - Processing document 4_2023-08-17


Converted 'data\edgar_documents\CHTR\4_2023-08-07' --> 'data\processed_data\CHTR\4_2023-08-07.md'


2025-11-14 15:55:25,861 - INFO - Finished converting document 4_2023-08-17 in 0.31 sec.
2025-11-14 15:55:25,991 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:26,006 - INFO - Going to convert document batch...
2025-11-14 15:55:26,007 - INFO - Processing document 4_2023-08-18
2025-11-14 15:55:26,045 - INFO - Finished converting document 4_2023-08-18 in 0.08 sec.
2025-11-14 15:55:26,095 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\4_2023-08-17' --> 'data\processed_data\CHTR\4_2023-08-17.md'
Converted 'data\edgar_documents\CHTR\4_2023-08-18' --> 'data\processed_data\CHTR\4_2023-08-18.md'


2025-11-14 15:55:26,173 - INFO - Going to convert document batch...
2025-11-14 15:55:26,174 - INFO - Processing document 4_2023-08-22
2025-11-14 15:55:26,964 - INFO - Finished converting document 4_2023-08-22 in 0.89 sec.
2025-11-14 15:55:27,139 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:27,212 - INFO - Going to convert document batch...
2025-11-14 15:55:27,214 - INFO - Processing document 4_2023-08-25


Converted 'data\edgar_documents\CHTR\4_2023-08-22' --> 'data\processed_data\CHTR\4_2023-08-22.md'


2025-11-14 15:55:27,399 - INFO - Finished converting document 4_2023-08-25 in 0.27 sec.
2025-11-14 15:55:27,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:27,563 - INFO - Going to convert document batch...
2025-11-14 15:55:27,563 - INFO - Processing document 4_2023-08-29
2025-11-14 15:55:27,623 - INFO - Finished converting document 4_2023-08-29 in 0.11 sec.
2025-11-14 15:55:27,701 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\4_2023-08-25' --> 'data\processed_data\CHTR\4_2023-08-25.md'
Converted 'data\edgar_documents\CHTR\4_2023-08-29' --> 'data\processed_data\CHTR\4_2023-08-29.md'


2025-11-14 15:55:27,798 - INFO - Going to convert document batch...
2025-11-14 15:55:27,799 - INFO - Processing document 4_2023-08-30
2025-11-14 15:55:28,010 - INFO - Finished converting document 4_2023-08-30 in 0.34 sec.
2025-11-14 15:55:28,157 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:28,184 - INFO - Going to convert document batch...
2025-11-14 15:55:28,186 - INFO - Processing document 4_2023-09-08
2025-11-14 15:55:28,248 - INFO - Finished converting document 4_2023-09-08 in 0.11 sec.
2025-11-14 15:55:28,305 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:28,323 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CHTR\4_2023-08-30' --> 'data\processed_data\CHTR\4_2023-08-30.md'
Converted 'data\edgar_documents\CHTR\4_2023-09-08' --> 'data\processed_data\CHTR\4_2023-09-08.md'


2025-11-14 15:55:28,325 - INFO - Processing document 4_2023-10-05
2025-11-14 15:55:28,366 - INFO - Finished converting document 4_2023-10-05 in 0.08 sec.
2025-11-14 15:55:28,424 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:28,441 - INFO - Going to convert document batch...
2025-11-14 15:55:28,442 - INFO - Processing document 4_2023-10-10
2025-11-14 15:55:28,478 - INFO - Finished converting document 4_2023-10-10 in 0.06 sec.
2025-11-14 15:55:28,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:28,565 - INFO - Going to convert document batch...
2025-11-14 15:55:28,566 - INFO - Processing document 4_2023-10-17
2025-11-14 15:55:28,597 - INFO - Finished converting document 4_2023-10-17 in 0.08 sec.


Converted 'data\edgar_documents\CHTR\4_2023-10-05' --> 'data\processed_data\CHTR\4_2023-10-05.md'
Converted 'data\edgar_documents\CHTR\4_2023-10-10' --> 'data\processed_data\CHTR\4_2023-10-10.md'


2025-11-14 15:55:28,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:28,729 - INFO - Going to convert document batch...
2025-11-14 15:55:28,732 - INFO - Processing document 4_2023-11-02


Converted 'data\edgar_documents\CHTR\4_2023-10-17' --> 'data\processed_data\CHTR\4_2023-10-17.md'


2025-11-14 15:55:28,887 - INFO - Finished converting document 4_2023-11-02 in 0.27 sec.
2025-11-14 15:55:28,996 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:29,016 - INFO - Going to convert document batch...
2025-11-14 15:55:29,018 - INFO - Processing document 4_2023-11-06
2025-11-14 15:55:29,060 - INFO - Finished converting document 4_2023-11-06 in 0.08 sec.
2025-11-14 15:55:29,132 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:29,147 - INFO - Going to convert document batch...
2025-11-14 15:55:29,148 - INFO - Processing document 4_2023-11-08
2025-11-14 15:55:29,181 - INFO - Finished converting document 4_2023-11-08 in 0.06 sec.


Converted 'data\edgar_documents\CHTR\4_2023-11-02' --> 'data\processed_data\CHTR\4_2023-11-02.md'
Converted 'data\edgar_documents\CHTR\4_2023-11-06' --> 'data\processed_data\CHTR\4_2023-11-06.md'


2025-11-14 15:55:29,229 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:29,245 - INFO - Going to convert document batch...
2025-11-14 15:55:29,246 - INFO - Processing document 4_2023-11-15
2025-11-14 15:55:29,277 - INFO - Finished converting document 4_2023-11-15 in 0.06 sec.
2025-11-14 15:55:29,321 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:29,354 - INFO - Going to convert document batch...
2025-11-14 15:55:29,355 - INFO - Processing document 4_2023-11-16


Converted 'data\edgar_documents\CHTR\4_2023-11-08' --> 'data\processed_data\CHTR\4_2023-11-08.md'
Converted 'data\edgar_documents\CHTR\4_2023-11-15' --> 'data\processed_data\CHTR\4_2023-11-15.md'


2025-11-14 15:55:29,448 - INFO - Finished converting document 4_2023-11-16 in 0.14 sec.
2025-11-14 15:55:29,528 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:29,573 - INFO - Going to convert document batch...
2025-11-14 15:55:29,574 - INFO - Processing document 4_2023-11-20
2025-11-14 15:55:29,668 - INFO - Finished converting document 4_2023-11-20 in 0.16 sec.


Converted 'data\edgar_documents\CHTR\4_2023-11-16' --> 'data\processed_data\CHTR\4_2023-11-16.md'


2025-11-14 15:55:29,761 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:29,823 - INFO - Going to convert document batch...
2025-11-14 15:55:29,824 - INFO - Processing document 4_2023-11-21
2025-11-14 15:55:29,892 - INFO - Finished converting document 4_2023-11-21 in 0.14 sec.


Converted 'data\edgar_documents\CHTR\4_2023-11-20' --> 'data\processed_data\CHTR\4_2023-11-20.md'
Converted 'data\edgar_documents\CHTR\4_2023-11-21' --> 'data\processed_data\CHTR\4_2023-11-21.md'


2025-11-14 15:55:29,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:30,010 - INFO - Going to convert document batch...
2025-11-14 15:55:30,011 - INFO - Processing document 4_2023-12-04
2025-11-14 15:55:30,078 - INFO - Finished converting document 4_2023-12-04 in 0.12 sec.
2025-11-14 15:55:30,155 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:30,182 - INFO - Going to convert document batch...
2025-11-14 15:55:30,183 - INFO - Processing document 4_2023-12-07
2025-11-14 15:55:30,219 - INFO - Finished converting document 4_2023-12-07 in 0.08 sec.
2025-11-14 15:55:30,273 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:30,302 - INFO - Going to convert document batch...
2025-11-14 15:55:30,303 - INFO - Processing document 4_2023-12-15
2025-11-14 15:55:30,340 - INFO - Finished converting document 4_2023-12-15 in 0.09 sec.


Converted 'data\edgar_documents\CHTR\4_2023-12-04' --> 'data\processed_data\CHTR\4_2023-12-04.md'
Converted 'data\edgar_documents\CHTR\4_2023-12-07' --> 'data\processed_data\CHTR\4_2023-12-07.md'


2025-11-14 15:55:30,390 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:30,416 - INFO - Going to convert document batch...
2025-11-14 15:55:30,417 - INFO - Processing document 4_2024-01-05
2025-11-14 15:55:30,464 - INFO - Finished converting document 4_2024-01-05 in 0.09 sec.
2025-11-14 15:55:30,534 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:30,589 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CHTR\4_2023-12-15' --> 'data\processed_data\CHTR\4_2023-12-15.md'
Converted 'data\edgar_documents\CHTR\4_2024-01-05' --> 'data\processed_data\CHTR\4_2024-01-05.md'


2025-11-14 15:55:30,590 - INFO - Processing document 4_2024-01-17
2025-11-14 15:55:30,655 - INFO - Finished converting document 4_2024-01-17 in 0.16 sec.
2025-11-14 15:55:30,759 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:30,774 - INFO - Going to convert document batch...
2025-11-14 15:55:30,775 - INFO - Processing document 4_2024-01-23
2025-11-14 15:55:30,812 - INFO - Finished converting document 4_2024-01-23 in 0.06 sec.
2025-11-14 15:55:30,860 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:30,875 - INFO - Going to convert document batch...
2025-11-14 15:55:30,876 - INFO - Processing document 4_2024-02-06
2025-11-14 15:55:30,911 - INFO - Finished converting document 4_2024-02-06 in 0.06 sec.


Converted 'data\edgar_documents\CHTR\4_2024-01-17' --> 'data\processed_data\CHTR\4_2024-01-17.md'
Converted 'data\edgar_documents\CHTR\4_2024-01-23' --> 'data\processed_data\CHTR\4_2024-01-23.md'
Converted 'data\edgar_documents\CHTR\4_2024-02-06' --> 'data\processed_data\CHTR\4_2024-02-06.md'


2025-11-14 15:55:30,983 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:31,015 - INFO - Going to convert document batch...
2025-11-14 15:55:31,016 - INFO - Processing document 4_2024-02-07
2025-11-14 15:55:31,058 - INFO - Finished converting document 4_2024-02-07 in 0.11 sec.
2025-11-14 15:55:31,108 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:31,129 - INFO - Going to convert document batch...
2025-11-14 15:55:31,131 - INFO - Processing document 4_2024-03-01
2025-11-14 15:55:31,164 - INFO - Finished converting document 4_2024-03-01 in 0.06 sec.
2025-11-14 15:55:31,209 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:31,224 - INFO - Going to convert document batch...
2025-11-14 15:55:31,225 - INFO - Processing document 4_2024-03-06
2025-11-14 15:55:31,259 - INFO - Finished converting document 4_2024-03-06 in 0.06 sec.


Converted 'data\edgar_documents\CHTR\4_2024-02-07' --> 'data\processed_data\CHTR\4_2024-02-07.md'
Converted 'data\edgar_documents\CHTR\4_2024-03-01' --> 'data\processed_data\CHTR\4_2024-03-01.md'
Converted 'data\edgar_documents\CHTR\4_2024-03-06' --> 'data\processed_data\CHTR\4_2024-03-06.md'


2025-11-14 15:55:31,326 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:31,362 - INFO - Going to convert document batch...
2025-11-14 15:55:31,363 - INFO - Processing document 4_2024-04-05
2025-11-14 15:55:31,461 - INFO - Finished converting document 4_2024-04-05 in 0.16 sec.
2025-11-14 15:55:31,540 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:31,554 - INFO - Going to convert document batch...
2025-11-14 15:55:31,555 - INFO - Processing document 4_2024-04-25
2025-11-14 15:55:31,590 - INFO - Finished converting document 4_2024-04-25 in 0.08 sec.
2025-11-14 15:55:31,653 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:31,668 - INFO - Going to convert document batch...
2025-11-14 15:55:31,669 - INFO - Processing document 4_2024-05-06
2025-11-14 15:55:31,705 - INFO - Finished converting document 4_2024-05-06 in 0.08 sec.


Converted 'data\edgar_documents\CHTR\4_2024-04-05' --> 'data\processed_data\CHTR\4_2024-04-05.md'
Converted 'data\edgar_documents\CHTR\4_2024-04-25' --> 'data\processed_data\CHTR\4_2024-04-25.md'


2025-11-14 15:55:31,760 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:31,777 - INFO - Going to convert document batch...
2025-11-14 15:55:31,778 - INFO - Processing document 4_2024-06-10
2025-11-14 15:55:31,818 - INFO - Finished converting document 4_2024-06-10 in 0.08 sec.
2025-11-14 15:55:31,885 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:31,903 - INFO - Going to convert document batch...
2025-11-14 15:55:31,904 - INFO - Processing document 4_2024-06-14


Converted 'data\edgar_documents\CHTR\4_2024-05-06' --> 'data\processed_data\CHTR\4_2024-05-06.md'
Converted 'data\edgar_documents\CHTR\4_2024-06-10' --> 'data\processed_data\CHTR\4_2024-06-10.md'


2025-11-14 15:55:31,947 - INFO - Finished converting document 4_2024-06-14 in 0.08 sec.
2025-11-14 15:55:32,010 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:32,024 - INFO - Going to convert document batch...
2025-11-14 15:55:32,025 - INFO - Processing document 4_2024-06-17
2025-11-14 15:55:32,058 - INFO - Finished converting document 4_2024-06-17 in 0.08 sec.
2025-11-14 15:55:32,104 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:32,121 - INFO - Going to convert document batch...
2025-11-14 15:55:32,122 - INFO - Processing document 4_2024-06-25
2025-11-14 15:55:32,161 - INFO - Finished converting document 4_2024-06-25 in 0.06 sec.


Converted 'data\edgar_documents\CHTR\4_2024-06-14' --> 'data\processed_data\CHTR\4_2024-06-14.md'
Converted 'data\edgar_documents\CHTR\4_2024-06-17' --> 'data\processed_data\CHTR\4_2024-06-17.md'


2025-11-14 15:55:32,225 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:32,246 - INFO - Going to convert document batch...
2025-11-14 15:55:32,247 - INFO - Processing document 4_2024-07-02
2025-11-14 15:55:32,295 - INFO - Finished converting document 4_2024-07-02 in 0.09 sec.


Converted 'data\edgar_documents\CHTR\4_2024-06-25' --> 'data\processed_data\CHTR\4_2024-06-25.md'
Converted 'data\edgar_documents\CHTR\4_2024-07-02' --> 'data\processed_data\CHTR\4_2024-07-02.md'


2025-11-14 15:55:32,416 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:32,431 - INFO - Going to convert document batch...
2025-11-14 15:55:32,433 - INFO - Processing document 4_2024-07-08
2025-11-14 15:55:32,465 - INFO - Finished converting document 4_2024-07-08 in 0.08 sec.
2025-11-14 15:55:32,523 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:32,540 - INFO - Going to convert document batch...
2025-11-14 15:55:32,541 - INFO - Processing document 4_2024-07-16
2025-11-14 15:55:33,147 - INFO - Finished converting document 4_2024-07-16 in 0.64 sec.


Converted 'data\edgar_documents\CHTR\4_2024-07-08' --> 'data\processed_data\CHTR\4_2024-07-08.md'


2025-11-14 15:55:33,203 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:33,222 - INFO - Going to convert document batch...
2025-11-14 15:55:33,223 - INFO - Processing document 4_2024-07-17
2025-11-14 15:55:33,268 - INFO - Finished converting document 4_2024-07-17 in 0.08 sec.
2025-11-14 15:55:33,327 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:33,358 - INFO - Going to convert document batch...
2025-11-14 15:55:33,359 - INFO - Processing document 4_2024-07-26


Converted 'data\edgar_documents\CHTR\4_2024-07-16' --> 'data\processed_data\CHTR\4_2024-07-16.md'
Converted 'data\edgar_documents\CHTR\4_2024-07-17' --> 'data\processed_data\CHTR\4_2024-07-17.md'


2025-11-14 15:55:33,438 - INFO - Finished converting document 4_2024-07-26 in 0.12 sec.
2025-11-14 15:55:33,526 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:33,559 - INFO - Going to convert document batch...
2025-11-14 15:55:33,561 - INFO - Processing document 4_2024-07-30
2025-11-14 15:55:33,635 - INFO - Finished converting document 4_2024-07-30 in 0.14 sec.


Converted 'data\edgar_documents\CHTR\4_2024-07-26' --> 'data\processed_data\CHTR\4_2024-07-26.md'
Converted 'data\edgar_documents\CHTR\4_2024-07-30' --> 'data\processed_data\CHTR\4_2024-07-30.md'


2025-11-14 15:55:33,708 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:33,733 - INFO - Going to convert document batch...
2025-11-14 15:55:33,734 - INFO - Processing document 4_2024-08-07
2025-11-14 15:55:33,773 - INFO - Finished converting document 4_2024-08-07 in 0.08 sec.
2025-11-14 15:55:33,824 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:33,838 - INFO - Going to convert document batch...
2025-11-14 15:55:33,840 - INFO - Processing document 4_2024-08-15
2025-11-14 15:55:33,880 - INFO - Finished converting document 4_2024-08-15 in 0.06 sec.
2025-11-14 15:55:33,935 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:33,959 - INFO - Going to convert document batch...
2025-11-14 15:55:33,961 - INFO - Processing document 4_2024-09-13
2025-11-14 15:55:33,999 - INFO - Finished converting document 4_2024-09-13 in 0.09 sec.


Converted 'data\edgar_documents\CHTR\4_2024-08-07' --> 'data\processed_data\CHTR\4_2024-08-07.md'
Converted 'data\edgar_documents\CHTR\4_2024-08-15' --> 'data\processed_data\CHTR\4_2024-08-15.md'


2025-11-14 15:55:34,050 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:34,064 - INFO - Going to convert document batch...
2025-11-14 15:55:34,065 - INFO - Processing document 4_2024-09-17
2025-11-14 15:55:34,098 - INFO - Finished converting document 4_2024-09-17 in 0.06 sec.
2025-11-14 15:55:34,145 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:55:34,146 - ERROR - Input document 4_2024-09-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:55

Converted 'data\edgar_documents\CHTR\4_2024-09-13' --> 'data\processed_data\CHTR\4_2024-09-13.md'
Converted 'data\edgar_documents\CHTR\4_2024-09-17' --> 'data\processed_data\CHTR\4_2024-09-17.md'
Error processing data\edgar_documents\CHTR\4_2024-09-23: File format not allowed: data\edgar_documents\CHTR\4_2024-09-23


2025-11-14 15:55:34,277 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:34,294 - INFO - Going to convert document batch...
2025-11-14 15:55:34,295 - INFO - Processing document 4_2024-10-15
2025-11-14 15:55:34,333 - INFO - Finished converting document 4_2024-10-15 in 0.08 sec.
2025-11-14 15:55:34,377 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:34,394 - INFO - Going to convert document batch...
2025-11-14 15:55:34,396 - INFO - Processing document 4_2024-10-22


Converted 'data\edgar_documents\CHTR\4_2024-10-09' --> 'data\processed_data\CHTR\4_2024-10-09.md'
Converted 'data\edgar_documents\CHTR\4_2024-10-15' --> 'data\processed_data\CHTR\4_2024-10-15.md'


2025-11-14 15:55:34,476 - INFO - Finished converting document 4_2024-10-22 in 0.11 sec.
2025-11-14 15:55:34,554 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:34,589 - INFO - Going to convert document batch...
2025-11-14 15:55:34,590 - INFO - Processing document 4_2024-11-07
2025-11-14 15:55:34,657 - INFO - Finished converting document 4_2024-11-07 in 0.12 sec.


Converted 'data\edgar_documents\CHTR\4_2024-10-22' --> 'data\processed_data\CHTR\4_2024-10-22.md'
Converted 'data\edgar_documents\CHTR\4_2024-11-07' --> 'data\processed_data\CHTR\4_2024-11-07.md'


2025-11-14 15:55:34,754 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:55:34,755 - ERROR - Input document 4_2024-11-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:55:34,757 - INFO - Going to convert document batch...
2025-11-14 15:55:34,774 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:55:34,775 - ERROR - Input document 4_2024-11-14 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\CHTR\4_2024-11-13: File format not allowed: data\edgar_documents\CHTR\4_2024-11-13
Error processing data\edgar_documents\CHTR\4_2024-11-14: File format not allowed: data\edgar_documents\CHTR\4_2024-11-14
Converted 'data\edgar_documents\CHTR\4_2024-11-18' --> 'data\processed_data\CHTR\4_2024-11-18.md'
Error processing data\edgar_documents\CHTR\4_2024-11-20: File format not allowed: data\edgar_documents\CHTR\4_2024-11-20


2025-11-14 15:55:34,963 - INFO - Going to convert document batch...
2025-11-14 15:55:34,964 - INFO - Processing document 4_2024-12-05
2025-11-14 15:55:35,003 - INFO - Finished converting document 4_2024-12-05 in 0.08 sec.
2025-11-14 15:55:35,055 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:35,069 - INFO - Going to convert document batch...
2025-11-14 15:55:35,070 - INFO - Processing document 4_2024-12-13
2025-11-14 15:55:35,116 - INFO - Finished converting document 4_2024-12-13 in 0.08 sec.
2025-11-14 15:55:35,185 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:35,206 - INFO - Going to convert document batch...
2025-11-14 15:55:35,210 - INFO - Processing document 4_2025-01-08


Converted 'data\edgar_documents\CHTR\4_2024-12-05' --> 'data\processed_data\CHTR\4_2024-12-05.md'
Converted 'data\edgar_documents\CHTR\4_2024-12-13' --> 'data\processed_data\CHTR\4_2024-12-13.md'


2025-11-14 15:55:35,253 - INFO - Finished converting document 4_2025-01-08 in 0.09 sec.
2025-11-14 15:55:35,313 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:35,328 - INFO - Going to convert document batch...
2025-11-14 15:55:35,329 - INFO - Processing document 4_2025-01-14
2025-11-14 15:55:35,371 - INFO - Finished converting document 4_2025-01-14 in 0.08 sec.
2025-11-14 15:55:35,448 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:35,479 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CHTR\4_2025-01-08' --> 'data\processed_data\CHTR\4_2025-01-08.md'
Converted 'data\edgar_documents\CHTR\4_2025-01-14' --> 'data\processed_data\CHTR\4_2025-01-14.md'


2025-11-14 15:55:35,481 - INFO - Processing document 4_2025-01-17
2025-11-14 15:55:35,542 - INFO - Finished converting document 4_2025-01-17 in 0.12 sec.
2025-11-14 15:55:35,595 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:55:35,596 - ERROR - Input document 4_2025-01-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:55:35,598 - INFO - Going to convert document batch...
2025-11-14 15:55:35,630 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55

Converted 'data\edgar_documents\CHTR\4_2025-01-17' --> 'data\processed_data\CHTR\4_2025-01-17.md'
Error processing data\edgar_documents\CHTR\4_2025-01-22: File format not allowed: data\edgar_documents\CHTR\4_2025-01-22
Converted 'data\edgar_documents\CHTR\4_2025-02-07' --> 'data\processed_data\CHTR\4_2025-02-07.md'


2025-11-14 15:55:35,779 - ERROR - Input document 4_2025-02-19 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:55:35,782 - INFO - Going to convert document batch...
2025-11-14 15:55:35,802 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:35,828 - INFO - Going to convert document batch...
2025-11-14 15:55:35,830 - INFO - Processing document 4_2025-03-10
2025-11-14 15:55:35,895 - INFO - Finished converting document 4_2025-03-10 in 0.11 sec.
2025-11-14 15:55:35,971 - INFO - detec

Error processing data\edgar_documents\CHTR\4_2025-02-19: File format not allowed: data\edgar_documents\CHTR\4_2025-02-19
Converted 'data\edgar_documents\CHTR\4_2025-03-10' --> 'data\processed_data\CHTR\4_2025-03-10.md'


2025-11-14 15:55:36,001 - INFO - Going to convert document batch...
2025-11-14 15:55:36,004 - INFO - Processing document 4_2025-03-13
2025-11-14 15:55:36,051 - INFO - Finished converting document 4_2025-03-13 in 0.09 sec.
2025-11-14 15:55:36,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:36,127 - INFO - Going to convert document batch...
2025-11-14 15:55:36,128 - INFO - Processing document 4_2025-03-20
2025-11-14 15:55:36,170 - INFO - Finished converting document 4_2025-03-20 in 0.08 sec.
2025-11-14 15:55:36,224 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:36,238 - INFO - Going to convert document batch...
2025-11-14 15:55:36,239 - INFO - Processing document 4_2025-03-26
2025-11-14 15:55:36,274 - INFO - Finished converting document 4_2025-03-26 in 0.05 sec.


Converted 'data\edgar_documents\CHTR\4_2025-03-13' --> 'data\processed_data\CHTR\4_2025-03-13.md'
Converted 'data\edgar_documents\CHTR\4_2025-03-20' --> 'data\processed_data\CHTR\4_2025-03-20.md'


2025-11-14 15:55:36,348 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:36,368 - INFO - Going to convert document batch...
2025-11-14 15:55:36,369 - INFO - Processing document 4_2025-04-01
2025-11-14 15:55:36,437 - INFO - Finished converting document 4_2025-04-01 in 0.11 sec.
2025-11-14 15:55:36,510 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\4_2025-03-26' --> 'data\processed_data\CHTR\4_2025-03-26.md'
Converted 'data\edgar_documents\CHTR\4_2025-04-01' --> 'data\processed_data\CHTR\4_2025-04-01.md'


2025-11-14 15:55:36,541 - INFO - Going to convert document batch...
2025-11-14 15:55:36,543 - INFO - Processing document 4_2025-04-04
2025-11-14 15:55:36,588 - INFO - Finished converting document 4_2025-04-04 in 0.09 sec.
2025-11-14 15:55:36,638 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:36,652 - INFO - Going to convert document batch...
2025-11-14 15:55:36,653 - INFO - Processing document 4_2025-04-11
2025-11-14 15:55:36,691 - INFO - Finished converting document 4_2025-04-11 in 0.06 sec.
2025-11-14 15:55:36,765 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:36,794 - INFO - Going to convert document batch...
2025-11-14 15:55:36,796 - INFO - Processing document 4_2025-04-24


Converted 'data\edgar_documents\CHTR\4_2025-04-04' --> 'data\processed_data\CHTR\4_2025-04-04.md'
Converted 'data\edgar_documents\CHTR\4_2025-04-11' --> 'data\processed_data\CHTR\4_2025-04-11.md'


2025-11-14 15:55:36,848 - INFO - Finished converting document 4_2025-04-24 in 0.11 sec.
2025-11-14 15:55:36,929 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:36,950 - INFO - Going to convert document batch...
2025-11-14 15:55:36,951 - INFO - Processing document 4_2025-05-07
2025-11-14 15:55:37,002 - INFO - Finished converting document 4_2025-05-07 in 0.09 sec.
2025-11-14 15:55:37,056 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:37,080 - INFO - Going to convert document batch...
2025-11-14 15:55:37,082 - INFO - Processing document 4_2025-05-13


Converted 'data\edgar_documents\CHTR\4_2025-04-24' --> 'data\processed_data\CHTR\4_2025-04-24.md'
Converted 'data\edgar_documents\CHTR\4_2025-05-07' --> 'data\processed_data\CHTR\4_2025-05-07.md'


2025-11-14 15:55:37,144 - INFO - Finished converting document 4_2025-05-13 in 0.09 sec.
2025-11-14 15:55:37,202 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:37,222 - INFO - Going to convert document batch...
2025-11-14 15:55:37,223 - INFO - Processing document 4_2025-05-20
2025-11-14 15:55:37,285 - INFO - Finished converting document 4_2025-05-20 in 0.09 sec.
2025-11-14 15:55:37,359 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:37,373 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CHTR\4_2025-05-13' --> 'data\processed_data\CHTR\4_2025-05-13.md'
Converted 'data\edgar_documents\CHTR\4_2025-05-20' --> 'data\processed_data\CHTR\4_2025-05-20.md'


2025-11-14 15:55:37,375 - INFO - Processing document 4_2025-06-10
2025-11-14 15:55:37,434 - INFO - Finished converting document 4_2025-06-10 in 0.09 sec.
2025-11-14 15:55:37,506 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:37,531 - INFO - Going to convert document batch...
2025-11-14 15:55:37,532 - INFO - Processing document 4_2025-06-12
2025-11-14 15:55:37,574 - INFO - Finished converting document 4_2025-06-12 in 0.08 sec.
2025-11-14 15:55:37,655 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:37,716 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CHTR\4_2025-06-10' --> 'data\processed_data\CHTR\4_2025-06-10.md'
Converted 'data\edgar_documents\CHTR\4_2025-06-12' --> 'data\processed_data\CHTR\4_2025-06-12.md'


2025-11-14 15:55:37,718 - INFO - Processing document 4_2025-06-20
2025-11-14 15:55:37,853 - INFO - Finished converting document 4_2025-06-20 in 0.22 sec.
2025-11-14 15:55:37,941 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:38,003 - INFO - Going to convert document batch...
2025-11-14 15:55:38,006 - INFO - Processing document 4_2025-07-03


Converted 'data\edgar_documents\CHTR\4_2025-06-20' --> 'data\processed_data\CHTR\4_2025-06-20.md'


2025-11-14 15:55:38,119 - INFO - Finished converting document 4_2025-07-03 in 0.19 sec.
2025-11-14 15:55:38,204 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:38,221 - INFO - Going to convert document batch...
2025-11-14 15:55:38,222 - INFO - Processing document 4_2025-07-08
2025-11-14 15:55:38,267 - INFO - Finished converting document 4_2025-07-08 in 0.08 sec.
2025-11-14 15:55:38,357 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\4_2025-07-03' --> 'data\processed_data\CHTR\4_2025-07-03.md'
Converted 'data\edgar_documents\CHTR\4_2025-07-08' --> 'data\processed_data\CHTR\4_2025-07-08.md'


2025-11-14 15:55:38,382 - INFO - Going to convert document batch...
2025-11-14 15:55:38,385 - INFO - Processing document 4_2025-07-15
2025-11-14 15:55:38,465 - INFO - Finished converting document 4_2025-07-15 in 0.14 sec.
2025-11-14 15:55:38,537 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:38,570 - INFO - Going to convert document batch...
2025-11-14 15:55:38,572 - INFO - Processing document 4_2025-07-29
2025-11-14 15:55:38,639 - INFO - Finished converting document 4_2025-07-29 in 0.14 sec.


Converted 'data\edgar_documents\CHTR\4_2025-07-15' --> 'data\processed_data\CHTR\4_2025-07-15.md'


2025-11-14 15:55:38,724 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:38,742 - INFO - Going to convert document batch...
2025-11-14 15:55:38,744 - INFO - Processing document 4_2025-07-31
2025-11-14 15:55:38,803 - INFO - Finished converting document 4_2025-07-31 in 0.09 sec.
2025-11-14 15:55:38,862 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:38,888 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CHTR\4_2025-07-29' --> 'data\processed_data\CHTR\4_2025-07-29.md'
Converted 'data\edgar_documents\CHTR\4_2025-07-31' --> 'data\processed_data\CHTR\4_2025-07-31.md'


2025-11-14 15:55:38,890 - INFO - Processing document 4_2025-08-04
2025-11-14 15:55:38,950 - INFO - Finished converting document 4_2025-08-04 in 0.11 sec.
2025-11-14 15:55:39,035 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:39,065 - INFO - Going to convert document batch...
2025-11-14 15:55:39,067 - INFO - Processing document 4_2025-08-05
2025-11-14 15:55:39,130 - INFO - Finished converting document 4_2025-08-05 in 0.12 sec.


Converted 'data\edgar_documents\CHTR\4_2025-08-04' --> 'data\processed_data\CHTR\4_2025-08-04.md'
Converted 'data\edgar_documents\CHTR\4_2025-08-05' --> 'data\processed_data\CHTR\4_2025-08-05.md'


2025-11-14 15:55:39,211 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:39,230 - INFO - Going to convert document batch...
2025-11-14 15:55:39,231 - INFO - Processing document 4_2025-08-07
2025-11-14 15:55:39,307 - INFO - Finished converting document 4_2025-08-07 in 0.12 sec.
2025-11-14 15:55:39,392 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:39,407 - INFO - Going to convert document batch...
2025-11-14 15:55:39,409 - INFO - Processing document 4_2025-08-13
2025-11-14 15:55:39,461 - INFO - Finished converting document 4_2025-08-13 in 0.08 sec.


Converted 'data\edgar_documents\CHTR\4_2025-08-07' --> 'data\processed_data\CHTR\4_2025-08-07.md'
Converted 'data\edgar_documents\CHTR\4_2025-08-13' --> 'data\processed_data\CHTR\4_2025-08-13.md'


2025-11-14 15:55:39,557 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:55:39,560 - ERROR - Input document 4_2025-08-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:55:39,562 - INFO - Going to convert document batch...
2025-11-14 15:55:39,592 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:39,619 - INFO - Going to convert document batch...
2025-11-14 15:55:39,621 - INFO - Processing document 4_2025-09-12
2025-11-14 15:55:39,682 - INFO - Fin

Error processing data\edgar_documents\CHTR\4_2025-08-18: File format not allowed: data\edgar_documents\CHTR\4_2025-08-18
Converted 'data\edgar_documents\CHTR\4_2025-09-12' --> 'data\processed_data\CHTR\4_2025-09-12.md'


2025-11-14 15:55:39,808 - INFO - Going to convert document batch...
2025-11-14 15:55:39,811 - INFO - Processing document 4_2025-09-23
2025-11-14 15:55:39,887 - INFO - Finished converting document 4_2025-09-23 in 0.16 sec.
2025-11-14 15:55:39,958 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:39,983 - INFO - Going to convert document batch...
2025-11-14 15:55:39,985 - INFO - Processing document 4_2025-10-14
2025-11-14 15:55:40,027 - INFO - Finished converting document 4_2025-10-14 in 0.11 sec.


Converted 'data\edgar_documents\CHTR\4_2025-09-23' --> 'data\processed_data\CHTR\4_2025-09-23.md'
Converted 'data\edgar_documents\CHTR\4_2025-10-14' --> 'data\processed_data\CHTR\4_2025-10-14.md'


2025-11-14 15:55:40,106 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:40,130 - INFO - Going to convert document batch...
2025-11-14 15:55:40,132 - INFO - Processing document 4_2025-11-07
2025-11-14 15:55:40,188 - INFO - Finished converting document 4_2025-11-07 in 0.12 sec.
2025-11-14 15:55:40,306 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:40,333 - INFO - Going to convert document batch...
2025-11-14 15:55:40,335 - INFO - Processing document 8-K_2023-01-27
2025-11-14 15:55:40,374 - INFO - Finished converting document 8-K_2023-01-27 in 0.09 sec.
2025-11-14 15:55:40,451 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\4_2025-11-07' --> 'data\processed_data\CHTR\4_2025-11-07.md'
Converted 'data\edgar_documents\CHTR\8-K_2023-01-27' --> 'data\processed_data\CHTR\8-K_2023-01-27.md'


2025-11-14 15:55:40,521 - INFO - Going to convert document batch...
2025-11-14 15:55:40,522 - INFO - Processing document 8-K_2023-02-16
2025-11-14 15:55:40,636 - INFO - Finished converting document 8-K_2023-02-16 in 0.23 sec.
2025-11-14 15:55:40,767 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:40,848 - INFO - Going to convert document batch...
2025-11-14 15:55:40,850 - INFO - Processing document 8-K_2023-02-24


Converted 'data\edgar_documents\CHTR\8-K_2023-02-16' --> 'data\processed_data\CHTR\8-K_2023-02-16.md'


2025-11-14 15:55:40,945 - INFO - Finished converting document 8-K_2023-02-24 in 0.22 sec.
2025-11-14 15:55:41,031 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:41,086 - INFO - Going to convert document batch...
2025-11-14 15:55:41,088 - INFO - Processing document 8-K_2023-03-29


Converted 'data\edgar_documents\CHTR\8-K_2023-02-24' --> 'data\processed_data\CHTR\8-K_2023-02-24.md'


2025-11-14 15:55:41,636 - INFO - Finished converting document 8-K_2023-03-29 in 0.64 sec.
2025-11-14 15:55:41,725 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:41,767 - INFO - Going to convert document batch...
2025-11-14 15:55:41,768 - INFO - Processing document 8-K_2023-04-06
2025-11-14 15:55:41,830 - INFO - Finished converting document 8-K_2023-04-06 in 0.14 sec.
2025-11-14 15:55:41,902 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\8-K_2023-03-29' --> 'data\processed_data\CHTR\8-K_2023-03-29.md'
Converted 'data\edgar_documents\CHTR\8-K_2023-04-06' --> 'data\processed_data\CHTR\8-K_2023-04-06.md'


2025-11-14 15:55:41,933 - INFO - Going to convert document batch...
2025-11-14 15:55:41,935 - INFO - Processing document 8-K_2023-04-21
2025-11-14 15:55:41,991 - INFO - Finished converting document 8-K_2023-04-21 in 0.14 sec.
2025-11-14 15:55:42,070 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:42,116 - INFO - Going to convert document batch...
2025-11-14 15:55:42,118 - INFO - Processing document 8-K_2023-04-28
2025-11-14 15:55:42,161 - INFO - Finished converting document 8-K_2023-04-28 in 0.12 sec.


Converted 'data\edgar_documents\CHTR\8-K_2023-04-21' --> 'data\processed_data\CHTR\8-K_2023-04-21.md'
Converted 'data\edgar_documents\CHTR\8-K_2023-04-28' --> 'data\processed_data\CHTR\8-K_2023-04-28.md'


2025-11-14 15:55:42,217 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:42,273 - INFO - Going to convert document batch...
2025-11-14 15:55:42,274 - INFO - Processing document 8-K_2023-05-01
2025-11-14 15:55:42,343 - INFO - Finished converting document 8-K_2023-05-01 in 0.16 sec.
2025-11-14 15:55:42,414 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:42,444 - INFO - Going to convert document batch...
2025-11-14 15:55:42,445 - INFO - Processing document 8-K_2023-06-29
2025-11-14 15:55:42,480 - INFO - Finished converting document 8-K_2023-06-29 in 0.11 sec.
2025-11-14 15:55:42,548 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\8-K_2023-05-01' --> 'data\processed_data\CHTR\8-K_2023-05-01.md'
Converted 'data\edgar_documents\CHTR\8-K_2023-06-29' --> 'data\processed_data\CHTR\8-K_2023-06-29.md'


2025-11-14 15:55:42,580 - INFO - Going to convert document batch...
2025-11-14 15:55:42,582 - INFO - Processing document 8-K_2023-07-28
2025-11-14 15:55:42,619 - INFO - Finished converting document 8-K_2023-07-28 in 0.11 sec.
2025-11-14 15:55:42,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:42,695 - INFO - Going to convert document batch...
2025-11-14 15:55:42,696 - INFO - Processing document 8-K_2023-08-21
2025-11-14 15:55:42,729 - INFO - Finished converting document 8-K_2023-08-21 in 0.06 sec.
2025-11-14 15:55:42,795 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\8-K_2023-07-28' --> 'data\processed_data\CHTR\8-K_2023-07-28.md'
Converted 'data\edgar_documents\CHTR\8-K_2023-08-21' --> 'data\processed_data\CHTR\8-K_2023-08-21.md'


2025-11-14 15:55:42,847 - INFO - Going to convert document batch...
2025-11-14 15:55:42,850 - INFO - Processing document 8-K_2023-09-01
2025-11-14 15:55:42,920 - INFO - Finished converting document 8-K_2023-09-01 in 0.17 sec.
2025-11-14 15:55:42,987 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:43,027 - INFO - Going to convert document batch...
2025-11-14 15:55:43,028 - INFO - Processing document 8-K_2023-09-11
2025-11-14 15:55:43,067 - INFO - Finished converting document 8-K_2023-09-11 in 0.11 sec.
2025-11-14 15:55:43,148 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\8-K_2023-09-01' --> 'data\processed_data\CHTR\8-K_2023-09-01.md'
Converted 'data\edgar_documents\CHTR\8-K_2023-09-11' --> 'data\processed_data\CHTR\8-K_2023-09-11.md'


2025-11-14 15:55:43,181 - INFO - Going to convert document batch...
2025-11-14 15:55:43,182 - INFO - Processing document 8-K_2023-10-25
2025-11-14 15:55:43,226 - INFO - Finished converting document 8-K_2023-10-25 in 0.12 sec.
2025-11-14 15:55:43,296 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:43,322 - INFO - Going to convert document batch...
2025-11-14 15:55:43,323 - INFO - Processing document 8-K_2023-10-27
2025-11-14 15:55:43,360 - INFO - Finished converting document 8-K_2023-10-27 in 0.11 sec.
2025-11-14 15:55:43,425 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\8-K_2023-10-25' --> 'data\processed_data\CHTR\8-K_2023-10-25.md'
Converted 'data\edgar_documents\CHTR\8-K_2023-10-27' --> 'data\processed_data\CHTR\8-K_2023-10-27.md'


2025-11-14 15:55:43,471 - INFO - Going to convert document batch...
2025-11-14 15:55:43,472 - INFO - Processing document 8-K_2023-11-13
2025-11-14 15:55:43,574 - INFO - Finished converting document 8-K_2023-11-13 in 0.19 sec.
2025-11-14 15:55:43,669 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:43,720 - INFO - Going to convert document batch...
2025-11-14 15:55:43,721 - INFO - Processing document 8-K_2023-12-13


Converted 'data\edgar_documents\CHTR\8-K_2023-11-13' --> 'data\processed_data\CHTR\8-K_2023-11-13.md'


2025-11-14 15:55:43,822 - INFO - Finished converting document 8-K_2023-12-13 in 0.17 sec.
2025-11-14 15:55:43,919 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:43,963 - INFO - Going to convert document batch...
2025-11-14 15:55:43,966 - INFO - Processing document 8-K_2024-02-02
2025-11-14 15:55:44,025 - INFO - Finished converting document 8-K_2024-02-02 in 0.14 sec.


Converted 'data\edgar_documents\CHTR\8-K_2023-12-13' --> 'data\processed_data\CHTR\8-K_2023-12-13.md'


2025-11-14 15:55:44,133 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:44,165 - INFO - Going to convert document batch...
2025-11-14 15:55:44,166 - INFO - Processing document 8-K_2024-02-05
2025-11-14 15:55:44,208 - INFO - Finished converting document 8-K_2024-02-05 in 0.12 sec.
2025-11-14 15:55:44,277 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\8-K_2024-02-02' --> 'data\processed_data\CHTR\8-K_2024-02-02.md'
Converted 'data\edgar_documents\CHTR\8-K_2024-02-05' --> 'data\processed_data\CHTR\8-K_2024-02-05.md'


2025-11-14 15:55:44,361 - INFO - Going to convert document batch...
2025-11-14 15:55:44,364 - INFO - Processing document 8-K_2024-04-26
2025-11-14 15:55:44,482 - INFO - Finished converting document 8-K_2024-04-26 in 0.25 sec.
2025-11-14 15:55:44,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:44,576 - INFO - Going to convert document batch...
2025-11-14 15:55:44,577 - INFO - Processing document 8-K_2024-05-09
2025-11-14 15:55:44,643 - INFO - Finished converting document 8-K_2024-05-09 in 0.11 sec.


Converted 'data\edgar_documents\CHTR\8-K_2024-04-26' --> 'data\processed_data\CHTR\8-K_2024-04-26.md'
Converted 'data\edgar_documents\CHTR\8-K_2024-05-09' --> 'data\processed_data\CHTR\8-K_2024-05-09.md'


2025-11-14 15:55:44,755 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:44,807 - INFO - Going to convert document batch...
2025-11-14 15:55:44,809 - INFO - Processing document 8-K_2024-05-10
2025-11-14 15:55:44,871 - INFO - Finished converting document 8-K_2024-05-10 in 0.17 sec.
2025-11-14 15:55:44,926 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:44,959 - INFO - Going to convert document batch...
2025-11-14 15:55:44,960 - INFO - Processing document 8-K_2024-05-14
2025-11-14 15:55:45,076 - INFO - Finished converting document 8-K_2024-05-14 in 0.17 sec.


Converted 'data\edgar_documents\CHTR\8-K_2024-05-10' --> 'data\processed_data\CHTR\8-K_2024-05-10.md'


2025-11-14 15:55:45,188 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:45,222 - INFO - Going to convert document batch...
2025-11-14 15:55:45,223 - INFO - Processing document 8-K_2024-07-26
2025-11-14 15:55:45,282 - INFO - Finished converting document 8-K_2024-07-26 in 0.11 sec.
2025-11-14 15:55:45,362 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\8-K_2024-05-14' --> 'data\processed_data\CHTR\8-K_2024-05-14.md'
Converted 'data\edgar_documents\CHTR\8-K_2024-07-26' --> 'data\processed_data\CHTR\8-K_2024-07-26.md'


2025-11-14 15:55:45,399 - INFO - Going to convert document batch...
2025-11-14 15:55:45,400 - INFO - Processing document 8-K_2024-11-01
2025-11-14 15:55:45,440 - INFO - Finished converting document 8-K_2024-11-01 in 0.12 sec.
2025-11-14 15:55:45,499 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:55:45,500 - ERROR - Input document 8-K_2024-11-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:55:45,501 - INFO - Going to convert docu

Converted 'data\edgar_documents\CHTR\8-K_2024-11-01' --> 'data\processed_data\CHTR\8-K_2024-11-01.md'
Error processing data\edgar_documents\CHTR\8-K_2024-11-13: File format not allowed: data\edgar_documents\CHTR\8-K_2024-11-13


2025-11-14 15:55:45,667 - INFO - Finished converting document 8-K_2024-12-09 in 0.17 sec.
2025-11-14 15:55:45,774 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:55:45,775 - ERROR - Input document 8-K_2024-12-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:55:45,776 - INFO - Going to convert document batch...
2025-11-14 15:55:45,802 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:45,829 - INFO - Going to 

Converted 'data\edgar_documents\CHTR\8-K_2024-12-09' --> 'data\processed_data\CHTR\8-K_2024-12-09.md'
Error processing data\edgar_documents\CHTR\8-K_2024-12-13: File format not allowed: data\edgar_documents\CHTR\8-K_2024-12-13
Converted 'data\edgar_documents\CHTR\8-K_2025-01-31' --> 'data\processed_data\CHTR\8-K_2025-01-31.md'


2025-11-14 15:55:45,932 - ERROR - Input document 8-K_2025-02-19 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:55:45,934 - INFO - Going to convert document batch...
2025-11-14 15:55:45,947 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:45,984 - INFO - Going to convert document batch...
2025-11-14 15:55:45,985 - INFO - Processing document 8-K_2025-02-27
2025-11-14 15:55:46,041 - INFO - Finished converting document 8-K_2025-02-27 in 0.11 sec.
2025-11-14 15:55:46,114 - INFO -

Error processing data\edgar_documents\CHTR\8-K_2025-02-19: File format not allowed: data\edgar_documents\CHTR\8-K_2025-02-19
Converted 'data\edgar_documents\CHTR\8-K_2025-02-27' --> 'data\processed_data\CHTR\8-K_2025-02-27.md'


2025-11-14 15:55:46,158 - INFO - Going to convert document batch...
2025-11-14 15:55:46,159 - INFO - Processing document 8-K_2025-04-25
2025-11-14 15:55:46,238 - INFO - Finished converting document 8-K_2025-04-25 in 0.17 sec.
2025-11-14 15:55:46,333 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:55:46,335 - ERROR - Input document 8-K_2025-05-16 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:55:46,336 - INFO - Going to convert docu

Converted 'data\edgar_documents\CHTR\8-K_2025-04-25' --> 'data\processed_data\CHTR\8-K_2025-04-25.md'
Error processing data\edgar_documents\CHTR\8-K_2025-05-16: File format not allowed: data\edgar_documents\CHTR\8-K_2025-05-16
Error processing data\edgar_documents\CHTR\8-K_2025-05-19: File format not allowed: data\edgar_documents\CHTR\8-K_2025-05-19
Error processing data\edgar_documents\CHTR\8-K_2025-07-21: File format not allowed: data\edgar_documents\CHTR\8-K_2025-07-21


2025-11-14 15:55:46,449 - INFO - Processing document 8-K_2025-07-25
2025-11-14 15:55:46,487 - INFO - Finished converting document 8-K_2025-07-25 in 0.08 sec.
2025-11-14 15:55:46,532 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:46,570 - INFO - Going to convert document batch...
2025-11-14 15:55:46,571 - INFO - Processing document 8-K_2025-08-01
2025-11-14 15:55:46,642 - INFO - Finished converting document 8-K_2025-08-01 in 0.14 sec.


Converted 'data\edgar_documents\CHTR\8-K_2025-07-25' --> 'data\processed_data\CHTR\8-K_2025-07-25.md'
Converted 'data\edgar_documents\CHTR\8-K_2025-08-01' --> 'data\processed_data\CHTR\8-K_2025-08-01.md'


2025-11-14 15:55:46,719 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:46,743 - INFO - Going to convert document batch...
2025-11-14 15:55:46,745 - INFO - Processing document 8-K_2025-08-04
2025-11-14 15:55:46,799 - INFO - Finished converting document 8-K_2025-08-04 in 0.11 sec.
2025-11-14 15:55:46,853 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:46,877 - INFO - Going to convert document batch...
2025-11-14 15:55:46,878 - INFO - Processing document 8-K_2025-08-05
2025-11-14 15:55:46,912 - INFO - Finished converting document 8-K_2025-08-05 in 0.08 sec.
2025-11-14 15:55:46,971 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CHTR\8-K_2025-08-04' --> 'data\processed_data\CHTR\8-K_2025-08-04.md'
Converted 'data\edgar_documents\CHTR\8-K_2025-08-05' --> 'data\processed_data\CHTR\8-K_2025-08-05.md'


2025-11-14 15:55:47,026 - INFO - Going to convert document batch...
2025-11-14 15:55:47,027 - INFO - Processing document 8-K_2025-08-18
2025-11-14 15:55:47,136 - INFO - Finished converting document 8-K_2025-08-18 in 0.22 sec.
2025-11-14 15:55:47,246 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:47,313 - INFO - Going to convert document batch...
2025-11-14 15:55:47,315 - INFO - Processing document 8-K_2025-08-20


Converted 'data\edgar_documents\CHTR\8-K_2025-08-18' --> 'data\processed_data\CHTR\8-K_2025-08-18.md'


2025-11-14 15:55:47,437 - INFO - Finished converting document 8-K_2025-08-20 in 0.23 sec.
2025-11-14 15:55:47,550 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:47,609 - INFO - Going to convert document batch...
2025-11-14 15:55:47,611 - INFO - Processing document 8-K_2025-09-02


Converted 'data\edgar_documents\CHTR\8-K_2025-08-20' --> 'data\processed_data\CHTR\8-K_2025-08-20.md'


2025-11-14 15:55:47,757 - INFO - Finished converting document 8-K_2025-09-02 in 0.25 sec.
2025-11-14 15:55:47,875 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:55:47,912 - INFO - Going to convert document batch...
2025-11-14 15:55:47,913 - INFO - Processing document 8-K_2025-10-31
2025-11-14 15:55:47,951 - INFO - Finished converting document 8-K_2025-10-31 in 0.11 sec.


Converted 'data\edgar_documents\CHTR\8-K_2025-09-02' --> 'data\processed_data\CHTR\8-K_2025-09-02.md'
Converted 'data\edgar_documents\CHTR\8-K_2025-10-31' --> 'data\processed_data\CHTR\8-K_2025-10-31.md'


2025-11-14 15:55:48,064 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:55:48,065 - ERROR - Input document DEF-14A_2023-03-16 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:55:48,069 - INFO - Going to convert document batch...
2025-11-14 15:55:48,150 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:55:48,151 - ERROR - Input document DEF-14A_2024-03-14 with format No

Error processing data\edgar_documents\CHTR\DEF-14A_2023-03-16: File format not allowed: data\edgar_documents\CHTR\DEF-14A_2023-03-16
Error processing data\edgar_documents\CHTR\DEF-14A_2024-03-14: File format not allowed: data\edgar_documents\CHTR\DEF-14A_2024-03-14


2025-11-14 15:55:48,252 - ERROR - Input document DEF-14A_2025-03-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:55:48,254 - INFO - Going to convert document batch...
2025-11-14 15:55:48,348 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Error processing data\edgar_documents\CHTR\DEF-14A_2025-03-13: File format not allowed: data\edgar_documents\CHTR\DEF-14A_2025-03-13
Processed 152 new files. Errors: 16
Found 111 files to process in data\edgar_documents\CL


2025-11-14 15:55:50,782 - INFO - Going to convert document batch...
2025-11-14 15:55:50,785 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:55:50,785 - INFO - Processing document 10-K_2023-02-16
2025-11-14 15:55:56,952 - INFO - Finished converting document 10-K_2023-02-16 in 8.69 sec.
2025-11-14 15:55:58,498 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\10-K_2023-02-16' --> 'data\processed_data\CL\10-K_2023-02-16.md'


2025-11-14 15:56:00,210 - INFO - Going to convert document batch...
2025-11-14 15:56:00,212 - INFO - Processing document 10-K_2024-02-15
2025-11-14 15:56:06,165 - INFO - Finished converting document 10-K_2024-02-15 in 7.75 sec.
2025-11-14 15:56:07,422 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\10-K_2024-02-15' --> 'data\processed_data\CL\10-K_2024-02-15.md'


2025-11-14 15:56:08,975 - INFO - Going to convert document batch...
2025-11-14 15:56:08,977 - INFO - Processing document 10-K_2025-02-13
2025-11-14 15:56:14,230 - INFO - Finished converting document 10-K_2025-02-13 in 6.86 sec.
2025-11-14 15:56:15,070 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\10-K_2025-02-13' --> 'data\processed_data\CL\10-K_2025-02-13.md'


2025-11-14 15:56:15,802 - INFO - Going to convert document batch...
2025-11-14 15:56:15,803 - INFO - Processing document 10-Q_2023-04-28
2025-11-14 15:56:16,346 - INFO - Finished converting document 10-Q_2023-04-28 in 1.31 sec.
2025-11-14 15:56:16,675 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\10-Q_2023-04-28' --> 'data\processed_data\CL\10-Q_2023-04-28.md'


2025-11-14 15:56:17,094 - INFO - Going to convert document batch...
2025-11-14 15:56:17,095 - INFO - Processing document 10-Q_2023-07-28
2025-11-14 15:56:18,234 - INFO - Finished converting document 10-Q_2023-07-28 in 1.61 sec.
2025-11-14 15:56:18,688 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\10-Q_2023-07-28' --> 'data\processed_data\CL\10-Q_2023-07-28.md'


2025-11-14 15:56:19,140 - INFO - Going to convert document batch...
2025-11-14 15:56:19,140 - INFO - Processing document 10-Q_2023-10-27
2025-11-14 15:56:20,007 - INFO - Finished converting document 10-Q_2023-10-27 in 1.34 sec.
2025-11-14 15:56:20,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\10-Q_2023-10-27' --> 'data\processed_data\CL\10-Q_2023-10-27.md'


2025-11-14 15:56:21,275 - INFO - Going to convert document batch...
2025-11-14 15:56:21,276 - INFO - Processing document 10-Q_2024-04-26
2025-11-14 15:56:22,648 - INFO - Finished converting document 10-Q_2024-04-26 in 2.22 sec.
2025-11-14 15:56:23,361 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\10-Q_2024-04-26' --> 'data\processed_data\CL\10-Q_2024-04-26.md'


2025-11-14 15:56:24,399 - INFO - Going to convert document batch...
2025-11-14 15:56:24,401 - INFO - Processing document 10-Q_2024-07-26
2025-11-14 15:56:26,449 - INFO - Finished converting document 10-Q_2024-07-26 in 3.14 sec.
2025-11-14 15:56:27,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\10-Q_2024-07-26' --> 'data\processed_data\CL\10-Q_2024-07-26.md'


2025-11-14 15:56:28,862 - INFO - Going to convert document batch...
2025-11-14 15:56:28,864 - INFO - Processing document 10-Q_2024-10-25
2025-11-14 15:56:30,715 - INFO - Finished converting document 10-Q_2024-10-25 in 3.58 sec.
2025-11-14 15:56:31,682 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\10-Q_2024-10-25' --> 'data\processed_data\CL\10-Q_2024-10-25.md'


2025-11-14 15:56:32,394 - INFO - Going to convert document batch...
2025-11-14 15:56:32,396 - INFO - Processing document 10-Q_2025-04-25
2025-11-14 15:56:33,645 - INFO - Finished converting document 10-Q_2025-04-25 in 2.02 sec.
2025-11-14 15:56:34,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\10-Q_2025-04-25' --> 'data\processed_data\CL\10-Q_2025-04-25.md'


2025-11-14 15:56:35,850 - INFO - Going to convert document batch...
2025-11-14 15:56:35,851 - INFO - Processing document 10-Q_2025-08-01
2025-11-14 15:56:37,428 - INFO - Finished converting document 10-Q_2025-08-01 in 3.23 sec.
2025-11-14 15:56:38,210 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\10-Q_2025-08-01' --> 'data\processed_data\CL\10-Q_2025-08-01.md'


2025-11-14 15:56:39,328 - INFO - Going to convert document batch...
2025-11-14 15:56:39,330 - INFO - Processing document 10-Q_2025-10-31
2025-11-14 15:56:42,062 - INFO - Finished converting document 10-Q_2025-10-31 in 3.92 sec.
2025-11-14 15:56:43,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:43,057 - INFO - Going to convert document batch...
2025-11-14 15:56:43,058 - INFO - Processing document 4_2023-01-05
2025-11-14 15:56:43,118 - INFO - Finished converting document 4_2023-01-05 in 0.09 sec.


Converted 'data\edgar_documents\CL\10-Q_2025-10-31' --> 'data\processed_data\CL\10-Q_2025-10-31.md'
Converted 'data\edgar_documents\CL\4_2023-01-05' --> 'data\processed_data\CL\4_2023-01-05.md'


2025-11-14 15:56:43,218 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:43,250 - INFO - Going to convert document batch...
2025-11-14 15:56:43,252 - INFO - Processing document 4_2023-02-03
2025-11-14 15:56:43,326 - INFO - Finished converting document 4_2023-02-03 in 0.14 sec.
2025-11-14 15:56:43,415 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:43,445 - INFO - Going to convert document batch...
2025-11-14 15:56:43,446 - INFO - Processing document 4_2023-02-17
2025-11-14 15:56:43,489 - INFO - Finished converting document 4_2023-02-17 in 0.09 sec.
2025-11-14 15:56:43,552 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:43,572 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CL\4_2023-02-03' --> 'data\processed_data\CL\4_2023-02-03.md'
Converted 'data\edgar_documents\CL\4_2023-02-17' --> 'data\processed_data\CL\4_2023-02-17.md'


2025-11-14 15:56:43,575 - INFO - Processing document 4_2023-02-21
2025-11-14 15:56:43,646 - INFO - Finished converting document 4_2023-02-21 in 0.12 sec.
2025-11-14 15:56:43,714 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:43,734 - INFO - Going to convert document batch...
2025-11-14 15:56:43,735 - INFO - Processing document 4_2023-02-23
2025-11-14 15:56:43,793 - INFO - Finished converting document 4_2023-02-23 in 0.12 sec.


Converted 'data\edgar_documents\CL\4_2023-02-21' --> 'data\processed_data\CL\4_2023-02-21.md'
Converted 'data\edgar_documents\CL\4_2023-02-23' --> 'data\processed_data\CL\4_2023-02-23.md'


2025-11-14 15:56:43,897 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:56:43,899 - ERROR - Input document 4_2023-02-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:56:43,902 - INFO - Going to convert document batch...
2025-11-14 15:56:43,925 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:43,952 - INFO - Going to convert document batch...
2025-11-14 15:56:43,953 - INFO - Processing document 4_2023-03-01


Error processing data\edgar_documents\CL\4_2023-02-27: File format not allowed: data\edgar_documents\CL\4_2023-02-27
Converted 'data\edgar_documents\CL\4_2023-03-01' --> 'data\processed_data\CL\4_2023-03-01.md'


2025-11-14 15:56:44,098 - INFO - Going to convert document batch...
2025-11-14 15:56:44,100 - INFO - Processing document 4_2023-03-15
2025-11-14 15:56:44,132 - INFO - Finished converting document 4_2023-03-15 in 0.08 sec.
2025-11-14 15:56:44,196 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:44,220 - INFO - Going to convert document batch...
2025-11-14 15:56:44,222 - INFO - Processing document 4_2023-04-05
2025-11-14 15:56:44,276 - INFO - Finished converting document 4_2023-04-05 in 0.12 sec.


Converted 'data\edgar_documents\CL\4_2023-03-15' --> 'data\processed_data\CL\4_2023-03-15.md'


2025-11-14 15:56:44,382 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:44,421 - INFO - Going to convert document batch...
2025-11-14 15:56:44,422 - INFO - Processing document 4_2023-05-05
2025-11-14 15:56:44,486 - INFO - Finished converting document 4_2023-05-05 in 0.14 sec.


Converted 'data\edgar_documents\CL\4_2023-04-05' --> 'data\processed_data\CL\4_2023-04-05.md'
Converted 'data\edgar_documents\CL\4_2023-05-05' --> 'data\processed_data\CL\4_2023-05-05.md'


2025-11-14 15:56:44,588 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:44,616 - INFO - Going to convert document batch...
2025-11-14 15:56:44,617 - INFO - Processing document 4_2023-05-10
2025-11-14 15:56:44,661 - INFO - Finished converting document 4_2023-05-10 in 0.09 sec.
2025-11-14 15:56:44,758 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:44,793 - INFO - Going to convert document batch...
2025-11-14 15:56:44,794 - INFO - Processing document 4_2023-05-12
2025-11-14 15:56:44,868 - INFO - Finished converting document 4_2023-05-12 in 0.12 sec.


Converted 'data\edgar_documents\CL\4_2023-05-10' --> 'data\processed_data\CL\4_2023-05-10.md'


2025-11-14 15:56:44,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:45,029 - INFO - Going to convert document batch...
2025-11-14 15:56:45,031 - INFO - Processing document 4_2023-05-17
2025-11-14 15:56:45,088 - INFO - Finished converting document 4_2023-05-17 in 0.14 sec.


Converted 'data\edgar_documents\CL\4_2023-05-12' --> 'data\processed_data\CL\4_2023-05-12.md'


2025-11-14 15:56:45,187 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:45,209 - INFO - Going to convert document batch...
2025-11-14 15:56:45,212 - INFO - Processing document 4_2023-05-23
2025-11-14 15:56:45,262 - INFO - Finished converting document 4_2023-05-23 in 0.11 sec.


Converted 'data\edgar_documents\CL\4_2023-05-17' --> 'data\processed_data\CL\4_2023-05-17.md'
Converted 'data\edgar_documents\CL\4_2023-05-23' --> 'data\processed_data\CL\4_2023-05-23.md'


2025-11-14 15:56:45,364 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:45,379 - INFO - Going to convert document batch...
2025-11-14 15:56:45,380 - INFO - Processing document 4_2023-07-06
2025-11-14 15:56:45,420 - INFO - Finished converting document 4_2023-07-06 in 0.09 sec.
2025-11-14 15:56:45,520 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:45,539 - INFO - Going to convert document batch...
2025-11-14 15:56:45,540 - INFO - Processing document 4_2023-08-04
2025-11-14 15:56:45,581 - INFO - Finished converting document 4_2023-08-04 in 0.09 sec.
2025-11-14 15:56:45,636 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:45,655 - INFO - Going to convert document batch...
2025-11-14 15:56:45,656 - INFO - Processing document 4_2023-09-01


Converted 'data\edgar_documents\CL\4_2023-07-06' --> 'data\processed_data\CL\4_2023-07-06.md'
Converted 'data\edgar_documents\CL\4_2023-08-04' --> 'data\processed_data\CL\4_2023-08-04.md'


2025-11-14 15:56:45,696 - INFO - Finished converting document 4_2023-09-01 in 0.06 sec.
2025-11-14 15:56:45,763 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:45,779 - INFO - Going to convert document batch...
2025-11-14 15:56:45,780 - INFO - Processing document 4_2023-09-12
2025-11-14 15:56:45,814 - INFO - Finished converting document 4_2023-09-12 in 0.08 sec.
2025-11-14 15:56:45,868 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:45,887 - INFO - Going to convert document batch...
2025-11-14 15:56:45,889 - INFO - Processing document 4_2023-09-13
2025-11-14 15:56:45,936 - INFO - Finished converting document 4_2023-09-13 in 0.09 sec.


Converted 'data\edgar_documents\CL\4_2023-09-01' --> 'data\processed_data\CL\4_2023-09-01.md'
Converted 'data\edgar_documents\CL\4_2023-09-12' --> 'data\processed_data\CL\4_2023-09-12.md'


2025-11-14 15:56:45,996 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:46,013 - INFO - Going to convert document batch...
2025-11-14 15:56:46,014 - INFO - Processing document 4_2023-09-15
2025-11-14 15:56:46,057 - INFO - Finished converting document 4_2023-09-15 in 0.09 sec.
2025-11-14 15:56:46,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:46,149 - INFO - Going to convert document batch...
2025-11-14 15:56:46,150 - INFO - Processing document 4_2023-10-04


Converted 'data\edgar_documents\CL\4_2023-09-13' --> 'data\processed_data\CL\4_2023-09-13.md'
Converted 'data\edgar_documents\CL\4_2023-09-15' --> 'data\processed_data\CL\4_2023-09-15.md'


2025-11-14 15:56:46,203 - INFO - Finished converting document 4_2023-10-04 in 0.11 sec.
2025-11-14 15:56:46,265 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:46,281 - INFO - Going to convert document batch...
2025-11-14 15:56:46,283 - INFO - Processing document 4_2023-10-17
2025-11-14 15:56:46,319 - INFO - Finished converting document 4_2023-10-17 in 0.08 sec.
2025-11-14 15:56:46,400 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\4_2023-10-04' --> 'data\processed_data\CL\4_2023-10-04.md'
Converted 'data\edgar_documents\CL\4_2023-10-17' --> 'data\processed_data\CL\4_2023-10-17.md'


2025-11-14 15:56:46,426 - INFO - Going to convert document batch...
2025-11-14 15:56:46,428 - INFO - Processing document 4_2023-11-06
2025-11-14 15:56:46,468 - INFO - Finished converting document 4_2023-11-06 in 0.09 sec.
2025-11-14 15:56:46,526 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:46,556 - INFO - Going to convert document batch...
2025-11-14 15:56:46,557 - INFO - Processing document 4_2023-11-07
2025-11-14 15:56:46,605 - INFO - Finished converting document 4_2023-11-07 in 0.11 sec.


Converted 'data\edgar_documents\CL\4_2023-11-06' --> 'data\processed_data\CL\4_2023-11-06.md'
Converted 'data\edgar_documents\CL\4_2023-11-07' --> 'data\processed_data\CL\4_2023-11-07.md'


2025-11-14 15:56:46,685 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:46,708 - INFO - Going to convert document batch...
2025-11-14 15:56:46,710 - INFO - Processing document 4_2023-11-13
2025-11-14 15:56:46,746 - INFO - Finished converting document 4_2023-11-13 in 0.11 sec.
2025-11-14 15:56:46,791 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:46,810 - INFO - Going to convert document batch...
2025-11-14 15:56:46,811 - INFO - Processing document 4_2023-11-14
2025-11-14 15:56:46,891 - INFO - Finished converting document 4_2023-11-14 in 0.11 sec.
2025-11-14 15:56:46,967 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\4_2023-11-13' --> 'data\processed_data\CL\4_2023-11-13.md'
Converted 'data\edgar_documents\CL\4_2023-11-14' --> 'data\processed_data\CL\4_2023-11-14.md'


2025-11-14 15:56:46,993 - INFO - Going to convert document batch...
2025-11-14 15:56:46,994 - INFO - Processing document 4_2023-11-17
2025-11-14 15:56:47,042 - INFO - Finished converting document 4_2023-11-17 in 0.11 sec.
2025-11-14 15:56:47,107 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:47,157 - INFO - Going to convert document batch...
2025-11-14 15:56:47,159 - INFO - Processing document 4_2023-11-30
2025-11-14 15:56:47,209 - INFO - Finished converting document 4_2023-11-30 in 0.12 sec.


Converted 'data\edgar_documents\CL\4_2023-11-17' --> 'data\processed_data\CL\4_2023-11-17.md'


2025-11-14 15:56:47,321 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:47,353 - INFO - Going to convert document batch...
2025-11-14 15:56:47,355 - INFO - Processing document 4_2023-12-04
2025-11-14 15:56:47,427 - INFO - Finished converting document 4_2023-12-04 in 0.14 sec.


Converted 'data\edgar_documents\CL\4_2023-11-30' --> 'data\processed_data\CL\4_2023-11-30.md'
Converted 'data\edgar_documents\CL\4_2023-12-04' --> 'data\processed_data\CL\4_2023-12-04.md'


2025-11-14 15:56:47,499 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:47,516 - INFO - Going to convert document batch...
2025-11-14 15:56:47,517 - INFO - Processing document 4_2023-12-08
2025-11-14 15:56:47,550 - INFO - Finished converting document 4_2023-12-08 in 0.08 sec.
2025-11-14 15:56:47,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:47,626 - INFO - Going to convert document batch...
2025-11-14 15:56:47,628 - INFO - Processing document 4_2024-01-04
2025-11-14 15:56:47,664 - INFO - Finished converting document 4_2024-01-04 in 0.08 sec.
2025-11-14 15:56:47,750 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:47,781 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CL\4_2023-12-08' --> 'data\processed_data\CL\4_2023-12-08.md'
Converted 'data\edgar_documents\CL\4_2024-01-04' --> 'data\processed_data\CL\4_2024-01-04.md'


2025-11-14 15:56:47,782 - INFO - Processing document 4_2024-02-02
2025-11-14 15:56:47,846 - INFO - Finished converting document 4_2024-02-02 in 0.14 sec.
2025-11-14 15:56:47,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:47,938 - INFO - Going to convert document batch...
2025-11-14 15:56:47,940 - INFO - Processing document 4_2024-02-07
2025-11-14 15:56:47,993 - INFO - Finished converting document 4_2024-02-07 in 0.09 sec.


Converted 'data\edgar_documents\CL\4_2024-02-02' --> 'data\processed_data\CL\4_2024-02-02.md'
Converted 'data\edgar_documents\CL\4_2024-02-07' --> 'data\processed_data\CL\4_2024-02-07.md'


2025-11-14 15:56:48,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:48,131 - INFO - Going to convert document batch...
2025-11-14 15:56:48,134 - INFO - Processing document 4_2024-02-13
2025-11-14 15:56:48,194 - INFO - Finished converting document 4_2024-02-13 in 0.14 sec.
2025-11-14 15:56:48,324 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:48,360 - INFO - Going to convert document batch...
2025-11-14 15:56:48,361 - INFO - Processing document 4_2024-02-14
2025-11-14 15:56:48,429 - INFO - Finished converting document 4_2024-02-14 in 0.17 sec.


Converted 'data\edgar_documents\CL\4_2024-02-13' --> 'data\processed_data\CL\4_2024-02-13.md'


2025-11-14 15:56:48,524 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:48,556 - INFO - Going to convert document batch...
2025-11-14 15:56:48,558 - INFO - Processing document 4_2024-02-15
2025-11-14 15:56:48,601 - INFO - Finished converting document 4_2024-02-15 in 0.11 sec.
2025-11-14 15:56:48,655 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:48,673 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CL\4_2024-02-14' --> 'data\processed_data\CL\4_2024-02-14.md'
Converted 'data\edgar_documents\CL\4_2024-02-15' --> 'data\processed_data\CL\4_2024-02-15.md'


2025-11-14 15:56:48,674 - INFO - Processing document 4_2024-02-20
2025-11-14 15:56:48,714 - INFO - Finished converting document 4_2024-02-20 in 0.06 sec.
2025-11-14 15:56:48,772 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:48,787 - INFO - Going to convert document batch...
2025-11-14 15:56:48,788 - INFO - Processing document 4_2024-04-03
2025-11-14 15:56:48,819 - INFO - Finished converting document 4_2024-04-03 in 0.06 sec.
2025-11-14 15:56:48,893 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:48,918 - INFO - Going to convert document batch...
2025-11-14 15:56:48,919 - INFO - Processing document 4_2024-05-03
2025-11-14 15:56:48,960 - INFO - Finished converting document 4_2024-05-03 in 0.09 sec.


Converted 'data\edgar_documents\CL\4_2024-02-20' --> 'data\processed_data\CL\4_2024-02-20.md'
Converted 'data\edgar_documents\CL\4_2024-04-03' --> 'data\processed_data\CL\4_2024-04-03.md'


2025-11-14 15:56:49,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:49,041 - INFO - Going to convert document batch...
2025-11-14 15:56:49,042 - INFO - Processing document 4_2024-05-09
2025-11-14 15:56:49,073 - INFO - Finished converting document 4_2024-05-09 in 0.08 sec.
2025-11-14 15:56:49,135 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:49,159 - INFO - Going to convert document batch...
2025-11-14 15:56:49,160 - INFO - Processing document 4_2024-05-10
2025-11-14 15:56:49,202 - INFO - Finished converting document 4_2024-05-10 in 0.09 sec.


Converted 'data\edgar_documents\CL\4_2024-05-03' --> 'data\processed_data\CL\4_2024-05-03.md'
Converted 'data\edgar_documents\CL\4_2024-05-09' --> 'data\processed_data\CL\4_2024-05-09.md'


2025-11-14 15:56:49,252 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:49,262 - INFO - Going to convert document batch...
2025-11-14 15:56:49,262 - INFO - Processing document 4_2024-05-15
2025-11-14 15:56:49,300 - INFO - Finished converting document 4_2024-05-15 in 0.06 sec.
2025-11-14 15:56:49,379 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:49,397 - INFO - Going to convert document batch...
2025-11-14 15:56:49,399 - INFO - Processing document 4_2024-05-16


Converted 'data\edgar_documents\CL\4_2024-05-10' --> 'data\processed_data\CL\4_2024-05-10.md'
Converted 'data\edgar_documents\CL\4_2024-05-15' --> 'data\processed_data\CL\4_2024-05-15.md'


2025-11-14 15:56:49,459 - INFO - Finished converting document 4_2024-05-16 in 0.09 sec.
2025-11-14 15:56:49,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:49,548 - INFO - Going to convert document batch...
2025-11-14 15:56:49,550 - INFO - Processing document 4_2024-07-03
2025-11-14 15:56:49,630 - INFO - Finished converting document 4_2024-07-03 in 0.12 sec.
2025-11-14 15:56:49,682 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\4_2024-05-16' --> 'data\processed_data\CL\4_2024-05-16.md'
Converted 'data\edgar_documents\CL\4_2024-07-03' --> 'data\processed_data\CL\4_2024-07-03.md'


2025-11-14 15:56:49,709 - INFO - Going to convert document batch...
2025-11-14 15:56:49,711 - INFO - Processing document 4_2024-08-02
2025-11-14 15:56:49,750 - INFO - Finished converting document 4_2024-08-02 in 0.09 sec.
2025-11-14 15:56:49,807 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:49,819 - INFO - Going to convert document batch...
2025-11-14 15:56:49,819 - INFO - Processing document 4_2024-08-08
2025-11-14 15:56:49,845 - INFO - Finished converting document 4_2024-08-08 in 0.06 sec.
2025-11-14 15:56:49,895 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:49,910 - INFO - Going to convert document batch...
2025-11-14 15:56:49,911 - INFO - Processing document 4_2024-08-12
2025-11-14 15:56:49,938 - INFO - Finished converting document 4_2024-08-12 in 0.06 sec.


Converted 'data\edgar_documents\CL\4_2024-08-02' --> 'data\processed_data\CL\4_2024-08-02.md'
Converted 'data\edgar_documents\CL\4_2024-08-08' --> 'data\processed_data\CL\4_2024-08-08.md'


2025-11-14 15:56:49,983 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:49,993 - INFO - Going to convert document batch...
2025-11-14 15:56:49,994 - INFO - Processing document 4_2024-08-27
2025-11-14 15:56:50,016 - INFO - Finished converting document 4_2024-08-27 in 0.05 sec.
2025-11-14 15:56:50,066 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:50,074 - INFO - Going to convert document batch...
2025-11-14 15:56:50,075 - INFO - Processing document 4_2024-09-12
2025-11-14 15:56:50,095 - INFO - Finished converting document 4_2024-09-12 in 0.05 sec.
2025-11-14 15:56:50,135 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:50,147 - INFO - Going to convert document batch...
2025-11-14 15:56:50,147 - INFO - Processing document 4_2024-09-16
2025-11-14 15:56:50,170 - INFO - Finished converting document 4_2024-09-16 in 0.06 sec.


Converted 'data\edgar_documents\CL\4_2024-08-12' --> 'data\processed_data\CL\4_2024-08-12.md'
Converted 'data\edgar_documents\CL\4_2024-08-27' --> 'data\processed_data\CL\4_2024-08-27.md'
Converted 'data\edgar_documents\CL\4_2024-09-12' --> 'data\processed_data\CL\4_2024-09-12.md'


2025-11-14 15:56:50,217 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:50,226 - INFO - Going to convert document batch...
2025-11-14 15:56:50,227 - INFO - Processing document 4_2024-10-03
2025-11-14 15:56:50,245 - INFO - Finished converting document 4_2024-10-03 in 0.06 sec.
2025-11-14 15:56:50,301 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:50,316 - INFO - Going to convert document batch...
2025-11-14 15:56:50,317 - INFO - Processing document 4_2024-11-05
2025-11-14 15:56:50,336 - INFO - Finished converting document 4_2024-11-05 in 0.06 sec.
2025-11-14 15:56:50,366 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:50,376 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CL\4_2024-09-16' --> 'data\processed_data\CL\4_2024-09-16.md'
Converted 'data\edgar_documents\CL\4_2024-10-03' --> 'data\processed_data\CL\4_2024-10-03.md'
Converted 'data\edgar_documents\CL\4_2024-11-05' --> 'data\processed_data\CL\4_2024-11-05.md'


2025-11-14 15:56:50,377 - INFO - Processing document 4_2024-11-07
2025-11-14 15:56:50,399 - INFO - Finished converting document 4_2024-11-07 in 0.03 sec.
2025-11-14 15:56:50,446 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:50,454 - INFO - Going to convert document batch...
2025-11-14 15:56:50,455 - INFO - Processing document 4_2024-11-26
2025-11-14 15:56:50,473 - INFO - Finished converting document 4_2024-11-26 in 0.05 sec.
2025-11-14 15:56:50,517 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:50,525 - INFO - Going to convert document batch...
2025-11-14 15:56:50,527 - INFO - Processing document 4_2024-11-27
2025-11-14 15:56:50,543 - INFO - Finished converting document 4_2024-11-27 in 0.06 sec.
2025-11-14 15:56:50,590 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:50,597 - INFO - Going to convert document batch...
2025-11-14 15:56:50,598 - INFO - Processing document 4_2024-12-05


Converted 'data\edgar_documents\CL\4_2024-11-07' --> 'data\processed_data\CL\4_2024-11-07.md'
Converted 'data\edgar_documents\CL\4_2024-11-26' --> 'data\processed_data\CL\4_2024-11-26.md'
Converted 'data\edgar_documents\CL\4_2024-11-27' --> 'data\processed_data\CL\4_2024-11-27.md'


2025-11-14 15:56:50,615 - INFO - Finished converting document 4_2024-12-05 in 0.05 sec.
2025-11-14 15:56:50,658 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:50,665 - INFO - Going to convert document batch...
2025-11-14 15:56:50,665 - INFO - Processing document 4_2025-01-06
2025-11-14 15:56:50,682 - INFO - Finished converting document 4_2025-01-06 in 0.05 sec.
2025-11-14 15:56:50,717 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:50,727 - INFO - Going to convert document batch...
2025-11-14 15:56:50,728 - INFO - Processing document 4_2025-02-18
2025-11-14 15:56:50,747 - INFO - Finished converting document 4_2025-02-18 in 0.05 sec.
2025-11-14 15:56:50,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:50,796 - INFO - Going to convert document batch...
2025-11-14 15:56:50,797 - INFO - Processing document 4_2025-02-27
2025-11-14 15:56:50,815 - INFO - Finished converting document 4_2025-02-27 in 0.05 sec.


Converted 'data\edgar_documents\CL\4_2024-12-05' --> 'data\processed_data\CL\4_2024-12-05.md'
Converted 'data\edgar_documents\CL\4_2025-01-06' --> 'data\processed_data\CL\4_2025-01-06.md'
Converted 'data\edgar_documents\CL\4_2025-02-18' --> 'data\processed_data\CL\4_2025-02-18.md'


2025-11-14 15:56:50,859 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:50,867 - INFO - Going to convert document batch...
2025-11-14 15:56:50,868 - INFO - Processing document 4_2025-04-03
2025-11-14 15:56:50,887 - INFO - Finished converting document 4_2025-04-03 in 0.06 sec.
2025-11-14 15:56:50,936 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:56:50,936 - ERROR - Input document 4_2025-04-28 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:56

Converted 'data\edgar_documents\CL\4_2025-02-27' --> 'data\processed_data\CL\4_2025-02-27.md'
Converted 'data\edgar_documents\CL\4_2025-04-03' --> 'data\processed_data\CL\4_2025-04-03.md'
Error processing data\edgar_documents\CL\4_2025-04-28: File format not allowed: data\edgar_documents\CL\4_2025-04-28
Error processing data\edgar_documents\CL\4_2025-04-30: File format not allowed: data\edgar_documents\CL\4_2025-04-30


2025-11-14 15:56:51,071 - INFO - Finished converting document 4_2025-05-14 in 0.11 sec.
2025-11-14 15:56:51,161 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:51,181 - INFO - Going to convert document batch...
2025-11-14 15:56:51,183 - INFO - Processing document 4_2025-05-19
2025-11-14 15:56:51,222 - INFO - Finished converting document 4_2025-05-19 in 0.08 sec.
2025-11-14 15:56:51,284 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:51,300 - INFO - Going to convert document batch...
2025-11-14 15:56:51,301 - INFO - Processing document 4_2025-06-18


Converted 'data\edgar_documents\CL\4_2025-05-14' --> 'data\processed_data\CL\4_2025-05-14.md'
Converted 'data\edgar_documents\CL\4_2025-05-19' --> 'data\processed_data\CL\4_2025-05-19.md'


2025-11-14 15:56:51,335 - INFO - Finished converting document 4_2025-06-18 in 0.06 sec.
2025-11-14 15:56:51,392 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:51,415 - INFO - Going to convert document batch...
2025-11-14 15:56:51,416 - INFO - Processing document 4_2025-07-02
2025-11-14 15:56:51,451 - INFO - Finished converting document 4_2025-07-02 in 0.08 sec.
2025-11-14 15:56:51,497 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:51,517 - INFO - Going to convert document batch...
2025-11-14 15:56:51,518 - INFO - Processing document 4_2025-09-12
2025-11-14 15:56:51,562 - INFO - Finished converting document 4_2025-09-12 in 0.08 sec.


Converted 'data\edgar_documents\CL\4_2025-06-18' --> 'data\processed_data\CL\4_2025-06-18.md'
Converted 'data\edgar_documents\CL\4_2025-07-02' --> 'data\processed_data\CL\4_2025-07-02.md'


2025-11-14 15:56:51,627 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\4_2025-09-12' --> 'data\processed_data\CL\4_2025-09-12.md'


2025-11-14 15:56:52,421 - INFO - Going to convert document batch...
2025-11-14 15:56:52,423 - INFO - Processing document 4_2025-09-16
2025-11-14 15:56:52,466 - INFO - Finished converting document 4_2025-09-16 in 0.88 sec.
2025-11-14 15:56:52,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:52,553 - INFO - Going to convert document batch...
2025-11-14 15:56:52,554 - INFO - Processing document 4_2025-10-03
2025-11-14 15:56:52,600 - INFO - Finished converting document 4_2025-10-03 in 0.08 sec.
2025-11-14 15:56:52,677 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:56:52,678 - ERROR - Input document 4_2025-11-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\CL\4_2025-09-16' --> 'data\processed_data\CL\4_2025-09-16.md'
Converted 'data\edgar_documents\CL\4_2025-10-03' --> 'data\processed_data\CL\4_2025-10-03.md'
Error processing data\edgar_documents\CL\4_2025-11-03: File format not allowed: data\edgar_documents\CL\4_2025-11-03


2025-11-14 15:56:52,700 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:56:52,702 - ERROR - Input document 4_2025-11-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:56:52,703 - INFO - Going to convert document batch...
2025-11-14 15:56:52,718 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:52,755 - INFO - Going to convert document batch...
2025-11-14 15:56:52,757 - INFO - Processing document 8-K_2023-01-12
2025-11-14 15:56:52,800 - INFO - F

Error processing data\edgar_documents\CL\4_2025-11-05: File format not allowed: data\edgar_documents\CL\4_2025-11-05
Converted 'data\edgar_documents\CL\8-K_2023-01-12' --> 'data\processed_data\CL\8-K_2023-01-12.md'


2025-11-14 15:56:52,911 - INFO - Finished converting document 8-K_2023-01-27 in 0.09 sec.
2025-11-14 15:56:52,945 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:52,971 - INFO - Going to convert document batch...
2025-11-14 15:56:52,972 - INFO - Processing document 8-K_2023-01-30
2025-11-14 15:56:53,005 - INFO - Finished converting document 8-K_2023-01-30 in 0.08 sec.
2025-11-14 15:56:53,063 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:56:53,064 - ERROR - Input document 8-K_2023-03-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS:

Converted 'data\edgar_documents\CL\8-K_2023-01-27' --> 'data\processed_data\CL\8-K_2023-01-27.md'
Converted 'data\edgar_documents\CL\8-K_2023-01-30' --> 'data\processed_data\CL\8-K_2023-01-30.md'
Error processing data\edgar_documents\CL\8-K_2023-03-01: File format not allowed: data\edgar_documents\CL\8-K_2023-03-01


2025-11-14 15:56:53,133 - INFO - Processing document 8-K_2023-04-28
2025-11-14 15:56:53,188 - INFO - Finished converting document 8-K_2023-04-28 in 0.12 sec.
2025-11-14 15:56:53,230 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:53,323 - INFO - Going to convert document batch...
2025-11-14 15:56:53,325 - INFO - Processing document 8-K_2023-05-17
2025-11-14 15:56:53,399 - INFO - Finished converting document 8-K_2023-05-17 in 0.19 sec.


Converted 'data\edgar_documents\CL\8-K_2023-04-28' --> 'data\processed_data\CL\8-K_2023-04-28.md'


2025-11-14 15:56:53,461 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:53,489 - INFO - Going to convert document batch...
2025-11-14 15:56:53,490 - INFO - Processing document 8-K_2023-07-28
2025-11-14 15:56:53,535 - INFO - Finished converting document 8-K_2023-07-28 in 0.09 sec.
2025-11-14 15:56:53,592 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:53,616 - INFO - Going to convert document batch...
2025-11-14 15:56:53,617 - INFO - Processing document 8-K_2023-08-18


Converted 'data\edgar_documents\CL\8-K_2023-05-17' --> 'data\processed_data\CL\8-K_2023-05-17.md'
Converted 'data\edgar_documents\CL\8-K_2023-07-28' --> 'data\processed_data\CL\8-K_2023-07-28.md'


2025-11-14 15:56:53,660 - INFO - Finished converting document 8-K_2023-08-18 in 0.09 sec.
2025-11-14 15:56:53,711 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:53,742 - INFO - Going to convert document batch...
2025-11-14 15:56:53,744 - INFO - Processing document 8-K_2023-09-15
2025-11-14 15:56:53,784 - INFO - Finished converting document 8-K_2023-09-15 in 0.11 sec.
2025-11-14 15:56:53,817 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:53,844 - INFO - Going to convert document batch...
2025-11-14 15:56:53,845 - INFO - Processing document 8-K_2023-10-27


Converted 'data\edgar_documents\CL\8-K_2023-08-18' --> 'data\processed_data\CL\8-K_2023-08-18.md'
Converted 'data\edgar_documents\CL\8-K_2023-09-15' --> 'data\processed_data\CL\8-K_2023-09-15.md'


2025-11-14 15:56:53,896 - INFO - Finished converting document 8-K_2023-10-27 in 0.09 sec.
2025-11-14 15:56:53,935 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:53,968 - INFO - Going to convert document batch...
2025-11-14 15:56:53,969 - INFO - Processing document 8-K_2024-01-26
2025-11-14 15:56:54,015 - INFO - Finished converting document 8-K_2024-01-26 in 0.09 sec.
2025-11-14 15:56:54,116 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\CL\8-K_2023-10-27' --> 'data\processed_data\CL\8-K_2023-10-27.md'
Converted 'data\edgar_documents\CL\8-K_2024-01-26' --> 'data\processed_data\CL\8-K_2024-01-26.md'


2025-11-14 15:56:54,120 - ERROR - Input document 8-K_2024-02-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:56:54,123 - INFO - Going to convert document batch...
2025-11-14 15:56:54,169 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:54,206 - INFO - Going to convert document batch...
2025-11-14 15:56:54,207 - INFO - Processing document 8-K_2024-04-26
2025-11-14 15:56:54,247 - INFO - Finished converting document 8-K_2024-04-26 in 0.12 sec.
2025-11-14 15:56:54,297 - INFO -

Error processing data\edgar_documents\CL\8-K_2024-02-15: File format not allowed: data\edgar_documents\CL\8-K_2024-02-15
Converted 'data\edgar_documents\CL\8-K_2024-04-26' --> 'data\processed_data\CL\8-K_2024-04-26.md'


2025-11-14 15:56:54,356 - INFO - Going to convert document batch...
2025-11-14 15:56:54,359 - INFO - Processing document 8-K_2024-05-15
2025-11-14 15:56:54,429 - INFO - Finished converting document 8-K_2024-05-15 in 0.14 sec.
2025-11-14 15:56:54,488 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:54,522 - INFO - Going to convert document batch...
2025-11-14 15:56:54,524 - INFO - Processing document 8-K_2024-07-26
2025-11-14 15:56:54,574 - INFO - Finished converting document 8-K_2024-07-26 in 0.12 sec.
2025-11-14 15:56:54,637 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\8-K_2024-05-15' --> 'data\processed_data\CL\8-K_2024-05-15.md'
Converted 'data\edgar_documents\CL\8-K_2024-07-26' --> 'data\processed_data\CL\8-K_2024-07-26.md'


2025-11-14 15:56:54,663 - INFO - Going to convert document batch...
2025-11-14 15:56:54,663 - INFO - Processing document 8-K_2024-10-25
2025-11-14 15:56:54,727 - INFO - Finished converting document 8-K_2024-10-25 in 0.12 sec.
2025-11-14 15:56:54,809 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:54,854 - INFO - Going to convert document batch...
2025-11-14 15:56:54,856 - INFO - Processing document 8-K_2025-01-24
2025-11-14 15:56:54,937 - INFO - Finished converting document 8-K_2025-01-24 in 0.19 sec.


Converted 'data\edgar_documents\CL\8-K_2024-10-25' --> 'data\processed_data\CL\8-K_2024-10-25.md'


2025-11-14 15:56:55,006 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:55,041 - INFO - Going to convert document batch...
2025-11-14 15:56:55,043 - INFO - Processing document 8-K_2025-01-31
2025-11-14 15:56:55,109 - INFO - Finished converting document 8-K_2025-01-31 in 0.12 sec.


Converted 'data\edgar_documents\CL\8-K_2025-01-24' --> 'data\processed_data\CL\8-K_2025-01-24.md'
Converted 'data\edgar_documents\CL\8-K_2025-01-31' --> 'data\processed_data\CL\8-K_2025-01-31.md'


2025-11-14 15:56:55,194 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:55,243 - INFO - Going to convert document batch...
2025-11-14 15:56:55,244 - INFO - Processing document 8-K_2025-04-25
2025-11-14 15:56:55,371 - INFO - Finished converting document 8-K_2025-04-25 in 0.22 sec.
2025-11-14 15:56:55,438 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:55,465 - INFO - Going to convert document batch...
2025-11-14 15:56:55,467 - INFO - Processing document 8-K_2025-05-02
2025-11-14 15:56:55,510 - INFO - Finished converting document 8-K_2025-05-02 in 0.11 sec.
2025-11-14 15:56:55,574 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\8-K_2025-04-25' --> 'data\processed_data\CL\8-K_2025-04-25.md'
Converted 'data\edgar_documents\CL\8-K_2025-05-02' --> 'data\processed_data\CL\8-K_2025-05-02.md'


2025-11-14 15:56:55,616 - INFO - Going to convert document batch...
2025-11-14 15:56:55,617 - INFO - Processing document 8-K_2025-05-14
2025-11-14 15:56:55,688 - INFO - Finished converting document 8-K_2025-05-14 in 0.16 sec.
2025-11-14 15:56:55,738 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:55,762 - INFO - Going to convert document batch...
2025-11-14 15:56:55,763 - INFO - Processing document 8-K_2025-05-29
2025-11-14 15:56:55,798 - INFO - Finished converting document 8-K_2025-05-29 in 0.08 sec.
2025-11-14 15:56:55,827 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:55,853 - INFO - Going to convert document batch...
2025-11-14 15:56:55,854 - INFO - Processing document 8-K_2025-08-01
2025-11-14 15:56:55,889 - INFO - Finished converting document 8-K_2025-08-01 in 0.08 sec.


Converted 'data\edgar_documents\CL\8-K_2025-05-14' --> 'data\processed_data\CL\8-K_2025-05-14.md'
Converted 'data\edgar_documents\CL\8-K_2025-05-29' --> 'data\processed_data\CL\8-K_2025-05-29.md'


2025-11-14 15:56:55,938 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:56:55,978 - INFO - Going to convert document batch...
2025-11-14 15:56:55,980 - INFO - Processing document 8-K_2025-10-31
2025-11-14 15:56:56,035 - INFO - Finished converting document 8-K_2025-10-31 in 0.11 sec.
2025-11-14 15:56:56,106 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\8-K_2025-08-01' --> 'data\processed_data\CL\8-K_2025-08-01.md'
Converted 'data\edgar_documents\CL\8-K_2025-10-31' --> 'data\processed_data\CL\8-K_2025-10-31.md'


2025-11-14 15:56:56,146 - INFO - Going to convert document batch...
2025-11-14 15:56:56,148 - INFO - Processing document 8-K_2025-11-10
2025-11-14 15:56:56,206 - INFO - Finished converting document 8-K_2025-11-10 in 0.12 sec.
2025-11-14 15:56:56,332 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:56:56,333 - ERROR - Input document DEF-14A_2023-03-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:56:56,336 - INFO - Going to convert 

Converted 'data\edgar_documents\CL\8-K_2025-11-10' --> 'data\processed_data\CL\8-K_2025-11-10.md'
Error processing data\edgar_documents\CL\DEF-14A_2023-03-29: File format not allowed: data\edgar_documents\CL\DEF-14A_2023-03-29


2025-11-14 15:56:57,799 - INFO - Going to convert document batch...
2025-11-14 15:56:57,800 - INFO - Processing document DEF-14A_2024-03-27
2025-11-14 15:57:17,015 - INFO - Finished converting document DEF-14A_2024-03-27 in 20.67 sec.
2025-11-14 15:57:19,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\DEF-14A_2024-03-27' --> 'data\processed_data\CL\DEF-14A_2024-03-27.md'


2025-11-14 15:57:21,316 - INFO - Going to convert document batch...
2025-11-14 15:57:21,318 - INFO - Processing document DEF-14A_2025-03-26
2025-11-14 15:57:52,496 - INFO - Finished converting document DEF-14A_2025-03-26 in 33.39 sec.
2025-11-14 15:57:53,555 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CL\DEF-14A_2025-03-26' --> 'data\processed_data\CL\DEF-14A_2025-03-26.md'
Processed 103 new files. Errors: 8
Found 141 files to process in data\edgar_documents\CMCSA


2025-11-14 15:57:54,413 - INFO - Going to convert document batch...
2025-11-14 15:57:54,414 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:57:54,415 - INFO - Processing document 10-K_2023-02-03
2025-11-14 15:57:55,912 - INFO - Finished converting document 10-K_2023-02-03 in 2.41 sec.
2025-11-14 15:57:56,710 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\10-K_2023-02-03' --> 'data\processed_data\CMCSA\10-K_2023-02-03.md'


2025-11-14 15:57:57,281 - INFO - Going to convert document batch...
2025-11-14 15:57:57,282 - INFO - Processing document 10-K_2024-01-31
2025-11-14 15:57:58,775 - INFO - Finished converting document 10-K_2024-01-31 in 2.11 sec.
2025-11-14 15:57:59,716 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\10-K_2024-01-31' --> 'data\processed_data\CMCSA\10-K_2024-01-31.md'


2025-11-14 15:58:00,265 - INFO - Going to convert document batch...
2025-11-14 15:58:00,266 - INFO - Processing document 10-K_2025-01-31
2025-11-14 15:58:01,791 - INFO - Finished converting document 10-K_2025-01-31 in 2.12 sec.
2025-11-14 15:58:02,416 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\10-K_2025-01-31' --> 'data\processed_data\CMCSA\10-K_2025-01-31.md'


2025-11-14 15:58:03,074 - INFO - Going to convert document batch...
2025-11-14 15:58:03,074 - INFO - Processing document 10-Q_2023-04-27
2025-11-14 15:58:03,684 - INFO - Finished converting document 10-Q_2023-04-27 in 1.30 sec.
2025-11-14 15:58:04,040 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\10-Q_2023-04-27' --> 'data\processed_data\CMCSA\10-Q_2023-04-27.md'


2025-11-14 15:58:04,424 - INFO - Going to convert document batch...
2025-11-14 15:58:04,426 - INFO - Processing document 10-Q_2023-07-27
2025-11-14 15:58:05,513 - INFO - Finished converting document 10-Q_2023-07-27 in 1.52 sec.
2025-11-14 15:58:05,940 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\10-Q_2023-07-27' --> 'data\processed_data\CMCSA\10-Q_2023-07-27.md'


2025-11-14 15:58:06,325 - INFO - Going to convert document batch...
2025-11-14 15:58:06,326 - INFO - Processing document 10-Q_2023-10-26
2025-11-14 15:58:07,066 - INFO - Finished converting document 10-Q_2023-10-26 in 1.16 sec.
2025-11-14 15:58:07,474 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\10-Q_2023-10-26' --> 'data\processed_data\CMCSA\10-Q_2023-10-26.md'


2025-11-14 15:58:07,735 - INFO - Going to convert document batch...
2025-11-14 15:58:07,736 - INFO - Processing document 10-Q_2024-04-25
2025-11-14 15:58:08,568 - INFO - Finished converting document 10-Q_2024-04-25 in 1.12 sec.
2025-11-14 15:58:08,898 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\10-Q_2024-04-25' --> 'data\processed_data\CMCSA\10-Q_2024-04-25.md'


2025-11-14 15:58:09,237 - INFO - Going to convert document batch...
2025-11-14 15:58:09,237 - INFO - Processing document 10-Q_2024-07-23
2025-11-14 15:58:09,888 - INFO - Finished converting document 10-Q_2024-07-23 in 1.03 sec.
2025-11-14 15:58:10,260 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\10-Q_2024-07-23' --> 'data\processed_data\CMCSA\10-Q_2024-07-23.md'


2025-11-14 15:58:10,933 - INFO - Going to convert document batch...
2025-11-14 15:58:10,933 - INFO - Processing document 10-Q_2024-10-31
2025-11-14 15:58:11,579 - INFO - Finished converting document 10-Q_2024-10-31 in 1.38 sec.
2025-11-14 15:58:11,937 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\10-Q_2024-10-31' --> 'data\processed_data\CMCSA\10-Q_2024-10-31.md'


2025-11-14 15:58:12,185 - INFO - Going to convert document batch...
2025-11-14 15:58:12,186 - INFO - Processing document 10-Q_2025-04-24
2025-11-14 15:58:12,707 - INFO - Finished converting document 10-Q_2025-04-24 in 0.80 sec.
2025-11-14 15:58:13,011 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\10-Q_2025-04-24' --> 'data\processed_data\CMCSA\10-Q_2025-04-24.md'


2025-11-14 15:58:13,659 - INFO - Going to convert document batch...
2025-11-14 15:58:13,660 - INFO - Processing document 10-Q_2025-07-31
2025-11-14 15:58:14,301 - INFO - Finished converting document 10-Q_2025-07-31 in 1.33 sec.
2025-11-14 15:58:14,655 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\10-Q_2025-07-31' --> 'data\processed_data\CMCSA\10-Q_2025-07-31.md'


2025-11-14 15:58:15,047 - INFO - Going to convert document batch...
2025-11-14 15:58:15,047 - INFO - Processing document 10-Q_2025-10-30
2025-11-14 15:58:15,723 - INFO - Finished converting document 10-Q_2025-10-30 in 1.09 sec.
2025-11-14 15:58:16,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:16,109 - INFO - Going to convert document batch...
2025-11-14 15:58:16,109 - INFO - Processing document 4_2023-01-04
2025-11-14 15:58:16,127 - INFO - Finished converting document 4_2023-01-04 in 0.06 sec.
2025-11-14 15:58:16,172 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:16,182 - INFO - Going to convert document batch...
2025-11-14 15:58:16,183 - INFO - Processing document 4_2023-01-05
2025-11-14 15:58:16,201 - INFO - Finished converting document 4_2023-01-05 in 0.06 sec.
2025-11-14 15:58:16,229 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:16,238 - INFO - Going to convert document batch...
2025-11-14 15:58:16,

Converted 'data\edgar_documents\CMCSA\10-Q_2025-10-30' --> 'data\processed_data\CMCSA\10-Q_2025-10-30.md'
Converted 'data\edgar_documents\CMCSA\4_2023-01-04' --> 'data\processed_data\CMCSA\4_2023-01-04.md'
Converted 'data\edgar_documents\CMCSA\4_2023-01-05' --> 'data\processed_data\CMCSA\4_2023-01-05.md'


2025-11-14 15:58:16,289 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:16,297 - INFO - Going to convert document batch...
2025-11-14 15:58:16,299 - INFO - Processing document 4_2023-01-09
2025-11-14 15:58:16,317 - INFO - Finished converting document 4_2023-01-09 in 0.03 sec.
2025-11-14 15:58:16,360 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:16,372 - INFO - Going to convert document batch...
2025-11-14 15:58:16,373 - INFO - Processing document 4_2023-01-27
2025-11-14 15:58:16,389 - INFO - Finished converting document 4_2023-01-27 in 0.06 sec.
2025-11-14 15:58:16,434 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:16,453 - INFO - Going to convert document batch...
2025-11-14 15:58:16,454 - INFO - Processing document 4_2023-01-30


Converted 'data\edgar_documents\CMCSA\4_2023-01-06' --> 'data\processed_data\CMCSA\4_2023-01-06.md'
Converted 'data\edgar_documents\CMCSA\4_2023-01-09' --> 'data\processed_data\CMCSA\4_2023-01-09.md'
Converted 'data\edgar_documents\CMCSA\4_2023-01-27' --> 'data\processed_data\CMCSA\4_2023-01-27.md'


2025-11-14 15:58:16,481 - INFO - Finished converting document 4_2023-01-30 in 0.08 sec.
2025-11-14 15:58:16,512 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:16,525 - INFO - Going to convert document batch...
2025-11-14 15:58:16,526 - INFO - Processing document 4_2023-02-01
2025-11-14 15:58:16,558 - INFO - Finished converting document 4_2023-02-01 in 0.06 sec.
2025-11-14 15:58:16,595 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:16,607 - INFO - Going to convert document batch...
2025-11-14 15:58:16,608 - INFO - Processing document 4_2023-02-06
2025-11-14 15:58:16,640 - INFO - Finished converting document 4_2023-02-06 in 0.06 sec.


Converted 'data\edgar_documents\CMCSA\4_2023-01-30' --> 'data\processed_data\CMCSA\4_2023-01-30.md'
Converted 'data\edgar_documents\CMCSA\4_2023-02-01' --> 'data\processed_data\CMCSA\4_2023-02-01.md'
Converted 'data\edgar_documents\CMCSA\4_2023-02-06' --> 'data\processed_data\CMCSA\4_2023-02-06.md'


2025-11-14 15:58:16,710 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:58:16,711 - ERROR - Input document 4_2023-02-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:58:16,713 - INFO - Going to convert document batch...
2025-11-14 15:58:16,735 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:58:16,736 - ERROR - Input document 4_2023-02-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\CMCSA\4_2023-02-07: File format not allowed: data\edgar_documents\CMCSA\4_2023-02-07
Error processing data\edgar_documents\CMCSA\4_2023-02-08: File format not allowed: data\edgar_documents\CMCSA\4_2023-02-08
Converted 'data\edgar_documents\CMCSA\4_2023-02-16' --> 'data\processed_data\CMCSA\4_2023-02-16.md'


2025-11-14 15:58:17,091 - INFO - Going to convert document batch...
2025-11-14 15:58:17,091 - INFO - Processing document 4_2023-02-21
2025-11-14 15:58:17,124 - INFO - Finished converting document 4_2023-02-21 in 0.33 sec.
2025-11-14 15:58:17,163 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:17,173 - INFO - Going to convert document batch...
2025-11-14 15:58:17,173 - INFO - Processing document 4_2023-03-03
2025-11-14 15:58:17,196 - INFO - Finished converting document 4_2023-03-03 in 0.03 sec.
2025-11-14 15:58:17,225 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:17,233 - INFO - Going to convert document batch...
2025-11-14 15:58:17,234 - INFO - Processing document 4_2023-03-09
2025-11-14 15:58:17,251 - INFO - Finished converting document 4_2023-03-09 in 0.03 sec.
2025-11-14 15:58:17,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:17,287 - INFO - Going to convert document batch...
2025-11-14 15:58:17,288 - 

Converted 'data\edgar_documents\CMCSA\4_2023-02-21' --> 'data\processed_data\CMCSA\4_2023-02-21.md'
Converted 'data\edgar_documents\CMCSA\4_2023-03-03' --> 'data\processed_data\CMCSA\4_2023-03-03.md'
Converted 'data\edgar_documents\CMCSA\4_2023-03-09' --> 'data\processed_data\CMCSA\4_2023-03-09.md'
Converted 'data\edgar_documents\CMCSA\4_2023-03-17' --> 'data\processed_data\CMCSA\4_2023-03-17.md'


2025-11-14 15:58:17,353 - INFO - Going to convert document batch...
2025-11-14 15:58:17,355 - INFO - Processing document 4_2023-03-30
2025-11-14 15:58:17,373 - INFO - Finished converting document 4_2023-03-30 in 0.06 sec.
2025-11-14 15:58:17,410 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:17,417 - INFO - Going to convert document batch...
2025-11-14 15:58:17,418 - INFO - Processing document 4_2023-04-04
2025-11-14 15:58:17,435 - INFO - Finished converting document 4_2023-04-04 in 0.05 sec.
2025-11-14 15:58:17,473 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:58:17,474 - ERROR - Input document 4_2023-05-02 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\CMCSA\4_2023-03-30' --> 'data\processed_data\CMCSA\4_2023-03-30.md'
Converted 'data\edgar_documents\CMCSA\4_2023-04-04' --> 'data\processed_data\CMCSA\4_2023-04-04.md'
Error processing data\edgar_documents\CMCSA\4_2023-05-02: File format not allowed: data\edgar_documents\CMCSA\4_2023-05-02
Converted 'data\edgar_documents\CMCSA\4_2023-05-24' --> 'data\processed_data\CMCSA\4_2023-05-24.md'


2025-11-14 15:58:17,579 - INFO - Processing document 4_2023-06-06
2025-11-14 15:58:17,599 - INFO - Finished converting document 4_2023-06-06 in 0.05 sec.
2025-11-14 15:58:17,634 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:17,642 - INFO - Going to convert document batch...
2025-11-14 15:58:17,643 - INFO - Processing document 4_2023-06-14
2025-11-14 15:58:17,660 - INFO - Finished converting document 4_2023-06-14 in 0.03 sec.
2025-11-14 15:58:17,692 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:17,701 - INFO - Going to convert document batch...
2025-11-14 15:58:17,701 - INFO - Processing document 4_2023-06-21
2025-11-14 15:58:17,721 - INFO - Finished converting document 4_2023-06-21 in 0.03 sec.
2025-11-14 15:58:17,772 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:17,785 - INFO - Going to convert document batch...
2025-11-14 15:58:17,786 - INFO - Processing document 4_2023-07-05
2025-11-14 15:58:17,805 - IN

Converted 'data\edgar_documents\CMCSA\4_2023-06-06' --> 'data\processed_data\CMCSA\4_2023-06-06.md'
Converted 'data\edgar_documents\CMCSA\4_2023-06-14' --> 'data\processed_data\CMCSA\4_2023-06-14.md'
Converted 'data\edgar_documents\CMCSA\4_2023-06-21' --> 'data\processed_data\CMCSA\4_2023-06-21.md'
Converted 'data\edgar_documents\CMCSA\4_2023-07-05' --> 'data\processed_data\CMCSA\4_2023-07-05.md'


2025-11-14 15:58:17,853 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:17,868 - INFO - Going to convert document batch...
2025-11-14 15:58:17,870 - INFO - Processing document 4_2023-08-07
2025-11-14 15:58:17,890 - INFO - Finished converting document 4_2023-08-07 in 0.06 sec.
2025-11-14 15:58:17,921 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:17,928 - INFO - Going to convert document batch...
2025-11-14 15:58:17,929 - INFO - Processing document 4_2023-08-30
2025-11-14 15:58:17,944 - INFO - Finished converting document 4_2023-08-30 in 0.03 sec.
2025-11-14 15:58:17,971 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:17,980 - INFO - Going to convert document batch...
2025-11-14 15:58:17,980 - INFO - Processing document 4_2023-10-03
2025-11-14 15:58:17,997 - INFO - Finished converting document 4_2023-10-03 in 0.05 sec.
2025-11-14 15:58:18,042 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\CMCSA\4_2023-08-07' --> 'data\processed_data\CMCSA\4_2023-08-07.md'
Converted 'data\edgar_documents\CMCSA\4_2023-08-30' --> 'data\processed_data\CMCSA\4_2023-08-30.md'
Converted 'data\edgar_documents\CMCSA\4_2023-10-03' --> 'data\processed_data\CMCSA\4_2023-10-03.md'
Converted 'data\edgar_documents\CMCSA\4_2023-10-05' --> 'data\processed_data\CMCSA\4_2023-10-05.md'


2025-11-14 15:58:18,104 - INFO - Going to convert document batch...
2025-11-14 15:58:18,105 - INFO - Processing document 4_2023-11-15
2025-11-14 15:58:18,124 - INFO - Finished converting document 4_2023-11-15 in 0.05 sec.
2025-11-14 15:58:18,160 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:18,172 - INFO - Going to convert document batch...
2025-11-14 15:58:18,174 - INFO - Processing document 4_2023-11-22
2025-11-14 15:58:18,202 - INFO - Finished converting document 4_2023-11-22 in 0.06 sec.
2025-11-14 15:58:18,231 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:18,244 - INFO - Going to convert document batch...
2025-11-14 15:58:18,245 - INFO - Processing document 4_2023-12-06
2025-11-14 15:58:18,278 - INFO - Finished converting document 4_2023-12-06 in 0.06 sec.
2025-11-14 15:58:18,318 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:18,326 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CMCSA\4_2023-11-15' --> 'data\processed_data\CMCSA\4_2023-11-15.md'
Converted 'data\edgar_documents\CMCSA\4_2023-11-22' --> 'data\processed_data\CMCSA\4_2023-11-22.md'
Converted 'data\edgar_documents\CMCSA\4_2023-12-06' --> 'data\processed_data\CMCSA\4_2023-12-06.md'


2025-11-14 15:58:18,327 - INFO - Processing document 4_2023-12-18
2025-11-14 15:58:18,345 - INFO - Finished converting document 4_2023-12-18 in 0.03 sec.
2025-11-14 15:58:18,374 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:18,382 - INFO - Going to convert document batch...
2025-11-14 15:58:18,383 - INFO - Processing document 4_2024-01-03
2025-11-14 15:58:18,401 - INFO - Finished converting document 4_2024-01-03 in 0.05 sec.
2025-11-14 15:58:18,429 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:18,437 - INFO - Going to convert document batch...
2025-11-14 15:58:18,438 - INFO - Processing document 4_2024-01-04
2025-11-14 15:58:18,454 - INFO - Finished converting document 4_2024-01-04 in 0.03 sec.
2025-11-14 15:58:18,485 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:18,494 - INFO - Going to convert document batch...
2025-11-14 15:58:18,495 - INFO - Processing document 4_2024-01-08
2025-11-14 15:58:18,513 - IN

Converted 'data\edgar_documents\CMCSA\4_2023-12-18' --> 'data\processed_data\CMCSA\4_2023-12-18.md'
Converted 'data\edgar_documents\CMCSA\4_2024-01-03' --> 'data\processed_data\CMCSA\4_2024-01-03.md'
Converted 'data\edgar_documents\CMCSA\4_2024-01-04' --> 'data\processed_data\CMCSA\4_2024-01-04.md'
Converted 'data\edgar_documents\CMCSA\4_2024-01-08' --> 'data\processed_data\CMCSA\4_2024-01-08.md'


2025-11-14 15:58:18,555 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:18,564 - INFO - Going to convert document batch...
2025-11-14 15:58:18,565 - INFO - Processing document 4_2024-01-16
2025-11-14 15:58:18,586 - INFO - Finished converting document 4_2024-01-16 in 0.05 sec.
2025-11-14 15:58:18,618 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:18,625 - INFO - Going to convert document batch...
2025-11-14 15:58:18,626 - INFO - Processing document 4_2024-01-29
2025-11-14 15:58:18,642 - INFO - Finished converting document 4_2024-01-29 in 0.03 sec.
2025-11-14 15:58:18,685 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:18,700 - INFO - Going to convert document batch...
2025-11-14 15:58:18,701 - INFO - Processing document 4_2024-01-30
2025-11-14 15:58:18,725 - INFO - Finished converting document 4_2024-01-30 in 0.06 sec.
2025-11-14 15:58:18,752 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\CMCSA\4_2024-01-16' --> 'data\processed_data\CMCSA\4_2024-01-16.md'
Converted 'data\edgar_documents\CMCSA\4_2024-01-29' --> 'data\processed_data\CMCSA\4_2024-01-29.md'
Converted 'data\edgar_documents\CMCSA\4_2024-01-30' --> 'data\processed_data\CMCSA\4_2024-01-30.md'
Converted 'data\edgar_documents\CMCSA\4_2024-01-31' --> 'data\processed_data\CMCSA\4_2024-01-31.md'


2025-11-14 15:58:18,822 - INFO - Going to convert document batch...
2025-11-14 15:58:18,822 - INFO - Processing document 4_2024-02-16
2025-11-14 15:58:18,840 - INFO - Finished converting document 4_2024-02-16 in 0.05 sec.
2025-11-14 15:58:18,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:18,882 - INFO - Going to convert document batch...
2025-11-14 15:58:18,883 - INFO - Processing document 4_2024-03-05
2025-11-14 15:58:18,907 - INFO - Finished converting document 4_2024-03-05 in 0.05 sec.
2025-11-14 15:58:18,960 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:18,972 - INFO - Going to convert document batch...
2025-11-14 15:58:18,973 - INFO - Processing document 4_2024-03-11
2025-11-14 15:58:18,991 - INFO - Finished converting document 4_2024-03-11 in 0.06 sec.
2025-11-14 15:58:19,034 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:19,047 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CMCSA\4_2024-02-16' --> 'data\processed_data\CMCSA\4_2024-02-16.md'
Converted 'data\edgar_documents\CMCSA\4_2024-03-05' --> 'data\processed_data\CMCSA\4_2024-03-05.md'
Converted 'data\edgar_documents\CMCSA\4_2024-03-11' --> 'data\processed_data\CMCSA\4_2024-03-11.md'


2025-11-14 15:58:19,048 - INFO - Processing document 4_2024-03-19
2025-11-14 15:58:19,069 - INFO - Finished converting document 4_2024-03-19 in 0.06 sec.
2025-11-14 15:58:19,100 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:19,109 - INFO - Going to convert document batch...
2025-11-14 15:58:19,109 - INFO - Processing document 4_2024-04-01
2025-11-14 15:58:19,131 - INFO - Finished converting document 4_2024-04-01 in 0.03 sec.
2025-11-14 15:58:19,177 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:19,185 - INFO - Going to convert document batch...
2025-11-14 15:58:19,185 - INFO - Processing document 4_2024-04-02
2025-11-14 15:58:19,201 - INFO - Finished converting document 4_2024-04-02 in 0.05 sec.
2025-11-14 15:58:19,232 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:19,239 - INFO - Going to convert document batch...
2025-11-14 15:58:19,239 - INFO - Processing document 4_2024-04-17
2025-11-14 15:58:19,257 - IN

Converted 'data\edgar_documents\CMCSA\4_2024-03-19' --> 'data\processed_data\CMCSA\4_2024-03-19.md'
Converted 'data\edgar_documents\CMCSA\4_2024-04-01' --> 'data\processed_data\CMCSA\4_2024-04-01.md'
Converted 'data\edgar_documents\CMCSA\4_2024-04-02' --> 'data\processed_data\CMCSA\4_2024-04-02.md'
Converted 'data\edgar_documents\CMCSA\4_2024-04-17' --> 'data\processed_data\CMCSA\4_2024-04-17.md'


2025-11-14 15:58:19,293 - INFO - Going to convert document batch...
2025-11-14 15:58:19,294 - INFO - Processing document 4_2024-05-13
2025-11-14 15:58:19,312 - INFO - Finished converting document 4_2024-05-13 in 0.03 sec.
2025-11-14 15:58:19,347 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:58:19,348 - ERROR - Input document 4_2024-05-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 15:58:19,349 - INFO - Going to convert document batch...
2025-11-14 15:58:19,359 - IN

Converted 'data\edgar_documents\CMCSA\4_2024-05-13' --> 'data\processed_data\CMCSA\4_2024-05-13.md'
Error processing data\edgar_documents\CMCSA\4_2024-05-21: File format not allowed: data\edgar_documents\CMCSA\4_2024-05-21
Converted 'data\edgar_documents\CMCSA\4_2024-05-23' --> 'data\processed_data\CMCSA\4_2024-05-23.md'
Converted 'data\edgar_documents\CMCSA\4_2024-06-07' --> 'data\processed_data\CMCSA\4_2024-06-07.md'


2025-11-14 15:58:19,516 - INFO - Processing document 4_2024-06-20
2025-11-14 15:58:19,535 - INFO - Finished converting document 4_2024-06-20 in 0.05 sec.
2025-11-14 15:58:19,566 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:19,573 - INFO - Going to convert document batch...
2025-11-14 15:58:19,574 - INFO - Processing document 4_2024-07-01
2025-11-14 15:58:19,589 - INFO - Finished converting document 4_2024-07-01 in 0.05 sec.
2025-11-14 15:58:19,632 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:19,644 - INFO - Going to convert document batch...
2025-11-14 15:58:19,644 - INFO - Processing document 4_2024-09-18
2025-11-14 15:58:19,661 - INFO - Finished converting document 4_2024-09-18 in 0.05 sec.
2025-11-14 15:58:19,698 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:58:19,699 - ERROR - Input document 4_2024-09-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>

Converted 'data\edgar_documents\CMCSA\4_2024-06-20' --> 'data\processed_data\CMCSA\4_2024-06-20.md'
Converted 'data\edgar_documents\CMCSA\4_2024-07-01' --> 'data\processed_data\CMCSA\4_2024-07-01.md'
Converted 'data\edgar_documents\CMCSA\4_2024-09-18' --> 'data\processed_data\CMCSA\4_2024-09-18.md'
Error processing data\edgar_documents\CMCSA\4_2024-09-23: File format not allowed: data\edgar_documents\CMCSA\4_2024-09-23
Error processing data\edgar_documents\CMCSA\4_2024-09-25: File format not allowed: data\edgar_documents\CMCSA\4_2024-09-25


2025-11-14 15:58:19,730 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:19,739 - INFO - Going to convert document batch...
2025-11-14 15:58:19,740 - INFO - Processing document 4_2024-10-01
2025-11-14 15:58:19,778 - INFO - Finished converting document 4_2024-10-01 in 0.06 sec.
2025-11-14 15:58:19,813 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:19,821 - INFO - Going to convert document batch...
2025-11-14 15:58:19,822 - INFO - Processing document 4_2024-11-05
2025-11-14 15:58:19,839 - INFO - Finished converting document 4_2024-11-05 in 0.05 sec.
2025-11-14 15:58:19,893 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:19,906 - INFO - Going to convert document batch...
2025-11-14 15:58:19,907 - INFO - Processing document 4_2024-11-07
2025-11-14 15:58:19,929 - INFO - Finished converting document 4_2024-11-07 in 0.06 sec.
2025-11-14 15:58:19,960 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:

Converted 'data\edgar_documents\CMCSA\4_2024-10-01' --> 'data\processed_data\CMCSA\4_2024-10-01.md'
Converted 'data\edgar_documents\CMCSA\4_2024-11-05' --> 'data\processed_data\CMCSA\4_2024-11-05.md'
Converted 'data\edgar_documents\CMCSA\4_2024-11-07' --> 'data\processed_data\CMCSA\4_2024-11-07.md'


2025-11-14 15:58:20,013 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:20,020 - INFO - Going to convert document batch...
2025-11-14 15:58:20,021 - INFO - Processing document 4_2024-11-25
2025-11-14 15:58:20,038 - INFO - Finished converting document 4_2024-11-25 in 0.03 sec.
2025-11-14 15:58:20,081 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:20,096 - INFO - Going to convert document batch...
2025-11-14 15:58:20,097 - INFO - Processing document 4_2024-11-29
2025-11-14 15:58:20,115 - INFO - Finished converting document 4_2024-11-29 in 0.06 sec.
2025-11-14 15:58:20,144 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:20,151 - INFO - Going to convert document batch...
2025-11-14 15:58:20,153 - INFO - Processing document 4_2024-12-03
2025-11-14 15:58:20,170 - INFO - Finished converting document 4_2024-12-03 in 0.05 sec.
2025-11-14 15:58:20,201 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\4_2024-11-22' --> 'data\processed_data\CMCSA\4_2024-11-22.md'
Converted 'data\edgar_documents\CMCSA\4_2024-11-25' --> 'data\processed_data\CMCSA\4_2024-11-25.md'
Converted 'data\edgar_documents\CMCSA\4_2024-11-29' --> 'data\processed_data\CMCSA\4_2024-11-29.md'
Converted 'data\edgar_documents\CMCSA\4_2024-12-03' --> 'data\processed_data\CMCSA\4_2024-12-03.md'


2025-11-14 15:58:20,207 - INFO - Going to convert document batch...
2025-11-14 15:58:20,209 - INFO - Processing document 4_2025-01-03
2025-11-14 15:58:20,225 - INFO - Finished converting document 4_2025-01-03 in 0.03 sec.
2025-11-14 15:58:20,254 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:20,264 - INFO - Going to convert document batch...
2025-11-14 15:58:20,264 - INFO - Processing document 4_2025-01-06
2025-11-14 15:58:20,288 - INFO - Finished converting document 4_2025-01-06 in 0.05 sec.
2025-11-14 15:58:20,321 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:20,329 - INFO - Going to convert document batch...
2025-11-14 15:58:20,330 - INFO - Processing document 4_2025-01-15
2025-11-14 15:58:20,349 - INFO - Finished converting document 4_2025-01-15 in 0.03 sec.
2025-11-14 15:58:20,394 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:20,404 - INFO - Going to convert document batch...
2025-11-14 15:58:20,404 - 

Converted 'data\edgar_documents\CMCSA\4_2025-01-03' --> 'data\processed_data\CMCSA\4_2025-01-03.md'
Converted 'data\edgar_documents\CMCSA\4_2025-01-06' --> 'data\processed_data\CMCSA\4_2025-01-06.md'
Converted 'data\edgar_documents\CMCSA\4_2025-01-15' --> 'data\processed_data\CMCSA\4_2025-01-15.md'


2025-11-14 15:58:20,452 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:20,463 - INFO - Going to convert document batch...
2025-11-14 15:58:20,464 - INFO - Processing document 4_2025-03-04
2025-11-14 15:58:20,485 - INFO - Finished converting document 4_2025-03-04 in 0.05 sec.
2025-11-14 15:58:20,516 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:20,525 - INFO - Going to convert document batch...
2025-11-14 15:58:20,526 - INFO - Processing document 4_2025-03-07
2025-11-14 15:58:20,546 - INFO - Finished converting document 4_2025-03-07 in 0.05 sec.
2025-11-14 15:58:20,578 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:20,585 - INFO - Going to convert document batch...
2025-11-14 15:58:20,586 - INFO - Processing document 4_2025-03-10
2025-11-14 15:58:20,602 - INFO - Finished converting document 4_2025-03-10 in 0.03 sec.
2025-11-14 15:58:20,630 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\4_2025-02-27' --> 'data\processed_data\CMCSA\4_2025-02-27.md'
Converted 'data\edgar_documents\CMCSA\4_2025-03-04' --> 'data\processed_data\CMCSA\4_2025-03-04.md'
Converted 'data\edgar_documents\CMCSA\4_2025-03-07' --> 'data\processed_data\CMCSA\4_2025-03-07.md'
Converted 'data\edgar_documents\CMCSA\4_2025-03-10' --> 'data\processed_data\CMCSA\4_2025-03-10.md'


2025-11-14 15:58:20,636 - INFO - Going to convert document batch...
2025-11-14 15:58:20,637 - INFO - Processing document 4_2025-03-19
2025-11-14 15:58:20,654 - INFO - Finished converting document 4_2025-03-19 in 0.03 sec.
2025-11-14 15:58:20,686 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:20,694 - INFO - Going to convert document batch...
2025-11-14 15:58:20,695 - INFO - Processing document 4_2025-04-02
2025-11-14 15:58:20,712 - INFO - Finished converting document 4_2025-04-02 in 0.03 sec.
2025-11-14 15:58:20,749 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 15:58:20,750 - ERROR - Input document 4_2025-05-06 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\CMCSA\4_2025-03-19' --> 'data\processed_data\CMCSA\4_2025-03-19.md'
Converted 'data\edgar_documents\CMCSA\4_2025-04-02' --> 'data\processed_data\CMCSA\4_2025-04-02.md'
Error processing data\edgar_documents\CMCSA\4_2025-05-06: File format not allowed: data\edgar_documents\CMCSA\4_2025-05-06
Converted 'data\edgar_documents\CMCSA\4_2025-05-07' --> 'data\processed_data\CMCSA\4_2025-05-07.md'
Converted 'data\edgar_documents\CMCSA\4_2025-05-15' --> 'data\processed_data\CMCSA\4_2025-05-15.md'


2025-11-14 15:58:20,881 - INFO - Going to convert document batch...
2025-11-14 15:58:20,882 - INFO - Processing document 4_2025-05-23
2025-11-14 15:58:20,901 - INFO - Finished converting document 4_2025-05-23 in 0.05 sec.
2025-11-14 15:58:20,933 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:20,941 - INFO - Going to convert document batch...
2025-11-14 15:58:20,942 - INFO - Processing document 4_2025-06-06


Converted 'data\edgar_documents\CMCSA\4_2025-05-23' --> 'data\processed_data\CMCSA\4_2025-05-23.md'


2025-11-14 15:58:21,160 - INFO - Finished converting document 4_2025-06-06 in 0.23 sec.
2025-11-14 15:58:21,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:21,199 - INFO - Going to convert document batch...
2025-11-14 15:58:21,199 - INFO - Processing document 4_2025-06-20
2025-11-14 15:58:21,217 - INFO - Finished converting document 4_2025-06-20 in 0.05 sec.
2025-11-14 15:58:21,262 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:21,270 - INFO - Going to convert document batch...
2025-11-14 15:58:21,271 - INFO - Processing document 4_2025-07-02
2025-11-14 15:58:21,288 - INFO - Finished converting document 4_2025-07-02 in 0.05 sec.
2025-11-14 15:58:21,319 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:21,331 - INFO - Going to convert document batch...
2025-11-14 15:58:21,331 - INFO - Processing document 4_2025-08-07
2025-11-14 15:58:21,358 - INFO - Finished converting document 4_2025-08-07 in 0.05 sec.


Converted 'data\edgar_documents\CMCSA\4_2025-06-06' --> 'data\processed_data\CMCSA\4_2025-06-06.md'
Converted 'data\edgar_documents\CMCSA\4_2025-06-20' --> 'data\processed_data\CMCSA\4_2025-06-20.md'
Converted 'data\edgar_documents\CMCSA\4_2025-07-02' --> 'data\processed_data\CMCSA\4_2025-07-02.md'


2025-11-14 15:58:21,394 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:21,404 - INFO - Going to convert document batch...
2025-11-14 15:58:21,405 - INFO - Processing document 4_2025-08-21
2025-11-14 15:58:21,422 - INFO - Finished converting document 4_2025-08-21 in 0.05 sec.
2025-11-14 15:58:21,451 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:21,457 - INFO - Going to convert document batch...
2025-11-14 15:58:21,458 - INFO - Processing document 4_2025-09-04
2025-11-14 15:58:21,475 - INFO - Finished converting document 4_2025-09-04 in 0.03 sec.
2025-11-14 15:58:21,504 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:21,512 - INFO - Going to convert document batch...
2025-11-14 15:58:21,513 - INFO - Processing document 4_2025-10-02
2025-11-14 15:58:21,530 - INFO - Finished converting document 4_2025-10-02 in 0.05 sec.
2025-11-14 15:58:21,557 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\4_2025-08-07' --> 'data\processed_data\CMCSA\4_2025-08-07.md'
Converted 'data\edgar_documents\CMCSA\4_2025-08-21' --> 'data\processed_data\CMCSA\4_2025-08-21.md'
Converted 'data\edgar_documents\CMCSA\4_2025-09-04' --> 'data\processed_data\CMCSA\4_2025-09-04.md'
Converted 'data\edgar_documents\CMCSA\4_2025-10-02' --> 'data\processed_data\CMCSA\4_2025-10-02.md'


2025-11-14 15:58:21,567 - INFO - Going to convert document batch...
2025-11-14 15:58:21,568 - INFO - Processing document 4_2025-11-05
2025-11-14 15:58:21,604 - INFO - Finished converting document 4_2025-11-05 in 0.05 sec.
2025-11-14 15:58:21,649 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:21,664 - INFO - Going to convert document batch...
2025-11-14 15:58:21,664 - INFO - Processing document 8-K_2023-01-06
2025-11-14 15:58:21,693 - INFO - Finished converting document 8-K_2023-01-06 in 0.06 sec.
2025-11-14 15:58:21,724 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:21,741 - INFO - Going to convert document batch...
2025-11-14 15:58:21,741 - INFO - Processing document 8-K_2023-01-26
2025-11-14 15:58:21,765 - INFO - Finished converting document 8-K_2023-01-26 in 0.06 sec.
2025-11-14 15:58:21,795 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:21,810 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CMCSA\4_2025-11-05' --> 'data\processed_data\CMCSA\4_2025-11-05.md'
Converted 'data\edgar_documents\CMCSA\8-K_2023-01-06' --> 'data\processed_data\CMCSA\8-K_2023-01-06.md'
Converted 'data\edgar_documents\CMCSA\8-K_2023-01-26' --> 'data\processed_data\CMCSA\8-K_2023-01-26.md'


2025-11-14 15:58:21,811 - INFO - Processing document 8-K_2023-02-09
2025-11-14 15:58:21,834 - INFO - Finished converting document 8-K_2023-02-09 in 0.05 sec.
2025-11-14 15:58:21,860 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:21,878 - INFO - Going to convert document batch...
2025-11-14 15:58:21,879 - INFO - Processing document 8-K_2023-03-13
2025-11-14 15:58:21,904 - INFO - Finished converting document 8-K_2023-03-13 in 0.06 sec.
2025-11-14 15:58:21,970 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:21,995 - INFO - Going to convert document batch...
2025-11-14 15:58:21,995 - INFO - Processing document 8-K_2023-03-15
2025-11-14 15:58:22,018 - INFO - Finished converting document 8-K_2023-03-15 in 0.09 sec.
2025-11-14 15:58:22,046 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\8-K_2023-02-09' --> 'data\processed_data\CMCSA\8-K_2023-02-09.md'
Converted 'data\edgar_documents\CMCSA\8-K_2023-03-13' --> 'data\processed_data\CMCSA\8-K_2023-03-13.md'
Converted 'data\edgar_documents\CMCSA\8-K_2023-03-15' --> 'data\processed_data\CMCSA\8-K_2023-03-15.md'


2025-11-14 15:58:22,059 - INFO - Going to convert document batch...
2025-11-14 15:58:22,060 - INFO - Processing document 8-K_2023-04-21
2025-11-14 15:58:22,079 - INFO - Finished converting document 8-K_2023-04-21 in 0.05 sec.
2025-11-14 15:58:22,105 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:22,118 - INFO - Going to convert document batch...
2025-11-14 15:58:22,118 - INFO - Processing document 8-K_2023-04-24
2025-11-14 15:58:22,138 - INFO - Finished converting document 8-K_2023-04-24 in 0.05 sec.
2025-11-14 15:58:22,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:22,181 - INFO - Going to convert document batch...
2025-11-14 15:58:22,181 - INFO - Processing document 8-K_2023-04-27
2025-11-14 15:58:22,205 - INFO - Finished converting document 8-K_2023-04-27 in 0.05 sec.
2025-11-14 15:58:22,235 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:22,248 - INFO - Going to convert document batch...
2025-11-14 15:

Converted 'data\edgar_documents\CMCSA\8-K_2023-04-21' --> 'data\processed_data\CMCSA\8-K_2023-04-21.md'
Converted 'data\edgar_documents\CMCSA\8-K_2023-04-24' --> 'data\processed_data\CMCSA\8-K_2023-04-24.md'
Converted 'data\edgar_documents\CMCSA\8-K_2023-04-27' --> 'data\processed_data\CMCSA\8-K_2023-04-27.md'
Converted 'data\edgar_documents\CMCSA\8-K_2023-05-01' --> 'data\processed_data\CMCSA\8-K_2023-05-01.md'


2025-11-14 15:58:22,311 - INFO - Going to convert document batch...
2025-11-14 15:58:22,311 - INFO - Processing document 8-K_2023-05-08
2025-11-14 15:58:22,335 - INFO - Finished converting document 8-K_2023-05-08 in 0.05 sec.
2025-11-14 15:58:22,364 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:22,378 - INFO - Going to convert document batch...
2025-11-14 15:58:22,378 - INFO - Processing document 8-K_2023-05-09
2025-11-14 15:58:22,405 - INFO - Finished converting document 8-K_2023-05-09 in 0.06 sec.
2025-11-14 15:58:22,437 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:22,461 - INFO - Going to convert document batch...
2025-11-14 15:58:22,462 - INFO - Processing document 8-K_2023-06-09
2025-11-14 15:58:22,524 - INFO - Finished converting document 8-K_2023-06-09 in 0.09 sec.


Converted 'data\edgar_documents\CMCSA\8-K_2023-05-08' --> 'data\processed_data\CMCSA\8-K_2023-05-08.md'
Converted 'data\edgar_documents\CMCSA\8-K_2023-05-09' --> 'data\processed_data\CMCSA\8-K_2023-05-09.md'


2025-11-14 15:58:22,569 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:22,587 - INFO - Going to convert document batch...
2025-11-14 15:58:22,588 - INFO - Processing document 8-K_2023-07-27
2025-11-14 15:58:22,613 - INFO - Finished converting document 8-K_2023-07-27 in 0.06 sec.
2025-11-14 15:58:22,643 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:22,657 - INFO - Going to convert document batch...
2025-11-14 15:58:22,658 - INFO - Processing document 8-K_2023-09-11
2025-11-14 15:58:22,681 - INFO - Finished converting document 8-K_2023-09-11 in 0.05 sec.
2025-11-14 15:58:22,733 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\8-K_2023-06-09' --> 'data\processed_data\CMCSA\8-K_2023-06-09.md'
Converted 'data\edgar_documents\CMCSA\8-K_2023-07-27' --> 'data\processed_data\CMCSA\8-K_2023-07-27.md'
Converted 'data\edgar_documents\CMCSA\8-K_2023-09-11' --> 'data\processed_data\CMCSA\8-K_2023-09-11.md'


2025-11-14 15:58:22,755 - INFO - Going to convert document batch...
2025-11-14 15:58:22,756 - INFO - Processing document 8-K_2023-10-03
2025-11-14 15:58:22,780 - INFO - Finished converting document 8-K_2023-10-03 in 0.08 sec.
2025-11-14 15:58:22,811 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:22,827 - INFO - Going to convert document batch...
2025-11-14 15:58:22,828 - INFO - Processing document 8-K_2023-10-26
2025-11-14 15:58:22,851 - INFO - Finished converting document 8-K_2023-10-26 in 0.05 sec.
2025-11-14 15:58:22,881 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:22,896 - INFO - Going to convert document batch...
2025-11-14 15:58:22,896 - INFO - Processing document 8-K_2023-12-06
2025-11-14 15:58:22,921 - INFO - Finished converting document 8-K_2023-12-06 in 0.06 sec.
2025-11-14 15:58:22,970 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:22,993 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CMCSA\8-K_2023-10-03' --> 'data\processed_data\CMCSA\8-K_2023-10-03.md'
Converted 'data\edgar_documents\CMCSA\8-K_2023-10-26' --> 'data\processed_data\CMCSA\8-K_2023-10-26.md'
Converted 'data\edgar_documents\CMCSA\8-K_2023-12-06' --> 'data\processed_data\CMCSA\8-K_2023-12-06.md'


2025-11-14 15:58:22,994 - INFO - Processing document 8-K_2024-01-25
2025-11-14 15:58:23,028 - INFO - Finished converting document 8-K_2024-01-25 in 0.09 sec.
2025-11-14 15:58:23,077 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:23,090 - INFO - Going to convert document batch...
2025-11-14 15:58:23,091 - INFO - Processing document 8-K_2024-04-15
2025-11-14 15:58:23,112 - INFO - Finished converting document 8-K_2024-04-15 in 0.05 sec.
2025-11-14 15:58:23,142 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:23,155 - INFO - Going to convert document batch...
2025-11-14 15:58:23,157 - INFO - Processing document 8-K_2024-04-25
2025-11-14 15:58:23,181 - INFO - Finished converting document 8-K_2024-04-25 in 0.05 sec.
2025-11-14 15:58:23,212 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:23,226 - INFO - Going to convert document batch...
2025-11-14 15:58:23,227 - INFO - Processing document 8-K_2024-05-17
2025-11-14 15:

Converted 'data\edgar_documents\CMCSA\8-K_2024-01-25' --> 'data\processed_data\CMCSA\8-K_2024-01-25.md'
Converted 'data\edgar_documents\CMCSA\8-K_2024-04-15' --> 'data\processed_data\CMCSA\8-K_2024-04-15.md'
Converted 'data\edgar_documents\CMCSA\8-K_2024-04-25' --> 'data\processed_data\CMCSA\8-K_2024-04-25.md'


2025-11-14 15:58:23,286 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:23,300 - INFO - Going to convert document batch...
2025-11-14 15:58:23,301 - INFO - Processing document 8-K_2024-05-22
2025-11-14 15:58:23,323 - INFO - Finished converting document 8-K_2024-05-22 in 0.06 sec.
2025-11-14 15:58:23,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:23,396 - INFO - Going to convert document batch...
2025-11-14 15:58:23,397 - INFO - Processing document 8-K_2024-06-12
2025-11-14 15:58:23,434 - INFO - Finished converting document 8-K_2024-06-12 in 0.11 sec.


Converted 'data\edgar_documents\CMCSA\8-K_2024-05-17' --> 'data\processed_data\CMCSA\8-K_2024-05-17.md'
Converted 'data\edgar_documents\CMCSA\8-K_2024-05-22' --> 'data\processed_data\CMCSA\8-K_2024-05-22.md'


2025-11-14 15:58:23,466 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:23,480 - INFO - Going to convert document batch...
2025-11-14 15:58:23,481 - INFO - Processing document 8-K_2024-07-23
2025-11-14 15:58:23,507 - INFO - Finished converting document 8-K_2024-07-23 in 0.05 sec.
2025-11-14 15:58:23,554 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:23,566 - INFO - Going to convert document batch...
2025-11-14 15:58:23,567 - INFO - Processing document 8-K_2024-09-23
2025-11-14 15:58:23,583 - INFO - Finished converting document 8-K_2024-09-23 in 0.06 sec.
2025-11-14 15:58:23,605 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:23,618 - INFO - Going to convert document batch...
2025-11-14 15:58:23,618 - INFO - Processing document 8-K_2024-09-26
2025-11-14 15:58:23,638 - INFO - Finished converting document 8-K_2024-09-26 in 0.05 sec.


Converted 'data\edgar_documents\CMCSA\8-K_2024-06-12' --> 'data\processed_data\CMCSA\8-K_2024-06-12.md'
Converted 'data\edgar_documents\CMCSA\8-K_2024-07-23' --> 'data\processed_data\CMCSA\8-K_2024-07-23.md'
Converted 'data\edgar_documents\CMCSA\8-K_2024-09-23' --> 'data\processed_data\CMCSA\8-K_2024-09-23.md'


2025-11-14 15:58:23,663 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:23,679 - INFO - Going to convert document batch...
2025-11-14 15:58:23,679 - INFO - Processing document 8-K_2024-10-31
2025-11-14 15:58:23,705 - INFO - Finished converting document 8-K_2024-10-31 in 0.06 sec.
2025-11-14 15:58:23,735 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:23,750 - INFO - Going to convert document batch...
2025-11-14 15:58:23,750 - INFO - Processing document 8-K_2025-01-30
2025-11-14 15:58:23,774 - INFO - Finished converting document 8-K_2025-01-30 in 0.05 sec.
2025-11-14 15:58:23,804 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:23,819 - INFO - Going to convert document batch...
2025-11-14 15:58:23,820 - INFO - Processing document 8-K_2025-03-19


Converted 'data\edgar_documents\CMCSA\8-K_2024-09-26' --> 'data\processed_data\CMCSA\8-K_2024-09-26.md'
Converted 'data\edgar_documents\CMCSA\8-K_2024-10-31' --> 'data\processed_data\CMCSA\8-K_2024-10-31.md'
Converted 'data\edgar_documents\CMCSA\8-K_2025-01-30' --> 'data\processed_data\CMCSA\8-K_2025-01-30.md'


2025-11-14 15:58:24,046 - INFO - Finished converting document 8-K_2025-03-19 in 0.25 sec.
2025-11-14 15:58:24,075 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:24,088 - INFO - Going to convert document batch...
2025-11-14 15:58:24,089 - INFO - Processing document 8-K_2025-04-24
2025-11-14 15:58:24,114 - INFO - Finished converting document 8-K_2025-04-24 in 0.05 sec.
2025-11-14 15:58:24,144 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:24,157 - INFO - Going to convert document batch...
2025-11-14 15:58:24,158 - INFO - Processing document 8-K_2025-05-05
2025-11-14 15:58:24,177 - INFO - Finished converting document 8-K_2025-05-05 in 0.05 sec.
2025-11-14 15:58:24,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:24,210 - INFO - Going to convert document batch...
2025-11-14 15:58:24,211 - INFO - Processing document 8-K_2025-05-08
2025-11-14 15:58:24,232 - INFO - Finished converting document 8-K_2025-05-08 in 0.

Converted 'data\edgar_documents\CMCSA\8-K_2025-03-19' --> 'data\processed_data\CMCSA\8-K_2025-03-19.md'
Converted 'data\edgar_documents\CMCSA\8-K_2025-04-24' --> 'data\processed_data\CMCSA\8-K_2025-04-24.md'
Converted 'data\edgar_documents\CMCSA\8-K_2025-05-05' --> 'data\processed_data\CMCSA\8-K_2025-05-05.md'
Converted 'data\edgar_documents\CMCSA\8-K_2025-05-08' --> 'data\processed_data\CMCSA\8-K_2025-05-08.md'


2025-11-14 15:58:24,280 - INFO - Going to convert document batch...
2025-11-14 15:58:24,280 - INFO - Processing document 8-K_2025-06-20
2025-11-14 15:58:24,323 - INFO - Finished converting document 8-K_2025-06-20 in 0.09 sec.
2025-11-14 15:58:24,360 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:24,374 - INFO - Going to convert document batch...
2025-11-14 15:58:24,374 - INFO - Processing document 8-K_2025-07-31
2025-11-14 15:58:24,400 - INFO - Finished converting document 8-K_2025-07-31 in 0.05 sec.
2025-11-14 15:58:24,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:24,449 - INFO - Going to convert document batch...
2025-11-14 15:58:24,450 - INFO - Processing document 8-K_2025-08-22
2025-11-14 15:58:24,474 - INFO - Finished converting document 8-K_2025-08-22 in 0.05 sec.
2025-11-14 15:58:24,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:24,514 - INFO - Going to convert document batch...
2025-11-14 15:

Converted 'data\edgar_documents\CMCSA\8-K_2025-06-20' --> 'data\processed_data\CMCSA\8-K_2025-06-20.md'
Converted 'data\edgar_documents\CMCSA\8-K_2025-07-31' --> 'data\processed_data\CMCSA\8-K_2025-07-31.md'
Converted 'data\edgar_documents\CMCSA\8-K_2025-08-22' --> 'data\processed_data\CMCSA\8-K_2025-08-22.md'


2025-11-14 15:58:24,539 - INFO - Finished converting document 8-K_2025-09-22 in 0.05 sec.
2025-11-14 15:58:24,568 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:24,610 - INFO - Going to convert document batch...
2025-11-14 15:58:24,612 - INFO - Processing document 8-K_2025-09-26
2025-11-14 15:58:24,641 - INFO - Finished converting document 8-K_2025-09-26 in 0.09 sec.
2025-11-14 15:58:24,668 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:24,682 - INFO - Going to convert document batch...
2025-11-14 15:58:24,682 - INFO - Processing document 8-K_2025-09-29
2025-11-14 15:58:24,705 - INFO - Finished converting document 8-K_2025-09-29 in 0.05 sec.
2025-11-14 15:58:24,735 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\8-K_2025-09-22' --> 'data\processed_data\CMCSA\8-K_2025-09-22.md'
Converted 'data\edgar_documents\CMCSA\8-K_2025-09-26' --> 'data\processed_data\CMCSA\8-K_2025-09-26.md'
Converted 'data\edgar_documents\CMCSA\8-K_2025-09-29' --> 'data\processed_data\CMCSA\8-K_2025-09-29.md'


2025-11-14 15:58:24,749 - INFO - Going to convert document batch...
2025-11-14 15:58:24,751 - INFO - Processing document 8-K_2025-10-01
2025-11-14 15:58:24,777 - INFO - Finished converting document 8-K_2025-10-01 in 0.06 sec.
2025-11-14 15:58:24,827 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:24,847 - INFO - Going to convert document batch...
2025-11-14 15:58:24,848 - INFO - Processing document 8-K_2025-10-02
2025-11-14 15:58:24,875 - INFO - Finished converting document 8-K_2025-10-02 in 0.08 sec.
2025-11-14 15:58:24,927 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:24,946 - INFO - Going to convert document batch...
2025-11-14 15:58:24,947 - INFO - Processing document 8-K_2025-10-06
2025-11-14 15:58:24,971 - INFO - Finished converting document 8-K_2025-10-06 in 0.08 sec.
2025-11-14 15:58:24,999 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\8-K_2025-10-01' --> 'data\processed_data\CMCSA\8-K_2025-10-01.md'
Converted 'data\edgar_documents\CMCSA\8-K_2025-10-02' --> 'data\processed_data\CMCSA\8-K_2025-10-02.md'
Converted 'data\edgar_documents\CMCSA\8-K_2025-10-06' --> 'data\processed_data\CMCSA\8-K_2025-10-06.md'


2025-11-14 15:58:25,013 - INFO - Going to convert document batch...
2025-11-14 15:58:25,014 - INFO - Processing document 8-K_2025-10-08
2025-11-14 15:58:25,039 - INFO - Finished converting document 8-K_2025-10-08 in 0.05 sec.
2025-11-14 15:58:25,069 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:25,083 - INFO - Going to convert document batch...
2025-11-14 15:58:25,083 - INFO - Processing document 8-K_2025-10-09
2025-11-14 15:58:25,112 - INFO - Finished converting document 8-K_2025-10-09 in 0.06 sec.
2025-11-14 15:58:25,162 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:25,180 - INFO - Going to convert document batch...
2025-11-14 15:58:25,181 - INFO - Processing document 8-K_2025-10-30
2025-11-14 15:58:25,205 - INFO - Finished converting document 8-K_2025-10-30 in 0.08 sec.


Converted 'data\edgar_documents\CMCSA\8-K_2025-10-08' --> 'data\processed_data\CMCSA\8-K_2025-10-08.md'
Converted 'data\edgar_documents\CMCSA\8-K_2025-10-09' --> 'data\processed_data\CMCSA\8-K_2025-10-09.md'
Converted 'data\edgar_documents\CMCSA\8-K_2025-10-30' --> 'data\processed_data\CMCSA\8-K_2025-10-30.md'


2025-11-14 15:58:25,255 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:58:25,872 - INFO - Going to convert document batch...
2025-11-14 15:58:25,874 - INFO - Processing document DEF-14A_2023-04-28
2025-11-14 15:58:32,164 - INFO - Finished converting document DEF-14A_2023-04-28 in 6.94 sec.
2025-11-14 15:58:33,155 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\DEF-14A_2023-04-28' --> 'data\processed_data\CMCSA\DEF-14A_2023-04-28.md'


2025-11-14 15:58:33,678 - INFO - Going to convert document batch...
2025-11-14 15:58:33,679 - INFO - Processing document DEF-14A_2024-04-26
2025-11-14 15:58:38,579 - INFO - Finished converting document DEF-14A_2024-04-26 in 5.50 sec.
2025-11-14 15:58:39,267 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\DEF-14A_2024-04-26' --> 'data\processed_data\CMCSA\DEF-14A_2024-04-26.md'


2025-11-14 15:58:39,683 - INFO - Going to convert document batch...
2025-11-14 15:58:39,683 - INFO - Processing document DEF-14A_2025-04-25
2025-11-14 15:58:46,691 - INFO - Finished converting document DEF-14A_2025-04-25 in 7.45 sec.
2025-11-14 15:58:47,768 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CMCSA\DEF-14A_2025-04-25' --> 'data\processed_data\CMCSA\DEF-14A_2025-04-25.md'
Processed 134 new files. Errors: 7
Found 186 files to process in data\edgar_documents\COF


2025-11-14 15:58:49,953 - INFO - Going to convert document batch...
2025-11-14 15:58:49,953 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 15:58:49,954 - INFO - Processing document 10-K_2023-02-24
2025-11-14 15:59:04,935 - INFO - Finished converting document 10-K_2023-02-24 in 17.34 sec.


Converted 'data\edgar_documents\COF\10-K_2023-02-24' --> 'data\processed_data\COF\10-K_2023-02-24.md'


2025-11-14 15:59:09,692 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:59:15,242 - INFO - Going to convert document batch...
2025-11-14 15:59:15,244 - INFO - Processing document 10-K_2024-02-23
2025-11-14 15:59:30,339 - INFO - Finished converting document 10-K_2024-02-23 in 20.84 sec.


Converted 'data\edgar_documents\COF\10-K_2024-02-23' --> 'data\processed_data\COF\10-K_2024-02-23.md'


2025-11-14 15:59:34,989 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 15:59:39,181 - INFO - Going to convert document batch...
2025-11-14 15:59:39,182 - INFO - Processing document 10-K_2025-02-20
2025-11-14 15:59:55,743 - INFO - Finished converting document 10-K_2025-02-20 in 20.95 sec.
2025-11-14 16:00:01,008 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\10-K_2025-02-20' --> 'data\processed_data\COF\10-K_2025-02-20.md'


2025-11-14 16:00:07,347 - INFO - Going to convert document batch...
2025-11-14 16:00:07,348 - INFO - Processing document 10-Q_2023-05-05
2025-11-14 16:00:17,523 - INFO - Finished converting document 10-Q_2023-05-05 in 16.62 sec.
2025-11-14 16:00:21,420 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\10-Q_2023-05-05' --> 'data\processed_data\COF\10-Q_2023-05-05.md'


2025-11-14 16:00:23,836 - INFO - Going to convert document batch...
2025-11-14 16:00:23,837 - INFO - Processing document 10-Q_2023-07-27
2025-11-14 16:00:29,023 - INFO - Finished converting document 10-Q_2023-07-27 in 7.80 sec.
2025-11-14 16:00:31,025 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\10-Q_2023-07-27' --> 'data\processed_data\COF\10-Q_2023-07-27.md'


2025-11-14 16:00:33,840 - INFO - Going to convert document batch...
2025-11-14 16:00:33,841 - INFO - Processing document 10-Q_2023-11-02
2025-11-14 16:00:38,662 - INFO - Finished converting document 10-Q_2023-11-02 in 7.80 sec.
2025-11-14 16:00:40,682 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\10-Q_2023-11-02' --> 'data\processed_data\COF\10-Q_2023-11-02.md'


2025-11-14 16:00:42,976 - INFO - Going to convert document batch...
2025-11-14 16:00:42,977 - INFO - Processing document 10-Q_2024-05-02
2025-11-14 16:00:49,911 - INFO - Finished converting document 10-Q_2024-05-02 in 9.34 sec.


Converted 'data\edgar_documents\COF\10-Q_2024-05-02' --> 'data\processed_data\COF\10-Q_2024-05-02.md'


2025-11-14 16:00:54,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:01:02,359 - INFO - Going to convert document batch...
2025-11-14 16:01:02,360 - INFO - Processing document 10-Q_2024-08-01
2025-11-14 16:01:17,373 - INFO - Finished converting document 10-Q_2024-08-01 in 23.03 sec.


Converted 'data\edgar_documents\COF\10-Q_2024-08-01' --> 'data\processed_data\COF\10-Q_2024-08-01.md'


2025-11-14 16:01:22,639 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:01:30,995 - INFO - Going to convert document batch...
2025-11-14 16:01:30,998 - INFO - Processing document 10-Q_2024-10-31
2025-11-14 16:01:44,426 - INFO - Finished converting document 10-Q_2024-10-31 in 21.97 sec.
2025-11-14 16:01:49,723 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\10-Q_2024-10-31' --> 'data\processed_data\COF\10-Q_2024-10-31.md'


2025-11-14 16:01:55,396 - INFO - Going to convert document batch...
2025-11-14 16:01:55,397 - INFO - Processing document 10-Q_2025-05-07
2025-11-14 16:01:59,481 - INFO - Finished converting document 10-Q_2025-05-07 in 9.89 sec.
2025-11-14 16:02:02,447 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\10-Q_2025-05-07' --> 'data\processed_data\COF\10-Q_2025-05-07.md'


2025-11-14 16:02:04,860 - INFO - Going to convert document batch...
2025-11-14 16:02:04,861 - INFO - Processing document 10-Q_2025-07-31
2025-11-14 16:02:13,233 - INFO - Finished converting document 10-Q_2025-07-31 in 10.98 sec.


Converted 'data\edgar_documents\COF\10-Q_2025-07-31' --> 'data\processed_data\COF\10-Q_2025-07-31.md'


2025-11-14 16:02:19,720 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:27,768 - INFO - Going to convert document batch...
2025-11-14 16:02:27,769 - INFO - Processing document 10-Q_2025-11-03
2025-11-14 16:02:44,022 - INFO - Finished converting document 10-Q_2025-11-03 in 24.50 sec.
2025-11-14 16:02:52,601 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:52,602 - ERROR - Input document 4_2023-01-25 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-1

Converted 'data\edgar_documents\COF\10-Q_2025-11-03' --> 'data\processed_data\COF\10-Q_2025-11-03.md'
Error processing data\edgar_documents\COF\4_2023-01-25: File format not allowed: data\edgar_documents\COF\4_2023-01-25
Error processing data\edgar_documents\COF\4_2023-01-26: File format not allowed: data\edgar_documents\COF\4_2023-01-26


2025-11-14 16:02:52,796 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:52,827 - INFO - Going to convert document batch...
2025-11-14 16:02:52,829 - INFO - Processing document 4_2023-02-02
2025-11-14 16:02:52,869 - INFO - Finished converting document 4_2023-02-02 in 0.08 sec.
2025-11-14 16:02:52,922 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:52,936 - INFO - Going to convert document batch...
2025-11-14 16:02:52,936 - INFO - Processing document 4_2023-02-16
2025-11-14 16:02:52,966 - INFO - Finished converting document 4_2023-02-16 in 0.06 sec.


Converted 'data\edgar_documents\COF\4_2023-01-30' --> 'data\processed_data\COF\4_2023-01-30.md'
Converted 'data\edgar_documents\COF\4_2023-02-02' --> 'data\processed_data\COF\4_2023-02-02.md'


2025-11-14 16:02:53,029 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:53,066 - INFO - Going to convert document batch...
2025-11-14 16:02:53,068 - INFO - Processing document 4_2023-02-17
2025-11-14 16:02:53,126 - INFO - Finished converting document 4_2023-02-17 in 0.11 sec.
2025-11-14 16:02:53,178 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:53,194 - INFO - Going to convert document batch...
2025-11-14 16:02:53,196 - INFO - Processing document 4_2023-03-03


Converted 'data\edgar_documents\COF\4_2023-02-16' --> 'data\processed_data\COF\4_2023-02-16.md'
Converted 'data\edgar_documents\COF\4_2023-02-17' --> 'data\processed_data\COF\4_2023-02-17.md'


2025-11-14 16:02:53,232 - INFO - Finished converting document 4_2023-03-03 in 0.08 sec.
2025-11-14 16:02:53,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:53,297 - INFO - Going to convert document batch...
2025-11-14 16:02:53,299 - INFO - Processing document 4_2023-05-08
2025-11-14 16:02:53,337 - INFO - Finished converting document 4_2023-05-08 in 0.06 sec.
2025-11-14 16:02:53,409 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:53,410 - ERROR - Input document 4_2023-06-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'js

Converted 'data\edgar_documents\COF\4_2023-03-03' --> 'data\processed_data\COF\4_2023-03-03.md'
Converted 'data\edgar_documents\COF\4_2023-05-08' --> 'data\processed_data\COF\4_2023-05-08.md'
Error processing data\edgar_documents\COF\4_2023-06-05: File format not allowed: data\edgar_documents\COF\4_2023-06-05
Error processing data\edgar_documents\COF\4_2023-06-06: File format not allowed: data\edgar_documents\COF\4_2023-06-06


2025-11-14 16:02:53,465 - INFO - Going to convert document batch...
2025-11-14 16:02:53,466 - INFO - Processing document 4_2023-07-20
2025-11-14 16:02:53,511 - INFO - Finished converting document 4_2023-07-20 in 0.08 sec.
2025-11-14 16:02:53,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:53,604 - INFO - Going to convert document batch...
2025-11-14 16:02:53,605 - INFO - Processing document 4_2023-07-26
2025-11-14 16:02:53,648 - INFO - Finished converting document 4_2023-07-26 in 0.08 sec.
2025-11-14 16:02:53,737 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:53,755 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\4_2023-07-20' --> 'data\processed_data\COF\4_2023-07-20.md'
Converted 'data\edgar_documents\COF\4_2023-07-26' --> 'data\processed_data\COF\4_2023-07-26.md'


2025-11-14 16:02:53,756 - INFO - Processing document 4_2023-07-27
2025-11-14 16:02:53,795 - INFO - Finished converting document 4_2023-07-27 in 0.09 sec.
2025-11-14 16:02:53,853 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:53,874 - INFO - Going to convert document batch...
2025-11-14 16:02:53,875 - INFO - Processing document 4_2023-07-28
2025-11-14 16:02:53,937 - INFO - Finished converting document 4_2023-07-28 in 0.11 sec.
2025-11-14 16:02:54,007 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:54,029 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\4_2023-07-27' --> 'data\processed_data\COF\4_2023-07-27.md'
Converted 'data\edgar_documents\COF\4_2023-07-28' --> 'data\processed_data\COF\4_2023-07-28.md'


2025-11-14 16:02:54,030 - INFO - Processing document 4_2023-08-01
2025-11-14 16:02:54,079 - INFO - Finished converting document 4_2023-08-01 in 0.09 sec.
2025-11-14 16:02:54,139 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:54,164 - INFO - Going to convert document batch...
2025-11-14 16:02:54,165 - INFO - Processing document 4_2023-08-03
2025-11-14 16:02:54,215 - INFO - Finished converting document 4_2023-08-03 in 0.09 sec.
2025-11-14 16:02:54,298 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:54,326 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\4_2023-08-01' --> 'data\processed_data\COF\4_2023-08-01.md'
Converted 'data\edgar_documents\COF\4_2023-08-03' --> 'data\processed_data\COF\4_2023-08-03.md'


2025-11-14 16:02:54,328 - INFO - Processing document 4_2023-08-04
2025-11-14 16:02:54,372 - INFO - Finished converting document 4_2023-08-04 in 0.11 sec.
2025-11-14 16:02:54,427 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:54,455 - INFO - Going to convert document batch...
2025-11-14 16:02:54,456 - INFO - Processing document 4_2023-08-08
2025-11-14 16:02:54,507 - INFO - Finished converting document 4_2023-08-08 in 0.09 sec.
2025-11-14 16:02:54,586 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\4_2023-08-04' --> 'data\processed_data\COF\4_2023-08-04.md'
Converted 'data\edgar_documents\COF\4_2023-08-08' --> 'data\processed_data\COF\4_2023-08-08.md'


2025-11-14 16:02:54,636 - INFO - Going to convert document batch...
2025-11-14 16:02:54,639 - INFO - Processing document 4_2023-08-11
2025-11-14 16:02:54,719 - INFO - Finished converting document 4_2023-08-11 in 0.16 sec.
2025-11-14 16:02:54,790 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:54,808 - INFO - Going to convert document batch...
2025-11-14 16:02:54,809 - INFO - Processing document 4_2023-08-15
2025-11-14 16:02:54,847 - INFO - Finished converting document 4_2023-08-15 in 0.08 sec.
2025-11-14 16:02:54,911 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:54,911 - ERROR - Input document 4_2023-10-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <Input

Converted 'data\edgar_documents\COF\4_2023-08-11' --> 'data\processed_data\COF\4_2023-08-11.md'
Converted 'data\edgar_documents\COF\4_2023-08-15' --> 'data\processed_data\COF\4_2023-08-15.md'
Error processing data\edgar_documents\COF\4_2023-10-27: File format not allowed: data\edgar_documents\COF\4_2023-10-27
Error processing data\edgar_documents\COF\4_2023-10-30: File format not allowed: data\edgar_documents\COF\4_2023-10-30


2025-11-14 16:02:54,973 - INFO - Going to convert document batch...
2025-11-14 16:02:54,974 - INFO - Processing document 4_2023-11-01
2025-11-14 16:02:55,055 - INFO - Finished converting document 4_2023-11-01 in 0.11 sec.
2025-11-14 16:02:55,128 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:55,165 - INFO - Going to convert document batch...
2025-11-14 16:02:55,166 - INFO - Processing document 4_2023-11-03
2025-11-14 16:02:55,277 - INFO - Finished converting document 4_2023-11-03 in 0.17 sec.


Converted 'data\edgar_documents\COF\4_2023-11-01' --> 'data\processed_data\COF\4_2023-11-01.md'


2025-11-14 16:02:55,386 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:55,422 - INFO - Going to convert document batch...
2025-11-14 16:02:55,423 - INFO - Processing document 4_2023-11-07
2025-11-14 16:02:55,512 - INFO - Finished converting document 4_2023-11-07 in 0.16 sec.


Converted 'data\edgar_documents\COF\4_2023-11-03' --> 'data\processed_data\COF\4_2023-11-03.md'


2025-11-14 16:02:55,592 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:55,614 - INFO - Going to convert document batch...
2025-11-14 16:02:55,615 - INFO - Processing document 4_2023-11-09
2025-11-14 16:02:55,676 - INFO - Finished converting document 4_2023-11-09 in 0.09 sec.
2025-11-14 16:02:55,762 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\4_2023-11-07' --> 'data\processed_data\COF\4_2023-11-07.md'
Converted 'data\edgar_documents\COF\4_2023-11-09' --> 'data\processed_data\COF\4_2023-11-09.md'


2025-11-14 16:02:55,812 - INFO - Going to convert document batch...
2025-11-14 16:02:55,813 - INFO - Processing document 4_2023-11-14
2025-11-14 16:02:55,870 - INFO - Finished converting document 4_2023-11-14 in 0.14 sec.
2025-11-14 16:02:55,939 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:55,957 - INFO - Going to convert document batch...
2025-11-14 16:02:55,958 - INFO - Processing document 4_2023-11-17
2025-11-14 16:02:55,996 - INFO - Finished converting document 4_2023-11-17 in 0.08 sec.
2025-11-14 16:02:56,067 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:56,084 - INFO - Going to convert document batch...
2025-11-14 16:02:56,086 - INFO - Processing document 4_2023-12-14
2025-11-14 16:02:56,127 - INFO - Finished converting document 4_2023-12-14 in 0.09 sec.


Converted 'data\edgar_documents\COF\4_2023-11-14' --> 'data\processed_data\COF\4_2023-11-14.md'
Converted 'data\edgar_documents\COF\4_2023-11-17' --> 'data\processed_data\COF\4_2023-11-17.md'


2025-11-14 16:02:56,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:56,224 - INFO - Going to convert document batch...
2025-11-14 16:02:56,226 - INFO - Processing document 4_2023-12-18
2025-11-14 16:02:56,294 - INFO - Finished converting document 4_2023-12-18 in 0.12 sec.


Converted 'data\edgar_documents\COF\4_2023-12-14' --> 'data\processed_data\COF\4_2023-12-14.md'
Converted 'data\edgar_documents\COF\4_2023-12-18' --> 'data\processed_data\COF\4_2023-12-18.md'


2025-11-14 16:02:56,383 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:56,384 - ERROR - Input document 4_2024-01-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:02:56,388 - INFO - Going to convert document batch...
2025-11-14 16:02:56,419 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:56,422 - ERROR - Input document 4_2024-01-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\COF\4_2024-01-29: File format not allowed: data\edgar_documents\COF\4_2024-01-29
Error processing data\edgar_documents\COF\4_2024-01-30: File format not allowed: data\edgar_documents\COF\4_2024-01-30


2025-11-14 16:02:56,613 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:56,645 - INFO - Going to convert document batch...
2025-11-14 16:02:56,647 - INFO - Processing document 4_2024-02-05
2025-11-14 16:02:56,692 - INFO - Finished converting document 4_2024-02-05 in 0.09 sec.
2025-11-14 16:02:56,760 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:56,761 - ERROR - Input document 4_2024-02-20 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:02

Converted 'data\edgar_documents\COF\4_2024-02-02' --> 'data\processed_data\COF\4_2024-02-02.md'
Converted 'data\edgar_documents\COF\4_2024-02-05' --> 'data\processed_data\COF\4_2024-02-05.md'
Error processing data\edgar_documents\COF\4_2024-02-20: File format not allowed: data\edgar_documents\COF\4_2024-02-20


2025-11-14 16:02:56,793 - ERROR - Input document 4_2024-02-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:02:56,795 - INFO - Going to convert document batch...
2025-11-14 16:02:56,813 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:56,815 - ERROR - Input document 4_2024-02-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\COF\4_2024-02-22: File format not allowed: data\edgar_documents\COF\4_2024-02-22
Error processing data\edgar_documents\COF\4_2024-02-27: File format not allowed: data\edgar_documents\COF\4_2024-02-27
Error processing data\edgar_documents\COF\4_2024-03-06: File format not allowed: data\edgar_documents\COF\4_2024-03-06
Error processing data\edgar_documents\COF\4_2024-03-11: File format not allowed: data\edgar_documents\COF\4_2024-03-11


2025-11-14 16:02:57,079 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:57,082 - ERROR - Input document 4_2024-03-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:02:57,085 - INFO - Going to convert document batch...
2025-11-14 16:02:57,112 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:57,135 - INFO - Going to convert document batch...
2025-11-14 16:02:57,138 - INFO - Processing document 4_2024-04-03
2025-11-14 16:02:57,210 - INFO - Fin

Converted 'data\edgar_documents\COF\4_2024-03-13' --> 'data\processed_data\COF\4_2024-03-13.md'
Error processing data\edgar_documents\COF\4_2024-03-21: File format not allowed: data\edgar_documents\COF\4_2024-03-21
Converted 'data\edgar_documents\COF\4_2024-04-03' --> 'data\processed_data\COF\4_2024-04-03.md'


2025-11-14 16:02:57,275 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:57,276 - ERROR - Input document 4_2024-04-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:02:57,277 - INFO - Going to convert document batch...
2025-11-14 16:02:57,294 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:57,295 - ERROR - Input document 4_2024-04-26 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\COF\4_2024-04-22: File format not allowed: data\edgar_documents\COF\4_2024-04-22
Error processing data\edgar_documents\COF\4_2024-04-26: File format not allowed: data\edgar_documents\COF\4_2024-04-26
Converted 'data\edgar_documents\COF\4_2024-05-02' --> 'data\processed_data\COF\4_2024-05-02.md'


2025-11-14 16:02:57,475 - INFO - Processing document 4_2024-05-03
2025-11-14 16:02:57,534 - INFO - Finished converting document 4_2024-05-03 in 0.11 sec.
2025-11-14 16:02:57,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:57,607 - INFO - Going to convert document batch...
2025-11-14 16:02:57,609 - INFO - Processing document 4_2024-05-06
2025-11-14 16:02:57,687 - INFO - Finished converting document 4_2024-05-06 in 0.12 sec.


Converted 'data\edgar_documents\COF\4_2024-05-03' --> 'data\processed_data\COF\4_2024-05-03.md'


2025-11-14 16:02:57,775 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:57,805 - INFO - Going to convert document batch...
2025-11-14 16:02:57,806 - INFO - Processing document 4_2024-05-09
2025-11-14 16:02:57,844 - INFO - Finished converting document 4_2024-05-09 in 0.09 sec.
2025-11-14 16:02:57,908 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:57,908 - ERROR - Input document 4_2024-07-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:02

Converted 'data\edgar_documents\COF\4_2024-05-06' --> 'data\processed_data\COF\4_2024-05-06.md'
Converted 'data\edgar_documents\COF\4_2024-05-09' --> 'data\processed_data\COF\4_2024-05-09.md'
Error processing data\edgar_documents\COF\4_2024-07-17: File format not allowed: data\edgar_documents\COF\4_2024-07-17


2025-11-14 16:02:57,953 - INFO - Processing document 4_2024-07-19
2025-11-14 16:02:58,003 - INFO - Finished converting document 4_2024-07-19 in 0.09 sec.
2025-11-14 16:02:58,089 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:58,091 - ERROR - Input document 4_2024-07-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:02:58,093 - INFO - Going to convert document batch...
2025-11-14 16:02:58,125 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-1

Converted 'data\edgar_documents\COF\4_2024-07-19' --> 'data\processed_data\COF\4_2024-07-19.md'
Error processing data\edgar_documents\COF\4_2024-07-24: File format not allowed: data\edgar_documents\COF\4_2024-07-24
Error processing data\edgar_documents\COF\4_2024-07-25: File format not allowed: data\edgar_documents\COF\4_2024-07-25


2025-11-14 16:02:58,269 - INFO - Finished converting document 4_2024-08-06 in 0.14 sec.
2025-11-14 16:02:58,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:58,397 - INFO - Going to convert document batch...
2025-11-14 16:02:58,399 - INFO - Processing document 4_2024-08-08
2025-11-14 16:02:58,496 - INFO - Finished converting document 4_2024-08-08 in 0.16 sec.


Converted 'data\edgar_documents\COF\4_2024-08-06' --> 'data\processed_data\COF\4_2024-08-06.md'


2025-11-14 16:02:58,582 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:58,583 - ERROR - Input document 4_2024-09-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:02:58,585 - INFO - Going to convert document batch...
2025-11-14 16:02:58,602 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:58,620 - INFO - Going to convert document batch...
2025-11-14 16:02:58,621 - INFO - Processing document 4_2024-10-21
2025-11-14 16:02:58,662 - INFO - Fin

Converted 'data\edgar_documents\COF\4_2024-08-08' --> 'data\processed_data\COF\4_2024-08-08.md'
Error processing data\edgar_documents\COF\4_2024-09-13: File format not allowed: data\edgar_documents\COF\4_2024-09-13
Converted 'data\edgar_documents\COF\4_2024-10-21' --> 'data\processed_data\COF\4_2024-10-21.md'
Error processing data\edgar_documents\COF\4_2024-10-25: File format not allowed: data\edgar_documents\COF\4_2024-10-25


2025-11-14 16:02:58,752 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:58,773 - INFO - Going to convert document batch...
2025-11-14 16:02:58,774 - INFO - Processing document 4_2024-11-07
2025-11-14 16:02:58,812 - INFO - Finished converting document 4_2024-11-07 in 0.08 sec.
2025-11-14 16:02:58,862 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:58,880 - INFO - Going to convert document batch...
2025-11-14 16:02:58,881 - INFO - Processing document 4_2024-11-12
2025-11-14 16:02:58,922 - INFO - Finished converting document 4_2024-11-12 in 0.08 sec.
2025-11-14 16:02:58,992 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:59,010 - INFO - Going to convert document batch...
2025-11-14 16:02:59,012 - INFO - Processing document 4_2024-11-13


Converted 'data\edgar_documents\COF\4_2024-11-07' --> 'data\processed_data\COF\4_2024-11-07.md'
Converted 'data\edgar_documents\COF\4_2024-11-12' --> 'data\processed_data\COF\4_2024-11-12.md'


2025-11-14 16:02:59,050 - INFO - Finished converting document 4_2024-11-13 in 0.08 sec.
2025-11-14 16:02:59,112 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:59,141 - INFO - Going to convert document batch...
2025-11-14 16:02:59,143 - INFO - Processing document 4_2024-11-14
2025-11-14 16:02:59,213 - INFO - Finished converting document 4_2024-11-14 in 0.12 sec.


Converted 'data\edgar_documents\COF\4_2024-11-13' --> 'data\processed_data\COF\4_2024-11-13.md'


2025-11-14 16:02:59,310 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:59,312 - ERROR - Input document 4_2024-12-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:02:59,317 - INFO - Going to convert document batch...
2025-11-14 16:02:59,341 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:59,344 - ERROR - Input document 4_2024-12-19 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\COF\4_2024-11-14' --> 'data\processed_data\COF\4_2024-11-14.md'
Error processing data\edgar_documents\COF\4_2024-12-17: File format not allowed: data\edgar_documents\COF\4_2024-12-17
Error processing data\edgar_documents\COF\4_2024-12-19: File format not allowed: data\edgar_documents\COF\4_2024-12-19
Error processing data\edgar_documents\COF\4_2025-01-06: File format not allowed: data\edgar_documents\COF\4_2025-01-06
Error processing data\edgar_documents\COF\4_2025-01-23: File format not allowed: data\edgar_documents\COF\4_2025-01-23


2025-11-14 16:02:59,578 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:59,579 - ERROR - Input document 4_2025-01-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:02:59,586 - INFO - Going to convert document batch...
2025-11-14 16:02:59,614 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:02:59,615 - ERROR - Input document 4_2025-01-28 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\COF\4_2025-01-24: File format not allowed: data\edgar_documents\COF\4_2025-01-24
Error processing data\edgar_documents\COF\4_2025-01-28: File format not allowed: data\edgar_documents\COF\4_2025-01-28
Error processing data\edgar_documents\COF\4_2025-01-29: File format not allowed: data\edgar_documents\COF\4_2025-01-29


2025-11-14 16:02:59,837 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:02:59,869 - INFO - Going to convert document batch...
2025-11-14 16:02:59,871 - INFO - Processing document 4_2025-02-06
2025-11-14 16:02:59,936 - INFO - Finished converting document 4_2025-02-06 in 0.12 sec.


Converted 'data\edgar_documents\COF\4_2025-02-04' --> 'data\processed_data\COF\4_2025-02-04.md'
Converted 'data\edgar_documents\COF\4_2025-02-06' --> 'data\processed_data\COF\4_2025-02-06.md'


2025-11-14 16:03:00,018 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:00,066 - INFO - Going to convert document batch...
2025-11-14 16:03:00,071 - INFO - Processing document 4_2025-02-10
2025-11-14 16:03:00,127 - INFO - Finished converting document 4_2025-02-10 in 0.14 sec.
2025-11-14 16:03:00,177 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:00,197 - INFO - Going to convert document batch...
2025-11-14 16:03:00,199 - INFO - Processing document 4_2025-02-19
2025-11-14 16:03:00,239 - INFO - Finished converting document 4_2025-02-19 in 0.08 sec.
2025-11-14 16:03:00,330 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:00,349 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\4_2025-02-10' --> 'data\processed_data\COF\4_2025-02-10.md'
Converted 'data\edgar_documents\COF\4_2025-02-19' --> 'data\processed_data\COF\4_2025-02-19.md'


2025-11-14 16:03:00,351 - INFO - Processing document 4_2025-03-12
2025-11-14 16:03:00,403 - INFO - Finished converting document 4_2025-03-12 in 0.09 sec.
2025-11-14 16:03:00,468 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:00,484 - INFO - Going to convert document batch...
2025-11-14 16:03:00,486 - INFO - Processing document 4_2025-05-12
2025-11-14 16:03:00,522 - INFO - Finished converting document 4_2025-05-12 in 0.06 sec.
2025-11-14 16:03:00,576 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:00,604 - INFO - Going to convert document batch...
2025-11-14 16:03:00,605 - INFO - Processing document 4_2025-05-14


Converted 'data\edgar_documents\COF\4_2025-03-12' --> 'data\processed_data\COF\4_2025-03-12.md'
Converted 'data\edgar_documents\COF\4_2025-05-12' --> 'data\processed_data\COF\4_2025-05-12.md'


2025-11-14 16:03:00,647 - INFO - Finished converting document 4_2025-05-14 in 0.08 sec.
2025-11-14 16:03:00,706 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:00,723 - INFO - Going to convert document batch...
2025-11-14 16:03:00,724 - INFO - Processing document 4_2025-05-20
2025-11-14 16:03:00,760 - INFO - Finished converting document 4_2025-05-20 in 0.08 sec.
2025-11-14 16:03:00,809 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:00,826 - INFO - Going to convert document batch...
2025-11-14 16:03:00,827 - INFO - Processing document 4_2025-06-05
2025-11-14 16:03:00,860 - INFO - Finished converting document 4_2025-06-05 in 0.06 sec.


Converted 'data\edgar_documents\COF\4_2025-05-14' --> 'data\processed_data\COF\4_2025-05-14.md'
Converted 'data\edgar_documents\COF\4_2025-05-20' --> 'data\processed_data\COF\4_2025-05-20.md'


2025-11-14 16:03:00,907 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:00,936 - INFO - Going to convert document batch...
2025-11-14 16:03:00,937 - INFO - Processing document 4_2025-07-25
2025-11-14 16:03:00,972 - INFO - Finished converting document 4_2025-07-25 in 0.08 sec.
2025-11-14 16:03:01,030 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:01,057 - INFO - Going to convert document batch...
2025-11-14 16:03:01,059 - INFO - Processing document 4_2025-08-05


Converted 'data\edgar_documents\COF\4_2025-06-05' --> 'data\processed_data\COF\4_2025-06-05.md'
Converted 'data\edgar_documents\COF\4_2025-07-25' --> 'data\processed_data\COF\4_2025-07-25.md'


2025-11-14 16:03:01,149 - INFO - Finished converting document 4_2025-08-05 in 0.12 sec.
2025-11-14 16:03:01,213 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:01,235 - INFO - Going to convert document batch...
2025-11-14 16:03:01,236 - INFO - Processing document 4_2025-08-06
2025-11-14 16:03:01,275 - INFO - Finished converting document 4_2025-08-06 in 0.06 sec.
2025-11-14 16:03:01,338 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:01,354 - INFO - Going to convert document batch...
2025-11-14 16:03:01,356 - INFO - Processing document 4_2025-08-13
2025-11-14 16:03:01,399 - INFO - Finished converting document 4_2025-08-13 in 0.08 sec.


Converted 'data\edgar_documents\COF\4_2025-08-05' --> 'data\processed_data\COF\4_2025-08-05.md'
Converted 'data\edgar_documents\COF\4_2025-08-06' --> 'data\processed_data\COF\4_2025-08-06.md'


2025-11-14 16:03:01,472 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:01,490 - INFO - Going to convert document batch...
2025-11-14 16:03:01,491 - INFO - Processing document 4_2025-08-20
2025-11-14 16:03:01,527 - INFO - Finished converting document 4_2025-08-20 in 0.08 sec.
2025-11-14 16:03:01,574 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:01,588 - INFO - Going to convert document batch...
2025-11-14 16:03:01,591 - INFO - Processing document 4_2025-09-03
2025-11-14 16:03:01,633 - INFO - Finished converting document 4_2025-09-03 in 0.06 sec.


Converted 'data\edgar_documents\COF\4_2025-08-13' --> 'data\processed_data\COF\4_2025-08-13.md'
Converted 'data\edgar_documents\COF\4_2025-08-20' --> 'data\processed_data\COF\4_2025-08-20.md'


2025-11-14 16:03:01,755 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:03:01,757 - ERROR - Input document 4_2025-09-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:03:01,761 - INFO - Going to convert document batch...
2025-11-14 16:03:01,788 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:03:01,789 - ERROR - Input document 4_2025-09-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\COF\4_2025-09-03' --> 'data\processed_data\COF\4_2025-09-03.md'
Error processing data\edgar_documents\COF\4_2025-09-08: File format not allowed: data\edgar_documents\COF\4_2025-09-08
Error processing data\edgar_documents\COF\4_2025-09-10: File format not allowed: data\edgar_documents\COF\4_2025-09-10


2025-11-14 16:03:01,903 - INFO - Finished converting document 4_2025-10-03 in 0.11 sec.
2025-11-14 16:03:01,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:02,005 - INFO - Going to convert document batch...
2025-11-14 16:03:02,006 - INFO - Processing document 4_2025-10-29
2025-11-14 16:03:02,100 - INFO - Finished converting document 4_2025-10-29 in 0.12 sec.


Converted 'data\edgar_documents\COF\4_2025-10-03' --> 'data\processed_data\COF\4_2025-10-03.md'


2025-11-14 16:03:02,231 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:02,254 - INFO - Going to convert document batch...
2025-11-14 16:03:02,255 - INFO - Processing document 4_2025-11-06
2025-11-14 16:03:02,292 - INFO - Finished converting document 4_2025-11-06 in 0.11 sec.
2025-11-14 16:03:02,362 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\4_2025-10-29' --> 'data\processed_data\COF\4_2025-10-29.md'
Converted 'data\edgar_documents\COF\4_2025-11-06' --> 'data\processed_data\COF\4_2025-11-06.md'


2025-11-14 16:03:02,383 - INFO - Going to convert document batch...
2025-11-14 16:03:02,386 - INFO - Processing document 4_2025-11-07
2025-11-14 16:03:02,451 - INFO - Finished converting document 4_2025-11-07 in 0.12 sec.
2025-11-14 16:03:02,523 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:02,553 - INFO - Going to convert document batch...
2025-11-14 16:03:02,554 - INFO - Processing document 8-K_2023-01-24
2025-11-14 16:03:02,619 - INFO - Finished converting document 8-K_2023-01-24 in 0.12 sec.
2025-11-14 16:03:02,680 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\4_2025-11-07' --> 'data\processed_data\COF\4_2025-11-07.md'
Converted 'data\edgar_documents\COF\8-K_2023-01-24' --> 'data\processed_data\COF\8-K_2023-01-24.md'


2025-11-14 16:03:02,733 - INFO - Going to convert document batch...
2025-11-14 16:03:02,734 - INFO - Processing document 8-K_2023-01-30
2025-11-14 16:03:02,776 - INFO - Finished converting document 8-K_2023-01-30 in 0.14 sec.
2025-11-14 16:03:02,821 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:02,915 - INFO - Going to convert document batch...
2025-11-14 16:03:02,916 - INFO - Processing document 8-K_2023-01-31
2025-11-14 16:03:02,970 - INFO - Finished converting document 8-K_2023-01-31 in 0.17 sec.


Converted 'data\edgar_documents\COF\8-K_2023-01-30' --> 'data\processed_data\COF\8-K_2023-01-30.md'


2025-11-14 16:03:03,005 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:03,033 - INFO - Going to convert document batch...
2025-11-14 16:03:03,034 - INFO - Processing document 8-K_2023-02-01
2025-11-14 16:03:03,084 - INFO - Finished converting document 8-K_2023-02-01 in 0.09 sec.
2025-11-14 16:03:03,143 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:03,171 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\8-K_2023-01-31' --> 'data\processed_data\COF\8-K_2023-01-31.md'
Converted 'data\edgar_documents\COF\8-K_2023-02-01' --> 'data\processed_data\COF\8-K_2023-02-01.md'


2025-11-14 16:03:03,173 - INFO - Processing document 8-K_2023-02-13
2025-11-14 16:03:03,228 - INFO - Finished converting document 8-K_2023-02-13 in 0.11 sec.
2025-11-14 16:03:03,262 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:03,317 - INFO - Going to convert document batch...
2025-11-14 16:03:03,319 - INFO - Processing document 8-K_2023-02-15
2025-11-14 16:03:03,377 - INFO - Finished converting document 8-K_2023-02-15 in 0.12 sec.


Converted 'data\edgar_documents\COF\8-K_2023-02-13' --> 'data\processed_data\COF\8-K_2023-02-13.md'
Converted 'data\edgar_documents\COF\8-K_2023-02-15' --> 'data\processed_data\COF\8-K_2023-02-15.md'


2025-11-14 16:03:03,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:03,503 - INFO - Going to convert document batch...
2025-11-14 16:03:03,504 - INFO - Processing document 8-K_2023-02-16
2025-11-14 16:03:03,546 - INFO - Finished converting document 8-K_2023-02-16 in 0.14 sec.
2025-11-14 16:03:03,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:03,644 - INFO - Going to convert document batch...
2025-11-14 16:03:03,645 - INFO - Processing document 8-K_2023-03-07
2025-11-14 16:03:03,693 - INFO - Finished converting document 8-K_2023-03-07 in 0.12 sec.
2025-11-14 16:03:03,754 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\8-K_2023-02-16' --> 'data\processed_data\COF\8-K_2023-02-16.md'
Converted 'data\edgar_documents\COF\8-K_2023-03-07' --> 'data\processed_data\COF\8-K_2023-03-07.md'


2025-11-14 16:03:03,804 - INFO - Going to convert document batch...
2025-11-14 16:03:03,805 - INFO - Processing document 8-K_2023-03-15
2025-11-14 16:03:03,848 - INFO - Finished converting document 8-K_2023-03-15 in 0.12 sec.
2025-11-14 16:03:03,884 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:03,910 - INFO - Going to convert document batch...
2025-11-14 16:03:03,911 - INFO - Processing document 8-K_2023-04-07
2025-11-14 16:03:03,977 - INFO - Finished converting document 8-K_2023-04-07 in 0.11 sec.
2025-11-14 16:03:04,050 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\8-K_2023-03-15' --> 'data\processed_data\COF\8-K_2023-03-15.md'
Converted 'data\edgar_documents\COF\8-K_2023-04-07' --> 'data\processed_data\COF\8-K_2023-04-07.md'


2025-11-14 16:03:04,080 - INFO - Going to convert document batch...
2025-11-14 16:03:04,081 - INFO - Processing document 8-K_2023-04-27
2025-11-14 16:03:04,114 - INFO - Finished converting document 8-K_2023-04-27 in 0.09 sec.
2025-11-14 16:03:04,157 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:04,189 - INFO - Going to convert document batch...
2025-11-14 16:03:04,191 - INFO - Processing document 8-K_2023-05-08
2025-11-14 16:03:04,240 - INFO - Finished converting document 8-K_2023-05-08 in 0.09 sec.
2025-11-14 16:03:04,292 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:04,335 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\8-K_2023-04-27' --> 'data\processed_data\COF\8-K_2023-04-27.md'
Converted 'data\edgar_documents\COF\8-K_2023-05-08' --> 'data\processed_data\COF\8-K_2023-05-08.md'


2025-11-14 16:03:04,337 - INFO - Processing document 8-K_2023-05-09
2025-11-14 16:03:04,403 - INFO - Finished converting document 8-K_2023-05-09 in 0.16 sec.
2025-11-14 16:03:04,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:04,523 - INFO - Going to convert document batch...
2025-11-14 16:03:04,524 - INFO - Processing document 8-K_2023-05-12
2025-11-14 16:03:04,561 - INFO - Finished converting document 8-K_2023-05-12 in 0.14 sec.


Converted 'data\edgar_documents\COF\8-K_2023-05-09' --> 'data\processed_data\COF\8-K_2023-05-09.md'
Converted 'data\edgar_documents\COF\8-K_2023-05-12' --> 'data\processed_data\COF\8-K_2023-05-12.md'


2025-11-14 16:03:04,616 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:04,669 - INFO - Going to convert document batch...
2025-11-14 16:03:04,671 - INFO - Processing document 8-K_2023-06-08
2025-11-14 16:03:04,750 - INFO - Finished converting document 8-K_2023-06-08 in 0.17 sec.
2025-11-14 16:03:04,811 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:04,860 - INFO - Going to convert document batch...
2025-11-14 16:03:04,862 - INFO - Processing document 8-K_2023-06-12
2025-11-14 16:03:04,929 - INFO - Finished converting document 8-K_2023-06-12 in 0.12 sec.
2025-11-14 16:03:04,999 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\8-K_2023-06-08' --> 'data\processed_data\COF\8-K_2023-06-08.md'
Converted 'data\edgar_documents\COF\8-K_2023-06-12' --> 'data\processed_data\COF\8-K_2023-06-12.md'


2025-11-14 16:03:05,056 - INFO - Going to convert document batch...
2025-11-14 16:03:05,057 - INFO - Processing document 8-K_2023-06-15
2025-11-14 16:03:05,096 - INFO - Finished converting document 8-K_2023-06-15 in 0.14 sec.
2025-11-14 16:03:05,154 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:05,195 - INFO - Going to convert document batch...
2025-11-14 16:03:05,195 - INFO - Processing document 8-K_2023-06-30
2025-11-14 16:03:05,229 - INFO - Finished converting document 8-K_2023-06-30 in 0.09 sec.
2025-11-14 16:03:05,279 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\8-K_2023-06-15' --> 'data\processed_data\COF\8-K_2023-06-15.md'
Converted 'data\edgar_documents\COF\8-K_2023-06-30' --> 'data\processed_data\COF\8-K_2023-06-30.md'


2025-11-14 16:03:05,342 - INFO - Going to convert document batch...
2025-11-14 16:03:05,343 - INFO - Processing document 8-K_2023-07-20
2025-11-14 16:03:05,402 - INFO - Finished converting document 8-K_2023-07-20 in 0.16 sec.
2025-11-14 16:03:05,442 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:05,472 - INFO - Going to convert document batch...
2025-11-14 16:03:05,473 - INFO - Processing document 8-K_2023-07-26
2025-11-14 16:03:05,512 - INFO - Finished converting document 8-K_2023-07-26 in 0.09 sec.
2025-11-14 16:03:05,567 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:05,611 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\8-K_2023-07-20' --> 'data\processed_data\COF\8-K_2023-07-20.md'
Converted 'data\edgar_documents\COF\8-K_2023-07-26' --> 'data\processed_data\COF\8-K_2023-07-26.md'


2025-11-14 16:03:05,613 - INFO - Processing document 8-K_2023-08-15
2025-11-14 16:03:05,681 - INFO - Finished converting document 8-K_2023-08-15 in 0.14 sec.
2025-11-14 16:03:05,722 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:05,757 - INFO - Going to convert document batch...
2025-11-14 16:03:05,758 - INFO - Processing document 8-K_2023-09-08
2025-11-14 16:03:05,795 - INFO - Finished converting document 8-K_2023-09-08 in 0.09 sec.
2025-11-14 16:03:05,848 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:05,892 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\8-K_2023-08-15' --> 'data\processed_data\COF\8-K_2023-08-15.md'
Converted 'data\edgar_documents\COF\8-K_2023-09-08' --> 'data\processed_data\COF\8-K_2023-09-08.md'


2025-11-14 16:03:05,893 - INFO - Processing document 8-K_2023-09-15
2025-11-14 16:03:05,932 - INFO - Finished converting document 8-K_2023-09-15 in 0.11 sec.
2025-11-14 16:03:05,966 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:06,009 - INFO - Going to convert document batch...
2025-11-14 16:03:06,010 - INFO - Processing document 8-K_2023-10-26
2025-11-14 16:03:06,045 - INFO - Finished converting document 8-K_2023-10-26 in 0.09 sec.
2025-11-14 16:03:06,078 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:06,108 - INFO - Going to convert document batch...
2025-11-14 16:03:06,110 - INFO - Processing document 8-K_2023-11-01


Converted 'data\edgar_documents\COF\8-K_2023-09-15' --> 'data\processed_data\COF\8-K_2023-09-15.md'
Converted 'data\edgar_documents\COF\8-K_2023-10-26' --> 'data\processed_data\COF\8-K_2023-10-26.md'


2025-11-14 16:03:06,210 - INFO - Finished converting document 8-K_2023-11-01 in 0.14 sec.
2025-11-14 16:03:06,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:06,344 - INFO - Going to convert document batch...
2025-11-14 16:03:06,347 - INFO - Processing document 8-K_2023-11-15
2025-11-14 16:03:06,388 - INFO - Finished converting document 8-K_2023-11-15 in 0.12 sec.
2025-11-14 16:03:06,438 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\8-K_2023-11-01' --> 'data\processed_data\COF\8-K_2023-11-01.md'
Converted 'data\edgar_documents\COF\8-K_2023-11-15' --> 'data\processed_data\COF\8-K_2023-11-15.md'


2025-11-14 16:03:06,468 - INFO - Going to convert document batch...
2025-11-14 16:03:06,469 - INFO - Processing document 8-K_2023-12-04
2025-11-14 16:03:06,508 - INFO - Finished converting document 8-K_2023-12-04 in 0.09 sec.
2025-11-14 16:03:06,542 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:06,569 - INFO - Going to convert document batch...
2025-11-14 16:03:06,570 - INFO - Processing document 8-K_2023-12-15
2025-11-14 16:03:06,625 - INFO - Finished converting document 8-K_2023-12-15 in 0.09 sec.
2025-11-14 16:03:06,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:06,710 - INFO - Going to convert document batch...
2025-11-14 16:03:06,711 - INFO - Processing document 8-K_2024-01-25
2025-11-14 16:03:06,744 - INFO - Finished converting document 8-K_2024-01-25 in 0.08 sec.


Converted 'data\edgar_documents\COF\8-K_2023-12-04' --> 'data\processed_data\COF\8-K_2023-12-04.md'
Converted 'data\edgar_documents\COF\8-K_2023-12-15' --> 'data\processed_data\COF\8-K_2023-12-15.md'


2025-11-14 16:03:06,780 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:06,813 - INFO - Going to convert document batch...
2025-11-14 16:03:06,815 - INFO - Processing document 8-K_2024-02-01
2025-11-14 16:03:06,872 - INFO - Finished converting document 8-K_2024-02-01 in 0.11 sec.
2025-11-14 16:03:06,911 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:06,954 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\8-K_2024-01-25' --> 'data\processed_data\COF\8-K_2024-01-25.md'
Converted 'data\edgar_documents\COF\8-K_2024-02-01' --> 'data\processed_data\COF\8-K_2024-02-01.md'


2025-11-14 16:03:06,955 - INFO - Processing document 8-K_2024-02-05
2025-11-14 16:03:07,016 - INFO - Finished converting document 8-K_2024-02-05 in 0.12 sec.
2025-11-14 16:03:07,075 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:07,116 - INFO - Going to convert document batch...
2025-11-14 16:03:07,118 - INFO - Processing document 8-K_2024-02-15
2025-11-14 16:03:07,167 - INFO - Finished converting document 8-K_2024-02-15 in 0.12 sec.


Converted 'data\edgar_documents\COF\8-K_2024-02-05' --> 'data\processed_data\COF\8-K_2024-02-05.md'
Converted 'data\edgar_documents\COF\8-K_2024-02-15' --> 'data\processed_data\COF\8-K_2024-02-15.md'


2025-11-14 16:03:07,240 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:07,275 - INFO - Going to convert document batch...
2025-11-14 16:03:07,276 - INFO - Processing document 8-K_2024-02-20
2025-11-14 16:03:07,334 - INFO - Finished converting document 8-K_2024-02-20 in 0.12 sec.
2025-11-14 16:03:07,376 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:07,439 - INFO - Going to convert document batch...
2025-11-14 16:03:07,442 - INFO - Processing document 8-K_2024-02-22


Converted 'data\edgar_documents\COF\8-K_2024-02-20' --> 'data\processed_data\COF\8-K_2024-02-20.md'


2025-11-14 16:03:07,576 - INFO - Finished converting document 8-K_2024-02-22 in 0.22 sec.
2025-11-14 16:03:07,619 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\8-K_2024-02-22' --> 'data\processed_data\COF\8-K_2024-02-22.md'


2025-11-14 16:03:09,198 - INFO - Going to convert document batch...
2025-11-14 16:03:09,199 - INFO - Processing document 8-K_2024-02-26
2025-11-14 16:03:09,235 - INFO - Finished converting document 8-K_2024-02-26 in 1.62 sec.
2025-11-14 16:03:09,272 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:09,296 - INFO - Going to convert document batch...
2025-11-14 16:03:09,298 - INFO - Processing document 8-K_2024-02-29
2025-11-14 16:03:09,334 - INFO - Finished converting document 8-K_2024-02-29 in 0.08 sec.
2025-11-14 16:03:09,387 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:09,413 - INFO - Going to convert document batch...
2025-11-14 16:03:09,415 - INFO - Processing document 8-K_2024-03-04


Converted 'data\edgar_documents\COF\8-K_2024-02-26' --> 'data\processed_data\COF\8-K_2024-02-26.md'
Converted 'data\edgar_documents\COF\8-K_2024-02-29' --> 'data\processed_data\COF\8-K_2024-02-29.md'


2025-11-14 16:03:09,454 - INFO - Finished converting document 8-K_2024-03-04 in 0.11 sec.
2025-11-14 16:03:09,500 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:09,530 - INFO - Going to convert document batch...
2025-11-14 16:03:09,533 - INFO - Processing document 8-K_2024-03-11
2025-11-14 16:03:09,581 - INFO - Finished converting document 8-K_2024-03-11 in 0.11 sec.
2025-11-14 16:03:09,644 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:09,682 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\8-K_2024-03-04' --> 'data\processed_data\COF\8-K_2024-03-04.md'
Converted 'data\edgar_documents\COF\8-K_2024-03-11' --> 'data\processed_data\COF\8-K_2024-03-11.md'


2025-11-14 16:03:09,684 - INFO - Processing document 8-K_2024-03-15
2025-11-14 16:03:09,747 - INFO - Finished converting document 8-K_2024-03-15 in 0.14 sec.
2025-11-14 16:03:09,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:09,832 - INFO - Going to convert document batch...
2025-11-14 16:03:09,834 - INFO - Processing document 8-K_2024-04-25
2025-11-14 16:03:09,898 - INFO - Finished converting document 8-K_2024-04-25 in 0.12 sec.
2025-11-14 16:03:09,956 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\8-K_2024-03-15' --> 'data\processed_data\COF\8-K_2024-03-15.md'
Converted 'data\edgar_documents\COF\8-K_2024-04-25' --> 'data\processed_data\COF\8-K_2024-04-25.md'


2025-11-14 16:03:10,002 - INFO - Going to convert document batch...
2025-11-14 16:03:10,003 - INFO - Processing document 8-K_2024-05-03
2025-11-14 16:03:10,080 - INFO - Finished converting document 8-K_2024-05-03 in 0.16 sec.
2025-11-14 16:03:10,151 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:10,176 - INFO - Going to convert document batch...
2025-11-14 16:03:10,177 - INFO - Processing document 8-K_2024-05-15
2025-11-14 16:03:10,209 - INFO - Finished converting document 8-K_2024-05-15 in 0.08 sec.
2025-11-14 16:03:10,261 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:10,302 - INFO - Going to convert document batch...
2025-11-14 16:03:10,304 - INFO - Processing document 8-K_2024-05-24


Converted 'data\edgar_documents\COF\8-K_2024-05-03' --> 'data\processed_data\COF\8-K_2024-05-03.md'
Converted 'data\edgar_documents\COF\8-K_2024-05-15' --> 'data\processed_data\COF\8-K_2024-05-15.md'


2025-11-14 16:03:10,352 - INFO - Finished converting document 8-K_2024-05-24 in 0.12 sec.
2025-11-14 16:03:10,405 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:10,440 - INFO - Going to convert document batch...
2025-11-14 16:03:10,442 - INFO - Processing document 8-K_2024-06-10
2025-11-14 16:03:10,492 - INFO - Finished converting document 8-K_2024-06-10 in 0.11 sec.
2025-11-14 16:03:10,531 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:10,562 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\8-K_2024-05-24' --> 'data\processed_data\COF\8-K_2024-05-24.md'
Converted 'data\edgar_documents\COF\8-K_2024-06-10' --> 'data\processed_data\COF\8-K_2024-06-10.md'


2025-11-14 16:03:10,564 - INFO - Processing document 8-K_2024-06-17
2025-11-14 16:03:10,604 - INFO - Finished converting document 8-K_2024-06-17 in 0.09 sec.
2025-11-14 16:03:10,643 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:10,670 - INFO - Going to convert document batch...
2025-11-14 16:03:10,671 - INFO - Processing document 8-K_2024-06-28
2025-11-14 16:03:10,705 - INFO - Finished converting document 8-K_2024-06-28 in 0.08 sec.
2025-11-14 16:03:10,759 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:10,802 - INFO - Going to convert document batch...
2025-11-14 16:03:10,803 - INFO - Processing document 8-K_2024-07-23


Converted 'data\edgar_documents\COF\8-K_2024-06-17' --> 'data\processed_data\COF\8-K_2024-06-17.md'
Converted 'data\edgar_documents\COF\8-K_2024-06-28' --> 'data\processed_data\COF\8-K_2024-06-28.md'


2025-11-14 16:03:10,852 - INFO - Finished converting document 8-K_2024-07-23 in 0.12 sec.
2025-11-14 16:03:10,894 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:10,932 - INFO - Going to convert document batch...
2025-11-14 16:03:10,933 - INFO - Processing document 8-K_2024-07-24
2025-11-14 16:03:10,979 - INFO - Finished converting document 8-K_2024-07-24 in 0.11 sec.
2025-11-14 16:03:11,036 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:11,070 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\8-K_2024-07-23' --> 'data\processed_data\COF\8-K_2024-07-23.md'
Converted 'data\edgar_documents\COF\8-K_2024-07-24' --> 'data\processed_data\COF\8-K_2024-07-24.md'


2025-11-14 16:03:11,071 - INFO - Processing document 8-K_2024-07-26
2025-11-14 16:03:11,128 - INFO - Finished converting document 8-K_2024-07-26 in 0.12 sec.
2025-11-14 16:03:11,181 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:11,205 - INFO - Going to convert document batch...
2025-11-14 16:03:11,206 - INFO - Processing document 8-K_2024-08-15
2025-11-14 16:03:11,249 - INFO - Finished converting document 8-K_2024-08-15 in 0.09 sec.
2025-11-14 16:03:11,299 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:11,323 - INFO - Going to convert document batch...
2025-11-14 16:03:11,324 - INFO - Processing document 8-K_2024-09-09
2025-11-14 16:03:11,357 - INFO - Finished converting document 8-K_2024-09-09 in 0.09 sec.


Converted 'data\edgar_documents\COF\8-K_2024-07-26' --> 'data\processed_data\COF\8-K_2024-07-26.md'
Converted 'data\edgar_documents\COF\8-K_2024-08-15' --> 'data\processed_data\COF\8-K_2024-08-15.md'


2025-11-14 16:03:11,392 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:11,417 - INFO - Going to convert document batch...
2025-11-14 16:03:11,418 - INFO - Processing document 8-K_2024-09-16
2025-11-14 16:03:11,451 - INFO - Finished converting document 8-K_2024-09-16 in 0.08 sec.
2025-11-14 16:03:11,498 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:11,524 - INFO - Going to convert document batch...
2025-11-14 16:03:11,525 - INFO - Processing document 8-K_2024-10-24


Converted 'data\edgar_documents\COF\8-K_2024-09-09' --> 'data\processed_data\COF\8-K_2024-09-09.md'
Converted 'data\edgar_documents\COF\8-K_2024-09-16' --> 'data\processed_data\COF\8-K_2024-09-16.md'


2025-11-14 16:03:11,562 - INFO - Finished converting document 8-K_2024-10-24 in 0.09 sec.
2025-11-14 16:03:11,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:11,621 - INFO - Going to convert document batch...
2025-11-14 16:03:11,622 - INFO - Processing document 8-K_2024-11-15
2025-11-14 16:03:11,658 - INFO - Finished converting document 8-K_2024-11-15 in 0.08 sec.
2025-11-14 16:03:11,693 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:11,717 - INFO - Going to convert document batch...
2025-11-14 16:03:11,718 - INFO - Processing document 8-K_2024-12-09
2025-11-14 16:03:11,752 - INFO - Finished converting document 8-K_2024-12-09 in 0.08 sec.


Converted 'data\edgar_documents\COF\8-K_2024-10-24' --> 'data\processed_data\COF\8-K_2024-10-24.md'
Converted 'data\edgar_documents\COF\8-K_2024-11-15' --> 'data\processed_data\COF\8-K_2024-11-15.md'


2025-11-14 16:03:11,789 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:11,813 - INFO - Going to convert document batch...
2025-11-14 16:03:11,814 - INFO - Processing document 8-K_2024-12-16
2025-11-14 16:03:11,850 - INFO - Finished converting document 8-K_2024-12-16 in 0.08 sec.
2025-11-14 16:03:11,903 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:11,930 - INFO - Going to convert document batch...
2025-11-14 16:03:11,931 - INFO - Processing document 8-K_2025-01-21
2025-11-14 16:03:11,963 - INFO - Finished converting document 8-K_2025-01-21 in 0.09 sec.


Converted 'data\edgar_documents\COF\8-K_2024-12-09' --> 'data\processed_data\COF\8-K_2024-12-09.md'
Converted 'data\edgar_documents\COF\8-K_2024-12-16' --> 'data\processed_data\COF\8-K_2024-12-16.md'


2025-11-14 16:03:11,997 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:12,032 - INFO - Going to convert document batch...
2025-11-14 16:03:12,034 - INFO - Processing document 8-K_2025-01-24
2025-11-14 16:03:12,122 - INFO - Finished converting document 8-K_2025-01-24 in 0.14 sec.


Converted 'data\edgar_documents\COF\8-K_2025-01-21' --> 'data\processed_data\COF\8-K_2025-01-21.md'
Converted 'data\edgar_documents\COF\8-K_2025-01-24' --> 'data\processed_data\COF\8-K_2025-01-24.md'


2025-11-14 16:03:12,188 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:12,216 - INFO - Going to convert document batch...
2025-11-14 16:03:12,218 - INFO - Processing document 8-K_2025-01-30
2025-11-14 16:03:12,263 - INFO - Finished converting document 8-K_2025-01-30 in 0.11 sec.
2025-11-14 16:03:12,306 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:12,333 - INFO - Going to convert document batch...
2025-11-14 16:03:12,334 - INFO - Processing document 8-K_2025-02-07
2025-11-14 16:03:12,371 - INFO - Finished converting document 8-K_2025-02-07 in 0.08 sec.
2025-11-14 16:03:12,409 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:12,438 - INFO - Going to convert document batch...
2025-11-14 16:03:12,439 - INFO - Processing document 8-K_2025-02-10
2025-11-14 16:03:12,483 - INFO - Finished converting document 8-K_2025-02-10 in 0.09 sec.


Converted 'data\edgar_documents\COF\8-K_2025-01-30' --> 'data\processed_data\COF\8-K_2025-01-30.md'
Converted 'data\edgar_documents\COF\8-K_2025-02-07' --> 'data\processed_data\COF\8-K_2025-02-07.md'


2025-11-14 16:03:12,521 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:12,558 - INFO - Going to convert document batch...
2025-11-14 16:03:12,560 - INFO - Processing document 8-K_2025-02-18
2025-11-14 16:03:12,612 - INFO - Finished converting document 8-K_2025-02-18 in 0.11 sec.
2025-11-14 16:03:12,647 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:12,669 - INFO - Going to convert document batch...
2025-11-14 16:03:12,671 - INFO - Processing document 8-K_2025-03-17


Converted 'data\edgar_documents\COF\8-K_2025-02-10' --> 'data\processed_data\COF\8-K_2025-02-10.md'
Converted 'data\edgar_documents\COF\8-K_2025-02-18' --> 'data\processed_data\COF\8-K_2025-02-18.md'


2025-11-14 16:03:12,715 - INFO - Finished converting document 8-K_2025-03-17 in 0.09 sec.
2025-11-14 16:03:12,750 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:12,780 - INFO - Going to convert document batch...
2025-11-14 16:03:12,782 - INFO - Processing document 8-K_2025-04-18
2025-11-14 16:03:12,817 - INFO - Finished converting document 8-K_2025-04-18 in 0.08 sec.
2025-11-14 16:03:12,854 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:12,882 - INFO - Going to convert document batch...
2025-11-14 16:03:12,884 - INFO - Processing document 8-K_2025-04-22
2025-11-14 16:03:12,925 - INFO - Finished converting document 8-K_2025-04-22 in 0.08 sec.


Converted 'data\edgar_documents\COF\8-K_2025-03-17' --> 'data\processed_data\COF\8-K_2025-03-17.md'
Converted 'data\edgar_documents\COF\8-K_2025-04-18' --> 'data\processed_data\COF\8-K_2025-04-18.md'


2025-11-14 16:03:12,973 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:13,025 - INFO - Going to convert document batch...
2025-11-14 16:03:13,026 - INFO - Processing document 8-K_2025-05-08
2025-11-14 16:03:13,092 - INFO - Finished converting document 8-K_2025-05-08 in 0.14 sec.
2025-11-14 16:03:13,135 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\8-K_2025-04-22' --> 'data\processed_data\COF\8-K_2025-04-22.md'
Converted 'data\edgar_documents\COF\8-K_2025-05-08' --> 'data\processed_data\COF\8-K_2025-05-08.md'


2025-11-14 16:03:13,156 - INFO - Going to convert document batch...
2025-11-14 16:03:13,158 - INFO - Processing document 8-K_2025-05-15
2025-11-14 16:03:13,191 - INFO - Finished converting document 8-K_2025-05-15 in 0.06 sec.
2025-11-14 16:03:13,226 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:13,264 - INFO - Going to convert document batch...
2025-11-14 16:03:13,266 - INFO - Processing document 8-K_2025-05-19
2025-11-14 16:03:13,324 - INFO - Finished converting document 8-K_2025-05-19 in 0.12 sec.


Converted 'data\edgar_documents\COF\8-K_2025-05-15' --> 'data\processed_data\COF\8-K_2025-05-15.md'
Converted 'data\edgar_documents\COF\8-K_2025-05-19' --> 'data\processed_data\COF\8-K_2025-05-19.md'


2025-11-14 16:03:13,396 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:13,444 - INFO - Going to convert document batch...
2025-11-14 16:03:13,447 - INFO - Processing document 8-K_2025-05-22
2025-11-14 16:03:13,508 - INFO - Finished converting document 8-K_2025-05-22 in 0.12 sec.
2025-11-14 16:03:13,569 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:13,604 - INFO - Going to convert document batch...
2025-11-14 16:03:13,605 - INFO - Processing document 8-K_2025-06-05
2025-11-14 16:03:13,642 - INFO - Finished converting document 8-K_2025-06-05 in 0.09 sec.
2025-11-14 16:03:13,691 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COF\8-K_2025-05-22' --> 'data\processed_data\COF\8-K_2025-05-22.md'
Converted 'data\edgar_documents\COF\8-K_2025-06-05' --> 'data\processed_data\COF\8-K_2025-06-05.md'


2025-11-14 16:03:13,736 - INFO - Going to convert document batch...
2025-11-14 16:03:13,738 - INFO - Processing document 8-K_2025-06-09
2025-11-14 16:03:13,795 - INFO - Finished converting document 8-K_2025-06-09 in 0.14 sec.
2025-11-14 16:03:13,849 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:13,888 - INFO - Going to convert document batch...
2025-11-14 16:03:13,888 - INFO - Processing document 8-K_2025-06-16
2025-11-14 16:03:13,942 - INFO - Finished converting document 8-K_2025-06-16 in 0.11 sec.


Converted 'data\edgar_documents\COF\8-K_2025-06-09' --> 'data\processed_data\COF\8-K_2025-06-09.md'
Converted 'data\edgar_documents\COF\8-K_2025-06-16' --> 'data\processed_data\COF\8-K_2025-06-16.md'


2025-11-14 16:03:14,018 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:14,048 - INFO - Going to convert document batch...
2025-11-14 16:03:14,050 - INFO - Processing document 8-K_2025-06-25
2025-11-14 16:03:14,093 - INFO - Finished converting document 8-K_2025-06-25 in 0.11 sec.
2025-11-14 16:03:14,132 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:14,155 - INFO - Going to convert document batch...
2025-11-14 16:03:14,156 - INFO - Processing document 8-K_2025-06-30
2025-11-14 16:03:14,212 - INFO - Finished converting document 8-K_2025-06-30 in 0.09 sec.
2025-11-14 16:03:14,249 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:14,274 - INFO - Going to convert document batch...
2025-11-14 16:03:14,275 - INFO - Processing document 8-K_2025-07-01
2025-11-14 16:03:14,311 - INFO - Finished converting document 8-K_2025-07-01 in 0.08 sec.


Converted 'data\edgar_documents\COF\8-K_2025-06-25' --> 'data\processed_data\COF\8-K_2025-06-25.md'
Converted 'data\edgar_documents\COF\8-K_2025-06-30' --> 'data\processed_data\COF\8-K_2025-06-30.md'


2025-11-14 16:03:14,351 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:14,374 - INFO - Going to convert document batch...
2025-11-14 16:03:14,375 - INFO - Processing document 8-K_2025-07-22
2025-11-14 16:03:14,409 - INFO - Finished converting document 8-K_2025-07-22 in 0.08 sec.
2025-11-14 16:03:14,461 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:14,484 - INFO - Going to convert document batch...
2025-11-14 16:03:14,485 - INFO - Processing document 8-K_2025-08-15
2025-11-14 16:03:14,519 - INFO - Finished converting document 8-K_2025-08-15 in 0.09 sec.


Converted 'data\edgar_documents\COF\8-K_2025-07-01' --> 'data\processed_data\COF\8-K_2025-07-01.md'
Converted 'data\edgar_documents\COF\8-K_2025-07-22' --> 'data\processed_data\COF\8-K_2025-07-22.md'


2025-11-14 16:03:14,563 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:14,584 - INFO - Going to convert document batch...
2025-11-14 16:03:14,585 - INFO - Processing document 8-K_2025-09-08
2025-11-14 16:03:14,639 - INFO - Finished converting document 8-K_2025-09-08 in 0.11 sec.
2025-11-14 16:03:14,689 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:14,734 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COF\8-K_2025-08-15' --> 'data\processed_data\COF\8-K_2025-08-15.md'
Converted 'data\edgar_documents\COF\8-K_2025-09-08' --> 'data\processed_data\COF\8-K_2025-09-08.md'


2025-11-14 16:03:14,735 - INFO - Processing document 8-K_2025-09-11
2025-11-14 16:03:14,800 - INFO - Finished converting document 8-K_2025-09-11 in 0.14 sec.
2025-11-14 16:03:14,853 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:14,876 - INFO - Going to convert document batch...
2025-11-14 16:03:14,878 - INFO - Processing document 8-K_2025-09-15
2025-11-14 16:03:14,914 - INFO - Finished converting document 8-K_2025-09-15 in 0.08 sec.
2025-11-14 16:03:14,963 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:14,987 - INFO - Going to convert document batch...
2025-11-14 16:03:14,988 - INFO - Processing document 8-K_2025-10-21
2025-11-14 16:03:15,020 - INFO - Finished converting document 8-K_2025-10-21 in 0.08 sec.


Converted 'data\edgar_documents\COF\8-K_2025-09-11' --> 'data\processed_data\COF\8-K_2025-09-11.md'
Converted 'data\edgar_documents\COF\8-K_2025-09-15' --> 'data\processed_data\COF\8-K_2025-09-15.md'


2025-11-14 16:03:15,055 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:15,091 - INFO - Going to convert document batch...
2025-11-14 16:03:15,092 - INFO - Processing document 8-K_2025-11-07
2025-11-14 16:03:15,130 - INFO - Finished converting document 8-K_2025-11-07 in 0.09 sec.


Converted 'data\edgar_documents\COF\8-K_2025-10-21' --> 'data\processed_data\COF\8-K_2025-10-21.md'
Converted 'data\edgar_documents\COF\8-K_2025-11-07' --> 'data\processed_data\COF\8-K_2025-11-07.md'


2025-11-14 16:03:15,266 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:03:15,267 - ERROR - Input document DEF-14A_2023-03-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:03:15,271 - INFO - Going to convert document batch...
2025-11-14 16:03:15,321 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:03:15,323 - ERROR - Input document DEF-14A_2024-03-20 with format No

Error processing data\edgar_documents\COF\DEF-14A_2023-03-22: File format not allowed: data\edgar_documents\COF\DEF-14A_2023-03-22
Error processing data\edgar_documents\COF\DEF-14A_2024-03-20: File format not allowed: data\edgar_documents\COF\DEF-14A_2024-03-20
Error processing data\edgar_documents\COF\DEF-14A_2025-03-27: File format not allowed: data\edgar_documents\COF\DEF-14A_2025-03-27
Processed 153 new files. Errors: 33
Found 124 files to process in data\edgar_documents\COP


2025-11-14 16:03:15,519 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:03:20,709 - INFO - Going to convert document batch...
2025-11-14 16:03:20,712 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:03:20,713 - INFO - Processing document 10-K_2023-02-16
2025-11-14 16:03:33,030 - INFO - Finished converting document 10-K_2023-02-16 in 17.64 sec.
2025-11-14 16:03:36,297 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\10-K_2023-02-16' --> 'data\processed_data\COP\10-K_2023-02-16.md'


2025-11-14 16:03:40,338 - INFO - Going to convert document batch...
2025-11-14 16:03:40,339 - INFO - Processing document 10-K_2024-02-15
2025-11-14 16:03:52,073 - INFO - Finished converting document 10-K_2024-02-15 in 15.91 sec.
2025-11-14 16:03:55,394 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\10-K_2024-02-15' --> 'data\processed_data\COP\10-K_2024-02-15.md'


2025-11-14 16:04:00,131 - INFO - Going to convert document batch...
2025-11-14 16:04:00,133 - INFO - Processing document 10-K_2025-02-18
2025-11-14 16:04:11,729 - INFO - Finished converting document 10-K_2025-02-18 in 16.45 sec.
2025-11-14 16:04:15,219 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\10-K_2025-02-18' --> 'data\processed_data\COP\10-K_2025-02-18.md'


2025-11-14 16:04:16,221 - INFO - Going to convert document batch...
2025-11-14 16:04:16,223 - INFO - Processing document 10-Q_2023-05-04
2025-11-14 16:04:18,577 - INFO - Finished converting document 10-Q_2023-05-04 in 3.44 sec.
2025-11-14 16:04:19,386 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\10-Q_2023-05-04' --> 'data\processed_data\COP\10-Q_2023-05-04.md'


2025-11-14 16:04:19,813 - INFO - Going to convert document batch...
2025-11-14 16:04:19,813 - INFO - Processing document 10-Q_2023-08-03
2025-11-14 16:04:21,637 - INFO - Finished converting document 10-Q_2023-08-03 in 2.30 sec.
2025-11-14 16:04:22,434 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:04:22,436 - ERROR - Input document 10-Q_2023-11-02 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:04:22,441 - INFO - Going to convert d

Converted 'data\edgar_documents\COP\10-Q_2023-08-03' --> 'data\processed_data\COP\10-Q_2023-08-03.md'
Error processing data\edgar_documents\COP\10-Q_2023-11-02: File format not allowed: data\edgar_documents\COP\10-Q_2023-11-02


2025-11-14 16:04:23,386 - INFO - Going to convert document batch...
2025-11-14 16:04:23,388 - INFO - Processing document 10-Q_2024-05-02
2025-11-14 16:04:27,561 - INFO - Finished converting document 10-Q_2024-05-02 in 5.12 sec.
2025-11-14 16:04:28,773 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\10-Q_2024-05-02' --> 'data\processed_data\COP\10-Q_2024-05-02.md'


2025-11-14 16:04:30,193 - INFO - Going to convert document batch...
2025-11-14 16:04:30,198 - INFO - Processing document 10-Q_2024-08-01
2025-11-14 16:04:33,042 - INFO - Finished converting document 10-Q_2024-08-01 in 4.36 sec.
2025-11-14 16:04:34,101 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\10-Q_2024-08-01' --> 'data\processed_data\COP\10-Q_2024-08-01.md'


2025-11-14 16:04:36,284 - INFO - Going to convert document batch...
2025-11-14 16:04:36,286 - INFO - Processing document 10-Q_2024-10-31
2025-11-14 16:04:39,086 - INFO - Finished converting document 10-Q_2024-10-31 in 5.08 sec.
2025-11-14 16:04:40,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\10-Q_2024-10-31' --> 'data\processed_data\COP\10-Q_2024-10-31.md'


2025-11-14 16:04:41,730 - INFO - Going to convert document batch...
2025-11-14 16:04:41,733 - INFO - Processing document 10-Q_2025-05-08
2025-11-14 16:04:44,357 - INFO - Finished converting document 10-Q_2025-05-08 in 3.97 sec.
2025-11-14 16:04:46,852 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\10-Q_2025-05-08' --> 'data\processed_data\COP\10-Q_2025-05-08.md'


2025-11-14 16:04:48,455 - INFO - Going to convert document batch...
2025-11-14 16:04:48,457 - INFO - Processing document 10-Q_2025-08-07
2025-11-14 16:04:51,648 - INFO - Finished converting document 10-Q_2025-08-07 in 4.88 sec.
2025-11-14 16:04:53,461 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\10-Q_2025-08-07' --> 'data\processed_data\COP\10-Q_2025-08-07.md'


2025-11-14 16:04:55,844 - INFO - Going to convert document batch...
2025-11-14 16:04:55,846 - INFO - Processing document 10-Q_2025-11-06
2025-11-14 16:04:59,367 - INFO - Finished converting document 10-Q_2025-11-06 in 5.95 sec.
2025-11-14 16:05:01,315 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:01,345 - INFO - Going to convert document batch...
2025-11-14 16:05:01,348 - INFO - Processing document 4_2023-01-04
2025-11-14 16:05:01,414 - INFO - Finished converting document 4_2023-01-04 in 0.11 sec.
2025-11-14 16:05:01,493 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\10-Q_2025-11-06' --> 'data\processed_data\COP\10-Q_2025-11-06.md'
Converted 'data\edgar_documents\COP\4_2023-01-04' --> 'data\processed_data\COP\4_2023-01-04.md'


2025-11-14 16:05:01,507 - INFO - Going to convert document batch...
2025-11-14 16:05:01,509 - INFO - Processing document 4_2023-01-06
2025-11-14 16:05:01,547 - INFO - Finished converting document 4_2023-01-06 in 0.08 sec.
2025-11-14 16:05:01,599 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:01,616 - INFO - Going to convert document batch...
2025-11-14 16:05:01,617 - INFO - Processing document 4_2023-01-18
2025-11-14 16:05:01,654 - INFO - Finished converting document 4_2023-01-18 in 0.08 sec.
2025-11-14 16:05:01,738 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:01,766 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COP\4_2023-01-06' --> 'data\processed_data\COP\4_2023-01-06.md'
Converted 'data\edgar_documents\COP\4_2023-01-18' --> 'data\processed_data\COP\4_2023-01-18.md'


2025-11-14 16:05:01,767 - INFO - Processing document 4_2023-02-02
2025-11-14 16:05:01,837 - INFO - Finished converting document 4_2023-02-02 in 0.12 sec.
2025-11-14 16:05:01,932 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:01,969 - INFO - Going to convert document batch...
2025-11-14 16:05:01,972 - INFO - Processing document 4_2023-02-14
2025-11-14 16:05:02,063 - INFO - Finished converting document 4_2023-02-14 in 0.16 sec.


Converted 'data\edgar_documents\COP\4_2023-02-02' --> 'data\processed_data\COP\4_2023-02-02.md'


2025-11-14 16:05:02,170 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:02,193 - INFO - Going to convert document batch...
2025-11-14 16:05:02,197 - INFO - Processing document 4_2023-02-16
2025-11-14 16:05:02,252 - INFO - Finished converting document 4_2023-02-16 in 0.11 sec.


Converted 'data\edgar_documents\COP\4_2023-02-14' --> 'data\processed_data\COP\4_2023-02-14.md'
Converted 'data\edgar_documents\COP\4_2023-02-16' --> 'data\processed_data\COP\4_2023-02-16.md'


2025-11-14 16:05:02,337 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:02,370 - INFO - Going to convert document batch...
2025-11-14 16:05:02,372 - INFO - Processing document 4_2023-02-21
2025-11-14 16:05:02,428 - INFO - Finished converting document 4_2023-02-21 in 0.11 sec.
2025-11-14 16:05:02,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:02,565 - INFO - Going to convert document batch...
2025-11-14 16:05:02,568 - INFO - Processing document 4_2023-02-22
2025-11-14 16:05:02,646 - INFO - Finished converting document 4_2023-02-22 in 0.14 sec.


Converted 'data\edgar_documents\COP\4_2023-02-21' --> 'data\processed_data\COP\4_2023-02-21.md'


2025-11-14 16:05:02,742 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:02,779 - INFO - Going to convert document batch...
2025-11-14 16:05:02,781 - INFO - Processing document 4_2023-02-23
2025-11-14 16:05:02,843 - INFO - Finished converting document 4_2023-02-23 in 0.12 sec.


Converted 'data\edgar_documents\COP\4_2023-02-22' --> 'data\processed_data\COP\4_2023-02-22.md'
Converted 'data\edgar_documents\COP\4_2023-02-23' --> 'data\processed_data\COP\4_2023-02-23.md'


2025-11-14 16:05:02,942 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:02,970 - INFO - Going to convert document batch...
2025-11-14 16:05:02,971 - INFO - Processing document 4_2023-03-02
2025-11-14 16:05:03,019 - INFO - Finished converting document 4_2023-03-02 in 0.11 sec.
2025-11-14 16:05:03,113 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:03,141 - INFO - Going to convert document batch...
2025-11-14 16:05:03,144 - INFO - Processing document 4_2023-04-04
2025-11-14 16:05:03,209 - INFO - Finished converting document 4_2023-04-04 in 0.12 sec.


Converted 'data\edgar_documents\COP\4_2023-03-02' --> 'data\processed_data\COP\4_2023-03-02.md'


2025-11-14 16:05:03,285 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:03,305 - INFO - Going to convert document batch...
2025-11-14 16:05:03,306 - INFO - Processing document 4_2023-04-19
2025-11-14 16:05:03,357 - INFO - Finished converting document 4_2023-04-19 in 0.09 sec.
2025-11-14 16:05:03,431 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:03,452 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COP\4_2023-04-04' --> 'data\processed_data\COP\4_2023-04-04.md'
Converted 'data\edgar_documents\COP\4_2023-04-19' --> 'data\processed_data\COP\4_2023-04-19.md'


2025-11-14 16:05:03,456 - INFO - Processing document 4_2023-05-02
2025-11-14 16:05:03,518 - INFO - Finished converting document 4_2023-05-02 in 0.11 sec.
2025-11-14 16:05:03,585 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:03,602 - INFO - Going to convert document batch...
2025-11-14 16:05:03,603 - INFO - Processing document 4_2023-05-09
2025-11-14 16:05:03,637 - INFO - Finished converting document 4_2023-05-09 in 0.08 sec.
2025-11-14 16:05:03,732 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:05:03,734 - ERROR - Input document 4_2023-05-10 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, 

Converted 'data\edgar_documents\COP\4_2023-05-02' --> 'data\processed_data\COP\4_2023-05-02.md'
Converted 'data\edgar_documents\COP\4_2023-05-09' --> 'data\processed_data\COP\4_2023-05-09.md'
Error processing data\edgar_documents\COP\4_2023-05-10: File format not allowed: data\edgar_documents\COP\4_2023-05-10


2025-11-14 16:05:03,807 - INFO - Going to convert document batch...
2025-11-14 16:05:03,809 - INFO - Processing document 4_2023-06-01
2025-11-14 16:05:03,878 - INFO - Finished converting document 4_2023-06-01 in 0.14 sec.
2025-11-14 16:05:03,944 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:03,959 - INFO - Going to convert document batch...
2025-11-14 16:05:03,959 - INFO - Processing document 4_2023-07-05
2025-11-14 16:05:03,995 - INFO - Finished converting document 4_2023-07-05 in 0.08 sec.
2025-11-14 16:05:04,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:04,087 - INFO - Going to convert document batch...
2025-11-14 16:05:04,092 - INFO - Processing document 4_2023-08-02


Converted 'data\edgar_documents\COP\4_2023-06-01' --> 'data\processed_data\COP\4_2023-06-01.md'
Converted 'data\edgar_documents\COP\4_2023-07-05' --> 'data\processed_data\COP\4_2023-07-05.md'


2025-11-14 16:05:04,136 - INFO - Finished converting document 4_2023-08-02 in 0.11 sec.
2025-11-14 16:05:04,233 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:05:04,235 - ERROR - Input document 4_2023-08-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:05:04,237 - INFO - Going to convert document batch...
2025-11-14 16:05:04,277 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:05:04,278 - ERROR - Input document 4_2023-08-09 with forma

Converted 'data\edgar_documents\COP\4_2023-08-02' --> 'data\processed_data\COP\4_2023-08-02.md'
Error processing data\edgar_documents\COP\4_2023-08-08: File format not allowed: data\edgar_documents\COP\4_2023-08-08
Error processing data\edgar_documents\COP\4_2023-08-09: File format not allowed: data\edgar_documents\COP\4_2023-08-09


2025-11-14 16:05:04,403 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:04,421 - INFO - Going to convert document batch...
2025-11-14 16:05:04,422 - INFO - Processing document 4_2023-09-06
2025-11-14 16:05:04,466 - INFO - Finished converting document 4_2023-09-06 in 0.08 sec.
2025-11-14 16:05:04,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:04,551 - INFO - Going to convert document batch...
2025-11-14 16:05:04,552 - INFO - Processing document 4_2023-09-19


Converted 'data\edgar_documents\COP\4_2023-09-05' --> 'data\processed_data\COP\4_2023-09-05.md'
Converted 'data\edgar_documents\COP\4_2023-09-06' --> 'data\processed_data\COP\4_2023-09-06.md'


2025-11-14 16:05:04,586 - INFO - Finished converting document 4_2023-09-19 in 0.06 sec.
2025-11-14 16:05:04,635 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:04,653 - INFO - Going to convert document batch...
2025-11-14 16:05:04,654 - INFO - Processing document 4_2023-09-20
2025-11-14 16:05:04,690 - INFO - Finished converting document 4_2023-09-20 in 0.06 sec.
2025-11-14 16:05:04,775 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\4_2023-09-19' --> 'data\processed_data\COP\4_2023-09-19.md'
Converted 'data\edgar_documents\COP\4_2023-09-20' --> 'data\processed_data\COP\4_2023-09-20.md'


2025-11-14 16:05:04,808 - INFO - Going to convert document batch...
2025-11-14 16:05:04,811 - INFO - Processing document 4_2023-09-28
2025-11-14 16:05:04,883 - INFO - Finished converting document 4_2023-09-28 in 0.14 sec.
2025-11-14 16:05:04,939 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:04,957 - INFO - Going to convert document batch...
2025-11-14 16:05:04,959 - INFO - Processing document 4_2023-10-03
2025-11-14 16:05:04,995 - INFO - Finished converting document 4_2023-10-03 in 0.08 sec.
2025-11-14 16:05:05,047 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:05,060 - INFO - Going to convert document batch...
2025-11-14 16:05:05,063 - INFO - Processing document 4_2023-11-02


Converted 'data\edgar_documents\COP\4_2023-09-28' --> 'data\processed_data\COP\4_2023-09-28.md'
Converted 'data\edgar_documents\COP\4_2023-10-03' --> 'data\processed_data\COP\4_2023-10-03.md'


2025-11-14 16:05:05,109 - INFO - Finished converting document 4_2023-11-02 in 0.08 sec.
2025-11-14 16:05:05,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:05,181 - INFO - Going to convert document batch...
2025-11-14 16:05:05,182 - INFO - Processing document 4_2023-11-13
2025-11-14 16:05:05,216 - INFO - Finished converting document 4_2023-11-13 in 0.08 sec.
2025-11-14 16:05:05,264 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:05,287 - INFO - Going to convert document batch...
2025-11-14 16:05:05,290 - INFO - Processing document 4_2023-12-04
2025-11-14 16:05:05,325 - INFO - Finished converting document 4_2023-12-04 in 0.08 sec.


Converted 'data\edgar_documents\COP\4_2023-11-02' --> 'data\processed_data\COP\4_2023-11-02.md'
Converted 'data\edgar_documents\COP\4_2023-11-13' --> 'data\processed_data\COP\4_2023-11-13.md'


2025-11-14 16:05:05,379 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:05,394 - INFO - Going to convert document batch...
2025-11-14 16:05:05,395 - INFO - Processing document 4_2023-12-18
2025-11-14 16:05:05,437 - INFO - Finished converting document 4_2023-12-18 in 0.08 sec.
2025-11-14 16:05:05,502 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\4_2023-12-04' --> 'data\processed_data\COP\4_2023-12-04.md'
Converted 'data\edgar_documents\COP\4_2023-12-18' --> 'data\processed_data\COP\4_2023-12-18.md'


2025-11-14 16:05:06,238 - INFO - Going to convert document batch...
2025-11-14 16:05:06,240 - INFO - Processing document 4_2024-01-02
2025-11-14 16:05:06,276 - INFO - Finished converting document 4_2024-01-02 in 0.81 sec.
2025-11-14 16:05:06,467 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:06,500 - INFO - Going to convert document batch...
2025-11-14 16:05:06,502 - INFO - Processing document 4_2024-01-04


Converted 'data\edgar_documents\COP\4_2024-01-02' --> 'data\processed_data\COP\4_2024-01-02.md'


2025-11-14 16:05:06,558 - INFO - Finished converting document 4_2024-01-04 in 0.23 sec.
2025-11-14 16:05:06,639 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:06,656 - INFO - Going to convert document batch...
2025-11-14 16:05:06,657 - INFO - Processing document 4_2024-01-05
2025-11-14 16:05:06,691 - INFO - Finished converting document 4_2024-01-05 in 0.08 sec.
2025-11-14 16:05:06,749 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:06,759 - INFO - Going to convert document batch...
2025-11-14 16:05:06,760 - INFO - Processing document 4_2024-01-17
2025-11-14 16:05:06,781 - INFO - Finished converting document 4_2024-01-17 in 0.06 sec.


Converted 'data\edgar_documents\COP\4_2024-01-04' --> 'data\processed_data\COP\4_2024-01-04.md'
Converted 'data\edgar_documents\COP\4_2024-01-05' --> 'data\processed_data\COP\4_2024-01-05.md'
Converted 'data\edgar_documents\COP\4_2024-01-17' --> 'data\processed_data\COP\4_2024-01-17.md'


2025-11-14 16:05:06,834 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:06,874 - INFO - Going to convert document batch...
2025-11-14 16:05:06,890 - INFO - Processing document 4_2024-02-02
2025-11-14 16:05:06,927 - INFO - Finished converting document 4_2024-02-02 in 0.11 sec.
2025-11-14 16:05:06,990 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:07,007 - INFO - Going to convert document batch...
2025-11-14 16:05:07,008 - INFO - Processing document 4_2024-02-13
2025-11-14 16:05:07,077 - INFO - Finished converting document 4_2024-02-13 in 0.11 sec.


Converted 'data\edgar_documents\COP\4_2024-02-02' --> 'data\processed_data\COP\4_2024-02-02.md'
Converted 'data\edgar_documents\COP\4_2024-02-13' --> 'data\processed_data\COP\4_2024-02-13.md'


2025-11-14 16:05:07,173 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:07,203 - INFO - Going to convert document batch...
2025-11-14 16:05:07,206 - INFO - Processing document 4_2024-02-14
2025-11-14 16:05:07,286 - INFO - Finished converting document 4_2024-02-14 in 0.14 sec.
2025-11-14 16:05:07,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:07,357 - INFO - Going to convert document batch...
2025-11-14 16:05:07,358 - INFO - Processing document 4_2024-02-22
2025-11-14 16:05:07,390 - INFO - Finished converting document 4_2024-02-22 in 0.06 sec.
2025-11-14 16:05:07,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:07,471 - INFO - Going to convert document batch...
2025-11-14 16:05:07,472 - INFO - Processing document 4_2024-02-29
2025-11-14 16:05:07,505 - INFO - Finished converting document 4_2024-02-29 in 0.08 sec.


Converted 'data\edgar_documents\COP\4_2024-02-14' --> 'data\processed_data\COP\4_2024-02-14.md'
Converted 'data\edgar_documents\COP\4_2024-02-22' --> 'data\processed_data\COP\4_2024-02-22.md'


2025-11-14 16:05:07,570 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:07,591 - INFO - Going to convert document batch...
2025-11-14 16:05:07,593 - INFO - Processing document 4_2024-03-04
2025-11-14 16:05:07,628 - INFO - Finished converting document 4_2024-03-04 in 0.08 sec.
2025-11-14 16:05:07,690 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:07,713 - INFO - Going to convert document batch...
2025-11-14 16:05:07,714 - INFO - Processing document 4_2024-03-25


Converted 'data\edgar_documents\COP\4_2024-02-29' --> 'data\processed_data\COP\4_2024-02-29.md'
Converted 'data\edgar_documents\COP\4_2024-03-04' --> 'data\processed_data\COP\4_2024-03-04.md'


2025-11-14 16:05:07,762 - INFO - Finished converting document 4_2024-03-25 in 0.11 sec.
2025-11-14 16:05:07,841 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:07,877 - INFO - Going to convert document batch...
2025-11-14 16:05:07,879 - INFO - Processing document 4_2024-03-26
2025-11-14 16:05:07,951 - INFO - Finished converting document 4_2024-03-26 in 0.12 sec.


Converted 'data\edgar_documents\COP\4_2024-03-25' --> 'data\processed_data\COP\4_2024-03-25.md'
Converted 'data\edgar_documents\COP\4_2024-03-26' --> 'data\processed_data\COP\4_2024-03-26.md'


2025-11-14 16:05:08,049 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:08,064 - INFO - Going to convert document batch...
2025-11-14 16:05:08,066 - INFO - Processing document 4_2024-04-02
2025-11-14 16:05:08,104 - INFO - Finished converting document 4_2024-04-02 in 0.09 sec.
2025-11-14 16:05:08,154 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:08,170 - INFO - Going to convert document batch...
2025-11-14 16:05:08,178 - INFO - Processing document 4_2024-04-17
2025-11-14 16:05:08,226 - INFO - Finished converting document 4_2024-04-17 in 0.08 sec.
2025-11-14 16:05:08,312 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\4_2024-04-02' --> 'data\processed_data\COP\4_2024-04-02.md'
Converted 'data\edgar_documents\COP\4_2024-04-17' --> 'data\processed_data\COP\4_2024-04-17.md'


2025-11-14 16:05:08,343 - INFO - Going to convert document batch...
2025-11-14 16:05:08,346 - INFO - Processing document 4_2024-05-02
2025-11-14 16:05:08,398 - INFO - Finished converting document 4_2024-05-02 in 0.09 sec.
2025-11-14 16:05:08,479 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:05:08,481 - ERROR - Input document 4_2024-05-29 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:05:08,483 - INFO - Going to convert document batch...
2025-11-14 16:05:08,505 - IN

Converted 'data\edgar_documents\COP\4_2024-05-02' --> 'data\processed_data\COP\4_2024-05-02.md'
Error processing data\edgar_documents\COP\4_2024-05-29: File format not allowed: data\edgar_documents\COP\4_2024-05-29
Converted 'data\edgar_documents\COP\4_2024-06-04' --> 'data\processed_data\COP\4_2024-06-04.md'


2025-11-14 16:05:08,664 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:08,715 - INFO - Going to convert document batch...
2025-11-14 16:05:08,718 - INFO - Processing document 4_2024-07-02
2025-11-14 16:05:08,842 - INFO - Finished converting document 4_2024-07-02 in 0.20 sec.
2025-11-14 16:05:08,905 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:05:08,907 - ERROR - Input document 4_2024-07-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:05

Converted 'data\edgar_documents\COP\4_2024-07-02' --> 'data\processed_data\COP\4_2024-07-02.md'
Error processing data\edgar_documents\COP\4_2024-07-12: File format not allowed: data\edgar_documents\COP\4_2024-07-12
Error processing data\edgar_documents\COP\4_2024-07-29: File format not allowed: data\edgar_documents\COP\4_2024-07-29
Error processing data\edgar_documents\COP\4_2024-08-01: File format not allowed: data\edgar_documents\COP\4_2024-08-01


2025-11-14 16:05:09,100 - INFO - Going to convert document batch...
2025-11-14 16:05:09,102 - INFO - Processing document 4_2024-08-02
2025-11-14 16:05:09,163 - INFO - Finished converting document 4_2024-08-02 in 0.11 sec.
2025-11-14 16:05:09,227 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:09,257 - INFO - Going to convert document batch...
2025-11-14 16:05:09,259 - INFO - Processing document 4_2024-08-14
2025-11-14 16:05:09,327 - INFO - Finished converting document 4_2024-08-14 in 0.12 sec.
2025-11-14 16:05:09,402 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\4_2024-08-02' --> 'data\processed_data\COP\4_2024-08-02.md'
Converted 'data\edgar_documents\COP\4_2024-08-14' --> 'data\processed_data\COP\4_2024-08-14.md'


2025-11-14 16:05:09,459 - INFO - Going to convert document batch...
2025-11-14 16:05:09,462 - INFO - Processing document 4_2024-09-04
2025-11-14 16:05:09,506 - INFO - Finished converting document 4_2024-09-04 in 0.11 sec.
2025-11-14 16:05:09,581 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:09,609 - INFO - Going to convert document batch...
2025-11-14 16:05:09,611 - INFO - Processing document 4_2024-10-02
2025-11-14 16:05:09,674 - INFO - Finished converting document 4_2024-10-02 in 0.11 sec.


Converted 'data\edgar_documents\COP\4_2024-09-04' --> 'data\processed_data\COP\4_2024-09-04.md'


2025-11-14 16:05:09,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:09,822 - INFO - Going to convert document batch...
2025-11-14 16:05:09,824 - INFO - Processing document 4_2024-11-04
2025-11-14 16:05:09,876 - INFO - Finished converting document 4_2024-11-04 in 0.11 sec.


Converted 'data\edgar_documents\COP\4_2024-10-02' --> 'data\processed_data\COP\4_2024-10-02.md'
Converted 'data\edgar_documents\COP\4_2024-11-04' --> 'data\processed_data\COP\4_2024-11-04.md'


2025-11-14 16:05:09,961 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:09,998 - INFO - Going to convert document batch...
2025-11-14 16:05:10,000 - INFO - Processing document 4_2024-11-22
2025-11-14 16:05:10,086 - INFO - Finished converting document 4_2024-11-22 in 0.16 sec.
2025-11-14 16:05:10,192 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:05:10,193 - ERROR - Input document 4_2024-11-25 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:05

Converted 'data\edgar_documents\COP\4_2024-11-22' --> 'data\processed_data\COP\4_2024-11-22.md'
Error processing data\edgar_documents\COP\4_2024-11-25: File format not allowed: data\edgar_documents\COP\4_2024-11-25
Error processing data\edgar_documents\COP\4_2024-11-26: File format not allowed: data\edgar_documents\COP\4_2024-11-26


2025-11-14 16:05:10,441 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:10,467 - INFO - Going to convert document batch...
2025-11-14 16:05:10,469 - INFO - Processing document 4_2024-12-16
2025-11-14 16:05:10,542 - INFO - Finished converting document 4_2024-12-16 in 0.12 sec.


Converted 'data\edgar_documents\COP\4_2024-12-02' --> 'data\processed_data\COP\4_2024-12-02.md'
Converted 'data\edgar_documents\COP\4_2024-12-16' --> 'data\processed_data\COP\4_2024-12-16.md'


2025-11-14 16:05:10,631 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:10,656 - INFO - Going to convert document batch...
2025-11-14 16:05:10,657 - INFO - Processing document 4_2024-12-18
2025-11-14 16:05:10,711 - INFO - Finished converting document 4_2024-12-18 in 0.11 sec.
2025-11-14 16:05:10,784 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:10,814 - INFO - Going to convert document batch...
2025-11-14 16:05:10,817 - INFO - Processing document 4_2024-12-20
2025-11-14 16:05:10,881 - INFO - Finished converting document 4_2024-12-20 in 0.11 sec.
2025-11-14 16:05:10,960 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\4_2024-12-18' --> 'data\processed_data\COP\4_2024-12-18.md'
Converted 'data\edgar_documents\COP\4_2024-12-20' --> 'data\processed_data\COP\4_2024-12-20.md'


2025-11-14 16:05:10,992 - INFO - Going to convert document batch...
2025-11-14 16:05:10,994 - INFO - Processing document 4_2024-12-30
2025-11-14 16:05:11,047 - INFO - Finished converting document 4_2024-12-30 in 0.11 sec.
2025-11-14 16:05:11,107 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:11,117 - INFO - Going to convert document batch...
2025-11-14 16:05:11,117 - INFO - Processing document 4_2025-01-02
2025-11-14 16:05:11,180 - INFO - Finished converting document 4_2025-01-02 in 0.09 sec.


Converted 'data\edgar_documents\COP\4_2024-12-30' --> 'data\processed_data\COP\4_2024-12-30.md'
Converted 'data\edgar_documents\COP\4_2025-01-02' --> 'data\processed_data\COP\4_2025-01-02.md'


2025-11-14 16:05:11,273 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:11,303 - INFO - Going to convert document batch...
2025-11-14 16:05:11,306 - INFO - Processing document 4_2025-01-17
2025-11-14 16:05:11,373 - INFO - Finished converting document 4_2025-01-17 in 0.14 sec.
2025-11-14 16:05:11,452 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:11,480 - INFO - Going to convert document batch...
2025-11-14 16:05:11,482 - INFO - Processing document 4_2025-02-04
2025-11-14 16:05:11,547 - INFO - Finished converting document 4_2025-02-04 in 0.11 sec.
2025-11-14 16:05:11,642 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\4_2025-01-17' --> 'data\processed_data\COP\4_2025-01-17.md'
Converted 'data\edgar_documents\COP\4_2025-02-04' --> 'data\processed_data\COP\4_2025-02-04.md'


2025-11-14 16:05:11,685 - INFO - Going to convert document batch...
2025-11-14 16:05:11,686 - INFO - Processing document 4_2025-02-11
2025-11-14 16:05:11,727 - INFO - Finished converting document 4_2025-02-11 in 0.11 sec.
2025-11-14 16:05:11,799 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:11,821 - INFO - Going to convert document batch...
2025-11-14 16:05:11,822 - INFO - Processing document 4_2025-02-13
2025-11-14 16:05:11,858 - INFO - Finished converting document 4_2025-02-13 in 0.09 sec.
2025-11-14 16:05:11,949 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\4_2025-02-11' --> 'data\processed_data\COP\4_2025-02-11.md'
Converted 'data\edgar_documents\COP\4_2025-02-13' --> 'data\processed_data\COP\4_2025-02-13.md'


2025-11-14 16:05:11,981 - INFO - Going to convert document batch...
2025-11-14 16:05:11,984 - INFO - Processing document 4_2025-03-04
2025-11-14 16:05:12,053 - INFO - Finished converting document 4_2025-03-04 in 0.12 sec.
2025-11-14 16:05:12,128 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:12,146 - INFO - Going to convert document batch...
2025-11-14 16:05:12,148 - INFO - Processing document 4_2025-04-02
2025-11-14 16:05:12,201 - INFO - Finished converting document 4_2025-04-02 in 0.09 sec.
2025-11-14 16:05:12,272 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\4_2025-03-04' --> 'data\processed_data\COP\4_2025-03-04.md'
Converted 'data\edgar_documents\COP\4_2025-04-02' --> 'data\processed_data\COP\4_2025-04-02.md'


2025-11-14 16:05:12,301 - INFO - Going to convert document batch...
2025-11-14 16:05:12,305 - INFO - Processing document 4_2025-05-01
2025-11-14 16:05:12,376 - INFO - Finished converting document 4_2025-05-01 in 0.14 sec.
2025-11-14 16:05:12,464 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:05:12,466 - ERROR - Input document 4_2025-05-16 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:05:12,468 - INFO - Going to convert document batch...
2025-11-14 16:05:12,488 - IN

Converted 'data\edgar_documents\COP\4_2025-05-01' --> 'data\processed_data\COP\4_2025-05-01.md'
Error processing data\edgar_documents\COP\4_2025-05-16: File format not allowed: data\edgar_documents\COP\4_2025-05-16


2025-11-14 16:05:12,688 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:12,713 - INFO - Going to convert document batch...
2025-11-14 16:05:12,715 - INFO - Processing document 4_2025-06-17
2025-11-14 16:05:12,758 - INFO - Finished converting document 4_2025-06-17 in 0.09 sec.
2025-11-14 16:05:12,812 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:12,829 - INFO - Going to convert document batch...
2025-11-14 16:05:12,830 - INFO - Processing document 4_2025-07-02


Converted 'data\edgar_documents\COP\4_2025-06-02' --> 'data\processed_data\COP\4_2025-06-02.md'
Converted 'data\edgar_documents\COP\4_2025-06-17' --> 'data\processed_data\COP\4_2025-06-17.md'


2025-11-14 16:05:12,867 - INFO - Finished converting document 4_2025-07-02 in 0.06 sec.
2025-11-14 16:05:12,957 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:12,996 - INFO - Going to convert document batch...
2025-11-14 16:05:13,002 - INFO - Processing document 4_2025-08-04
2025-11-14 16:05:13,051 - INFO - Finished converting document 4_2025-08-04 in 0.12 sec.
2025-11-14 16:05:13,116 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\4_2025-07-02' --> 'data\processed_data\COP\4_2025-07-02.md'
Converted 'data\edgar_documents\COP\4_2025-08-04' --> 'data\processed_data\COP\4_2025-08-04.md'


2025-11-14 16:05:13,131 - INFO - Going to convert document batch...
2025-11-14 16:05:13,132 - INFO - Processing document 4_2025-09-03
2025-11-14 16:05:13,169 - INFO - Finished converting document 4_2025-09-03 in 0.08 sec.
2025-11-14 16:05:13,214 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:13,239 - INFO - Going to convert document batch...
2025-11-14 16:05:13,242 - INFO - Processing document 4_2025-10-02
2025-11-14 16:05:13,317 - INFO - Finished converting document 4_2025-10-02 in 0.11 sec.


Converted 'data\edgar_documents\COP\4_2025-09-03' --> 'data\processed_data\COP\4_2025-09-03.md'
Converted 'data\edgar_documents\COP\4_2025-10-02' --> 'data\processed_data\COP\4_2025-10-02.md'


2025-11-14 16:05:13,394 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:13,415 - INFO - Going to convert document batch...
2025-11-14 16:05:13,416 - INFO - Processing document 4_2025-11-10
2025-11-14 16:05:13,457 - INFO - Finished converting document 4_2025-11-10 in 0.09 sec.
2025-11-14 16:05:13,534 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:13,574 - INFO - Going to convert document batch...
2025-11-14 16:05:13,576 - INFO - Processing document 8-K_2023-02-02
2025-11-14 16:05:13,622 - INFO - Finished converting document 8-K_2023-02-02 in 0.12 sec.


Converted 'data\edgar_documents\COP\4_2025-11-10' --> 'data\processed_data\COP\4_2025-11-10.md'
Converted 'data\edgar_documents\COP\8-K_2023-02-02' --> 'data\processed_data\COP\8-K_2023-02-02.md'


2025-11-14 16:05:13,683 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:13,724 - INFO - Going to convert document batch...
2025-11-14 16:05:13,727 - INFO - Processing document 8-K_2023-05-04
2025-11-14 16:05:13,791 - INFO - Finished converting document 8-K_2023-05-04 in 0.16 sec.
2025-11-14 16:05:13,842 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:13,915 - INFO - Going to convert document batch...
2025-11-14 16:05:13,917 - INFO - Processing document 8-K_2023-05-18


Converted 'data\edgar_documents\COP\8-K_2023-05-04' --> 'data\processed_data\COP\8-K_2023-05-04.md'


2025-11-14 16:05:14,094 - INFO - Finished converting document 8-K_2023-05-18 in 0.27 sec.
2025-11-14 16:05:14,296 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:14,325 - INFO - Going to convert document batch...
2025-11-14 16:05:14,326 - INFO - Processing document 8-K_2023-05-23
2025-11-14 16:05:14,362 - INFO - Finished converting document 8-K_2023-05-23 in 0.09 sec.
2025-11-14 16:05:14,432 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\8-K_2023-05-18' --> 'data\processed_data\COP\8-K_2023-05-18.md'
Converted 'data\edgar_documents\COP\8-K_2023-05-23' --> 'data\processed_data\COP\8-K_2023-05-23.md'


2025-11-14 16:05:14,474 - INFO - Going to convert document batch...
2025-11-14 16:05:14,477 - INFO - Processing document 8-K_2023-08-03
2025-11-14 16:05:14,529 - INFO - Finished converting document 8-K_2023-08-03 in 0.14 sec.
2025-11-14 16:05:14,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:14,621 - INFO - Going to convert document batch...
2025-11-14 16:05:14,622 - INFO - Processing document 8-K_2023-08-17
2025-11-14 16:05:14,675 - INFO - Finished converting document 8-K_2023-08-17 in 0.12 sec.


Converted 'data\edgar_documents\COP\8-K_2023-08-03' --> 'data\processed_data\COP\8-K_2023-08-03.md'
Converted 'data\edgar_documents\COP\8-K_2023-08-17' --> 'data\processed_data\COP\8-K_2023-08-17.md'


2025-11-14 16:05:14,761 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:14,805 - INFO - Going to convert document batch...
2025-11-14 16:05:14,806 - INFO - Processing document 8-K_2023-11-02
2025-11-14 16:05:14,844 - INFO - Finished converting document 8-K_2023-11-02 in 0.12 sec.
2025-11-14 16:05:14,888 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:14,915 - INFO - Going to convert document batch...
2025-11-14 16:05:14,917 - INFO - Processing document 8-K_2024-02-08
2025-11-14 16:05:14,965 - INFO - Finished converting document 8-K_2024-02-08 in 0.09 sec.
2025-11-14 16:05:15,038 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\8-K_2023-11-02' --> 'data\processed_data\COP\8-K_2023-11-02.md'
Converted 'data\edgar_documents\COP\8-K_2024-02-08' --> 'data\processed_data\COP\8-K_2024-02-08.md'


2025-11-14 16:05:15,072 - INFO - Going to convert document batch...
2025-11-14 16:05:15,076 - INFO - Processing document 8-K_2024-02-15
2025-11-14 16:05:15,138 - INFO - Finished converting document 8-K_2024-02-15 in 0.14 sec.
2025-11-14 16:05:15,188 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:15,219 - INFO - Going to convert document batch...
2025-11-14 16:05:15,223 - INFO - Processing document 8-K_2024-05-02
2025-11-14 16:05:15,272 - INFO - Finished converting document 8-K_2024-05-02 in 0.09 sec.
2025-11-14 16:05:15,344 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\8-K_2024-02-15' --> 'data\processed_data\COP\8-K_2024-02-15.md'
Converted 'data\edgar_documents\COP\8-K_2024-05-02' --> 'data\processed_data\COP\8-K_2024-05-02.md'


2025-11-14 16:05:15,411 - INFO - Going to convert document batch...
2025-11-14 16:05:15,413 - INFO - Processing document 8-K_2024-05-16
2025-11-14 16:05:15,535 - INFO - Finished converting document 8-K_2024-05-16 in 0.23 sec.
2025-11-14 16:05:15,610 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:15,636 - INFO - Going to convert document batch...
2025-11-14 16:05:15,638 - INFO - Processing document 8-K_2024-05-29
2025-11-14 16:05:15,711 - INFO - Finished converting document 8-K_2024-05-29 in 0.12 sec.


Converted 'data\edgar_documents\COP\8-K_2024-05-16' --> 'data\processed_data\COP\8-K_2024-05-16.md'


2025-11-14 16:05:15,812 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:15,847 - INFO - Going to convert document batch...
2025-11-14 16:05:15,850 - INFO - Processing document 8-K_2024-07-02
2025-11-14 16:05:15,888 - INFO - Finished converting document 8-K_2024-07-02 in 0.09 sec.
2025-11-14 16:05:15,939 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:15,969 - INFO - Going to convert document batch...
2025-11-14 16:05:15,971 - INFO - Processing document 8-K_2024-07-12


Converted 'data\edgar_documents\COP\8-K_2024-05-29' --> 'data\processed_data\COP\8-K_2024-05-29.md'
Converted 'data\edgar_documents\COP\8-K_2024-07-02' --> 'data\processed_data\COP\8-K_2024-07-02.md'


2025-11-14 16:05:16,021 - INFO - Finished converting document 8-K_2024-07-12 in 0.11 sec.
2025-11-14 16:05:16,475 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:16,494 - INFO - Going to convert document batch...
2025-11-14 16:05:16,495 - INFO - Processing document 8-K_2024-08-01
2025-11-14 16:05:16,524 - INFO - Finished converting document 8-K_2024-08-01 in 0.06 sec.
2025-11-14 16:05:16,582 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:16,611 - INFO - Going to convert document batch...
2025-11-14 16:05:16,612 - INFO - Processing document 8-K_2024-09-03


Converted 'data\edgar_documents\COP\8-K_2024-07-12' --> 'data\processed_data\COP\8-K_2024-07-12.md'
Converted 'data\edgar_documents\COP\8-K_2024-08-01' --> 'data\processed_data\COP\8-K_2024-08-01.md'


2025-11-14 16:05:16,673 - INFO - Finished converting document 8-K_2024-09-03 in 0.14 sec.
2025-11-14 16:05:16,731 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:16,749 - INFO - Going to convert document batch...
2025-11-14 16:05:16,750 - INFO - Processing document 8-K_2024-10-31
2025-11-14 16:05:16,787 - INFO - Finished converting document 8-K_2024-10-31 in 0.06 sec.
2025-11-14 16:05:16,843 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\8-K_2024-09-03' --> 'data\processed_data\COP\8-K_2024-09-03.md'
Converted 'data\edgar_documents\COP\8-K_2024-10-31' --> 'data\processed_data\COP\8-K_2024-10-31.md'


2025-11-14 16:05:16,912 - INFO - Going to convert document batch...
2025-11-14 16:05:16,914 - INFO - Processing document 8-K_2024-11-22
2025-11-14 16:05:17,066 - INFO - Finished converting document 8-K_2024-11-22 in 0.25 sec.
2025-11-14 16:05:17,185 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:17,202 - INFO - Going to convert document batch...
2025-11-14 16:05:17,203 - INFO - Processing document 8-K_2024-11-25
2025-11-14 16:05:17,271 - INFO - Finished converting document 8-K_2024-11-25 in 0.11 sec.


Converted 'data\edgar_documents\COP\8-K_2024-11-22' --> 'data\processed_data\COP\8-K_2024-11-22.md'
Converted 'data\edgar_documents\COP\8-K_2024-11-25' --> 'data\processed_data\COP\8-K_2024-11-25.md'


2025-11-14 16:05:17,351 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:17,387 - INFO - Going to convert document batch...
2025-11-14 16:05:17,389 - INFO - Processing document 8-K_2024-12-05
2025-11-14 16:05:17,485 - INFO - Finished converting document 8-K_2024-12-05 in 0.17 sec.
2025-11-14 16:05:17,585 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:17,625 - INFO - Going to convert document batch...
2025-11-14 16:05:17,627 - INFO - Processing document 8-K_2024-12-10
2025-11-14 16:05:17,696 - INFO - Finished converting document 8-K_2024-12-10 in 0.16 sec.


Converted 'data\edgar_documents\COP\8-K_2024-12-05' --> 'data\processed_data\COP\8-K_2024-12-05.md'


2025-11-14 16:05:17,778 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:17,828 - INFO - Going to convert document batch...
2025-11-14 16:05:17,830 - INFO - Processing document 8-K_2024-12-30
2025-11-14 16:05:17,891 - INFO - Finished converting document 8-K_2024-12-30 in 0.16 sec.


Converted 'data\edgar_documents\COP\8-K_2024-12-10' --> 'data\processed_data\COP\8-K_2024-12-10.md'


2025-11-14 16:05:17,964 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:18,002 - INFO - Going to convert document batch...
2025-11-14 16:05:18,002 - INFO - Processing document 8-K_2025-01-28
2025-11-14 16:05:18,048 - INFO - Finished converting document 8-K_2025-01-28 in 0.09 sec.
2025-11-14 16:05:18,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:18,129 - INFO - Going to convert document batch...
2025-11-14 16:05:18,130 - INFO - Processing document 8-K_2025-02-06
2025-11-14 16:05:18,154 - INFO - Finished converting document 8-K_2025-02-06 in 0.08 sec.


Converted 'data\edgar_documents\COP\8-K_2024-12-30' --> 'data\processed_data\COP\8-K_2024-12-30.md'
Converted 'data\edgar_documents\COP\8-K_2025-01-28' --> 'data\processed_data\COP\8-K_2025-01-28.md'


2025-11-14 16:05:18,180 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:18,199 - INFO - Going to convert document batch...
2025-11-14 16:05:18,201 - INFO - Processing document 8-K_2025-05-08
2025-11-14 16:05:18,232 - INFO - Finished converting document 8-K_2025-05-08 in 0.06 sec.
2025-11-14 16:05:18,292 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\8-K_2025-02-06' --> 'data\processed_data\COP\8-K_2025-02-06.md'
Converted 'data\edgar_documents\COP\8-K_2025-05-08' --> 'data\processed_data\COP\8-K_2025-05-08.md'


2025-11-14 16:05:18,357 - INFO - Going to convert document batch...
2025-11-14 16:05:18,359 - INFO - Processing document 8-K_2025-05-15
2025-11-14 16:05:18,450 - INFO - Finished converting document 8-K_2025-05-15 in 0.20 sec.
2025-11-14 16:05:18,519 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:18,553 - INFO - Going to convert document batch...
2025-11-14 16:05:18,553 - INFO - Processing document 8-K_2025-07-01
2025-11-14 16:05:18,595 - INFO - Finished converting document 8-K_2025-07-01 in 0.09 sec.


Converted 'data\edgar_documents\COP\8-K_2025-05-15' --> 'data\processed_data\COP\8-K_2025-05-15.md'
Converted 'data\edgar_documents\COP\8-K_2025-07-01' --> 'data\processed_data\COP\8-K_2025-07-01.md'


2025-11-14 16:05:18,695 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:18,723 - INFO - Going to convert document batch...
2025-11-14 16:05:18,725 - INFO - Processing document 8-K_2025-08-07
2025-11-14 16:05:18,769 - INFO - Finished converting document 8-K_2025-08-07 in 0.11 sec.
2025-11-14 16:05:18,805 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:05:18,831 - INFO - Going to convert document batch...
2025-11-14 16:05:18,833 - INFO - Processing document 8-K_2025-11-06
2025-11-14 16:05:18,882 - INFO - Finished converting document 8-K_2025-11-06 in 0.09 sec.


Converted 'data\edgar_documents\COP\8-K_2025-08-07' --> 'data\processed_data\COP\8-K_2025-08-07.md'
Converted 'data\edgar_documents\COP\8-K_2025-11-06' --> 'data\processed_data\COP\8-K_2025-11-06.md'


2025-11-14 16:05:19,021 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:05:19,021 - ERROR - Input document DEF-14A_2023-04-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:05:19,025 - INFO - Going to convert document batch...
2025-11-14 16:05:19,095 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Error processing data\edgar_documents\COP\DEF-14A_2023-04-03: File format not allowed: data\edgar_documents\COP\DEF-14A_2023-04-03


2025-11-14 16:05:21,252 - INFO - Going to convert document batch...
2025-11-14 16:05:21,254 - INFO - Processing document DEF-14A_2024-04-01
2025-11-14 16:05:49,662 - INFO - Finished converting document DEF-14A_2024-04-01 in 30.62 sec.
2025-11-14 16:05:52,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\DEF-14A_2024-04-01' --> 'data\processed_data\COP\DEF-14A_2024-04-01.md'


2025-11-14 16:05:55,434 - INFO - Going to convert document batch...
2025-11-14 16:05:55,436 - INFO - Processing document DEF-14A_2025-03-31
2025-11-14 16:06:55,526 - INFO - Finished converting document DEF-14A_2025-03-31 in 63.11 sec.
2025-11-14 16:06:59,278 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COP\DEF-14A_2025-03-31' --> 'data\processed_data\COP\DEF-14A_2025-03-31.md'
Processed 112 new files. Errors: 12
Found 104 files to process in data\edgar_documents\COST


2025-11-14 16:07:00,365 - INFO - Going to convert document batch...
2025-11-14 16:07:00,366 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:07:00,368 - INFO - Processing document 10-K_2023-10-11
2025-11-14 16:07:02,295 - INFO - Finished converting document 10-K_2023-10-11 in 3.06 sec.
2025-11-14 16:07:03,139 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\10-K_2023-10-11' --> 'data\processed_data\COST\10-K_2023-10-11.md'


2025-11-14 16:07:03,930 - INFO - Going to convert document batch...
2025-11-14 16:07:03,931 - INFO - Processing document 10-K_2024-10-09
2025-11-14 16:07:06,813 - INFO - Finished converting document 10-K_2024-10-09 in 3.70 sec.
2025-11-14 16:07:07,683 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\10-K_2024-10-09' --> 'data\processed_data\COST\10-K_2024-10-09.md'


2025-11-14 16:07:08,554 - INFO - Going to convert document batch...
2025-11-14 16:07:08,557 - INFO - Processing document 10-K_2025-10-08
2025-11-14 16:07:10,380 - INFO - Finished converting document 10-K_2025-10-08 in 2.73 sec.
2025-11-14 16:07:11,324 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\10-K_2025-10-08' --> 'data\processed_data\COST\10-K_2025-10-08.md'


2025-11-14 16:07:12,017 - INFO - Going to convert document batch...
2025-11-14 16:07:12,018 - INFO - Processing document 10-Q_2023-03-09
2025-11-14 16:07:13,017 - INFO - Finished converting document 10-Q_2023-03-09 in 1.72 sec.
2025-11-14 16:07:13,564 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\10-Q_2023-03-09' --> 'data\processed_data\COST\10-Q_2023-03-09.md'


2025-11-14 16:07:14,842 - INFO - Going to convert document batch...
2025-11-14 16:07:14,844 - INFO - Processing document 10-Q_2023-06-01
2025-11-14 16:07:15,940 - INFO - Finished converting document 10-Q_2023-06-01 in 2.41 sec.
2025-11-14 16:07:16,458 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\10-Q_2023-06-01' --> 'data\processed_data\COST\10-Q_2023-06-01.md'


2025-11-14 16:07:16,856 - INFO - Going to convert document batch...
2025-11-14 16:07:16,858 - INFO - Processing document 10-Q_2023-12-20
2025-11-14 16:07:17,576 - INFO - Finished converting document 10-Q_2023-12-20 in 1.14 sec.
2025-11-14 16:07:17,991 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\10-Q_2023-12-20' --> 'data\processed_data\COST\10-Q_2023-12-20.md'


2025-11-14 16:07:18,420 - INFO - Going to convert document batch...
2025-11-14 16:07:18,421 - INFO - Processing document 10-Q_2024-03-13
2025-11-14 16:07:19,289 - INFO - Finished converting document 10-Q_2024-03-13 in 1.34 sec.
2025-11-14 16:07:19,759 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\10-Q_2024-03-13' --> 'data\processed_data\COST\10-Q_2024-03-13.md'


2025-11-14 16:07:20,788 - INFO - Going to convert document batch...
2025-11-14 16:07:20,790 - INFO - Processing document 10-Q_2024-06-06
2025-11-14 16:07:21,734 - INFO - Finished converting document 10-Q_2024-06-06 in 2.00 sec.
2025-11-14 16:07:22,503 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\10-Q_2024-06-06' --> 'data\processed_data\COST\10-Q_2024-06-06.md'


2025-11-14 16:07:22,875 - INFO - Going to convert document batch...
2025-11-14 16:07:22,877 - INFO - Processing document 10-Q_2024-12-19
2025-11-14 16:07:23,634 - INFO - Finished converting document 10-Q_2024-12-19 in 1.19 sec.
2025-11-14 16:07:24,147 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\10-Q_2024-12-19' --> 'data\processed_data\COST\10-Q_2024-12-19.md'


2025-11-14 16:07:24,617 - INFO - Going to convert document batch...
2025-11-14 16:07:24,618 - INFO - Processing document 10-Q_2025-03-13
2025-11-14 16:07:25,674 - INFO - Finished converting document 10-Q_2025-03-13 in 1.56 sec.
2025-11-14 16:07:26,309 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\10-Q_2025-03-13' --> 'data\processed_data\COST\10-Q_2025-03-13.md'


2025-11-14 16:07:27,233 - INFO - Going to convert document batch...
2025-11-14 16:07:27,235 - INFO - Processing document 10-Q_2025-06-05
2025-11-14 16:07:28,404 - INFO - Finished converting document 10-Q_2025-06-05 in 2.16 sec.
2025-11-14 16:07:28,952 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:28,971 - INFO - Going to convert document batch...
2025-11-14 16:07:28,975 - INFO - Processing document 4_2023-01-31
2025-11-14 16:07:29,014 - INFO - Finished converting document 4_2023-01-31 in 0.08 sec.
2025-11-14 16:07:29,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:29,144 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COST\10-Q_2025-06-05' --> 'data\processed_data\COST\10-Q_2025-06-05.md'
Converted 'data\edgar_documents\COST\4_2023-01-31' --> 'data\processed_data\COST\4_2023-01-31.md'


2025-11-14 16:07:29,146 - INFO - Processing document 4_2023-03-07
2025-11-14 16:07:29,201 - INFO - Finished converting document 4_2023-03-07 in 0.12 sec.
2025-11-14 16:07:29,258 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:29,275 - INFO - Going to convert document batch...
2025-11-14 16:07:29,277 - INFO - Processing document 4_2023-03-08
2025-11-14 16:07:29,343 - INFO - Finished converting document 4_2023-03-08 in 0.11 sec.
2025-11-14 16:07:29,434 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\4_2023-03-07' --> 'data\processed_data\COST\4_2023-03-07.md'
Converted 'data\edgar_documents\COST\4_2023-03-08' --> 'data\processed_data\COST\4_2023-03-08.md'


2025-11-14 16:07:29,459 - INFO - Going to convert document batch...
2025-11-14 16:07:29,461 - INFO - Processing document 4_2023-03-15
2025-11-14 16:07:29,549 - INFO - Finished converting document 4_2023-03-15 in 0.14 sec.
2025-11-14 16:07:29,650 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:29,680 - INFO - Going to convert document batch...
2025-11-14 16:07:29,681 - INFO - Processing document 4_2023-04-13
2025-11-14 16:07:29,737 - INFO - Finished converting document 4_2023-04-13 in 0.12 sec.


Converted 'data\edgar_documents\COST\4_2023-03-15' --> 'data\processed_data\COST\4_2023-03-15.md'
Converted 'data\edgar_documents\COST\4_2023-04-13' --> 'data\processed_data\COST\4_2023-04-13.md'


2025-11-14 16:07:29,833 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:29,865 - INFO - Going to convert document batch...
2025-11-14 16:07:29,867 - INFO - Processing document 4_2023-06-09
2025-11-14 16:07:29,935 - INFO - Finished converting document 4_2023-06-09 in 0.14 sec.
2025-11-14 16:07:30,000 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:30,015 - INFO - Going to convert document batch...
2025-11-14 16:07:30,016 - INFO - Processing document 4_2023-06-15
2025-11-14 16:07:30,058 - INFO - Finished converting document 4_2023-06-15 in 0.08 sec.
2025-11-14 16:07:30,147 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:30,165 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COST\4_2023-06-09' --> 'data\processed_data\COST\4_2023-06-09.md'
Converted 'data\edgar_documents\COST\4_2023-06-15' --> 'data\processed_data\COST\4_2023-06-15.md'


2025-11-14 16:07:30,167 - INFO - Processing document 4_2023-06-26
2025-11-14 16:07:30,208 - INFO - Finished converting document 4_2023-06-26 in 0.09 sec.
2025-11-14 16:07:30,267 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:30,289 - INFO - Going to convert document batch...
2025-11-14 16:07:30,292 - INFO - Processing document 4_2023-06-29
2025-11-14 16:07:30,325 - INFO - Finished converting document 4_2023-06-29 in 0.08 sec.
2025-11-14 16:07:30,403 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:30,421 - INFO - Going to convert document batch...
2025-11-14 16:07:30,423 - INFO - Processing document 4_2023-09-19


Converted 'data\edgar_documents\COST\4_2023-06-26' --> 'data\processed_data\COST\4_2023-06-26.md'
Converted 'data\edgar_documents\COST\4_2023-06-29' --> 'data\processed_data\COST\4_2023-06-29.md'


2025-11-14 16:07:30,470 - INFO - Finished converting document 4_2023-09-19 in 0.09 sec.
2025-11-14 16:07:30,561 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:30,580 - INFO - Going to convert document batch...
2025-11-14 16:07:30,582 - INFO - Processing document 4_2023-09-28
2025-11-14 16:07:30,618 - INFO - Finished converting document 4_2023-09-28 in 0.08 sec.
2025-11-14 16:07:30,682 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:30,706 - INFO - Going to convert document batch...
2025-11-14 16:07:30,708 - INFO - Processing document 4_2023-10-11


Converted 'data\edgar_documents\COST\4_2023-09-19' --> 'data\processed_data\COST\4_2023-09-19.md'
Converted 'data\edgar_documents\COST\4_2023-09-28' --> 'data\processed_data\COST\4_2023-09-28.md'


2025-11-14 16:07:30,784 - INFO - Finished converting document 4_2023-10-11 in 0.12 sec.
2025-11-14 16:07:30,867 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:30,890 - INFO - Going to convert document batch...
2025-11-14 16:07:30,891 - INFO - Processing document 4_2023-10-12
2025-11-14 16:07:30,931 - INFO - Finished converting document 4_2023-10-12 in 0.08 sec.
2025-11-14 16:07:31,015 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\4_2023-10-11' --> 'data\processed_data\COST\4_2023-10-11.md'
Converted 'data\edgar_documents\COST\4_2023-10-12' --> 'data\processed_data\COST\4_2023-10-12.md'


2025-11-14 16:07:31,060 - INFO - Going to convert document batch...
2025-11-14 16:07:31,062 - INFO - Processing document 4_2023-10-24
2025-11-14 16:07:31,137 - INFO - Finished converting document 4_2023-10-24 in 0.16 sec.
2025-11-14 16:07:31,195 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:31,220 - INFO - Going to convert document batch...
2025-11-14 16:07:31,222 - INFO - Processing document 4_2023-11-06
2025-11-14 16:07:31,268 - INFO - Finished converting document 4_2023-11-06 in 0.09 sec.
2025-11-14 16:07:31,327 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:31,350 - INFO - Going to convert document batch...
2025-11-14 16:07:31,352 - INFO - Processing document 4_2023-11-08


Converted 'data\edgar_documents\COST\4_2023-10-24' --> 'data\processed_data\COST\4_2023-10-24.md'
Converted 'data\edgar_documents\COST\4_2023-11-06' --> 'data\processed_data\COST\4_2023-11-06.md'


2025-11-14 16:07:31,386 - INFO - Finished converting document 4_2023-11-08 in 0.08 sec.
2025-11-14 16:07:31,443 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:31,462 - INFO - Going to convert document batch...
2025-11-14 16:07:31,463 - INFO - Processing document 4_2023-11-13
2025-11-14 16:07:31,509 - INFO - Finished converting document 4_2023-11-13 in 0.08 sec.
2025-11-14 16:07:31,565 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:31,593 - INFO - Going to convert document batch...
2025-11-14 16:07:31,594 - INFO - Processing document 4_2023-12-20


Converted 'data\edgar_documents\COST\4_2023-11-08' --> 'data\processed_data\COST\4_2023-11-08.md'
Converted 'data\edgar_documents\COST\4_2023-11-13' --> 'data\processed_data\COST\4_2023-11-13.md'


2025-11-14 16:07:31,665 - INFO - Finished converting document 4_2023-12-20 in 0.11 sec.
2025-11-14 16:07:31,744 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:31,769 - INFO - Going to convert document batch...
2025-11-14 16:07:31,770 - INFO - Processing document 4_2023-12-28
2025-11-14 16:07:31,811 - INFO - Finished converting document 4_2023-12-28 in 0.09 sec.
2025-11-14 16:07:31,868 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:31,890 - INFO - Going to convert document batch...
2025-11-14 16:07:31,892 - INFO - Processing document 4_2024-01-02


Converted 'data\edgar_documents\COST\4_2023-12-20' --> 'data\processed_data\COST\4_2023-12-20.md'
Converted 'data\edgar_documents\COST\4_2023-12-28' --> 'data\processed_data\COST\4_2023-12-28.md'


2025-11-14 16:07:31,932 - INFO - Finished converting document 4_2024-01-02 in 0.09 sec.
2025-11-14 16:07:32,003 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:32,025 - INFO - Going to convert document batch...
2025-11-14 16:07:32,026 - INFO - Processing document 4_2024-01-10
2025-11-14 16:07:32,068 - INFO - Finished converting document 4_2024-01-10 in 0.08 sec.
2025-11-14 16:07:32,132 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:32,147 - INFO - Going to convert document batch...
2025-11-14 16:07:32,149 - INFO - Processing document 4_2024-01-12
2025-11-14 16:07:32,187 - INFO - Finished converting document 4_2024-01-12 in 0.08 sec.


Converted 'data\edgar_documents\COST\4_2024-01-02' --> 'data\processed_data\COST\4_2024-01-02.md'
Converted 'data\edgar_documents\COST\4_2024-01-10' --> 'data\processed_data\COST\4_2024-01-10.md'


2025-11-14 16:07:32,234 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:32,249 - INFO - Going to convert document batch...
2025-11-14 16:07:32,250 - INFO - Processing document 4_2024-01-16
2025-11-14 16:07:32,289 - INFO - Finished converting document 4_2024-01-16 in 0.06 sec.
2025-11-14 16:07:32,346 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:32,362 - INFO - Going to convert document batch...
2025-11-14 16:07:32,364 - INFO - Processing document 4_2024-01-18
2025-11-14 16:07:32,398 - INFO - Finished converting document 4_2024-01-18 in 0.06 sec.


Converted 'data\edgar_documents\COST\4_2024-01-12' --> 'data\processed_data\COST\4_2024-01-12.md'
Converted 'data\edgar_documents\COST\4_2024-01-16' --> 'data\processed_data\COST\4_2024-01-16.md'


2025-11-14 16:07:32,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:32,475 - INFO - Going to convert document batch...
2025-11-14 16:07:32,477 - INFO - Processing document 4_2024-01-23
2025-11-14 16:07:32,536 - INFO - Finished converting document 4_2024-01-23 in 0.11 sec.
2025-11-14 16:07:32,603 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\4_2024-01-18' --> 'data\processed_data\COST\4_2024-01-18.md'
Converted 'data\edgar_documents\COST\4_2024-01-23' --> 'data\processed_data\COST\4_2024-01-23.md'


2025-11-14 16:07:32,617 - INFO - Going to convert document batch...
2025-11-14 16:07:32,618 - INFO - Processing document 4_2024-02-12
2025-11-14 16:07:32,652 - INFO - Finished converting document 4_2024-02-12 in 0.08 sec.
2025-11-14 16:07:32,702 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:32,720 - INFO - Going to convert document batch...
2025-11-14 16:07:32,721 - INFO - Processing document 4_2024-02-22
2025-11-14 16:07:32,772 - INFO - Finished converting document 4_2024-02-22 in 0.08 sec.
2025-11-14 16:07:32,827 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:32,844 - INFO - Going to convert document batch...
2025-11-14 16:07:32,845 - INFO - Processing document 4_2024-03-13


Converted 'data\edgar_documents\COST\4_2024-02-12' --> 'data\processed_data\COST\4_2024-02-12.md'
Converted 'data\edgar_documents\COST\4_2024-02-22' --> 'data\processed_data\COST\4_2024-02-22.md'


2025-11-14 16:07:32,879 - INFO - Finished converting document 4_2024-03-13 in 0.06 sec.
2025-11-14 16:07:32,937 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:32,969 - INFO - Going to convert document batch...
2025-11-14 16:07:32,971 - INFO - Processing document 4_2024-04-09
2025-11-14 16:07:33,037 - INFO - Finished converting document 4_2024-04-09 in 0.11 sec.


Converted 'data\edgar_documents\COST\4_2024-03-13' --> 'data\processed_data\COST\4_2024-03-13.md'
Converted 'data\edgar_documents\COST\4_2024-04-09' --> 'data\processed_data\COST\4_2024-04-09.md'


2025-11-14 16:07:33,107 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:33,133 - INFO - Going to convert document batch...
2025-11-14 16:07:33,135 - INFO - Processing document 4_2024-04-18
2025-11-14 16:07:33,177 - INFO - Finished converting document 4_2024-04-18 in 0.09 sec.
2025-11-14 16:07:33,227 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:33,241 - INFO - Going to convert document batch...
2025-11-14 16:07:33,242 - INFO - Processing document 4_2024-07-15
2025-11-14 16:07:33,297 - INFO - Finished converting document 4_2024-07-15 in 0.09 sec.


Converted 'data\edgar_documents\COST\4_2024-04-18' --> 'data\processed_data\COST\4_2024-04-18.md'
Converted 'data\edgar_documents\COST\4_2024-07-15' --> 'data\processed_data\COST\4_2024-07-15.md'


2025-11-14 16:07:33,395 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:33,421 - INFO - Going to convert document batch...
2025-11-14 16:07:33,425 - INFO - Processing document 4_2024-07-17
2025-11-14 16:07:33,474 - INFO - Finished converting document 4_2024-07-17 in 0.09 sec.
2025-11-14 16:07:33,537 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:33,569 - INFO - Going to convert document batch...
2025-11-14 16:07:33,570 - INFO - Processing document 4_2024-07-22
2025-11-14 16:07:33,618 - INFO - Finished converting document 4_2024-07-22 in 0.08 sec.
2025-11-14 16:07:33,684 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:33,725 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COST\4_2024-07-17' --> 'data\processed_data\COST\4_2024-07-17.md'
Converted 'data\edgar_documents\COST\4_2024-07-22' --> 'data\processed_data\COST\4_2024-07-22.md'


2025-11-14 16:07:33,727 - INFO - Processing document 4_2024-08-15
2025-11-14 16:07:33,781 - INFO - Finished converting document 4_2024-08-15 in 0.12 sec.
2025-11-14 16:07:33,835 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:33,852 - INFO - Going to convert document batch...
2025-11-14 16:07:33,854 - INFO - Processing document 4_2024-08-29
2025-11-14 16:07:33,891 - INFO - Finished converting document 4_2024-08-29 in 0.06 sec.
2025-11-14 16:07:33,940 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:33,958 - INFO - Going to convert document batch...
2025-11-14 16:07:33,959 - INFO - Processing document 4_2024-09-18
2025-11-14 16:07:34,001 - INFO - Finished converting document 4_2024-09-18 in 0.08 sec.


Converted 'data\edgar_documents\COST\4_2024-08-15' --> 'data\processed_data\COST\4_2024-08-15.md'
Converted 'data\edgar_documents\COST\4_2024-08-29' --> 'data\processed_data\COST\4_2024-08-29.md'


2025-11-14 16:07:34,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:34,084 - INFO - Going to convert document batch...
2025-11-14 16:07:34,086 - INFO - Processing document 4_2024-09-26
2025-11-14 16:07:34,125 - INFO - Finished converting document 4_2024-09-26 in 0.08 sec.
2025-11-14 16:07:34,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:34,207 - INFO - Going to convert document batch...
2025-11-14 16:07:34,208 - INFO - Processing document 4_2024-10-02


Converted 'data\edgar_documents\COST\4_2024-09-18' --> 'data\processed_data\COST\4_2024-09-18.md'
Converted 'data\edgar_documents\COST\4_2024-09-26' --> 'data\processed_data\COST\4_2024-09-26.md'


2025-11-14 16:07:34,245 - INFO - Finished converting document 4_2024-10-02 in 0.09 sec.
2025-11-14 16:07:34,294 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:34,309 - INFO - Going to convert document batch...
2025-11-14 16:07:34,310 - INFO - Processing document 4_2024-10-15
2025-11-14 16:07:34,343 - INFO - Finished converting document 4_2024-10-15 in 0.06 sec.
2025-11-14 16:07:34,391 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:34,421 - INFO - Going to convert document batch...
2025-11-14 16:07:34,423 - INFO - Processing document 4_2024-10-24


Converted 'data\edgar_documents\COST\4_2024-10-02' --> 'data\processed_data\COST\4_2024-10-02.md'
Converted 'data\edgar_documents\COST\4_2024-10-15' --> 'data\processed_data\COST\4_2024-10-15.md'


2025-11-14 16:07:34,478 - INFO - Finished converting document 4_2024-10-24 in 0.09 sec.
2025-11-14 16:07:34,552 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:34,576 - INFO - Going to convert document batch...
2025-11-14 16:07:34,579 - INFO - Processing document 4_2024-12-18
2025-11-14 16:07:34,618 - INFO - Finished converting document 4_2024-12-18 in 0.09 sec.
2025-11-14 16:07:34,685 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:34,704 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\COST\4_2024-10-24' --> 'data\processed_data\COST\4_2024-10-24.md'
Converted 'data\edgar_documents\COST\4_2024-12-18' --> 'data\processed_data\COST\4_2024-12-18.md'


2025-11-14 16:07:34,705 - INFO - Processing document 4_2024-12-23
2025-11-14 16:07:34,773 - INFO - Finished converting document 4_2024-12-23 in 0.11 sec.
2025-11-14 16:07:34,829 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:34,856 - INFO - Going to convert document batch...
2025-11-14 16:07:34,858 - INFO - Processing document 4_2025-03-13
2025-11-14 16:07:34,944 - INFO - Finished converting document 4_2025-03-13 in 0.12 sec.


Converted 'data\edgar_documents\COST\4_2024-12-23' --> 'data\processed_data\COST\4_2024-12-23.md'
Converted 'data\edgar_documents\COST\4_2025-03-13' --> 'data\processed_data\COST\4_2025-03-13.md'


2025-11-14 16:07:35,026 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:35,065 - INFO - Going to convert document batch...
2025-11-14 16:07:35,069 - INFO - Processing document 4_2025-03-20
2025-11-14 16:07:35,129 - INFO - Finished converting document 4_2025-03-20 in 0.12 sec.
2025-11-14 16:07:35,207 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:35,233 - INFO - Going to convert document batch...
2025-11-14 16:07:35,235 - INFO - Processing document 4_2025-03-25
2025-11-14 16:07:35,300 - INFO - Finished converting document 4_2025-03-25 in 0.11 sec.
2025-11-14 16:07:35,377 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\4_2025-03-20' --> 'data\processed_data\COST\4_2025-03-20.md'
Converted 'data\edgar_documents\COST\4_2025-03-25' --> 'data\processed_data\COST\4_2025-03-25.md'


2025-11-14 16:07:35,404 - INFO - Going to convert document batch...
2025-11-14 16:07:35,406 - INFO - Processing document 4_2025-03-27
2025-11-14 16:07:35,453 - INFO - Finished converting document 4_2025-03-27 in 0.11 sec.
2025-11-14 16:07:35,506 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:35,525 - INFO - Going to convert document batch...
2025-11-14 16:07:35,526 - INFO - Processing document 4_2025-04-21
2025-11-14 16:07:35,562 - INFO - Finished converting document 4_2025-04-21 in 0.08 sec.
2025-11-14 16:07:35,624 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:35,646 - INFO - Going to convert document batch...
2025-11-14 16:07:35,649 - INFO - Processing document 4_2025-06-09
2025-11-14 16:07:35,709 - INFO - Finished converting document 4_2025-06-09 in 0.11 sec.


Converted 'data\edgar_documents\COST\4_2025-03-27' --> 'data\processed_data\COST\4_2025-03-27.md'
Converted 'data\edgar_documents\COST\4_2025-04-21' --> 'data\processed_data\COST\4_2025-04-21.md'


2025-11-14 16:07:35,796 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:35,822 - INFO - Going to convert document batch...
2025-11-14 16:07:35,824 - INFO - Processing document 4_2025-06-10
2025-11-14 16:07:35,861 - INFO - Finished converting document 4_2025-06-10 in 0.08 sec.
2025-11-14 16:07:35,926 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:35,947 - INFO - Going to convert document batch...
2025-11-14 16:07:35,948 - INFO - Processing document 4_2025-06-20


Converted 'data\edgar_documents\COST\4_2025-06-09' --> 'data\processed_data\COST\4_2025-06-09.md'
Converted 'data\edgar_documents\COST\4_2025-06-10' --> 'data\processed_data\COST\4_2025-06-10.md'


2025-11-14 16:07:36,041 - INFO - Finished converting document 4_2025-06-20 in 0.14 sec.
2025-11-14 16:07:36,096 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:36,125 - INFO - Going to convert document batch...
2025-11-14 16:07:36,126 - INFO - Processing document 4_2025-07-15
2025-11-14 16:07:36,184 - INFO - Finished converting document 4_2025-07-15 in 0.11 sec.
2025-11-14 16:07:36,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\4_2025-06-20' --> 'data\processed_data\COST\4_2025-06-20.md'
Converted 'data\edgar_documents\COST\4_2025-07-15' --> 'data\processed_data\COST\4_2025-07-15.md'


2025-11-14 16:07:36,310 - INFO - Going to convert document batch...
2025-11-14 16:07:36,311 - INFO - Processing document 4_2025-08-22
2025-11-14 16:07:36,361 - INFO - Finished converting document 4_2025-08-22 in 0.11 sec.
2025-11-14 16:07:36,440 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:36,455 - INFO - Going to convert document batch...
2025-11-14 16:07:36,457 - INFO - Processing document 4_2025-09-04
2025-11-14 16:07:36,491 - INFO - Finished converting document 4_2025-09-04 in 0.06 sec.
2025-11-14 16:07:36,546 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:36,576 - INFO - Going to convert document batch...
2025-11-14 16:07:36,578 - INFO - Processing document 4_2025-09-12
2025-11-14 16:07:36,616 - INFO - Finished converting document 4_2025-09-12 in 0.08 sec.


Converted 'data\edgar_documents\COST\4_2025-08-22' --> 'data\processed_data\COST\4_2025-08-22.md'
Converted 'data\edgar_documents\COST\4_2025-09-04' --> 'data\processed_data\COST\4_2025-09-04.md'


2025-11-14 16:07:36,699 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:36,729 - INFO - Going to convert document batch...
2025-11-14 16:07:36,732 - INFO - Processing document 4_2025-09-24
2025-11-14 16:07:36,784 - INFO - Finished converting document 4_2025-09-24 in 0.09 sec.


Converted 'data\edgar_documents\COST\4_2025-09-12' --> 'data\processed_data\COST\4_2025-09-12.md'
Converted 'data\edgar_documents\COST\4_2025-09-24' --> 'data\processed_data\COST\4_2025-09-24.md'


2025-11-14 16:07:36,857 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:36,882 - INFO - Going to convert document batch...
2025-11-14 16:07:36,884 - INFO - Processing document 4_2025-09-30
2025-11-14 16:07:36,944 - INFO - Finished converting document 4_2025-09-30 in 0.11 sec.
2025-11-14 16:07:36,998 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\4_2025-09-30' --> 'data\processed_data\COST\4_2025-09-30.md'


2025-11-14 16:07:37,754 - INFO - Going to convert document batch...
2025-11-14 16:07:37,756 - INFO - Processing document 4_2025-10-01
2025-11-14 16:07:37,803 - INFO - Finished converting document 4_2025-10-01 in 0.81 sec.
2025-11-14 16:07:37,956 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:37,977 - INFO - Going to convert document batch...
2025-11-14 16:07:37,978 - INFO - Processing document 4_2025-10-24
2025-11-14 16:07:38,014 - INFO - Finished converting document 4_2025-10-24 in 0.08 sec.
2025-11-14 16:07:38,111 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\4_2025-10-01' --> 'data\processed_data\COST\4_2025-10-01.md'
Converted 'data\edgar_documents\COST\4_2025-10-24' --> 'data\processed_data\COST\4_2025-10-24.md'


2025-11-14 16:07:38,149 - INFO - Going to convert document batch...
2025-11-14 16:07:38,151 - INFO - Processing document 8-K_2023-01-19
2025-11-14 16:07:38,210 - INFO - Finished converting document 8-K_2023-01-19 in 0.12 sec.
2025-11-14 16:07:38,264 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:38,316 - INFO - Going to convert document batch...
2025-11-14 16:07:38,317 - INFO - Processing document 8-K_2023-01-25
2025-11-14 16:07:38,384 - INFO - Finished converting document 8-K_2023-01-25 in 0.14 sec.


Converted 'data\edgar_documents\COST\8-K_2023-01-19' --> 'data\processed_data\COST\8-K_2023-01-19.md'


2025-11-14 16:07:38,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:38,496 - INFO - Going to convert document batch...
2025-11-14 16:07:38,498 - INFO - Processing document 8-K_2023-03-03
2025-11-14 16:07:38,535 - INFO - Finished converting document 8-K_2023-03-03 in 0.11 sec.
2025-11-14 16:07:38,568 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:38,591 - INFO - Going to convert document batch...
2025-11-14 16:07:38,592 - INFO - Processing document 8-K_2023-04-19


Converted 'data\edgar_documents\COST\8-K_2023-01-25' --> 'data\processed_data\COST\8-K_2023-01-25.md'
Converted 'data\edgar_documents\COST\8-K_2023-03-03' --> 'data\processed_data\COST\8-K_2023-03-03.md'


2025-11-14 16:07:38,634 - INFO - Finished converting document 8-K_2023-04-19 in 0.08 sec.
2025-11-14 16:07:38,681 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:38,731 - INFO - Going to convert document batch...
2025-11-14 16:07:38,733 - INFO - Processing document 8-K_2023-05-25
2025-11-14 16:07:38,772 - INFO - Finished converting document 8-K_2023-05-25 in 0.11 sec.
2025-11-14 16:07:38,835 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\8-K_2023-04-19' --> 'data\processed_data\COST\8-K_2023-04-19.md'
Converted 'data\edgar_documents\COST\8-K_2023-05-25' --> 'data\processed_data\COST\8-K_2023-05-25.md'


2025-11-14 16:07:38,883 - INFO - Going to convert document batch...
2025-11-14 16:07:38,885 - INFO - Processing document 8-K_2023-08-10
2025-11-14 16:07:38,962 - INFO - Finished converting document 8-K_2023-08-10 in 0.16 sec.
2025-11-14 16:07:39,028 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:39,064 - INFO - Going to convert document batch...
2025-11-14 16:07:39,065 - INFO - Processing document 8-K_2023-08-17
2025-11-14 16:07:39,101 - INFO - Finished converting document 8-K_2023-08-17 in 0.09 sec.
2025-11-14 16:07:39,159 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\8-K_2023-08-10' --> 'data\processed_data\COST\8-K_2023-08-10.md'
Converted 'data\edgar_documents\COST\8-K_2023-08-17' --> 'data\processed_data\COST\8-K_2023-08-17.md'


2025-11-14 16:07:39,200 - INFO - Going to convert document batch...
2025-11-14 16:07:39,205 - INFO - Processing document 8-K_2023-09-26
2025-11-14 16:07:39,265 - INFO - Finished converting document 8-K_2023-09-26 in 0.14 sec.
2025-11-14 16:07:39,314 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:39,335 - INFO - Going to convert document batch...
2025-11-14 16:07:39,337 - INFO - Processing document 8-K_2023-10-20
2025-11-14 16:07:39,365 - INFO - Finished converting document 8-K_2023-10-20 in 0.08 sec.
2025-11-14 16:07:39,407 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:39,428 - INFO - Going to convert document batch...
2025-11-14 16:07:39,430 - INFO - Processing document 8-K_2023-11-24
2025-11-14 16:07:39,459 - INFO - Finished converting document 8-K_2023-11-24 in 0.08 sec.


Converted 'data\edgar_documents\COST\8-K_2023-09-26' --> 'data\processed_data\COST\8-K_2023-09-26.md'
Converted 'data\edgar_documents\COST\8-K_2023-10-20' --> 'data\processed_data\COST\8-K_2023-10-20.md'


2025-11-14 16:07:39,498 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:39,543 - INFO - Going to convert document batch...
2025-11-14 16:07:39,545 - INFO - Processing document 8-K_2023-12-14
2025-11-14 16:07:39,582 - INFO - Finished converting document 8-K_2023-12-14 in 0.11 sec.
2025-11-14 16:07:39,613 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:39,647 - INFO - Going to convert document batch...
2025-11-14 16:07:39,648 - INFO - Processing document 8-K_2024-01-22


Converted 'data\edgar_documents\COST\8-K_2023-11-24' --> 'data\processed_data\COST\8-K_2023-11-24.md'
Converted 'data\edgar_documents\COST\8-K_2023-12-14' --> 'data\processed_data\COST\8-K_2023-12-14.md'


2025-11-14 16:07:39,675 - INFO - Finished converting document 8-K_2024-01-22 in 0.08 sec.
2025-11-14 16:07:39,712 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:39,734 - INFO - Going to convert document batch...
2025-11-14 16:07:39,735 - INFO - Processing document 8-K_2024-02-09
2025-11-14 16:07:39,784 - INFO - Finished converting document 8-K_2024-02-09 in 0.09 sec.
2025-11-14 16:07:39,836 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:39,857 - INFO - Going to convert document batch...
2025-11-14 16:07:39,859 - INFO - Processing document 8-K_2024-03-07


Converted 'data\edgar_documents\COST\8-K_2024-01-22' --> 'data\processed_data\COST\8-K_2024-01-22.md'
Converted 'data\edgar_documents\COST\8-K_2024-02-09' --> 'data\processed_data\COST\8-K_2024-02-09.md'


2025-11-14 16:07:39,898 - INFO - Finished converting document 8-K_2024-03-07 in 0.09 sec.
2025-11-14 16:07:39,948 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:39,964 - INFO - Going to convert document batch...
2025-11-14 16:07:39,966 - INFO - Processing document 8-K_2024-04-10
2025-11-14 16:07:39,992 - INFO - Finished converting document 8-K_2024-04-10 in 0.05 sec.
2025-11-14 16:07:40,050 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:40,081 - INFO - Going to convert document batch...
2025-11-14 16:07:40,083 - INFO - Processing document 8-K_2024-05-30
2025-11-14 16:07:40,116 - INFO - Finished converting document 8-K_2024-05-30 in 0.09 sec.


Converted 'data\edgar_documents\COST\8-K_2024-03-07' --> 'data\processed_data\COST\8-K_2024-03-07.md'
Converted 'data\edgar_documents\COST\8-K_2024-04-10' --> 'data\processed_data\COST\8-K_2024-04-10.md'
Converted 'data\edgar_documents\COST\8-K_2024-05-30' --> 'data\processed_data\COST\8-K_2024-05-30.md'


2025-11-14 16:07:40,165 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:40,187 - INFO - Going to convert document batch...
2025-11-14 16:07:40,189 - INFO - Processing document 8-K_2024-07-10
2025-11-14 16:07:40,219 - INFO - Finished converting document 8-K_2024-07-10 in 0.09 sec.
2025-11-14 16:07:40,280 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:40,307 - INFO - Going to convert document batch...
2025-11-14 16:07:40,309 - INFO - Processing document 8-K_2024-09-20
2025-11-14 16:07:40,352 - INFO - Finished converting document 8-K_2024-09-20 in 0.09 sec.
2025-11-14 16:07:40,406 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\8-K_2024-07-10' --> 'data\processed_data\COST\8-K_2024-07-10.md'
Converted 'data\edgar_documents\COST\8-K_2024-09-20' --> 'data\processed_data\COST\8-K_2024-09-20.md'


2025-11-14 16:07:40,432 - INFO - Going to convert document batch...
2025-11-14 16:07:40,436 - INFO - Processing document 8-K_2024-09-26
2025-11-14 16:07:40,482 - INFO - Finished converting document 8-K_2024-09-26 in 0.11 sec.
2025-11-14 16:07:40,516 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:40,532 - INFO - Going to convert document batch...
2025-11-14 16:07:40,533 - INFO - Processing document 8-K_2024-10-17
2025-11-14 16:07:40,561 - INFO - Finished converting document 8-K_2024-10-17 in 0.06 sec.
2025-11-14 16:07:40,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:40,614 - INFO - Going to convert document batch...
2025-11-14 16:07:40,616 - INFO - Processing document 8-K_2024-11-07
2025-11-14 16:07:40,677 - INFO - Finished converting document 8-K_2024-11-07 in 0.09 sec.


Converted 'data\edgar_documents\COST\8-K_2024-09-26' --> 'data\processed_data\COST\8-K_2024-09-26.md'
Converted 'data\edgar_documents\COST\8-K_2024-10-17' --> 'data\processed_data\COST\8-K_2024-10-17.md'
Converted 'data\edgar_documents\COST\8-K_2024-11-07' --> 'data\processed_data\COST\8-K_2024-11-07.md'


2025-11-14 16:07:40,725 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:40,766 - INFO - Going to convert document batch...
2025-11-14 16:07:40,770 - INFO - Processing document 8-K_2024-12-12
2025-11-14 16:07:40,895 - INFO - Finished converting document 8-K_2024-12-12 in 0.20 sec.
2025-11-14 16:07:40,957 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:41,007 - INFO - Going to convert document batch...
2025-11-14 16:07:41,009 - INFO - Processing document 8-K_2025-01-27
2025-11-14 16:07:41,096 - INFO - Finished converting document 8-K_2025-01-27 in 0.17 sec.


Converted 'data\edgar_documents\COST\8-K_2024-12-12' --> 'data\processed_data\COST\8-K_2024-12-12.md'
Converted 'data\edgar_documents\COST\8-K_2025-01-27' --> 'data\processed_data\COST\8-K_2025-01-27.md'


2025-11-14 16:07:41,168 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:41,183 - INFO - Going to convert document batch...
2025-11-14 16:07:41,184 - INFO - Processing document 8-K_2025-02-03
2025-11-14 16:07:41,232 - INFO - Finished converting document 8-K_2025-02-03 in 0.09 sec.
2025-11-14 16:07:41,289 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:41,310 - INFO - Going to convert document batch...
2025-11-14 16:07:41,312 - INFO - Processing document 8-K_2025-03-06
2025-11-14 16:07:41,360 - INFO - Finished converting document 8-K_2025-03-06 in 0.09 sec.
2025-11-14 16:07:41,419 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\8-K_2025-02-03' --> 'data\processed_data\COST\8-K_2025-02-03.md'
Converted 'data\edgar_documents\COST\8-K_2025-03-06' --> 'data\processed_data\COST\8-K_2025-03-06.md'


2025-11-14 16:07:41,449 - INFO - Going to convert document batch...
2025-11-14 16:07:41,452 - INFO - Processing document 8-K_2025-04-16
2025-11-14 16:07:41,482 - INFO - Finished converting document 8-K_2025-04-16 in 0.09 sec.
2025-11-14 16:07:41,513 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:41,529 - INFO - Going to convert document batch...
2025-11-14 16:07:41,530 - INFO - Processing document 8-K_2025-05-29
2025-11-14 16:07:41,561 - INFO - Finished converting document 8-K_2025-05-29 in 0.06 sec.
2025-11-14 16:07:41,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:41,618 - INFO - Going to convert document batch...
2025-11-14 16:07:41,619 - INFO - Processing document 8-K_2025-06-11
2025-11-14 16:07:41,671 - INFO - Finished converting document 8-K_2025-06-11 in 0.09 sec.


Converted 'data\edgar_documents\COST\8-K_2025-04-16' --> 'data\processed_data\COST\8-K_2025-04-16.md'
Converted 'data\edgar_documents\COST\8-K_2025-05-29' --> 'data\processed_data\COST\8-K_2025-05-29.md'
Converted 'data\edgar_documents\COST\8-K_2025-06-11' --> 'data\processed_data\COST\8-K_2025-06-11.md'


2025-11-14 16:07:41,735 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:41,765 - INFO - Going to convert document batch...
2025-11-14 16:07:41,767 - INFO - Processing document 8-K_2025-07-16
2025-11-14 16:07:41,798 - INFO - Finished converting document 8-K_2025-07-16 in 0.09 sec.
2025-11-14 16:07:41,832 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:41,859 - INFO - Going to convert document batch...
2025-11-14 16:07:41,861 - INFO - Processing document 8-K_2025-08-07
2025-11-14 16:07:41,905 - INFO - Finished converting document 8-K_2025-08-07 in 0.09 sec.
2025-11-14 16:07:41,959 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:41,980 - INFO - Going to convert document batch...
2025-11-14 16:07:41,982 - INFO - Processing document 8-K_2025-09-25


Converted 'data\edgar_documents\COST\8-K_2025-07-16' --> 'data\processed_data\COST\8-K_2025-07-16.md'
Converted 'data\edgar_documents\COST\8-K_2025-08-07' --> 'data\processed_data\COST\8-K_2025-08-07.md'


2025-11-14 16:07:42,033 - INFO - Finished converting document 8-K_2025-09-25 in 0.09 sec.
2025-11-14 16:07:42,072 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:42,087 - INFO - Going to convert document batch...
2025-11-14 16:07:42,089 - INFO - Processing document 8-K_2025-10-15
2025-11-14 16:07:42,117 - INFO - Finished converting document 8-K_2025-10-15 in 0.06 sec.
2025-11-14 16:07:42,152 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:42,169 - INFO - Going to convert document batch...
2025-11-14 16:07:42,171 - INFO - Processing document 8-K_2025-10-20
2025-11-14 16:07:42,200 - INFO - Finished converting document 8-K_2025-10-20 in 0.06 sec.


Converted 'data\edgar_documents\COST\8-K_2025-09-25' --> 'data\processed_data\COST\8-K_2025-09-25.md'
Converted 'data\edgar_documents\COST\8-K_2025-10-15' --> 'data\processed_data\COST\8-K_2025-10-15.md'
Converted 'data\edgar_documents\COST\8-K_2025-10-20' --> 'data\processed_data\COST\8-K_2025-10-20.md'


2025-11-14 16:07:42,274 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:07:42,610 - INFO - Going to convert document batch...
2025-11-14 16:07:42,611 - INFO - Processing document DEF-14A_2023-12-07
2025-11-14 16:07:43,360 - INFO - Finished converting document DEF-14A_2023-12-07 in 1.14 sec.
2025-11-14 16:07:43,723 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\DEF-14A_2023-12-07' --> 'data\processed_data\COST\DEF-14A_2023-12-07.md'


2025-11-14 16:07:44,106 - INFO - Going to convert document batch...
2025-11-14 16:07:44,108 - INFO - Processing document DEF-14A_2024-12-11
2025-11-14 16:07:44,705 - INFO - Finished converting document DEF-14A_2024-12-11 in 1.02 sec.
2025-11-14 16:07:45,136 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\COST\DEF-14A_2024-12-11' --> 'data\processed_data\COST\DEF-14A_2024-12-11.md'
Processed 104 new files. Errors: 0
Found 511 files to process in data\edgar_documents\CRM


2025-11-14 16:07:47,260 - INFO - Going to convert document batch...
2025-11-14 16:07:47,262 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:07:47,264 - INFO - Processing document 10-K_2023-03-08
2025-11-14 16:07:50,017 - INFO - Finished converting document 10-K_2023-03-08 in 4.98 sec.
2025-11-14 16:07:51,384 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\10-K_2023-03-08' --> 'data\processed_data\CRM\10-K_2023-03-08.md'


2025-11-14 16:07:53,370 - INFO - Going to convert document batch...
2025-11-14 16:07:53,372 - INFO - Processing document 10-K_2024-03-06
2025-11-14 16:07:56,385 - INFO - Finished converting document 10-K_2024-03-06 in 5.06 sec.
2025-11-14 16:07:57,865 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\10-K_2024-03-06' --> 'data\processed_data\CRM\10-K_2024-03-06.md'


2025-11-14 16:07:59,177 - INFO - Going to convert document batch...
2025-11-14 16:07:59,178 - INFO - Processing document 10-K_2025-03-05
2025-11-14 16:08:00,341 - INFO - Finished converting document 10-K_2025-03-05 in 2.53 sec.
2025-11-14 16:08:00,854 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\10-K_2025-03-05' --> 'data\processed_data\CRM\10-K_2025-03-05.md'


2025-11-14 16:08:01,220 - INFO - Going to convert document batch...
2025-11-14 16:08:01,221 - INFO - Processing document 10-Q_2023-06-01
2025-11-14 16:08:01,932 - INFO - Finished converting document 10-Q_2023-06-01 in 1.11 sec.
2025-11-14 16:08:02,679 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\10-Q_2023-06-01' --> 'data\processed_data\CRM\10-Q_2023-06-01.md'


2025-11-14 16:08:03,105 - INFO - Going to convert document batch...
2025-11-14 16:08:03,106 - INFO - Processing document 10-Q_2023-08-31
2025-11-14 16:08:03,930 - INFO - Finished converting document 10-Q_2023-08-31 in 1.28 sec.
2025-11-14 16:08:04,444 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\10-Q_2023-08-31' --> 'data\processed_data\CRM\10-Q_2023-08-31.md'


2025-11-14 16:08:05,154 - INFO - Going to convert document batch...
2025-11-14 16:08:05,155 - INFO - Processing document 10-Q_2023-11-30
2025-11-14 16:08:06,128 - INFO - Finished converting document 10-Q_2023-11-30 in 1.72 sec.
2025-11-14 16:08:06,642 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\10-Q_2023-11-30' --> 'data\processed_data\CRM\10-Q_2023-11-30.md'


2025-11-14 16:08:07,399 - INFO - Going to convert document batch...
2025-11-14 16:08:07,400 - INFO - Processing document 10-Q_2024-05-30
2025-11-14 16:08:08,233 - INFO - Finished converting document 10-Q_2024-05-30 in 1.62 sec.
2025-11-14 16:08:08,726 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\10-Q_2024-05-30' --> 'data\processed_data\CRM\10-Q_2024-05-30.md'


2025-11-14 16:08:09,296 - INFO - Going to convert document batch...
2025-11-14 16:08:09,298 - INFO - Processing document 10-Q_2024-08-29
2025-11-14 16:08:10,440 - INFO - Finished converting document 10-Q_2024-08-29 in 1.75 sec.
2025-11-14 16:08:11,029 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\10-Q_2024-08-29' --> 'data\processed_data\CRM\10-Q_2024-08-29.md'


2025-11-14 16:08:11,828 - INFO - Going to convert document batch...
2025-11-14 16:08:11,829 - INFO - Processing document 10-Q_2024-12-04
2025-11-14 16:08:12,817 - INFO - Finished converting document 10-Q_2024-12-04 in 1.83 sec.
2025-11-14 16:08:13,317 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\10-Q_2024-12-04' --> 'data\processed_data\CRM\10-Q_2024-12-04.md'


2025-11-14 16:08:14,003 - INFO - Going to convert document batch...
2025-11-14 16:08:14,004 - INFO - Processing document 10-Q_2025-05-29
2025-11-14 16:08:14,690 - INFO - Finished converting document 10-Q_2025-05-29 in 1.41 sec.
2025-11-14 16:08:15,769 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\10-Q_2025-05-29' --> 'data\processed_data\CRM\10-Q_2025-05-29.md'


2025-11-14 16:08:16,905 - INFO - Going to convert document batch...
2025-11-14 16:08:16,906 - INFO - Processing document 10-Q_2025-09-04
2025-11-14 16:08:19,765 - INFO - Finished converting document 10-Q_2025-09-04 in 4.06 sec.
2025-11-14 16:08:21,152 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:21,282 - INFO - Going to convert document batch...
2025-11-14 16:08:21,286 - INFO - Processing document 4_2023-01-04
2025-11-14 16:08:21,368 - INFO - Finished converting document 4_2023-01-04 in 0.25 sec.


Converted 'data\edgar_documents\CRM\10-Q_2025-09-04' --> 'data\processed_data\CRM\10-Q_2025-09-04.md'


2025-11-14 16:08:21,441 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:21,464 - INFO - Going to convert document batch...
2025-11-14 16:08:21,465 - INFO - Processing document 4_2023-01-05
2025-11-14 16:08:21,524 - INFO - Finished converting document 4_2023-01-05 in 0.09 sec.
2025-11-14 16:08:21,592 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:21,620 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-01-04' --> 'data\processed_data\CRM\4_2023-01-04.md'
Converted 'data\edgar_documents\CRM\4_2023-01-05' --> 'data\processed_data\CRM\4_2023-01-05.md'


2025-11-14 16:08:21,621 - INFO - Processing document 4_2023-01-09
2025-11-14 16:08:21,684 - INFO - Finished converting document 4_2023-01-09 in 0.11 sec.
2025-11-14 16:08:21,757 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:21,783 - INFO - Going to convert document batch...
2025-11-14 16:08:21,784 - INFO - Processing document 4_2023-01-10
2025-11-14 16:08:21,848 - INFO - Finished converting document 4_2023-01-10 in 0.09 sec.


Converted 'data\edgar_documents\CRM\4_2023-01-09' --> 'data\processed_data\CRM\4_2023-01-09.md'
Converted 'data\edgar_documents\CRM\4_2023-01-10' --> 'data\processed_data\CRM\4_2023-01-10.md'


2025-11-14 16:08:21,939 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:21,965 - INFO - Going to convert document batch...
2025-11-14 16:08:21,967 - INFO - Processing document 4_2023-01-11
2025-11-14 16:08:22,016 - INFO - Finished converting document 4_2023-01-11 in 0.11 sec.
2025-11-14 16:08:22,077 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:22,101 - INFO - Going to convert document batch...
2025-11-14 16:08:22,102 - INFO - Processing document 4_2023-01-12
2025-11-14 16:08:22,153 - INFO - Finished converting document 4_2023-01-12 in 0.09 sec.
2025-11-14 16:08:22,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-01-11' --> 'data\processed_data\CRM\4_2023-01-11.md'
Converted 'data\edgar_documents\CRM\4_2023-01-12' --> 'data\processed_data\CRM\4_2023-01-12.md'


2025-11-14 16:08:22,276 - INFO - Going to convert document batch...
2025-11-14 16:08:22,278 - INFO - Processing document 4_2023-01-13
2025-11-14 16:08:22,346 - INFO - Finished converting document 4_2023-01-13 in 0.12 sec.
2025-11-14 16:08:22,412 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:22,435 - INFO - Going to convert document batch...
2025-11-14 16:08:22,435 - INFO - Processing document 4_2023-01-18
2025-11-14 16:08:22,494 - INFO - Finished converting document 4_2023-01-18 in 0.11 sec.
2025-11-14 16:08:22,564 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:22,586 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-01-13' --> 'data\processed_data\CRM\4_2023-01-13.md'
Converted 'data\edgar_documents\CRM\4_2023-01-18' --> 'data\processed_data\CRM\4_2023-01-18.md'


2025-11-14 16:08:22,588 - INFO - Processing document 4_2023-01-19
2025-11-14 16:08:22,647 - INFO - Finished converting document 4_2023-01-19 in 0.09 sec.
2025-11-14 16:08:22,710 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:22,745 - INFO - Going to convert document batch...
2025-11-14 16:08:22,747 - INFO - Processing document 4_2023-01-20
2025-11-14 16:08:22,844 - INFO - Finished converting document 4_2023-01-20 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-01-19' --> 'data\processed_data\CRM\4_2023-01-19.md'


2025-11-14 16:08:22,923 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:22,978 - INFO - Going to convert document batch...
2025-11-14 16:08:22,980 - INFO - Processing document 4_2023-01-23
2025-11-14 16:08:23,046 - INFO - Finished converting document 4_2023-01-23 in 0.14 sec.
2025-11-14 16:08:23,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-01-20' --> 'data\processed_data\CRM\4_2023-01-20.md'
Converted 'data\edgar_documents\CRM\4_2023-01-23' --> 'data\processed_data\CRM\4_2023-01-23.md'


2025-11-14 16:08:23,132 - INFO - Going to convert document batch...
2025-11-14 16:08:23,133 - INFO - Processing document 4_2023-01-24
2025-11-14 16:08:23,203 - INFO - Finished converting document 4_2023-01-24 in 0.12 sec.
2025-11-14 16:08:23,312 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:23,346 - INFO - Going to convert document batch...
2025-11-14 16:08:23,346 - INFO - Processing document 4_2023-01-25
2025-11-14 16:08:23,407 - INFO - Finished converting document 4_2023-01-25 in 0.11 sec.
2025-11-14 16:08:23,464 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-01-24' --> 'data\processed_data\CRM\4_2023-01-24.md'
Converted 'data\edgar_documents\CRM\4_2023-01-25' --> 'data\processed_data\CRM\4_2023-01-25.md'


2025-11-14 16:08:23,516 - INFO - Going to convert document batch...
2025-11-14 16:08:23,516 - INFO - Processing document 4_2023-01-27
2025-11-14 16:08:23,614 - INFO - Finished converting document 4_2023-01-27 in 0.16 sec.
2025-11-14 16:08:23,708 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:23,744 - INFO - Going to convert document batch...
2025-11-14 16:08:23,746 - INFO - Processing document 4_2023-01-30
2025-11-14 16:08:23,804 - INFO - Finished converting document 4_2023-01-30 in 0.11 sec.
2025-11-14 16:08:23,868 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:23,892 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-01-27' --> 'data\processed_data\CRM\4_2023-01-27.md'
Converted 'data\edgar_documents\CRM\4_2023-01-30' --> 'data\processed_data\CRM\4_2023-01-30.md'


2025-11-14 16:08:23,894 - INFO - Processing document 4_2023-01-31
2025-11-14 16:08:23,944 - INFO - Finished converting document 4_2023-01-31 in 0.09 sec.
2025-11-14 16:08:24,001 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:24,027 - INFO - Going to convert document batch...
2025-11-14 16:08:24,028 - INFO - Processing document 4_2023-02-01
2025-11-14 16:08:24,086 - INFO - Finished converting document 4_2023-02-01 in 0.09 sec.
2025-11-14 16:08:24,151 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-01-31' --> 'data\processed_data\CRM\4_2023-01-31.md'
Converted 'data\edgar_documents\CRM\4_2023-02-01' --> 'data\processed_data\CRM\4_2023-02-01.md'


2025-11-14 16:08:24,195 - INFO - Going to convert document batch...
2025-11-14 16:08:24,197 - INFO - Processing document 4_2023-02-02
2025-11-14 16:08:24,292 - INFO - Finished converting document 4_2023-02-02 in 0.17 sec.
2025-11-14 16:08:24,385 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:24,411 - INFO - Going to convert document batch...
2025-11-14 16:08:24,412 - INFO - Processing document 4_2023-02-03
2025-11-14 16:08:24,470 - INFO - Finished converting document 4_2023-02-03 in 0.09 sec.
2025-11-14 16:08:24,548 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-02-02' --> 'data\processed_data\CRM\4_2023-02-02.md'
Converted 'data\edgar_documents\CRM\4_2023-02-03' --> 'data\processed_data\CRM\4_2023-02-03.md'


2025-11-14 16:08:24,570 - INFO - Going to convert document batch...
2025-11-14 16:08:24,574 - INFO - Processing document 4_2023-02-06
2025-11-14 16:08:24,629 - INFO - Finished converting document 4_2023-02-06 in 0.11 sec.
2025-11-14 16:08:24,703 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:24,726 - INFO - Going to convert document batch...
2025-11-14 16:08:24,727 - INFO - Processing document 4_2023-02-07
2025-11-14 16:08:24,780 - INFO - Finished converting document 4_2023-02-07 in 0.11 sec.
2025-11-14 16:08:24,867 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-02-06' --> 'data\processed_data\CRM\4_2023-02-06.md'
Converted 'data\edgar_documents\CRM\4_2023-02-07' --> 'data\processed_data\CRM\4_2023-02-07.md'


2025-11-14 16:08:24,909 - INFO - Going to convert document batch...
2025-11-14 16:08:24,912 - INFO - Processing document 4_2023-02-08
2025-11-14 16:08:24,985 - INFO - Finished converting document 4_2023-02-08 in 0.14 sec.
2025-11-14 16:08:25,098 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:25,120 - INFO - Going to convert document batch...
2025-11-14 16:08:25,122 - INFO - Processing document 4_2023-02-09
2025-11-14 16:08:25,169 - INFO - Finished converting document 4_2023-02-09 in 0.09 sec.
2025-11-14 16:08:25,238 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:25,262 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-02-08' --> 'data\processed_data\CRM\4_2023-02-08.md'
Converted 'data\edgar_documents\CRM\4_2023-02-09' --> 'data\processed_data\CRM\4_2023-02-09.md'


2025-11-14 16:08:25,263 - INFO - Processing document 4_2023-02-10
2025-11-14 16:08:25,318 - INFO - Finished converting document 4_2023-02-10 in 0.09 sec.
2025-11-14 16:08:25,380 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:25,401 - INFO - Going to convert document batch...
2025-11-14 16:08:25,402 - INFO - Processing document 4_2023-02-13
2025-11-14 16:08:25,452 - INFO - Finished converting document 4_2023-02-13 in 0.09 sec.
2025-11-14 16:08:25,548 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-02-10' --> 'data\processed_data\CRM\4_2023-02-10.md'
Converted 'data\edgar_documents\CRM\4_2023-02-13' --> 'data\processed_data\CRM\4_2023-02-13.md'


2025-11-14 16:08:25,594 - INFO - Going to convert document batch...
2025-11-14 16:08:25,595 - INFO - Processing document 4_2023-02-14
2025-11-14 16:08:25,685 - INFO - Finished converting document 4_2023-02-14 in 0.16 sec.
2025-11-14 16:08:25,747 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:25,768 - INFO - Going to convert document batch...
2025-11-14 16:08:25,769 - INFO - Processing document 4_2023-02-15
2025-11-14 16:08:25,863 - INFO - Finished converting document 4_2023-02-15 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2023-02-14' --> 'data\processed_data\CRM\4_2023-02-14.md'


2025-11-14 16:08:25,987 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:26,037 - INFO - Going to convert document batch...
2025-11-14 16:08:26,039 - INFO - Processing document 4_2023-02-16
2025-11-14 16:08:26,133 - INFO - Finished converting document 4_2023-02-16 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2023-02-15' --> 'data\processed_data\CRM\4_2023-02-15.md'


2025-11-14 16:08:26,198 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:26,213 - INFO - Going to convert document batch...
2025-11-14 16:08:26,214 - INFO - Processing document 4_2023-02-17
2025-11-14 16:08:26,251 - INFO - Finished converting document 4_2023-02-17 in 0.06 sec.
2025-11-14 16:08:26,302 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:26,325 - INFO - Going to convert document batch...
2025-11-14 16:08:26,326 - INFO - Processing document 4_2023-02-21
2025-11-14 16:08:26,381 - INFO - Finished converting document 4_2023-02-21 in 0.09 sec.


Converted 'data\edgar_documents\CRM\4_2023-02-16' --> 'data\processed_data\CRM\4_2023-02-16.md'
Converted 'data\edgar_documents\CRM\4_2023-02-17' --> 'data\processed_data\CRM\4_2023-02-17.md'


2025-11-14 16:08:26,455 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:26,501 - INFO - Going to convert document batch...
2025-11-14 16:08:26,502 - INFO - Processing document 4_2023-02-22
2025-11-14 16:08:26,577 - INFO - Finished converting document 4_2023-02-22 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-02-21' --> 'data\processed_data\CRM\4_2023-02-21.md'
Converted 'data\edgar_documents\CRM\4_2023-02-22' --> 'data\processed_data\CRM\4_2023-02-22.md'


2025-11-14 16:08:26,656 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:26,674 - INFO - Going to convert document batch...
2025-11-14 16:08:26,675 - INFO - Processing document 4_2023-02-23
2025-11-14 16:08:26,717 - INFO - Finished converting document 4_2023-02-23 in 0.09 sec.
2025-11-14 16:08:26,768 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:26,791 - INFO - Going to convert document batch...
2025-11-14 16:08:26,792 - INFO - Processing document 4_2023-02-24
2025-11-14 16:08:26,843 - INFO - Finished converting document 4_2023-02-24 in 0.09 sec.
2025-11-14 16:08:26,906 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:26,932 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-02-23' --> 'data\processed_data\CRM\4_2023-02-23.md'
Converted 'data\edgar_documents\CRM\4_2023-02-24' --> 'data\processed_data\CRM\4_2023-02-24.md'


2025-11-14 16:08:26,933 - INFO - Processing document 4_2023-02-27
2025-11-14 16:08:26,985 - INFO - Finished converting document 4_2023-02-27 in 0.09 sec.
2025-11-14 16:08:27,046 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:27,066 - INFO - Going to convert document batch...
2025-11-14 16:08:27,067 - INFO - Processing document 4_2023-02-28
2025-11-14 16:08:27,116 - INFO - Finished converting document 4_2023-02-28 in 0.08 sec.
2025-11-14 16:08:27,213 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-02-27' --> 'data\processed_data\CRM\4_2023-02-27.md'
Converted 'data\edgar_documents\CRM\4_2023-02-28' --> 'data\processed_data\CRM\4_2023-02-28.md'


2025-11-14 16:08:27,257 - INFO - Going to convert document batch...
2025-11-14 16:08:27,259 - INFO - Processing document 4_2023-03-01
2025-11-14 16:08:27,424 - INFO - Finished converting document 4_2023-03-01 in 0.25 sec.
2025-11-14 16:08:27,518 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:27,556 - INFO - Going to convert document batch...
2025-11-14 16:08:27,557 - INFO - Processing document 4_2023-03-02
2025-11-14 16:08:27,668 - INFO - Finished converting document 4_2023-03-02 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-01' --> 'data\processed_data\CRM\4_2023-03-01.md'


2025-11-14 16:08:27,782 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:27,822 - INFO - Going to convert document batch...
2025-11-14 16:08:27,823 - INFO - Processing document 4_2023-03-03
2025-11-14 16:08:27,904 - INFO - Finished converting document 4_2023-03-03 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-02' --> 'data\processed_data\CRM\4_2023-03-02.md'


2025-11-14 16:08:28,021 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:28,070 - INFO - Going to convert document batch...
2025-11-14 16:08:28,072 - INFO - Processing document 4_2023-03-06
2025-11-14 16:08:28,173 - INFO - Finished converting document 4_2023-03-06 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-03' --> 'data\processed_data\CRM\4_2023-03-03.md'


2025-11-14 16:08:28,292 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:28,337 - INFO - Going to convert document batch...
2025-11-14 16:08:28,339 - INFO - Processing document 4_2023-03-07
2025-11-14 16:08:28,409 - INFO - Finished converting document 4_2023-03-07 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-06' --> 'data\processed_data\CRM\4_2023-03-06.md'
Converted 'data\edgar_documents\CRM\4_2023-03-07' --> 'data\processed_data\CRM\4_2023-03-07.md'


2025-11-14 16:08:28,498 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:28,523 - INFO - Going to convert document batch...
2025-11-14 16:08:28,524 - INFO - Processing document 4_2023-03-08
2025-11-14 16:08:28,575 - INFO - Finished converting document 4_2023-03-08 in 0.11 sec.
2025-11-14 16:08:28,633 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:28,658 - INFO - Going to convert document batch...
2025-11-14 16:08:28,659 - INFO - Processing document 4_2023-03-09
2025-11-14 16:08:28,709 - INFO - Finished converting document 4_2023-03-09 in 0.08 sec.
2025-11-14 16:08:28,781 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:28,797 - INFO - Going to convert document batch...
2025-11-14 16:08:28,798 - INFO - Processing document 4_2023-03-10
2025-11-14 16:08:28,831 - INFO - Finished converting document 4_2023-03-10 in 0.08 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-08' --> 'data\processed_data\CRM\4_2023-03-08.md'
Converted 'data\edgar_documents\CRM\4_2023-03-09' --> 'data\processed_data\CRM\4_2023-03-09.md'


2025-11-14 16:08:28,881 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:28,908 - INFO - Going to convert document batch...
2025-11-14 16:08:28,910 - INFO - Processing document 4_2023-03-13


Converted 'data\edgar_documents\CRM\4_2023-03-10' --> 'data\processed_data\CRM\4_2023-03-10.md'


2025-11-14 16:08:30,002 - INFO - Finished converting document 4_2023-03-13 in 1.14 sec.
2025-11-14 16:08:30,150 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:30,204 - INFO - Going to convert document batch...
2025-11-14 16:08:30,207 - INFO - Processing document 4_2023-03-14
2025-11-14 16:08:30,282 - INFO - Finished converting document 4_2023-03-14 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-13' --> 'data\processed_data\CRM\4_2023-03-13.md'


2025-11-14 16:08:30,399 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:30,439 - INFO - Going to convert document batch...
2025-11-14 16:08:30,441 - INFO - Processing document 4_2023-03-15
2025-11-14 16:08:30,539 - INFO - Finished converting document 4_2023-03-15 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-14' --> 'data\processed_data\CRM\4_2023-03-14.md'


2025-11-14 16:08:30,647 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:30,685 - INFO - Going to convert document batch...
2025-11-14 16:08:30,689 - INFO - Processing document 4_2023-03-16


Converted 'data\edgar_documents\CRM\4_2023-03-15' --> 'data\processed_data\CRM\4_2023-03-15.md'


2025-11-14 16:08:30,853 - INFO - Finished converting document 4_2023-03-16 in 0.22 sec.
2025-11-14 16:08:30,953 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:30,974 - INFO - Going to convert document batch...
2025-11-14 16:08:30,976 - INFO - Processing document 4_2023-03-17
2025-11-14 16:08:31,031 - INFO - Finished converting document 4_2023-03-17 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-16' --> 'data\processed_data\CRM\4_2023-03-16.md'
Converted 'data\edgar_documents\CRM\4_2023-03-17' --> 'data\processed_data\CRM\4_2023-03-17.md'


2025-11-14 16:08:31,139 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:31,170 - INFO - Going to convert document batch...
2025-11-14 16:08:31,172 - INFO - Processing document 4_2023-03-20
2025-11-14 16:08:31,223 - INFO - Finished converting document 4_2023-03-20 in 0.11 sec.
2025-11-14 16:08:31,330 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:31,365 - INFO - Going to convert document batch...
2025-11-14 16:08:31,366 - INFO - Processing document 4_2023-03-21
2025-11-14 16:08:31,430 - INFO - Finished converting document 4_2023-03-21 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-20' --> 'data\processed_data\CRM\4_2023-03-20.md'
Converted 'data\edgar_documents\CRM\4_2023-03-21' --> 'data\processed_data\CRM\4_2023-03-21.md'


2025-11-14 16:08:31,526 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:31,573 - INFO - Going to convert document batch...
2025-11-14 16:08:31,575 - INFO - Processing document 4_2023-03-22
2025-11-14 16:08:31,650 - INFO - Finished converting document 4_2023-03-22 in 0.14 sec.
2025-11-14 16:08:31,754 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:31,808 - INFO - Going to convert document batch...
2025-11-14 16:08:31,809 - INFO - Processing document 4_2023-03-23
2025-11-14 16:08:31,916 - INFO - Finished converting document 4_2023-03-23 in 0.19 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-22' --> 'data\processed_data\CRM\4_2023-03-22.md'


2025-11-14 16:08:32,000 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:32,019 - INFO - Going to convert document batch...
2025-11-14 16:08:32,022 - INFO - Processing document 4_2023-03-24
2025-11-14 16:08:32,073 - INFO - Finished converting document 4_2023-03-24 in 0.09 sec.
2025-11-14 16:08:32,164 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:32,188 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-03-23' --> 'data\processed_data\CRM\4_2023-03-23.md'
Converted 'data\edgar_documents\CRM\4_2023-03-24' --> 'data\processed_data\CRM\4_2023-03-24.md'


2025-11-14 16:08:32,189 - INFO - Processing document 4_2023-03-27
2025-11-14 16:08:32,256 - INFO - Finished converting document 4_2023-03-27 in 0.11 sec.
2025-11-14 16:08:32,327 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:32,350 - INFO - Going to convert document batch...
2025-11-14 16:08:32,351 - INFO - Processing document 4_2023-03-28
2025-11-14 16:08:32,430 - INFO - Finished converting document 4_2023-03-28 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-27' --> 'data\processed_data\CRM\4_2023-03-27.md'


2025-11-14 16:08:32,562 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:32,605 - INFO - Going to convert document batch...
2025-11-14 16:08:32,608 - INFO - Processing document 4_2023-03-29
2025-11-14 16:08:32,679 - INFO - Finished converting document 4_2023-03-29 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-28' --> 'data\processed_data\CRM\4_2023-03-28.md'


2025-11-14 16:08:32,814 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:32,859 - INFO - Going to convert document batch...
2025-11-14 16:08:32,861 - INFO - Processing document 4_2023-03-30
2025-11-14 16:08:32,985 - INFO - Finished converting document 4_2023-03-30 in 0.20 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-29' --> 'data\processed_data\CRM\4_2023-03-29.md'


2025-11-14 16:08:33,067 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:33,109 - INFO - Going to convert document batch...
2025-11-14 16:08:33,110 - INFO - Processing document 4_2023-04-03
2025-11-14 16:08:33,231 - INFO - Finished converting document 4_2023-04-03 in 0.19 sec.


Converted 'data\edgar_documents\CRM\4_2023-03-30' --> 'data\processed_data\CRM\4_2023-03-30.md'


2025-11-14 16:08:33,408 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:33,443 - INFO - Going to convert document batch...
2025-11-14 16:08:33,445 - INFO - Processing document 4_2023-04-05
2025-11-14 16:08:33,547 - INFO - Finished converting document 4_2023-04-05 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-04-03' --> 'data\processed_data\CRM\4_2023-04-03.md'


2025-11-14 16:08:33,691 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:33,712 - INFO - Going to convert document batch...
2025-11-14 16:08:33,713 - INFO - Processing document 4_2023-04-11
2025-11-14 16:08:33,764 - INFO - Finished converting document 4_2023-04-11 in 0.09 sec.
2025-11-14 16:08:33,835 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:33,863 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-04-05' --> 'data\processed_data\CRM\4_2023-04-05.md'
Converted 'data\edgar_documents\CRM\4_2023-04-11' --> 'data\processed_data\CRM\4_2023-04-11.md'


2025-11-14 16:08:33,865 - INFO - Processing document 4_2023-04-12
2025-11-14 16:08:33,928 - INFO - Finished converting document 4_2023-04-12 in 0.11 sec.
2025-11-14 16:08:34,008 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:34,031 - INFO - Going to convert document batch...
2025-11-14 16:08:34,033 - INFO - Processing document 4_2023-04-19
2025-11-14 16:08:34,097 - INFO - Finished converting document 4_2023-04-19 in 0.11 sec.
2025-11-14 16:08:34,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-04-12' --> 'data\processed_data\CRM\4_2023-04-12.md'
Converted 'data\edgar_documents\CRM\4_2023-04-19' --> 'data\processed_data\CRM\4_2023-04-19.md'


2025-11-14 16:08:34,214 - INFO - Going to convert document batch...
2025-11-14 16:08:34,215 - INFO - Processing document 4_2023-04-24
2025-11-14 16:08:34,280 - INFO - Finished converting document 4_2023-04-24 in 0.12 sec.
2025-11-14 16:08:34,375 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:34,409 - INFO - Going to convert document batch...
2025-11-14 16:08:34,410 - INFO - Processing document 4_2023-04-26
2025-11-14 16:08:34,464 - INFO - Finished converting document 4_2023-04-26 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2023-04-24' --> 'data\processed_data\CRM\4_2023-04-24.md'
Converted 'data\edgar_documents\CRM\4_2023-04-26' --> 'data\processed_data\CRM\4_2023-04-26.md'


2025-11-14 16:08:34,564 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:34,621 - INFO - Going to convert document batch...
2025-11-14 16:08:34,622 - INFO - Processing document 4_2023-05-03
2025-11-14 16:08:34,709 - INFO - Finished converting document 4_2023-05-03 in 0.17 sec.
2025-11-14 16:08:34,782 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:34,824 - INFO - Going to convert document batch...
2025-11-14 16:08:34,825 - INFO - Processing document 4_2023-05-10
2025-11-14 16:08:34,916 - INFO - Finished converting document 4_2023-05-10 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-05-03' --> 'data\processed_data\CRM\4_2023-05-03.md'


2025-11-14 16:08:35,019 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:35,060 - INFO - Going to convert document batch...
2025-11-14 16:08:35,062 - INFO - Processing document 4_2023-05-17
2025-11-14 16:08:35,144 - INFO - Finished converting document 4_2023-05-17 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-05-10' --> 'data\processed_data\CRM\4_2023-05-10.md'
Converted 'data\edgar_documents\CRM\4_2023-05-17' --> 'data\processed_data\CRM\4_2023-05-17.md'


2025-11-14 16:08:35,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:35,283 - INFO - Going to convert document batch...
2025-11-14 16:08:35,284 - INFO - Processing document 4_2023-05-23
2025-11-14 16:08:35,416 - INFO - Finished converting document 4_2023-05-23 in 0.20 sec.
2025-11-14 16:08:35,531 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:35,557 - INFO - Going to convert document batch...
2025-11-14 16:08:35,558 - INFO - Processing document 4_2023-05-24
2025-11-14 16:08:35,615 - INFO - Finished converting document 4_2023-05-24 in 0.09 sec.
2025-11-14 16:08:35,704 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-05-23' --> 'data\processed_data\CRM\4_2023-05-23.md'
Converted 'data\edgar_documents\CRM\4_2023-05-24' --> 'data\processed_data\CRM\4_2023-05-24.md'


2025-11-14 16:08:35,748 - INFO - Going to convert document batch...
2025-11-14 16:08:35,752 - INFO - Processing document 4_2023-05-31
2025-11-14 16:08:35,818 - INFO - Finished converting document 4_2023-05-31 in 0.14 sec.
2025-11-14 16:08:35,912 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:35,938 - INFO - Going to convert document batch...
2025-11-14 16:08:35,940 - INFO - Processing document 4_2023-06-01
2025-11-14 16:08:35,996 - INFO - Finished converting document 4_2023-06-01 in 0.11 sec.
2025-11-14 16:08:36,083 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-05-31' --> 'data\processed_data\CRM\4_2023-05-31.md'
Converted 'data\edgar_documents\CRM\4_2023-06-01' --> 'data\processed_data\CRM\4_2023-06-01.md'


2025-11-14 16:08:36,117 - INFO - Going to convert document batch...
2025-11-14 16:08:36,117 - INFO - Processing document 4_2023-06-06
2025-11-14 16:08:36,173 - INFO - Finished converting document 4_2023-06-06 in 0.12 sec.
2025-11-14 16:08:36,261 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:36,293 - INFO - Going to convert document batch...
2025-11-14 16:08:36,296 - INFO - Processing document 4_2023-06-07
2025-11-14 16:08:36,379 - INFO - Finished converting document 4_2023-06-07 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-06-06' --> 'data\processed_data\CRM\4_2023-06-06.md'


2025-11-14 16:08:36,495 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:36,536 - INFO - Going to convert document batch...
2025-11-14 16:08:36,537 - INFO - Processing document 4_2023-06-09
2025-11-14 16:08:36,589 - INFO - Finished converting document 4_2023-06-09 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2023-06-07' --> 'data\processed_data\CRM\4_2023-06-07.md'
Converted 'data\edgar_documents\CRM\4_2023-06-09' --> 'data\processed_data\CRM\4_2023-06-09.md'


2025-11-14 16:08:36,704 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:36,769 - INFO - Going to convert document batch...
2025-11-14 16:08:36,771 - INFO - Processing document 4_2023-06-14
2025-11-14 16:08:36,928 - INFO - Finished converting document 4_2023-06-14 in 0.25 sec.
2025-11-14 16:08:37,009 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:37,044 - INFO - Going to convert document batch...
2025-11-14 16:08:37,046 - INFO - Processing document 4_2023-06-16
2025-11-14 16:08:37,122 - INFO - Finished converting document 4_2023-06-16 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-06-14' --> 'data\processed_data\CRM\4_2023-06-14.md'


2025-11-14 16:08:37,245 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:37,300 - INFO - Going to convert document batch...
2025-11-14 16:08:37,302 - INFO - Processing document 4_2023-06-20
2025-11-14 16:08:37,376 - INFO - Finished converting document 4_2023-06-20 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-06-16' --> 'data\processed_data\CRM\4_2023-06-16.md'


2025-11-14 16:08:37,469 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:37,509 - INFO - Going to convert document batch...
2025-11-14 16:08:37,510 - INFO - Processing document 4_2023-06-21


Converted 'data\edgar_documents\CRM\4_2023-06-20' --> 'data\processed_data\CRM\4_2023-06-20.md'


2025-11-14 16:08:38,057 - INFO - Finished converting document 4_2023-06-21 in 0.62 sec.
2025-11-14 16:08:38,215 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:38,262 - INFO - Going to convert document batch...
2025-11-14 16:08:38,264 - INFO - Processing document 4_2023-06-23
2025-11-14 16:08:38,336 - INFO - Finished converting document 4_2023-06-23 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2023-06-21' --> 'data\processed_data\CRM\4_2023-06-21.md'


2025-11-14 16:08:38,408 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:38,427 - INFO - Going to convert document batch...
2025-11-14 16:08:38,429 - INFO - Processing document 4_2023-06-27
2025-11-14 16:08:38,472 - INFO - Finished converting document 4_2023-06-27 in 0.08 sec.
2025-11-14 16:08:38,553 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:38,578 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-06-23' --> 'data\processed_data\CRM\4_2023-06-23.md'
Converted 'data\edgar_documents\CRM\4_2023-06-27' --> 'data\processed_data\CRM\4_2023-06-27.md'


2025-11-14 16:08:38,579 - INFO - Processing document 4_2023-06-28
2025-11-14 16:08:38,644 - INFO - Finished converting document 4_2023-06-28 in 0.12 sec.
2025-11-14 16:08:38,744 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:38,764 - INFO - Going to convert document batch...
2025-11-14 16:08:38,766 - INFO - Processing document 4_2023-06-30
2025-11-14 16:08:38,809 - INFO - Finished converting document 4_2023-06-30 in 0.08 sec.
2025-11-14 16:08:38,907 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:38,956 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-06-28' --> 'data\processed_data\CRM\4_2023-06-28.md'
Converted 'data\edgar_documents\CRM\4_2023-06-30' --> 'data\processed_data\CRM\4_2023-06-30.md'


2025-11-14 16:08:38,957 - INFO - Processing document 4_2023-07-03
2025-11-14 16:08:39,036 - INFO - Finished converting document 4_2023-07-03 in 0.16 sec.
2025-11-14 16:08:39,144 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:39,166 - INFO - Going to convert document batch...
2025-11-14 16:08:39,167 - INFO - Processing document 4_2023-07-05
2025-11-14 16:08:39,216 - INFO - Finished converting document 4_2023-07-05 in 0.09 sec.
2025-11-14 16:08:39,304 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-07-03' --> 'data\processed_data\CRM\4_2023-07-03.md'
Converted 'data\edgar_documents\CRM\4_2023-07-05' --> 'data\processed_data\CRM\4_2023-07-05.md'


2025-11-14 16:08:39,343 - INFO - Going to convert document batch...
2025-11-14 16:08:39,346 - INFO - Processing document 4_2023-07-06
2025-11-14 16:08:39,423 - INFO - Finished converting document 4_2023-07-06 in 0.16 sec.
2025-11-14 16:08:39,499 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:39,543 - INFO - Going to convert document batch...
2025-11-14 16:08:39,544 - INFO - Processing document 4_2023-07-07
2025-11-14 16:08:39,608 - INFO - Finished converting document 4_2023-07-07 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2023-07-06' --> 'data\processed_data\CRM\4_2023-07-06.md'
Converted 'data\edgar_documents\CRM\4_2023-07-07' --> 'data\processed_data\CRM\4_2023-07-07.md'


2025-11-14 16:08:39,701 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:39,740 - INFO - Going to convert document batch...
2025-11-14 16:08:39,742 - INFO - Processing document 4_2023-07-10
2025-11-14 16:08:39,847 - INFO - Finished converting document 4_2023-07-10 in 0.17 sec.
2025-11-14 16:08:39,964 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:40,021 - INFO - Going to convert document batch...
2025-11-14 16:08:40,024 - INFO - Processing document 4_2023-07-11
2025-11-14 16:08:40,118 - INFO - Finished converting document 4_2023-07-11 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-07-10' --> 'data\processed_data\CRM\4_2023-07-10.md'


2025-11-14 16:08:40,192 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:40,227 - INFO - Going to convert document batch...
2025-11-14 16:08:40,228 - INFO - Processing document 4_2023-07-12
2025-11-14 16:08:40,278 - INFO - Finished converting document 4_2023-07-12 in 0.11 sec.
2025-11-14 16:08:40,348 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-07-11' --> 'data\processed_data\CRM\4_2023-07-11.md'
Converted 'data\edgar_documents\CRM\4_2023-07-12' --> 'data\processed_data\CRM\4_2023-07-12.md'


2025-11-14 16:08:40,394 - INFO - Going to convert document batch...
2025-11-14 16:08:40,396 - INFO - Processing document 4_2023-07-13
2025-11-14 16:08:40,477 - INFO - Finished converting document 4_2023-07-13 in 0.14 sec.
2025-11-14 16:08:40,598 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:40,647 - INFO - Going to convert document batch...
2025-11-14 16:08:40,649 - INFO - Processing document 4_2023-07-14
2025-11-14 16:08:40,742 - INFO - Finished converting document 4_2023-07-14 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-07-13' --> 'data\processed_data\CRM\4_2023-07-13.md'


2025-11-14 16:08:40,882 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:40,910 - INFO - Going to convert document batch...
2025-11-14 16:08:40,911 - INFO - Processing document 4_2023-07-17
2025-11-14 16:08:40,965 - INFO - Finished converting document 4_2023-07-17 in 0.12 sec.
2025-11-14 16:08:41,043 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-07-14' --> 'data\processed_data\CRM\4_2023-07-14.md'
Converted 'data\edgar_documents\CRM\4_2023-07-17' --> 'data\processed_data\CRM\4_2023-07-17.md'


2025-11-14 16:08:41,108 - INFO - Going to convert document batch...
2025-11-14 16:08:41,109 - INFO - Processing document 4_2023-07-18
2025-11-14 16:08:41,156 - INFO - Finished converting document 4_2023-07-18 in 0.14 sec.
2025-11-14 16:08:41,220 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:41,242 - INFO - Going to convert document batch...
2025-11-14 16:08:41,244 - INFO - Processing document 4_2023-07-19
2025-11-14 16:08:41,299 - INFO - Finished converting document 4_2023-07-19 in 0.09 sec.
2025-11-14 16:08:41,361 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:41,384 - INFO - Going to convert document batch...
2025-11-14 16:08:41,385 - INFO - Processing document 4_2023-07-20


Converted 'data\edgar_documents\CRM\4_2023-07-18' --> 'data\processed_data\CRM\4_2023-07-18.md'
Converted 'data\edgar_documents\CRM\4_2023-07-19' --> 'data\processed_data\CRM\4_2023-07-19.md'


2025-11-14 16:08:41,443 - INFO - Finished converting document 4_2023-07-20 in 0.09 sec.
2025-11-14 16:08:41,524 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:41,553 - INFO - Going to convert document batch...
2025-11-14 16:08:41,554 - INFO - Processing document 4_2023-07-21
2025-11-14 16:08:41,608 - INFO - Finished converting document 4_2023-07-21 in 0.11 sec.
2025-11-14 16:08:41,688 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-07-20' --> 'data\processed_data\CRM\4_2023-07-20.md'
Converted 'data\edgar_documents\CRM\4_2023-07-21' --> 'data\processed_data\CRM\4_2023-07-21.md'


2025-11-14 16:08:41,729 - INFO - Going to convert document batch...
2025-11-14 16:08:41,732 - INFO - Processing document 4_2023-07-24
2025-11-14 16:08:41,788 - INFO - Finished converting document 4_2023-07-24 in 0.12 sec.
2025-11-14 16:08:41,846 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:41,866 - INFO - Going to convert document batch...
2025-11-14 16:08:41,867 - INFO - Processing document 4_2023-07-25
2025-11-14 16:08:41,910 - INFO - Finished converting document 4_2023-07-25 in 0.08 sec.
2025-11-14 16:08:41,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:41,993 - INFO - Going to convert document batch...
2025-11-14 16:08:41,994 - INFO - Processing document 4_2023-07-26


Converted 'data\edgar_documents\CRM\4_2023-07-24' --> 'data\processed_data\CRM\4_2023-07-24.md'
Converted 'data\edgar_documents\CRM\4_2023-07-25' --> 'data\processed_data\CRM\4_2023-07-25.md'


2025-11-14 16:08:42,040 - INFO - Finished converting document 4_2023-07-26 in 0.06 sec.
2025-11-14 16:08:42,102 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:42,136 - INFO - Going to convert document batch...
2025-11-14 16:08:42,139 - INFO - Processing document 4_2023-07-27
2025-11-14 16:08:42,229 - INFO - Finished converting document 4_2023-07-27 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-07-26' --> 'data\processed_data\CRM\4_2023-07-26.md'


2025-11-14 16:08:42,350 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:42,395 - INFO - Going to convert document batch...
2025-11-14 16:08:42,396 - INFO - Processing document 4_2023-07-28
2025-11-14 16:08:42,475 - INFO - Finished converting document 4_2023-07-28 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-07-27' --> 'data\processed_data\CRM\4_2023-07-27.md'


2025-11-14 16:08:42,541 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:42,565 - INFO - Going to convert document batch...
2025-11-14 16:08:42,565 - INFO - Processing document 4_2023-07-31
2025-11-14 16:08:42,619 - INFO - Finished converting document 4_2023-07-31 in 0.09 sec.


Converted 'data\edgar_documents\CRM\4_2023-07-28' --> 'data\processed_data\CRM\4_2023-07-28.md'
Converted 'data\edgar_documents\CRM\4_2023-07-31' --> 'data\processed_data\CRM\4_2023-07-31.md'


2025-11-14 16:08:42,699 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:42,724 - INFO - Going to convert document batch...
2025-11-14 16:08:42,726 - INFO - Processing document 4_2023-08-01
2025-11-14 16:08:42,801 - INFO - Finished converting document 4_2023-08-01 in 0.12 sec.
2025-11-14 16:08:42,875 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:42,906 - INFO - Going to convert document batch...
2025-11-14 16:08:42,908 - INFO - Processing document 4_2023-08-02
2025-11-14 16:08:42,960 - INFO - Finished converting document 4_2023-08-02 in 0.09 sec.


Converted 'data\edgar_documents\CRM\4_2023-08-01' --> 'data\processed_data\CRM\4_2023-08-01.md'
Converted 'data\edgar_documents\CRM\4_2023-08-02' --> 'data\processed_data\CRM\4_2023-08-02.md'


2025-11-14 16:08:43,049 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:43,094 - INFO - Going to convert document batch...
2025-11-14 16:08:43,096 - INFO - Processing document 4_2023-08-03
2025-11-14 16:08:43,160 - INFO - Finished converting document 4_2023-08-03 in 0.14 sec.
2025-11-14 16:08:43,223 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:43,259 - INFO - Going to convert document batch...
2025-11-14 16:08:43,260 - INFO - Processing document 4_2023-08-04
2025-11-14 16:08:43,327 - INFO - Finished converting document 4_2023-08-04 in 0.12 sec.
2025-11-14 16:08:43,404 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-08-03' --> 'data\processed_data\CRM\4_2023-08-03.md'
Converted 'data\edgar_documents\CRM\4_2023-08-04' --> 'data\processed_data\CRM\4_2023-08-04.md'


2025-11-14 16:08:43,426 - INFO - Going to convert document batch...
2025-11-14 16:08:43,427 - INFO - Processing document 4_2023-08-07
2025-11-14 16:08:43,479 - INFO - Finished converting document 4_2023-08-07 in 0.09 sec.
2025-11-14 16:08:43,551 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:43,574 - INFO - Going to convert document batch...
2025-11-14 16:08:43,576 - INFO - Processing document 4_2023-08-08
2025-11-14 16:08:43,671 - INFO - Finished converting document 4_2023-08-08 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-08-07' --> 'data\processed_data\CRM\4_2023-08-07.md'


2025-11-14 16:08:43,755 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:43,778 - INFO - Going to convert document batch...
2025-11-14 16:08:43,779 - INFO - Processing document 4_2023-08-09
2025-11-14 16:08:43,843 - INFO - Finished converting document 4_2023-08-09 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2023-08-08' --> 'data\processed_data\CRM\4_2023-08-08.md'
Converted 'data\edgar_documents\CRM\4_2023-08-09' --> 'data\processed_data\CRM\4_2023-08-09.md'


2025-11-14 16:08:43,927 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:43,953 - INFO - Going to convert document batch...
2025-11-14 16:08:43,954 - INFO - Processing document 4_2023-08-10
2025-11-14 16:08:44,010 - INFO - Finished converting document 4_2023-08-10 in 0.11 sec.
2025-11-14 16:08:44,089 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:44,124 - INFO - Going to convert document batch...
2025-11-14 16:08:44,126 - INFO - Processing document 4_2023-08-11
2025-11-14 16:08:44,178 - INFO - Finished converting document 4_2023-08-11 in 0.09 sec.
2025-11-14 16:08:44,269 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-08-10' --> 'data\processed_data\CRM\4_2023-08-10.md'
Converted 'data\edgar_documents\CRM\4_2023-08-11' --> 'data\processed_data\CRM\4_2023-08-11.md'


2025-11-14 16:08:44,307 - INFO - Going to convert document batch...
2025-11-14 16:08:44,308 - INFO - Processing document 4_2023-08-14
2025-11-14 16:08:44,357 - INFO - Finished converting document 4_2023-08-14 in 0.11 sec.
2025-11-14 16:08:44,418 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:44,440 - INFO - Going to convert document batch...
2025-11-14 16:08:44,441 - INFO - Processing document 4_2023-08-15
2025-11-14 16:08:44,492 - INFO - Finished converting document 4_2023-08-15 in 0.08 sec.
2025-11-14 16:08:44,582 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:44,612 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-08-14' --> 'data\processed_data\CRM\4_2023-08-14.md'
Converted 'data\edgar_documents\CRM\4_2023-08-15' --> 'data\processed_data\CRM\4_2023-08-15.md'


2025-11-14 16:08:44,614 - INFO - Processing document 4_2023-08-16
2025-11-14 16:08:44,696 - INFO - Finished converting document 4_2023-08-16 in 0.14 sec.
2025-11-14 16:08:44,769 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:44,788 - INFO - Going to convert document batch...
2025-11-14 16:08:44,789 - INFO - Processing document 4_2023-08-17
2025-11-14 16:08:44,845 - INFO - Finished converting document 4_2023-08-17 in 0.09 sec.
2025-11-14 16:08:44,919 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-08-16' --> 'data\processed_data\CRM\4_2023-08-16.md'
Converted 'data\edgar_documents\CRM\4_2023-08-17' --> 'data\processed_data\CRM\4_2023-08-17.md'


2025-11-14 16:08:45,695 - INFO - Going to convert document batch...
2025-11-14 16:08:45,700 - INFO - Processing document 4_2023-08-18
2025-11-14 16:08:45,777 - INFO - Finished converting document 4_2023-08-18 in 0.88 sec.
2025-11-14 16:08:45,846 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:45,883 - INFO - Going to convert document batch...
2025-11-14 16:08:45,887 - INFO - Processing document 4_2023-08-21
2025-11-14 16:08:45,945 - INFO - Finished converting document 4_2023-08-21 in 0.11 sec.
2025-11-14 16:08:46,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-08-18' --> 'data\processed_data\CRM\4_2023-08-18.md'
Converted 'data\edgar_documents\CRM\4_2023-08-21' --> 'data\processed_data\CRM\4_2023-08-21.md'


2025-11-14 16:08:46,068 - INFO - Going to convert document batch...
2025-11-14 16:08:46,070 - INFO - Processing document 4_2023-08-22
2025-11-14 16:08:46,158 - INFO - Finished converting document 4_2023-08-22 in 0.16 sec.
2025-11-14 16:08:46,222 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:46,238 - INFO - Going to convert document batch...
2025-11-14 16:08:46,240 - INFO - Processing document 4_2023-08-23
2025-11-14 16:08:46,275 - INFO - Finished converting document 4_2023-08-23 in 0.06 sec.
2025-11-14 16:08:46,343 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:46,372 - INFO - Going to convert document batch...
2025-11-14 16:08:46,374 - INFO - Processing document 4_2023-08-24


Converted 'data\edgar_documents\CRM\4_2023-08-22' --> 'data\processed_data\CRM\4_2023-08-22.md'
Converted 'data\edgar_documents\CRM\4_2023-08-23' --> 'data\processed_data\CRM\4_2023-08-23.md'


2025-11-14 16:08:46,440 - INFO - Finished converting document 4_2023-08-24 in 0.11 sec.
2025-11-14 16:08:46,506 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:46,529 - INFO - Going to convert document batch...
2025-11-14 16:08:46,531 - INFO - Processing document 4_2023-08-25
2025-11-14 16:08:46,589 - INFO - Finished converting document 4_2023-08-25 in 0.11 sec.
2025-11-14 16:08:46,674 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-08-24' --> 'data\processed_data\CRM\4_2023-08-24.md'
Converted 'data\edgar_documents\CRM\4_2023-08-25' --> 'data\processed_data\CRM\4_2023-08-25.md'


2025-11-14 16:08:46,725 - INFO - Going to convert document batch...
2025-11-14 16:08:46,726 - INFO - Processing document 4_2023-08-28
2025-11-14 16:08:46,788 - INFO - Finished converting document 4_2023-08-28 in 0.14 sec.
2025-11-14 16:08:46,859 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:46,888 - INFO - Going to convert document batch...
2025-11-14 16:08:46,889 - INFO - Processing document 4_2023-08-29
2025-11-14 16:08:46,940 - INFO - Finished converting document 4_2023-08-29 in 0.09 sec.
2025-11-14 16:08:47,014 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:47,036 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-08-28' --> 'data\processed_data\CRM\4_2023-08-28.md'
Converted 'data\edgar_documents\CRM\4_2023-08-29' --> 'data\processed_data\CRM\4_2023-08-29.md'


2025-11-14 16:08:47,037 - INFO - Processing document 4_2023-08-30
2025-11-14 16:08:47,107 - INFO - Finished converting document 4_2023-08-30 in 0.12 sec.
2025-11-14 16:08:47,169 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:47,211 - INFO - Going to convert document batch...
2025-11-14 16:08:47,214 - INFO - Processing document 4_2023-08-31
2025-11-14 16:08:47,296 - INFO - Finished converting document 4_2023-08-31 in 0.14 sec.
2025-11-14 16:08:47,361 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-08-30' --> 'data\processed_data\CRM\4_2023-08-30.md'
Converted 'data\edgar_documents\CRM\4_2023-08-31' --> 'data\processed_data\CRM\4_2023-08-31.md'


2025-11-14 16:08:47,409 - INFO - Going to convert document batch...
2025-11-14 16:08:47,412 - INFO - Processing document 4_2023-09-01
2025-11-14 16:08:47,502 - INFO - Finished converting document 4_2023-09-01 in 0.16 sec.
2025-11-14 16:08:47,582 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:47,622 - INFO - Going to convert document batch...
2025-11-14 16:08:47,624 - INFO - Processing document 4_2023-09-05
2025-11-14 16:08:47,716 - INFO - Finished converting document 4_2023-09-05 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2023-09-01' --> 'data\processed_data\CRM\4_2023-09-01.md'


2025-11-14 16:08:47,781 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:47,806 - INFO - Going to convert document batch...
2025-11-14 16:08:47,807 - INFO - Processing document 4_2023-09-06
2025-11-14 16:08:47,868 - INFO - Finished converting document 4_2023-09-06 in 0.09 sec.
2025-11-14 16:08:47,942 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-09-05' --> 'data\processed_data\CRM\4_2023-09-05.md'
Converted 'data\edgar_documents\CRM\4_2023-09-06' --> 'data\processed_data\CRM\4_2023-09-06.md'


2025-11-14 16:08:47,976 - INFO - Going to convert document batch...
2025-11-14 16:08:47,978 - INFO - Processing document 4_2023-09-07
2025-11-14 16:08:48,055 - INFO - Finished converting document 4_2023-09-07 in 0.14 sec.
2025-11-14 16:08:48,122 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:48,142 - INFO - Going to convert document batch...
2025-11-14 16:08:48,142 - INFO - Processing document 4_2023-09-08
2025-11-14 16:08:48,189 - INFO - Finished converting document 4_2023-09-08 in 0.08 sec.
2025-11-14 16:08:48,259 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:48,286 - INFO - Going to convert document batch...
2025-11-14 16:08:48,287 - INFO - Processing document 4_2023-09-11


Converted 'data\edgar_documents\CRM\4_2023-09-07' --> 'data\processed_data\CRM\4_2023-09-07.md'
Converted 'data\edgar_documents\CRM\4_2023-09-08' --> 'data\processed_data\CRM\4_2023-09-08.md'


2025-11-14 16:08:48,351 - INFO - Finished converting document 4_2023-09-11 in 0.11 sec.
2025-11-14 16:08:48,420 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:48,438 - INFO - Going to convert document batch...
2025-11-14 16:08:48,439 - INFO - Processing document 4_2023-09-12
2025-11-14 16:08:48,483 - INFO - Finished converting document 4_2023-09-12 in 0.08 sec.
2025-11-14 16:08:48,553 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:48,593 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-09-11' --> 'data\processed_data\CRM\4_2023-09-11.md'
Converted 'data\edgar_documents\CRM\4_2023-09-12' --> 'data\processed_data\CRM\4_2023-09-12.md'


2025-11-14 16:08:48,595 - INFO - Processing document 4_2023-09-13
2025-11-14 16:08:48,675 - INFO - Finished converting document 4_2023-09-13 in 0.16 sec.
2025-11-14 16:08:48,738 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:48,761 - INFO - Going to convert document batch...
2025-11-14 16:08:48,763 - INFO - Processing document 4_2023-09-14
2025-11-14 16:08:48,814 - INFO - Finished converting document 4_2023-09-14 in 0.09 sec.


Converted 'data\edgar_documents\CRM\4_2023-09-13' --> 'data\processed_data\CRM\4_2023-09-13.md'
Converted 'data\edgar_documents\CRM\4_2023-09-14' --> 'data\processed_data\CRM\4_2023-09-14.md'


2025-11-14 16:08:48,905 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:48,939 - INFO - Going to convert document batch...
2025-11-14 16:08:48,941 - INFO - Processing document 4_2023-09-15
2025-11-14 16:08:49,006 - INFO - Finished converting document 4_2023-09-15 in 0.12 sec.
2025-11-14 16:08:49,091 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:49,186 - INFO - Going to convert document batch...
2025-11-14 16:08:49,189 - INFO - Processing document 4_2023-09-18


Converted 'data\edgar_documents\CRM\4_2023-09-15' --> 'data\processed_data\CRM\4_2023-09-15.md'


2025-11-14 16:08:49,303 - INFO - Finished converting document 4_2023-09-18 in 0.23 sec.
2025-11-14 16:08:49,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:49,386 - INFO - Going to convert document batch...
2025-11-14 16:08:49,388 - INFO - Processing document 4_2023-09-19
2025-11-14 16:08:49,440 - INFO - Finished converting document 4_2023-09-19 in 0.09 sec.
2025-11-14 16:08:49,538 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-09-18' --> 'data\processed_data\CRM\4_2023-09-18.md'
Converted 'data\edgar_documents\CRM\4_2023-09-19' --> 'data\processed_data\CRM\4_2023-09-19.md'


2025-11-14 16:08:49,584 - INFO - Going to convert document batch...
2025-11-14 16:08:49,585 - INFO - Processing document 4_2023-09-20
2025-11-14 16:08:49,658 - INFO - Finished converting document 4_2023-09-20 in 0.14 sec.
2025-11-14 16:08:49,738 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:49,776 - INFO - Going to convert document batch...
2025-11-14 16:08:49,782 - INFO - Processing document 4_2023-09-21
2025-11-14 16:08:49,869 - INFO - Finished converting document 4_2023-09-21 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-09-20' --> 'data\processed_data\CRM\4_2023-09-20.md'


2025-11-14 16:08:49,960 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:49,985 - INFO - Going to convert document batch...
2025-11-14 16:08:49,986 - INFO - Processing document 4_2023-09-22
2025-11-14 16:08:50,038 - INFO - Finished converting document 4_2023-09-22 in 0.09 sec.
2025-11-14 16:08:50,113 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:50,150 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-09-21' --> 'data\processed_data\CRM\4_2023-09-21.md'
Converted 'data\edgar_documents\CRM\4_2023-09-22' --> 'data\processed_data\CRM\4_2023-09-22.md'


2025-11-14 16:08:50,151 - INFO - Processing document 4_2023-09-25
2025-11-14 16:08:50,230 - INFO - Finished converting document 4_2023-09-25 in 0.16 sec.
2025-11-14 16:08:50,305 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:50,333 - INFO - Going to convert document batch...
2025-11-14 16:08:50,334 - INFO - Processing document 4_2023-09-26
2025-11-14 16:08:50,391 - INFO - Finished converting document 4_2023-09-26 in 0.11 sec.
2025-11-14 16:08:50,477 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-09-25' --> 'data\processed_data\CRM\4_2023-09-25.md'
Converted 'data\edgar_documents\CRM\4_2023-09-26' --> 'data\processed_data\CRM\4_2023-09-26.md'


2025-11-14 16:08:50,502 - INFO - Going to convert document batch...
2025-11-14 16:08:50,503 - INFO - Processing document 4_2023-09-27
2025-11-14 16:08:50,556 - INFO - Finished converting document 4_2023-09-27 in 0.09 sec.
2025-11-14 16:08:50,633 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:50,667 - INFO - Going to convert document batch...
2025-11-14 16:08:50,669 - INFO - Processing document 4_2023-09-28
2025-11-14 16:08:50,752 - INFO - Finished converting document 4_2023-09-28 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-09-27' --> 'data\processed_data\CRM\4_2023-09-27.md'


2025-11-14 16:08:50,838 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:50,877 - INFO - Going to convert document batch...
2025-11-14 16:08:50,878 - INFO - Processing document 4_2023-09-29
2025-11-14 16:08:50,941 - INFO - Finished converting document 4_2023-09-29 in 0.11 sec.
2025-11-14 16:08:51,005 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:51,030 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-09-28' --> 'data\processed_data\CRM\4_2023-09-28.md'
Converted 'data\edgar_documents\CRM\4_2023-09-29' --> 'data\processed_data\CRM\4_2023-09-29.md'


2025-11-14 16:08:51,032 - INFO - Processing document 4_2023-10-02
2025-11-14 16:08:51,086 - INFO - Finished converting document 4_2023-10-02 in 0.09 sec.
2025-11-14 16:08:51,156 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:51,196 - INFO - Going to convert document batch...
2025-11-14 16:08:51,198 - INFO - Processing document 4_2023-10-03
2025-11-14 16:08:51,270 - INFO - Finished converting document 4_2023-10-03 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2023-10-02' --> 'data\processed_data\CRM\4_2023-10-02.md'
Converted 'data\edgar_documents\CRM\4_2023-10-03' --> 'data\processed_data\CRM\4_2023-10-03.md'


2025-11-14 16:08:51,384 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:51,420 - INFO - Going to convert document batch...
2025-11-14 16:08:51,421 - INFO - Processing document 4_2023-10-04
2025-11-14 16:08:51,492 - INFO - Finished converting document 4_2023-10-04 in 0.14 sec.
2025-11-14 16:08:51,593 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:51,621 - INFO - Going to convert document batch...
2025-11-14 16:08:51,622 - INFO - Processing document 4_2023-10-05
2025-11-14 16:08:51,666 - INFO - Finished converting document 4_2023-10-05 in 0.09 sec.
2025-11-14 16:08:51,722 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:51,744 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-10-04' --> 'data\processed_data\CRM\4_2023-10-04.md'
Converted 'data\edgar_documents\CRM\4_2023-10-05' --> 'data\processed_data\CRM\4_2023-10-05.md'


2025-11-14 16:08:51,745 - INFO - Processing document 4_2023-10-06
2025-11-14 16:08:51,798 - INFO - Finished converting document 4_2023-10-06 in 0.09 sec.
2025-11-14 16:08:51,875 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:51,896 - INFO - Going to convert document batch...
2025-11-14 16:08:51,897 - INFO - Processing document 4_2023-10-10
2025-11-14 16:08:51,945 - INFO - Finished converting document 4_2023-10-10 in 0.09 sec.
2025-11-14 16:08:52,022 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:52,046 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-10-06' --> 'data\processed_data\CRM\4_2023-10-06.md'
Converted 'data\edgar_documents\CRM\4_2023-10-10' --> 'data\processed_data\CRM\4_2023-10-10.md'


2025-11-14 16:08:52,047 - INFO - Processing document 4_2023-10-11
2025-11-14 16:08:52,103 - INFO - Finished converting document 4_2023-10-11 in 0.11 sec.
2025-11-14 16:08:52,159 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:52,190 - INFO - Going to convert document batch...
2025-11-14 16:08:52,191 - INFO - Processing document 4_2023-10-12
2025-11-14 16:08:52,242 - INFO - Finished converting document 4_2023-10-12 in 0.09 sec.
2025-11-14 16:08:52,334 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-10-11' --> 'data\processed_data\CRM\4_2023-10-11.md'
Converted 'data\edgar_documents\CRM\4_2023-10-12' --> 'data\processed_data\CRM\4_2023-10-12.md'


2025-11-14 16:08:52,381 - INFO - Going to convert document batch...
2025-11-14 16:08:52,383 - INFO - Processing document 4_2023-10-13
2025-11-14 16:08:53,097 - INFO - Finished converting document 4_2023-10-13 in 0.78 sec.
2025-11-14 16:08:53,200 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:53,237 - INFO - Going to convert document batch...
2025-11-14 16:08:53,239 - INFO - Processing document 4_2023-10-16
2025-11-14 16:08:53,309 - INFO - Finished converting document 4_2023-10-16 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-10-13' --> 'data\processed_data\CRM\4_2023-10-13.md'
Converted 'data\edgar_documents\CRM\4_2023-10-16' --> 'data\processed_data\CRM\4_2023-10-16.md'


2025-11-14 16:08:53,395 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:53,420 - INFO - Going to convert document batch...
2025-11-14 16:08:53,421 - INFO - Processing document 4_2023-10-17
2025-11-14 16:08:53,473 - INFO - Finished converting document 4_2023-10-17 in 0.11 sec.
2025-11-14 16:08:53,548 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:53,570 - INFO - Going to convert document batch...
2025-11-14 16:08:53,571 - INFO - Processing document 4_2023-10-18
2025-11-14 16:08:53,620 - INFO - Finished converting document 4_2023-10-18 in 0.09 sec.
2025-11-14 16:08:53,704 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-10-17' --> 'data\processed_data\CRM\4_2023-10-17.md'
Converted 'data\edgar_documents\CRM\4_2023-10-18' --> 'data\processed_data\CRM\4_2023-10-18.md'


2025-11-14 16:08:53,745 - INFO - Going to convert document batch...
2025-11-14 16:08:53,747 - INFO - Processing document 4_2023-10-19
2025-11-14 16:08:53,843 - INFO - Finished converting document 4_2023-10-19 in 0.16 sec.
2025-11-14 16:08:53,916 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:53,938 - INFO - Going to convert document batch...
2025-11-14 16:08:53,939 - INFO - Processing document 4_2023-10-20
2025-11-14 16:08:53,990 - INFO - Finished converting document 4_2023-10-20 in 0.09 sec.
2025-11-14 16:08:54,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:54,088 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-10-19' --> 'data\processed_data\CRM\4_2023-10-19.md'
Converted 'data\edgar_documents\CRM\4_2023-10-20' --> 'data\processed_data\CRM\4_2023-10-20.md'


2025-11-14 16:08:54,090 - INFO - Processing document 4_2023-10-23
2025-11-14 16:08:54,170 - INFO - Finished converting document 4_2023-10-23 in 0.12 sec.
2025-11-14 16:08:54,264 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:54,283 - INFO - Going to convert document batch...
2025-11-14 16:08:54,284 - INFO - Processing document 4_2023-10-24
2025-11-14 16:08:54,330 - INFO - Finished converting document 4_2023-10-24 in 0.09 sec.
2025-11-14 16:08:54,390 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:54,415 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-10-23' --> 'data\processed_data\CRM\4_2023-10-23.md'
Converted 'data\edgar_documents\CRM\4_2023-10-24' --> 'data\processed_data\CRM\4_2023-10-24.md'


2025-11-14 16:08:54,417 - INFO - Processing document 4_2023-10-25
2025-11-14 16:08:54,474 - INFO - Finished converting document 4_2023-10-25 in 0.09 sec.
2025-11-14 16:08:54,567 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:54,598 - INFO - Going to convert document batch...
2025-11-14 16:08:54,599 - INFO - Processing document 4_2023-10-26
2025-11-14 16:08:54,657 - INFO - Finished converting document 4_2023-10-26 in 0.11 sec.
2025-11-14 16:08:54,736 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-10-25' --> 'data\processed_data\CRM\4_2023-10-25.md'
Converted 'data\edgar_documents\CRM\4_2023-10-26' --> 'data\processed_data\CRM\4_2023-10-26.md'


2025-11-14 16:08:54,786 - INFO - Going to convert document batch...
2025-11-14 16:08:54,787 - INFO - Processing document 4_2023-10-27
2025-11-14 16:08:54,869 - INFO - Finished converting document 4_2023-10-27 in 0.16 sec.
2025-11-14 16:08:54,960 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:54,980 - INFO - Going to convert document batch...
2025-11-14 16:08:54,981 - INFO - Processing document 4_2023-10-30
2025-11-14 16:08:55,023 - INFO - Finished converting document 4_2023-10-30 in 0.08 sec.
2025-11-14 16:08:55,107 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-10-27' --> 'data\processed_data\CRM\4_2023-10-27.md'
Converted 'data\edgar_documents\CRM\4_2023-10-30' --> 'data\processed_data\CRM\4_2023-10-30.md'


2025-11-14 16:08:55,144 - INFO - Going to convert document batch...
2025-11-14 16:08:55,147 - INFO - Processing document 4_2023-10-31
2025-11-14 16:08:55,201 - INFO - Finished converting document 4_2023-10-31 in 0.11 sec.
2025-11-14 16:08:55,261 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:55,307 - INFO - Going to convert document batch...
2025-11-14 16:08:55,309 - INFO - Processing document 4_2023-11-01
2025-11-14 16:08:55,416 - INFO - Finished converting document 4_2023-11-01 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-10-31' --> 'data\processed_data\CRM\4_2023-10-31.md'


2025-11-14 16:08:55,526 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:55,561 - INFO - Going to convert document batch...
2025-11-14 16:08:55,565 - INFO - Processing document 4_2023-11-02


Converted 'data\edgar_documents\CRM\4_2023-11-01' --> 'data\processed_data\CRM\4_2023-11-01.md'


2025-11-14 16:08:55,739 - INFO - Finished converting document 4_2023-11-02 in 0.23 sec.
2025-11-14 16:08:55,800 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:55,817 - INFO - Going to convert document batch...
2025-11-14 16:08:55,818 - INFO - Processing document 4_2023-11-03
2025-11-14 16:08:55,862 - INFO - Finished converting document 4_2023-11-03 in 0.08 sec.
2025-11-14 16:08:55,918 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:55,941 - INFO - Going to convert document batch...
2025-11-14 16:08:55,941 - INFO - Processing document 4_2023-11-06
2025-11-14 16:08:55,987 - INFO - Finished converting document 4_2023-11-06 in 0.08 sec.


Converted 'data\edgar_documents\CRM\4_2023-11-02' --> 'data\processed_data\CRM\4_2023-11-02.md'
Converted 'data\edgar_documents\CRM\4_2023-11-03' --> 'data\processed_data\CRM\4_2023-11-03.md'


2025-11-14 16:08:56,046 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:56,067 - INFO - Going to convert document batch...
2025-11-14 16:08:56,069 - INFO - Processing document 4_2023-11-07
2025-11-14 16:08:56,158 - INFO - Finished converting document 4_2023-11-07 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2023-11-06' --> 'data\processed_data\CRM\4_2023-11-06.md'


2025-11-14 16:08:56,267 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:56,327 - INFO - Going to convert document batch...
2025-11-14 16:08:56,329 - INFO - Processing document 4_2023-11-08
2025-11-14 16:08:56,390 - INFO - Finished converting document 4_2023-11-08 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-11-07' --> 'data\processed_data\CRM\4_2023-11-07.md'


2025-11-14 16:08:56,502 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:56,566 - INFO - Going to convert document batch...
2025-11-14 16:08:56,567 - INFO - Processing document 4_2023-11-09
2025-11-14 16:08:56,629 - INFO - Finished converting document 4_2023-11-09 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-11-08' --> 'data\processed_data\CRM\4_2023-11-08.md'


2025-11-14 16:08:56,697 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:56,745 - INFO - Going to convert document batch...
2025-11-14 16:08:56,747 - INFO - Processing document 4_2023-11-13
2025-11-14 16:08:56,818 - INFO - Finished converting document 4_2023-11-13 in 0.12 sec.
2025-11-14 16:08:56,895 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-11-09' --> 'data\processed_data\CRM\4_2023-11-09.md'
Converted 'data\edgar_documents\CRM\4_2023-11-13' --> 'data\processed_data\CRM\4_2023-11-13.md'


2025-11-14 16:08:56,917 - INFO - Going to convert document batch...
2025-11-14 16:08:56,918 - INFO - Processing document 4_2023-11-14
2025-11-14 16:08:56,968 - INFO - Finished converting document 4_2023-11-14 in 0.11 sec.
2025-11-14 16:08:57,024 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:57,066 - INFO - Going to convert document batch...
2025-11-14 16:08:57,067 - INFO - Processing document 4_2023-11-15
2025-11-14 16:08:57,162 - INFO - Finished converting document 4_2023-11-15 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-11-14' --> 'data\processed_data\CRM\4_2023-11-14.md'


2025-11-14 16:08:57,272 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:57,316 - INFO - Going to convert document batch...
2025-11-14 16:08:57,318 - INFO - Processing document 4_2023-11-16
2025-11-14 16:08:57,395 - INFO - Finished converting document 4_2023-11-16 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-11-15' --> 'data\processed_data\CRM\4_2023-11-15.md'


2025-11-14 16:08:57,476 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:57,518 - INFO - Going to convert document batch...
2025-11-14 16:08:57,520 - INFO - Processing document 4_2023-11-17
2025-11-14 16:08:57,603 - INFO - Finished converting document 4_2023-11-17 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-11-16' --> 'data\processed_data\CRM\4_2023-11-16.md'
Converted 'data\edgar_documents\CRM\4_2023-11-17' --> 'data\processed_data\CRM\4_2023-11-17.md'


2025-11-14 16:08:57,681 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:57,718 - INFO - Going to convert document batch...
2025-11-14 16:08:57,720 - INFO - Processing document 4_2023-11-20
2025-11-14 16:08:57,790 - INFO - Finished converting document 4_2023-11-20 in 0.12 sec.
2025-11-14 16:08:57,892 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:57,936 - INFO - Going to convert document batch...
2025-11-14 16:08:57,939 - INFO - Processing document 4_2023-11-21
2025-11-14 16:08:58,003 - INFO - Finished converting document 4_2023-11-21 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2023-11-20' --> 'data\processed_data\CRM\4_2023-11-20.md'
Converted 'data\edgar_documents\CRM\4_2023-11-21' --> 'data\processed_data\CRM\4_2023-11-21.md'


2025-11-14 16:08:58,080 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:58,111 - INFO - Going to convert document batch...
2025-11-14 16:08:58,112 - INFO - Processing document 4_2023-11-22
2025-11-14 16:08:58,159 - INFO - Finished converting document 4_2023-11-22 in 0.11 sec.
2025-11-14 16:08:58,258 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:58,294 - INFO - Going to convert document batch...
2025-11-14 16:08:58,296 - INFO - Processing document 4_2023-11-24
2025-11-14 16:08:58,338 - INFO - Finished converting document 4_2023-11-24 in 0.12 sec.
2025-11-14 16:08:58,408 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-11-22' --> 'data\processed_data\CRM\4_2023-11-22.md'
Converted 'data\edgar_documents\CRM\4_2023-11-24' --> 'data\processed_data\CRM\4_2023-11-24.md'


2025-11-14 16:08:58,463 - INFO - Going to convert document batch...
2025-11-14 16:08:58,464 - INFO - Processing document 4_2023-11-27
2025-11-14 16:08:58,587 - INFO - Finished converting document 4_2023-11-27 in 0.20 sec.
2025-11-14 16:08:58,697 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:58,723 - INFO - Going to convert document batch...
2025-11-14 16:08:58,724 - INFO - Processing document 4_2023-11-28
2025-11-14 16:08:58,780 - INFO - Finished converting document 4_2023-11-28 in 0.11 sec.
2025-11-14 16:08:58,849 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:58,867 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-11-27' --> 'data\processed_data\CRM\4_2023-11-27.md'
Converted 'data\edgar_documents\CRM\4_2023-11-28' --> 'data\processed_data\CRM\4_2023-11-28.md'


2025-11-14 16:08:58,868 - INFO - Processing document 4_2023-11-29
2025-11-14 16:08:58,916 - INFO - Finished converting document 4_2023-11-29 in 0.09 sec.
2025-11-14 16:08:58,980 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:59,000 - INFO - Going to convert document batch...
2025-11-14 16:08:59,001 - INFO - Processing document 4_2023-11-30
2025-11-14 16:08:59,055 - INFO - Finished converting document 4_2023-11-30 in 0.09 sec.
2025-11-14 16:08:59,141 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-11-29' --> 'data\processed_data\CRM\4_2023-11-29.md'
Converted 'data\edgar_documents\CRM\4_2023-11-30' --> 'data\processed_data\CRM\4_2023-11-30.md'


2025-11-14 16:08:59,191 - INFO - Going to convert document batch...
2025-11-14 16:08:59,193 - INFO - Processing document 4_2023-12-01
2025-11-14 16:08:59,282 - INFO - Finished converting document 4_2023-12-01 in 0.17 sec.
2025-11-14 16:08:59,346 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:59,371 - INFO - Going to convert document batch...
2025-11-14 16:08:59,373 - INFO - Processing document 4_2023-12-04
2025-11-14 16:08:59,432 - INFO - Finished converting document 4_2023-12-04 in 0.11 sec.
2025-11-14 16:08:59,491 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:59,515 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-12-01' --> 'data\processed_data\CRM\4_2023-12-01.md'
Converted 'data\edgar_documents\CRM\4_2023-12-04' --> 'data\processed_data\CRM\4_2023-12-04.md'


2025-11-14 16:08:59,516 - INFO - Processing document 4_2023-12-05
2025-11-14 16:08:59,565 - INFO - Finished converting document 4_2023-12-05 in 0.09 sec.
2025-11-14 16:08:59,627 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:59,648 - INFO - Going to convert document batch...
2025-11-14 16:08:59,650 - INFO - Processing document 4_2023-12-06
2025-11-14 16:08:59,703 - INFO - Finished converting document 4_2023-12-06 in 0.09 sec.
2025-11-14 16:08:59,762 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:08:59,784 - INFO - Going to convert document batch...
2025-11-14 16:08:59,786 - INFO - Processing document 4_2023-12-07


Converted 'data\edgar_documents\CRM\4_2023-12-05' --> 'data\processed_data\CRM\4_2023-12-05.md'
Converted 'data\edgar_documents\CRM\4_2023-12-06' --> 'data\processed_data\CRM\4_2023-12-06.md'


2025-11-14 16:08:59,838 - INFO - Finished converting document 4_2023-12-07 in 0.09 sec.
2025-11-14 16:08:59,924 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-12-07' --> 'data\processed_data\CRM\4_2023-12-07.md'


2025-11-14 16:09:00,464 - INFO - Going to convert document batch...
2025-11-14 16:09:00,467 - INFO - Processing document 4_2023-12-08
2025-11-14 16:09:00,573 - INFO - Finished converting document 4_2023-12-08 in 0.69 sec.
2025-11-14 16:09:00,675 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:00,717 - INFO - Going to convert document batch...
2025-11-14 16:09:00,719 - INFO - Processing document 4_2023-12-11
2025-11-14 16:09:00,806 - INFO - Finished converting document 4_2023-12-11 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-12-08' --> 'data\processed_data\CRM\4_2023-12-08.md'


2025-11-14 16:09:00,907 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:00,945 - INFO - Going to convert document batch...
2025-11-14 16:09:00,947 - INFO - Processing document 4_2023-12-12
2025-11-14 16:09:01,030 - INFO - Finished converting document 4_2023-12-12 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2023-12-11' --> 'data\processed_data\CRM\4_2023-12-11.md'


2025-11-14 16:09:01,130 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:01,171 - INFO - Going to convert document batch...
2025-11-14 16:09:01,173 - INFO - Processing document 4_2023-12-13
2025-11-14 16:09:01,243 - INFO - Finished converting document 4_2023-12-13 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2023-12-12' --> 'data\processed_data\CRM\4_2023-12-12.md'


2025-11-14 16:09:01,331 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:01,350 - INFO - Going to convert document batch...
2025-11-14 16:09:01,351 - INFO - Processing document 4_2023-12-14
2025-11-14 16:09:01,403 - INFO - Finished converting document 4_2023-12-14 in 0.09 sec.
2025-11-14 16:09:01,483 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2023-12-13' --> 'data\processed_data\CRM\4_2023-12-13.md'
Converted 'data\edgar_documents\CRM\4_2023-12-14' --> 'data\processed_data\CRM\4_2023-12-14.md'


2025-11-14 16:09:01,523 - INFO - Going to convert document batch...
2025-11-14 16:09:01,526 - INFO - Processing document 4_2023-12-15
2025-11-14 16:09:01,603 - INFO - Finished converting document 4_2023-12-15 in 0.14 sec.
2025-11-14 16:09:01,669 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:01,691 - INFO - Going to convert document batch...
2025-11-14 16:09:01,693 - INFO - Processing document 4_2023-12-18
2025-11-14 16:09:01,747 - INFO - Finished converting document 4_2023-12-18 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2023-12-15' --> 'data\processed_data\CRM\4_2023-12-15.md'
Converted 'data\edgar_documents\CRM\4_2023-12-18' --> 'data\processed_data\CRM\4_2023-12-18.md'


2025-11-14 16:09:01,851 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:01,897 - INFO - Going to convert document batch...
2025-11-14 16:09:01,899 - INFO - Processing document 4_2023-12-19
2025-11-14 16:09:01,952 - INFO - Finished converting document 4_2023-12-19 in 0.14 sec.
2025-11-14 16:09:02,029 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:02,062 - INFO - Going to convert document batch...
2025-11-14 16:09:02,064 - INFO - Processing document 4_2023-12-20
2025-11-14 16:09:02,107 - INFO - Finished converting document 4_2023-12-20 in 0.09 sec.
2025-11-14 16:09:02,191 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:02,232 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-12-19' --> 'data\processed_data\CRM\4_2023-12-19.md'
Converted 'data\edgar_documents\CRM\4_2023-12-20' --> 'data\processed_data\CRM\4_2023-12-20.md'


2025-11-14 16:09:02,234 - INFO - Processing document 4_2023-12-21
2025-11-14 16:09:02,327 - INFO - Finished converting document 4_2023-12-21 in 0.17 sec.
2025-11-14 16:09:02,403 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:02,426 - INFO - Going to convert document batch...
2025-11-14 16:09:02,429 - INFO - Processing document 4_2023-12-22
2025-11-14 16:09:02,484 - INFO - Finished converting document 4_2023-12-22 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2023-12-21' --> 'data\processed_data\CRM\4_2023-12-21.md'
Converted 'data\edgar_documents\CRM\4_2023-12-22' --> 'data\processed_data\CRM\4_2023-12-22.md'


2025-11-14 16:09:02,588 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:02,637 - INFO - Going to convert document batch...
2025-11-14 16:09:02,638 - INFO - Processing document 4_2023-12-26
2025-11-14 16:09:02,720 - INFO - Finished converting document 4_2023-12-26 in 0.17 sec.
2025-11-14 16:09:02,824 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:02,864 - INFO - Going to convert document batch...
2025-11-14 16:09:02,867 - INFO - Processing document 4_2023-12-27
2025-11-14 16:09:02,948 - INFO - Finished converting document 4_2023-12-27 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2023-12-26' --> 'data\processed_data\CRM\4_2023-12-26.md'


2025-11-14 16:09:03,043 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:03,062 - INFO - Going to convert document batch...
2025-11-14 16:09:03,063 - INFO - Processing document 4_2023-12-28
2025-11-14 16:09:03,102 - INFO - Finished converting document 4_2023-12-28 in 0.08 sec.
2025-11-14 16:09:03,170 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:03,204 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-12-27' --> 'data\processed_data\CRM\4_2023-12-27.md'
Converted 'data\edgar_documents\CRM\4_2023-12-28' --> 'data\processed_data\CRM\4_2023-12-28.md'


2025-11-14 16:09:03,205 - INFO - Processing document 4_2023-12-29
2025-11-14 16:09:03,269 - INFO - Finished converting document 4_2023-12-29 in 0.12 sec.
2025-11-14 16:09:03,345 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:03,367 - INFO - Going to convert document batch...
2025-11-14 16:09:03,368 - INFO - Processing document 4_2024-01-03
2025-11-14 16:09:03,419 - INFO - Finished converting document 4_2024-01-03 in 0.09 sec.
2025-11-14 16:09:03,485 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:03,518 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2023-12-29' --> 'data\processed_data\CRM\4_2023-12-29.md'
Converted 'data\edgar_documents\CRM\4_2024-01-03' --> 'data\processed_data\CRM\4_2024-01-03.md'


2025-11-14 16:09:03,520 - INFO - Processing document 4_2024-01-04
2025-11-14 16:09:03,585 - INFO - Finished converting document 4_2024-01-04 in 0.11 sec.
2025-11-14 16:09:03,658 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:03,688 - INFO - Going to convert document batch...
2025-11-14 16:09:03,690 - INFO - Processing document 4_2024-01-05
2025-11-14 16:09:03,747 - INFO - Finished converting document 4_2024-01-05 in 0.11 sec.
2025-11-14 16:09:03,834 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-01-04' --> 'data\processed_data\CRM\4_2024-01-04.md'
Converted 'data\edgar_documents\CRM\4_2024-01-05' --> 'data\processed_data\CRM\4_2024-01-05.md'


2025-11-14 16:09:03,876 - INFO - Going to convert document batch...
2025-11-14 16:09:03,877 - INFO - Processing document 4_2024-01-08
2025-11-14 16:09:03,946 - INFO - Finished converting document 4_2024-01-08 in 0.14 sec.
2025-11-14 16:09:04,004 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:04,025 - INFO - Going to convert document batch...
2025-11-14 16:09:04,026 - INFO - Processing document 4_2024-01-09
2025-11-14 16:09:04,111 - INFO - Finished converting document 4_2024-01-09 in 0.12 sec.
2025-11-14 16:09:04,181 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-01-08' --> 'data\processed_data\CRM\4_2024-01-08.md'
Converted 'data\edgar_documents\CRM\4_2024-01-09' --> 'data\processed_data\CRM\4_2024-01-09.md'


2025-11-14 16:09:04,205 - INFO - Going to convert document batch...
2025-11-14 16:09:04,207 - INFO - Processing document 4_2024-01-10
2025-11-14 16:09:04,266 - INFO - Finished converting document 4_2024-01-10 in 0.11 sec.
2025-11-14 16:09:04,347 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:04,376 - INFO - Going to convert document batch...
2025-11-14 16:09:04,378 - INFO - Processing document 4_2024-01-11
2025-11-14 16:09:04,450 - INFO - Finished converting document 4_2024-01-11 in 0.12 sec.
2025-11-14 16:09:04,521 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-01-10' --> 'data\processed_data\CRM\4_2024-01-10.md'
Converted 'data\edgar_documents\CRM\4_2024-01-11' --> 'data\processed_data\CRM\4_2024-01-11.md'


2025-11-14 16:09:04,549 - INFO - Going to convert document batch...
2025-11-14 16:09:04,550 - INFO - Processing document 4_2024-01-12
2025-11-14 16:09:04,612 - INFO - Finished converting document 4_2024-01-12 in 0.11 sec.
2025-11-14 16:09:04,678 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:04,701 - INFO - Going to convert document batch...
2025-11-14 16:09:04,702 - INFO - Processing document 4_2024-01-16
2025-11-14 16:09:04,760 - INFO - Finished converting document 4_2024-01-16 in 0.11 sec.
2025-11-14 16:09:04,826 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:04,852 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2024-01-12' --> 'data\processed_data\CRM\4_2024-01-12.md'
Converted 'data\edgar_documents\CRM\4_2024-01-16' --> 'data\processed_data\CRM\4_2024-01-16.md'


2025-11-14 16:09:04,855 - INFO - Processing document 4_2024-01-17
2025-11-14 16:09:04,908 - INFO - Finished converting document 4_2024-01-17 in 0.09 sec.
2025-11-14 16:09:05,009 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:05,053 - INFO - Going to convert document batch...
2025-11-14 16:09:05,054 - INFO - Processing document 4_2024-01-18
2025-11-14 16:09:05,136 - INFO - Finished converting document 4_2024-01-18 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2024-01-17' --> 'data\processed_data\CRM\4_2024-01-17.md'


2025-11-14 16:09:05,220 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:05,261 - INFO - Going to convert document batch...
2025-11-14 16:09:05,262 - INFO - Processing document 4_2024-01-19
2025-11-14 16:09:05,316 - INFO - Finished converting document 4_2024-01-19 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2024-01-18' --> 'data\processed_data\CRM\4_2024-01-18.md'
Converted 'data\edgar_documents\CRM\4_2024-01-19' --> 'data\processed_data\CRM\4_2024-01-19.md'


2025-11-14 16:09:05,419 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:05,453 - INFO - Going to convert document batch...
2025-11-14 16:09:05,455 - INFO - Processing document 4_2024-01-22
2025-11-14 16:09:05,505 - INFO - Finished converting document 4_2024-01-22 in 0.11 sec.
2025-11-14 16:09:05,567 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:05,599 - INFO - Going to convert document batch...
2025-11-14 16:09:05,600 - INFO - Processing document 4_2024-01-23
2025-11-14 16:09:05,664 - INFO - Finished converting document 4_2024-01-23 in 0.11 sec.
2025-11-14 16:09:05,726 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-01-22' --> 'data\processed_data\CRM\4_2024-01-22.md'
Converted 'data\edgar_documents\CRM\4_2024-01-23' --> 'data\processed_data\CRM\4_2024-01-23.md'


2025-11-14 16:09:05,759 - INFO - Going to convert document batch...
2025-11-14 16:09:05,760 - INFO - Processing document 4_2024-01-24
2025-11-14 16:09:05,835 - INFO - Finished converting document 4_2024-01-24 in 0.12 sec.
2025-11-14 16:09:05,908 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:05,922 - INFO - Going to convert document batch...
2025-11-14 16:09:05,924 - INFO - Processing document 4_2024-01-25
2025-11-14 16:09:05,970 - INFO - Finished converting document 4_2024-01-25 in 0.08 sec.
2025-11-14 16:09:06,046 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:06,069 - INFO - Going to convert document batch...
2025-11-14 16:09:06,070 - INFO - Processing document 4_2024-01-26


Converted 'data\edgar_documents\CRM\4_2024-01-24' --> 'data\processed_data\CRM\4_2024-01-24.md'
Converted 'data\edgar_documents\CRM\4_2024-01-25' --> 'data\processed_data\CRM\4_2024-01-25.md'


2025-11-14 16:09:06,113 - INFO - Finished converting document 4_2024-01-26 in 0.08 sec.
2025-11-14 16:09:06,171 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:06,196 - INFO - Going to convert document batch...
2025-11-14 16:09:06,197 - INFO - Processing document 4_2024-01-29
2025-11-14 16:09:06,258 - INFO - Finished converting document 4_2024-01-29 in 0.09 sec.
2025-11-14 16:09:06,340 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-01-26' --> 'data\processed_data\CRM\4_2024-01-26.md'
Converted 'data\edgar_documents\CRM\4_2024-01-29' --> 'data\processed_data\CRM\4_2024-01-29.md'


2025-11-14 16:09:06,369 - INFO - Going to convert document batch...
2025-11-14 16:09:06,371 - INFO - Processing document 4_2024-01-30
2025-11-14 16:09:06,422 - INFO - Finished converting document 4_2024-01-30 in 0.11 sec.
2025-11-14 16:09:06,484 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:06,513 - INFO - Going to convert document batch...
2025-11-14 16:09:06,514 - INFO - Processing document 4_2024-01-31
2025-11-14 16:09:06,576 - INFO - Finished converting document 4_2024-01-31 in 0.11 sec.
2025-11-14 16:09:06,655 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-01-30' --> 'data\processed_data\CRM\4_2024-01-30.md'
Converted 'data\edgar_documents\CRM\4_2024-01-31' --> 'data\processed_data\CRM\4_2024-01-31.md'


2025-11-14 16:09:06,682 - INFO - Going to convert document batch...
2025-11-14 16:09:06,685 - INFO - Processing document 4_2024-02-01
2025-11-14 16:09:06,743 - INFO - Finished converting document 4_2024-02-01 in 0.11 sec.
2025-11-14 16:09:06,803 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:06,827 - INFO - Going to convert document batch...
2025-11-14 16:09:06,829 - INFO - Processing document 4_2024-02-02
2025-11-14 16:09:06,893 - INFO - Finished converting document 4_2024-02-02 in 0.11 sec.
2025-11-14 16:09:06,972 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-02-01' --> 'data\processed_data\CRM\4_2024-02-01.md'
Converted 'data\edgar_documents\CRM\4_2024-02-02' --> 'data\processed_data\CRM\4_2024-02-02.md'


2025-11-14 16:09:07,007 - INFO - Going to convert document batch...
2025-11-14 16:09:07,009 - INFO - Processing document 4_2024-02-05
2025-11-14 16:09:07,088 - INFO - Finished converting document 4_2024-02-05 in 0.16 sec.
2025-11-14 16:09:07,178 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:07,210 - INFO - Going to convert document batch...
2025-11-14 16:09:07,211 - INFO - Processing document 4_2024-02-06


Converted 'data\edgar_documents\CRM\4_2024-02-05' --> 'data\processed_data\CRM\4_2024-02-05.md'


2025-11-14 16:09:07,837 - INFO - Finished converting document 4_2024-02-06 in 0.67 sec.
2025-11-14 16:09:07,912 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:07,935 - INFO - Going to convert document batch...
2025-11-14 16:09:07,936 - INFO - Processing document 4_2024-02-07
2025-11-14 16:09:07,994 - INFO - Finished converting document 4_2024-02-07 in 0.09 sec.
2025-11-14 16:09:08,065 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:08,085 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2024-02-06' --> 'data\processed_data\CRM\4_2024-02-06.md'
Converted 'data\edgar_documents\CRM\4_2024-02-07' --> 'data\processed_data\CRM\4_2024-02-07.md'


2025-11-14 16:09:08,086 - INFO - Processing document 4_2024-02-08
2025-11-14 16:09:08,139 - INFO - Finished converting document 4_2024-02-08 in 0.09 sec.
2025-11-14 16:09:08,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:08,250 - INFO - Going to convert document batch...
2025-11-14 16:09:08,251 - INFO - Processing document 4_2024-02-09
2025-11-14 16:09:08,298 - INFO - Finished converting document 4_2024-02-09 in 0.09 sec.
2025-11-14 16:09:08,377 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-02-08' --> 'data\processed_data\CRM\4_2024-02-08.md'
Converted 'data\edgar_documents\CRM\4_2024-02-09' --> 'data\processed_data\CRM\4_2024-02-09.md'


2025-11-14 16:09:08,408 - INFO - Going to convert document batch...
2025-11-14 16:09:08,411 - INFO - Processing document 4_2024-02-12
2025-11-14 16:09:08,473 - INFO - Finished converting document 4_2024-02-12 in 0.12 sec.
2025-11-14 16:09:08,533 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:08,558 - INFO - Going to convert document batch...
2025-11-14 16:09:08,562 - INFO - Processing document 4_2024-02-13
2025-11-14 16:09:08,613 - INFO - Finished converting document 4_2024-02-13 in 0.09 sec.
2025-11-14 16:09:08,693 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-02-12' --> 'data\processed_data\CRM\4_2024-02-12.md'
Converted 'data\edgar_documents\CRM\4_2024-02-13' --> 'data\processed_data\CRM\4_2024-02-13.md'


2025-11-14 16:09:08,754 - INFO - Going to convert document batch...
2025-11-14 16:09:08,757 - INFO - Processing document 4_2024-02-14
2025-11-14 16:09:08,849 - INFO - Finished converting document 4_2024-02-14 in 0.17 sec.
2025-11-14 16:09:08,947 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:08,987 - INFO - Going to convert document batch...
2025-11-14 16:09:08,989 - INFO - Processing document 4_2024-02-15
2025-11-14 16:09:09,077 - INFO - Finished converting document 4_2024-02-15 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2024-02-14' --> 'data\processed_data\CRM\4_2024-02-14.md'
Converted 'data\edgar_documents\CRM\4_2024-02-15' --> 'data\processed_data\CRM\4_2024-02-15.md'


2025-11-14 16:09:09,152 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:09,178 - INFO - Going to convert document batch...
2025-11-14 16:09:09,179 - INFO - Processing document 4_2024-02-16
2025-11-14 16:09:09,234 - INFO - Finished converting document 4_2024-02-16 in 0.11 sec.
2025-11-14 16:09:09,325 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:09,346 - INFO - Going to convert document batch...
2025-11-14 16:09:09,347 - INFO - Processing document 4_2024-02-20
2025-11-14 16:09:09,398 - INFO - Finished converting document 4_2024-02-20 in 0.09 sec.
2025-11-14 16:09:09,462 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-02-16' --> 'data\processed_data\CRM\4_2024-02-16.md'
Converted 'data\edgar_documents\CRM\4_2024-02-20' --> 'data\processed_data\CRM\4_2024-02-20.md'


2025-11-14 16:09:09,490 - INFO - Going to convert document batch...
2025-11-14 16:09:09,492 - INFO - Processing document 4_2024-02-21
2025-11-14 16:09:09,559 - INFO - Finished converting document 4_2024-02-21 in 0.12 sec.
2025-11-14 16:09:09,626 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:09,650 - INFO - Going to convert document batch...
2025-11-14 16:09:09,652 - INFO - Processing document 4_2024-02-22
2025-11-14 16:09:09,734 - INFO - Finished converting document 4_2024-02-22 in 0.12 sec.
2025-11-14 16:09:09,810 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-02-21' --> 'data\processed_data\CRM\4_2024-02-21.md'
Converted 'data\edgar_documents\CRM\4_2024-02-22' --> 'data\processed_data\CRM\4_2024-02-22.md'


2025-11-14 16:09:09,828 - INFO - Going to convert document batch...
2025-11-14 16:09:09,829 - INFO - Processing document 4_2024-02-23
2025-11-14 16:09:09,869 - INFO - Finished converting document 4_2024-02-23 in 0.08 sec.
2025-11-14 16:09:09,919 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:09,948 - INFO - Going to convert document batch...
2025-11-14 16:09:09,949 - INFO - Processing document 4_2024-02-26
2025-11-14 16:09:10,015 - INFO - Finished converting document 4_2024-02-26 in 0.11 sec.
2025-11-14 16:09:10,089 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-02-23' --> 'data\processed_data\CRM\4_2024-02-23.md'
Converted 'data\edgar_documents\CRM\4_2024-02-26' --> 'data\processed_data\CRM\4_2024-02-26.md'


2025-11-14 16:09:10,107 - INFO - Going to convert document batch...
2025-11-14 16:09:10,109 - INFO - Processing document 4_2024-02-27
2025-11-14 16:09:10,156 - INFO - Finished converting document 4_2024-02-27 in 0.08 sec.
2025-11-14 16:09:10,213 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:10,235 - INFO - Going to convert document batch...
2025-11-14 16:09:10,236 - INFO - Processing document 4_2024-02-28
2025-11-14 16:09:10,304 - INFO - Finished converting document 4_2024-02-28 in 0.09 sec.
2025-11-14 16:09:10,365 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-02-27' --> 'data\processed_data\CRM\4_2024-02-27.md'
Converted 'data\edgar_documents\CRM\4_2024-02-28' --> 'data\processed_data\CRM\4_2024-02-28.md'


2025-11-14 16:09:10,392 - INFO - Going to convert document batch...
2025-11-14 16:09:10,394 - INFO - Processing document 4_2024-02-29
2025-11-14 16:09:10,469 - INFO - Finished converting document 4_2024-02-29 in 0.12 sec.
2025-11-14 16:09:10,552 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:10,596 - INFO - Going to convert document batch...
2025-11-14 16:09:10,597 - INFO - Processing document 4_2024-03-01
2025-11-14 16:09:10,724 - INFO - Finished converting document 4_2024-03-01 in 0.20 sec.


Converted 'data\edgar_documents\CRM\4_2024-02-29' --> 'data\processed_data\CRM\4_2024-02-29.md'


2025-11-14 16:09:10,814 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:10,863 - INFO - Going to convert document batch...
2025-11-14 16:09:10,865 - INFO - Processing document 4_2024-03-04
2025-11-14 16:09:10,949 - INFO - Finished converting document 4_2024-03-04 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2024-03-01' --> 'data\processed_data\CRM\4_2024-03-01.md'


2025-11-14 16:09:11,061 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:11,080 - INFO - Going to convert document batch...
2025-11-14 16:09:11,081 - INFO - Processing document 4_2024-03-05
2025-11-14 16:09:11,133 - INFO - Finished converting document 4_2024-03-05 in 0.09 sec.
2025-11-14 16:09:11,190 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-03-04' --> 'data\processed_data\CRM\4_2024-03-04.md'
Converted 'data\edgar_documents\CRM\4_2024-03-05' --> 'data\processed_data\CRM\4_2024-03-05.md'


2025-11-14 16:09:11,249 - INFO - Going to convert document batch...
2025-11-14 16:09:11,250 - INFO - Processing document 4_2024-03-06
2025-11-14 16:09:11,379 - INFO - Finished converting document 4_2024-03-06 in 0.20 sec.
2025-11-14 16:09:11,535 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:11,574 - INFO - Going to convert document batch...
2025-11-14 16:09:11,577 - INFO - Processing document 4_2024-03-07
2025-11-14 16:09:11,628 - INFO - Finished converting document 4_2024-03-07 in 0.11 sec.
2025-11-14 16:09:11,695 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:11,717 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2024-03-06' --> 'data\processed_data\CRM\4_2024-03-06.md'
Converted 'data\edgar_documents\CRM\4_2024-03-07' --> 'data\processed_data\CRM\4_2024-03-07.md'


2025-11-14 16:09:11,718 - INFO - Processing document 4_2024-03-08
2025-11-14 16:09:11,775 - INFO - Finished converting document 4_2024-03-08 in 0.09 sec.
2025-11-14 16:09:11,834 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:11,859 - INFO - Going to convert document batch...
2025-11-14 16:09:11,859 - INFO - Processing document 4_2024-03-11
2025-11-14 16:09:11,922 - INFO - Finished converting document 4_2024-03-11 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2024-03-08' --> 'data\processed_data\CRM\4_2024-03-08.md'


2025-11-14 16:09:12,012 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:12,051 - INFO - Going to convert document batch...
2025-11-14 16:09:12,054 - INFO - Processing document 4_2024-03-12
2025-11-14 16:09:12,119 - INFO - Finished converting document 4_2024-03-12 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2024-03-11' --> 'data\processed_data\CRM\4_2024-03-11.md'
Converted 'data\edgar_documents\CRM\4_2024-03-12' --> 'data\processed_data\CRM\4_2024-03-12.md'


2025-11-14 16:09:12,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:12,259 - INFO - Going to convert document batch...
2025-11-14 16:09:12,260 - INFO - Processing document 4_2024-03-13
2025-11-14 16:09:12,439 - INFO - Finished converting document 4_2024-03-13 in 0.27 sec.
2025-11-14 16:09:12,515 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:12,535 - INFO - Going to convert document batch...
2025-11-14 16:09:12,536 - INFO - Processing document 4_2024-03-14
2025-11-14 16:09:12,581 - INFO - Finished converting document 4_2024-03-14 in 0.09 sec.
2025-11-14 16:09:12,657 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:12,682 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2024-03-13' --> 'data\processed_data\CRM\4_2024-03-13.md'
Converted 'data\edgar_documents\CRM\4_2024-03-14' --> 'data\processed_data\CRM\4_2024-03-14.md'


2025-11-14 16:09:12,683 - INFO - Processing document 4_2024-03-15
2025-11-14 16:09:12,745 - INFO - Finished converting document 4_2024-03-15 in 0.12 sec.
2025-11-14 16:09:12,814 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:12,851 - INFO - Going to convert document batch...
2025-11-14 16:09:12,853 - INFO - Processing document 4_2024-03-18
2025-11-14 16:09:12,917 - INFO - Finished converting document 4_2024-03-18 in 0.12 sec.
2025-11-14 16:09:12,994 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-03-15' --> 'data\processed_data\CRM\4_2024-03-15.md'
Converted 'data\edgar_documents\CRM\4_2024-03-18' --> 'data\processed_data\CRM\4_2024-03-18.md'


2025-11-14 16:09:13,014 - INFO - Going to convert document batch...
2025-11-14 16:09:13,016 - INFO - Processing document 4_2024-03-19
2025-11-14 16:09:13,069 - INFO - Finished converting document 4_2024-03-19 in 0.09 sec.
2025-11-14 16:09:13,136 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:13,167 - INFO - Going to convert document batch...
2025-11-14 16:09:13,168 - INFO - Processing document 4_2024-03-20
2025-11-14 16:09:13,240 - INFO - Finished converting document 4_2024-03-20 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2024-03-19' --> 'data\processed_data\CRM\4_2024-03-19.md'
Converted 'data\edgar_documents\CRM\4_2024-03-20' --> 'data\processed_data\CRM\4_2024-03-20.md'


2025-11-14 16:09:13,324 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:13,348 - INFO - Going to convert document batch...
2025-11-14 16:09:13,350 - INFO - Processing document 4_2024-03-21
2025-11-14 16:09:13,400 - INFO - Finished converting document 4_2024-03-21 in 0.09 sec.
2025-11-14 16:09:13,565 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:13,598 - INFO - Going to convert document batch...
2025-11-14 16:09:13,599 - INFO - Processing document 4_2024-03-22
2025-11-14 16:09:13,639 - INFO - Finished converting document 4_2024-03-22 in 0.12 sec.
2025-11-14 16:09:13,705 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-03-21' --> 'data\processed_data\CRM\4_2024-03-21.md'
Converted 'data\edgar_documents\CRM\4_2024-03-22' --> 'data\processed_data\CRM\4_2024-03-22.md'


2025-11-14 16:09:13,742 - INFO - Going to convert document batch...
2025-11-14 16:09:13,745 - INFO - Processing document 4_2024-03-25
2025-11-14 16:09:13,816 - INFO - Finished converting document 4_2024-03-25 in 0.14 sec.
2025-11-14 16:09:13,874 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:13,899 - INFO - Going to convert document batch...
2025-11-14 16:09:13,900 - INFO - Processing document 4_2024-03-26
2025-11-14 16:09:13,974 - INFO - Finished converting document 4_2024-03-26 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2024-03-25' --> 'data\processed_data\CRM\4_2024-03-25.md'


2025-11-14 16:09:14,084 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-03-26' --> 'data\processed_data\CRM\4_2024-03-26.md'


2025-11-14 16:09:14,661 - INFO - Going to convert document batch...
2025-11-14 16:09:14,662 - INFO - Processing document 4_2024-03-27
2025-11-14 16:09:14,737 - INFO - Finished converting document 4_2024-03-27 in 0.67 sec.
2025-11-14 16:09:14,801 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:14,830 - INFO - Going to convert document batch...
2025-11-14 16:09:14,831 - INFO - Processing document 4_2024-03-28
2025-11-14 16:09:14,902 - INFO - Finished converting document 4_2024-03-28 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2024-03-27' --> 'data\processed_data\CRM\4_2024-03-27.md'


2025-11-14 16:09:14,989 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:15,010 - INFO - Going to convert document batch...
2025-11-14 16:09:15,011 - INFO - Processing document 4_2024-03-29
2025-11-14 16:09:15,055 - INFO - Finished converting document 4_2024-03-29 in 0.08 sec.
2025-11-14 16:09:15,126 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:15,148 - INFO - Going to convert document batch...
2025-11-14 16:09:15,150 - INFO - Processing document 4_2024-04-02


Converted 'data\edgar_documents\CRM\4_2024-03-28' --> 'data\processed_data\CRM\4_2024-03-28.md'
Converted 'data\edgar_documents\CRM\4_2024-03-29' --> 'data\processed_data\CRM\4_2024-03-29.md'


2025-11-14 16:09:15,229 - INFO - Finished converting document 4_2024-04-02 in 0.14 sec.
2025-11-14 16:09:15,304 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:15,345 - INFO - Going to convert document batch...
2025-11-14 16:09:15,346 - INFO - Processing document 4_2024-04-03
2025-11-14 16:09:15,431 - INFO - Finished converting document 4_2024-04-03 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2024-04-02' --> 'data\processed_data\CRM\4_2024-04-02.md'


2025-11-14 16:09:15,515 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:15,550 - INFO - Going to convert document batch...
2025-11-14 16:09:15,551 - INFO - Processing document 4_2024-04-04
2025-11-14 16:09:15,636 - INFO - Finished converting document 4_2024-04-04 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2024-04-03' --> 'data\processed_data\CRM\4_2024-04-03.md'
Converted 'data\edgar_documents\CRM\4_2024-04-04' --> 'data\processed_data\CRM\4_2024-04-04.md'


2025-11-14 16:09:15,730 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:15,770 - INFO - Going to convert document batch...
2025-11-14 16:09:15,772 - INFO - Processing document 4_2024-04-05
2025-11-14 16:09:15,861 - INFO - Finished converting document 4_2024-04-05 in 0.16 sec.
2025-11-14 16:09:15,996 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:16,052 - INFO - Going to convert document batch...
2025-11-14 16:09:16,055 - INFO - Processing document 4_2024-04-08
2025-11-14 16:09:16,155 - INFO - Finished converting document 4_2024-04-08 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2024-04-05' --> 'data\processed_data\CRM\4_2024-04-05.md'


2025-11-14 16:09:16,232 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:16,254 - INFO - Going to convert document batch...
2025-11-14 16:09:16,255 - INFO - Processing document 4_2024-04-09
2025-11-14 16:09:16,312 - INFO - Finished converting document 4_2024-04-09 in 0.09 sec.
2025-11-14 16:09:16,376 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:16,395 - INFO - Going to convert document batch...
2025-11-14 16:09:16,396 - INFO - Processing document 4_2024-04-10


Converted 'data\edgar_documents\CRM\4_2024-04-08' --> 'data\processed_data\CRM\4_2024-04-08.md'
Converted 'data\edgar_documents\CRM\4_2024-04-09' --> 'data\processed_data\CRM\4_2024-04-09.md'


2025-11-14 16:09:16,429 - INFO - Finished converting document 4_2024-04-10 in 0.06 sec.
2025-11-14 16:09:16,500 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:16,528 - INFO - Going to convert document batch...
2025-11-14 16:09:16,529 - INFO - Processing document 4_2024-04-11
2025-11-14 16:09:16,576 - INFO - Finished converting document 4_2024-04-11 in 0.11 sec.
2025-11-14 16:09:16,648 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:16,666 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2024-04-10' --> 'data\processed_data\CRM\4_2024-04-10.md'
Converted 'data\edgar_documents\CRM\4_2024-04-11' --> 'data\processed_data\CRM\4_2024-04-11.md'


2025-11-14 16:09:16,668 - INFO - Processing document 4_2024-04-12
2025-11-14 16:09:16,730 - INFO - Finished converting document 4_2024-04-12 in 0.11 sec.
2025-11-14 16:09:16,853 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:16,898 - INFO - Going to convert document batch...
2025-11-14 16:09:16,899 - INFO - Processing document 4_2024-04-15
2025-11-14 16:09:16,955 - INFO - Finished converting document 4_2024-04-15 in 0.12 sec.
2025-11-14 16:09:17,036 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-04-12' --> 'data\processed_data\CRM\4_2024-04-12.md'
Converted 'data\edgar_documents\CRM\4_2024-04-15' --> 'data\processed_data\CRM\4_2024-04-15.md'


2025-11-14 16:09:17,099 - INFO - Going to convert document batch...
2025-11-14 16:09:17,100 - INFO - Processing document 4_2024-04-16
2025-11-14 16:09:17,222 - INFO - Finished converting document 4_2024-04-16 in 0.22 sec.
2025-11-14 16:09:17,337 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:17,362 - INFO - Going to convert document batch...
2025-11-14 16:09:17,364 - INFO - Processing document 4_2024-04-17
2025-11-14 16:09:17,432 - INFO - Finished converting document 4_2024-04-17 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2024-04-16' --> 'data\processed_data\CRM\4_2024-04-16.md'
Converted 'data\edgar_documents\CRM\4_2024-04-17' --> 'data\processed_data\CRM\4_2024-04-17.md'


2025-11-14 16:09:17,524 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:17,567 - INFO - Going to convert document batch...
2025-11-14 16:09:17,570 - INFO - Processing document 4_2024-04-18
2025-11-14 16:09:17,671 - INFO - Finished converting document 4_2024-04-18 in 0.17 sec.
2025-11-14 16:09:17,794 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:17,818 - INFO - Going to convert document batch...
2025-11-14 16:09:17,820 - INFO - Processing document 4_2024-04-19
2025-11-14 16:09:17,895 - INFO - Finished converting document 4_2024-04-19 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2024-04-18' --> 'data\processed_data\CRM\4_2024-04-18.md'
Converted 'data\edgar_documents\CRM\4_2024-04-19' --> 'data\processed_data\CRM\4_2024-04-19.md'


2025-11-14 16:09:17,973 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:17,993 - INFO - Going to convert document batch...
2025-11-14 16:09:17,994 - INFO - Processing document 4_2024-04-22
2025-11-14 16:09:18,043 - INFO - Finished converting document 4_2024-04-22 in 0.09 sec.
2025-11-14 16:09:18,137 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:18,178 - INFO - Going to convert document batch...
2025-11-14 16:09:18,179 - INFO - Processing document 4_2024-04-23
2025-11-14 16:09:18,281 - INFO - Finished converting document 4_2024-04-23 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2024-04-22' --> 'data\processed_data\CRM\4_2024-04-22.md'


2025-11-14 16:09:18,371 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:18,416 - INFO - Going to convert document batch...
2025-11-14 16:09:18,417 - INFO - Processing document 4_2024-04-24
2025-11-14 16:09:18,494 - INFO - Finished converting document 4_2024-04-24 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2024-04-23' --> 'data\processed_data\CRM\4_2024-04-23.md'
Converted 'data\edgar_documents\CRM\4_2024-04-24' --> 'data\processed_data\CRM\4_2024-04-24.md'


2025-11-14 16:09:18,582 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:18,602 - INFO - Going to convert document batch...
2025-11-14 16:09:18,603 - INFO - Processing document 4_2024-04-25
2025-11-14 16:09:18,638 - INFO - Finished converting document 4_2024-04-25 in 0.08 sec.
2025-11-14 16:09:18,685 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:18,706 - INFO - Going to convert document batch...
2025-11-14 16:09:18,708 - INFO - Processing document 4_2024-04-26
2025-11-14 16:09:18,756 - INFO - Finished converting document 4_2024-04-26 in 0.08 sec.
2025-11-14 16:09:18,841 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:18,865 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2024-04-25' --> 'data\processed_data\CRM\4_2024-04-25.md'
Converted 'data\edgar_documents\CRM\4_2024-04-26' --> 'data\processed_data\CRM\4_2024-04-26.md'


2025-11-14 16:09:18,867 - INFO - Processing document 4_2024-04-29
2025-11-14 16:09:18,916 - INFO - Finished converting document 4_2024-04-29 in 0.09 sec.
2025-11-14 16:09:18,982 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:19,005 - INFO - Going to convert document batch...
2025-11-14 16:09:19,006 - INFO - Processing document 4_2024-04-30
2025-11-14 16:09:19,072 - INFO - Finished converting document 4_2024-04-30 in 0.09 sec.


Converted 'data\edgar_documents\CRM\4_2024-04-29' --> 'data\processed_data\CRM\4_2024-04-29.md'
Converted 'data\edgar_documents\CRM\4_2024-04-30' --> 'data\processed_data\CRM\4_2024-04-30.md'


2025-11-14 16:09:19,193 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:19,248 - INFO - Going to convert document batch...
2025-11-14 16:09:19,249 - INFO - Processing document 4_2024-05-01
2025-11-14 16:09:19,367 - INFO - Finished converting document 4_2024-05-01 in 0.20 sec.
2025-11-14 16:09:19,518 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:19,541 - INFO - Going to convert document batch...
2025-11-14 16:09:19,542 - INFO - Processing document 4_2024-05-02
2025-11-14 16:09:19,598 - INFO - Finished converting document 4_2024-05-02 in 0.09 sec.
2025-11-14 16:09:19,671 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:19,694 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2024-05-01' --> 'data\processed_data\CRM\4_2024-05-01.md'
Converted 'data\edgar_documents\CRM\4_2024-05-02' --> 'data\processed_data\CRM\4_2024-05-02.md'


2025-11-14 16:09:19,695 - INFO - Processing document 4_2024-05-03
2025-11-14 16:09:19,750 - INFO - Finished converting document 4_2024-05-03 in 0.11 sec.
2025-11-14 16:09:19,814 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:19,841 - INFO - Going to convert document batch...
2025-11-14 16:09:19,842 - INFO - Processing document 4_2024-05-06
2025-11-14 16:09:19,900 - INFO - Finished converting document 4_2024-05-06 in 0.09 sec.
2025-11-14 16:09:19,961 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:19,981 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2024-05-03' --> 'data\processed_data\CRM\4_2024-05-03.md'
Converted 'data\edgar_documents\CRM\4_2024-05-06' --> 'data\processed_data\CRM\4_2024-05-06.md'


2025-11-14 16:09:19,982 - INFO - Processing document 4_2024-05-07
2025-11-14 16:09:20,027 - INFO - Finished converting document 4_2024-05-07 in 0.08 sec.
2025-11-14 16:09:20,094 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:20,126 - INFO - Going to convert document batch...
2025-11-14 16:09:20,127 - INFO - Processing document 4_2024-05-08
2025-11-14 16:09:20,280 - INFO - Finished converting document 4_2024-05-08 in 0.20 sec.


Converted 'data\edgar_documents\CRM\4_2024-05-07' --> 'data\processed_data\CRM\4_2024-05-07.md'


2025-11-14 16:09:20,349 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:20,367 - INFO - Going to convert document batch...
2025-11-14 16:09:20,369 - INFO - Processing document 4_2024-05-09
2025-11-14 16:09:20,413 - INFO - Finished converting document 4_2024-05-09 in 0.08 sec.
2025-11-14 16:09:20,484 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:20,509 - INFO - Going to convert document batch...
2025-11-14 16:09:20,510 - INFO - Processing document 4_2024-05-10


Converted 'data\edgar_documents\CRM\4_2024-05-08' --> 'data\processed_data\CRM\4_2024-05-08.md'
Converted 'data\edgar_documents\CRM\4_2024-05-09' --> 'data\processed_data\CRM\4_2024-05-09.md'


2025-11-14 16:09:20,567 - INFO - Finished converting document 4_2024-05-10 in 0.11 sec.
2025-11-14 16:09:20,640 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:20,664 - INFO - Going to convert document batch...
2025-11-14 16:09:20,665 - INFO - Processing document 4_2024-05-13
2025-11-14 16:09:20,715 - INFO - Finished converting document 4_2024-05-13 in 0.09 sec.
2025-11-14 16:09:20,774 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:20,800 - INFO - Going to convert document batch...
2025-11-14 16:09:20,801 - INFO - Processing document 4_2024-05-14


Converted 'data\edgar_documents\CRM\4_2024-05-10' --> 'data\processed_data\CRM\4_2024-05-10.md'
Converted 'data\edgar_documents\CRM\4_2024-05-13' --> 'data\processed_data\CRM\4_2024-05-13.md'


2025-11-14 16:09:20,856 - INFO - Finished converting document 4_2024-05-14 in 0.11 sec.
2025-11-14 16:09:20,942 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:20,990 - INFO - Going to convert document batch...
2025-11-14 16:09:20,992 - INFO - Processing document 4_2024-05-15
2025-11-14 16:09:21,058 - INFO - Finished converting document 4_2024-05-15 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2024-05-14' --> 'data\processed_data\CRM\4_2024-05-14.md'
Converted 'data\edgar_documents\CRM\4_2024-05-15' --> 'data\processed_data\CRM\4_2024-05-15.md'


2025-11-14 16:09:21,135 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:21,158 - INFO - Going to convert document batch...
2025-11-14 16:09:21,160 - INFO - Processing document 4_2024-05-16
2025-11-14 16:09:21,200 - INFO - Finished converting document 4_2024-05-16 in 0.09 sec.
2025-11-14 16:09:21,255 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-05-16' --> 'data\processed_data\CRM\4_2024-05-16.md'


2025-11-14 16:09:21,933 - INFO - Going to convert document batch...
2025-11-14 16:09:21,936 - INFO - Processing document 4_2024-05-17
2025-11-14 16:09:22,000 - INFO - Finished converting document 4_2024-05-17 in 0.77 sec.
2025-11-14 16:09:22,072 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:22,097 - INFO - Going to convert document batch...
2025-11-14 16:09:22,098 - INFO - Processing document 4_2024-05-20
2025-11-14 16:09:22,152 - INFO - Finished converting document 4_2024-05-20 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2024-05-17' --> 'data\processed_data\CRM\4_2024-05-17.md'


2025-11-14 16:09:22,305 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:22,324 - INFO - Going to convert document batch...
2025-11-14 16:09:22,325 - INFO - Processing document 4_2024-05-21
2025-11-14 16:09:22,380 - INFO - Finished converting document 4_2024-05-21 in 0.09 sec.
2025-11-14 16:09:22,449 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-05-20' --> 'data\processed_data\CRM\4_2024-05-20.md'
Converted 'data\edgar_documents\CRM\4_2024-05-21' --> 'data\processed_data\CRM\4_2024-05-21.md'


2025-11-14 16:09:22,476 - INFO - Going to convert document batch...
2025-11-14 16:09:22,479 - INFO - Processing document 4_2024-05-22
2025-11-14 16:09:22,561 - INFO - Finished converting document 4_2024-05-22 in 0.14 sec.
2025-11-14 16:09:22,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:22,682 - INFO - Going to convert document batch...
2025-11-14 16:09:22,683 - INFO - Processing document 4_2024-05-23
2025-11-14 16:09:22,749 - INFO - Finished converting document 4_2024-05-23 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2024-05-22' --> 'data\processed_data\CRM\4_2024-05-22.md'
Converted 'data\edgar_documents\CRM\4_2024-05-23' --> 'data\processed_data\CRM\4_2024-05-23.md'


2025-11-14 16:09:22,838 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:22,868 - INFO - Going to convert document batch...
2025-11-14 16:09:22,870 - INFO - Processing document 4_2024-05-24
2025-11-14 16:09:22,965 - INFO - Finished converting document 4_2024-05-24 in 0.16 sec.
2025-11-14 16:09:23,043 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:23,067 - INFO - Going to convert document batch...
2025-11-14 16:09:23,068 - INFO - Processing document 4_2024-05-28
2025-11-14 16:09:23,132 - INFO - Finished converting document 4_2024-05-28 in 0.09 sec.
2025-11-14 16:09:23,213 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-05-24' --> 'data\processed_data\CRM\4_2024-05-24.md'
Converted 'data\edgar_documents\CRM\4_2024-05-28' --> 'data\processed_data\CRM\4_2024-05-28.md'


2025-11-14 16:09:23,269 - INFO - Going to convert document batch...
2025-11-14 16:09:23,272 - INFO - Processing document 4_2024-05-29
2025-11-14 16:09:23,353 - INFO - Finished converting document 4_2024-05-29 in 0.16 sec.
2025-11-14 16:09:23,437 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:23,473 - INFO - Going to convert document batch...
2025-11-14 16:09:23,479 - INFO - Processing document 4_2024-05-30
2025-11-14 16:09:23,555 - INFO - Finished converting document 4_2024-05-30 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2024-05-29' --> 'data\processed_data\CRM\4_2024-05-29.md'
Converted 'data\edgar_documents\CRM\4_2024-05-30' --> 'data\processed_data\CRM\4_2024-05-30.md'


2025-11-14 16:09:23,627 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:23,678 - INFO - Going to convert document batch...
2025-11-14 16:09:23,679 - INFO - Processing document 4_2024-05-31
2025-11-14 16:09:23,757 - INFO - Finished converting document 4_2024-05-31 in 0.16 sec.
2025-11-14 16:09:23,871 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:23,944 - INFO - Going to convert document batch...
2025-11-14 16:09:23,946 - INFO - Processing document 4_2024-06-03


Converted 'data\edgar_documents\CRM\4_2024-05-31' --> 'data\processed_data\CRM\4_2024-05-31.md'


2025-11-14 16:09:24,059 - INFO - Finished converting document 4_2024-06-03 in 0.22 sec.
2025-11-14 16:09:24,244 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:24,283 - INFO - Going to convert document batch...
2025-11-14 16:09:24,284 - INFO - Processing document 4_2024-06-04
2025-11-14 16:09:24,350 - INFO - Finished converting document 4_2024-06-04 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2024-06-03' --> 'data\processed_data\CRM\4_2024-06-03.md'


2025-11-14 16:09:24,476 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:24,557 - INFO - Going to convert document batch...
2025-11-14 16:09:24,559 - INFO - Processing document 4_2024-06-05


Converted 'data\edgar_documents\CRM\4_2024-06-04' --> 'data\processed_data\CRM\4_2024-06-04.md'


2025-11-14 16:09:24,672 - INFO - Finished converting document 4_2024-06-05 in 0.23 sec.
2025-11-14 16:09:24,762 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:24,806 - INFO - Going to convert document batch...
2025-11-14 16:09:24,808 - INFO - Processing document 4_2024-06-06
2025-11-14 16:09:24,877 - INFO - Finished converting document 4_2024-06-06 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2024-06-05' --> 'data\processed_data\CRM\4_2024-06-05.md'


2025-11-14 16:09:24,973 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:25,056 - INFO - Going to convert document batch...
2025-11-14 16:09:25,060 - INFO - Processing document 4_2024-06-07


Converted 'data\edgar_documents\CRM\4_2024-06-06' --> 'data\processed_data\CRM\4_2024-06-06.md'


2025-11-14 16:09:25,146 - INFO - Finished converting document 4_2024-06-07 in 0.20 sec.
2025-11-14 16:09:25,224 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:25,249 - INFO - Going to convert document batch...
2025-11-14 16:09:25,251 - INFO - Processing document 4_2024-06-10
2025-11-14 16:09:25,307 - INFO - Finished converting document 4_2024-06-10 in 0.09 sec.
2025-11-14 16:09:25,383 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:25,403 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2024-06-07' --> 'data\processed_data\CRM\4_2024-06-07.md'
Converted 'data\edgar_documents\CRM\4_2024-06-10' --> 'data\processed_data\CRM\4_2024-06-10.md'


2025-11-14 16:09:25,404 - INFO - Processing document 4_2024-06-11
2025-11-14 16:09:25,449 - INFO - Finished converting document 4_2024-06-11 in 0.09 sec.
2025-11-14 16:09:25,510 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:25,527 - INFO - Going to convert document batch...
2025-11-14 16:09:25,528 - INFO - Processing document 4_2024-06-12
2025-11-14 16:09:25,569 - INFO - Finished converting document 4_2024-06-12 in 0.06 sec.
2025-11-14 16:09:25,676 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-06-11' --> 'data\processed_data\CRM\4_2024-06-11.md'
Converted 'data\edgar_documents\CRM\4_2024-06-12' --> 'data\processed_data\CRM\4_2024-06-12.md'


2025-11-14 16:09:25,718 - INFO - Going to convert document batch...
2025-11-14 16:09:25,724 - INFO - Processing document 4_2024-06-20
2025-11-14 16:09:25,809 - INFO - Finished converting document 4_2024-06-20 in 0.17 sec.
2025-11-14 16:09:25,902 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:25,946 - INFO - Going to convert document batch...
2025-11-14 16:09:25,948 - INFO - Processing document 4_2024-06-24
2025-11-14 16:09:26,001 - INFO - Finished converting document 4_2024-06-24 in 0.12 sec.
2025-11-14 16:09:26,073 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-06-20' --> 'data\processed_data\CRM\4_2024-06-20.md'
Converted 'data\edgar_documents\CRM\4_2024-06-24' --> 'data\processed_data\CRM\4_2024-06-24.md'


2025-11-14 16:09:26,090 - INFO - Going to convert document batch...
2025-11-14 16:09:26,092 - INFO - Processing document 4_2024-06-25
2025-11-14 16:09:26,131 - INFO - Finished converting document 4_2024-06-25 in 0.08 sec.
2025-11-14 16:09:26,186 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:26,208 - INFO - Going to convert document batch...
2025-11-14 16:09:26,209 - INFO - Processing document 4_2024-06-26
2025-11-14 16:09:26,247 - INFO - Finished converting document 4_2024-06-26 in 0.08 sec.
2025-11-14 16:09:26,304 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:26,328 - INFO - Going to convert document batch...
2025-11-14 16:09:26,330 - INFO - Processing document 4_2024-06-28


Converted 'data\edgar_documents\CRM\4_2024-06-25' --> 'data\processed_data\CRM\4_2024-06-25.md'
Converted 'data\edgar_documents\CRM\4_2024-06-26' --> 'data\processed_data\CRM\4_2024-06-26.md'


2025-11-14 16:09:26,389 - INFO - Finished converting document 4_2024-06-28 in 0.11 sec.
2025-11-14 16:09:26,480 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:26,522 - INFO - Going to convert document batch...
2025-11-14 16:09:26,525 - INFO - Processing document 4_2024-07-01
2025-11-14 16:09:26,606 - INFO - Finished converting document 4_2024-07-01 in 0.14 sec.
2025-11-14 16:09:26,672 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-06-28' --> 'data\processed_data\CRM\4_2024-06-28.md'
Converted 'data\edgar_documents\CRM\4_2024-07-01' --> 'data\processed_data\CRM\4_2024-07-01.md'


2025-11-14 16:09:26,704 - INFO - Going to convert document batch...
2025-11-14 16:09:26,706 - INFO - Processing document 4_2024-07-03
2025-11-14 16:09:26,769 - INFO - Finished converting document 4_2024-07-03 in 0.12 sec.
2025-11-14 16:09:26,840 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:26,869 - INFO - Going to convert document batch...
2025-11-14 16:09:26,871 - INFO - Processing document 4_2024-07-10
2025-11-14 16:09:26,932 - INFO - Finished converting document 4_2024-07-10 in 0.09 sec.


Converted 'data\edgar_documents\CRM\4_2024-07-03' --> 'data\processed_data\CRM\4_2024-07-03.md'
Converted 'data\edgar_documents\CRM\4_2024-07-10' --> 'data\processed_data\CRM\4_2024-07-10.md'


2025-11-14 16:09:27,037 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:27,067 - INFO - Going to convert document batch...
2025-11-14 16:09:27,068 - INFO - Processing document 4_2024-07-17
2025-11-14 16:09:27,132 - INFO - Finished converting document 4_2024-07-17 in 0.12 sec.
2025-11-14 16:09:27,200 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:27,221 - INFO - Going to convert document batch...
2025-11-14 16:09:27,222 - INFO - Processing document 4_2024-07-23
2025-11-14 16:09:27,263 - INFO - Finished converting document 4_2024-07-23 in 0.08 sec.
2025-11-14 16:09:27,335 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:27,367 - INFO - Going to convert document batch...
2025-11-14 16:09:27,368 - INFO - Processing document 4_2024-07-24


Converted 'data\edgar_documents\CRM\4_2024-07-17' --> 'data\processed_data\CRM\4_2024-07-17.md'
Converted 'data\edgar_documents\CRM\4_2024-07-23' --> 'data\processed_data\CRM\4_2024-07-23.md'


2025-11-14 16:09:27,429 - INFO - Finished converting document 4_2024-07-24 in 0.12 sec.
2025-11-14 16:09:27,494 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:27,510 - INFO - Going to convert document batch...
2025-11-14 16:09:27,512 - INFO - Processing document 4_2024-07-25
2025-11-14 16:09:27,549 - INFO - Finished converting document 4_2024-07-25 in 0.08 sec.
2025-11-14 16:09:27,619 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:27,639 - INFO - Going to convert document batch...
2025-11-14 16:09:27,641 - INFO - Processing document 4_2024-07-26


Converted 'data\edgar_documents\CRM\4_2024-07-24' --> 'data\processed_data\CRM\4_2024-07-24.md'
Converted 'data\edgar_documents\CRM\4_2024-07-25' --> 'data\processed_data\CRM\4_2024-07-25.md'


2025-11-14 16:09:27,683 - INFO - Finished converting document 4_2024-07-26 in 0.09 sec.
2025-11-14 16:09:27,741 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:27,774 - INFO - Going to convert document batch...
2025-11-14 16:09:27,775 - INFO - Processing document 4_2024-07-31
2025-11-14 16:09:27,858 - INFO - Finished converting document 4_2024-07-31 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2024-07-26' --> 'data\processed_data\CRM\4_2024-07-26.md'


2025-11-14 16:09:27,930 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:27,969 - INFO - Going to convert document batch...
2025-11-14 16:09:28,424 - INFO - Processing document 4_2024-08-07


Converted 'data\edgar_documents\CRM\4_2024-07-31' --> 'data\processed_data\CRM\4_2024-07-31.md'


2025-11-14 16:09:28,583 - INFO - Finished converting document 4_2024-08-07 in 0.66 sec.
2025-11-14 16:09:28,675 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:28,700 - INFO - Going to convert document batch...
2025-11-14 16:09:28,701 - INFO - Processing document 4_2024-08-12
2025-11-14 16:09:28,755 - INFO - Finished converting document 4_2024-08-12 in 0.09 sec.
2025-11-14 16:09:28,836 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:28,863 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2024-08-07' --> 'data\processed_data\CRM\4_2024-08-07.md'
Converted 'data\edgar_documents\CRM\4_2024-08-12' --> 'data\processed_data\CRM\4_2024-08-12.md'


2025-11-14 16:09:28,864 - INFO - Processing document 4_2024-08-14
2025-11-14 16:09:28,938 - INFO - Finished converting document 4_2024-08-14 in 0.12 sec.
2025-11-14 16:09:29,030 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:29,066 - INFO - Going to convert document batch...
2025-11-14 16:09:29,068 - INFO - Processing document 4_2024-08-21


Converted 'data\edgar_documents\CRM\4_2024-08-14' --> 'data\processed_data\CRM\4_2024-08-14.md'


2025-11-14 16:09:29,264 - INFO - Finished converting document 4_2024-08-21 in 0.25 sec.
2025-11-14 16:09:29,360 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:29,378 - INFO - Going to convert document batch...
2025-11-14 16:09:29,379 - INFO - Processing document 4_2024-08-23
2025-11-14 16:09:29,416 - INFO - Finished converting document 4_2024-08-23 in 0.09 sec.
2025-11-14 16:09:29,481 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:29,511 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2024-08-21' --> 'data\processed_data\CRM\4_2024-08-21.md'
Converted 'data\edgar_documents\CRM\4_2024-08-23' --> 'data\processed_data\CRM\4_2024-08-23.md'


2025-11-14 16:09:29,512 - INFO - Processing document 4_2024-08-28
2025-11-14 16:09:29,579 - INFO - Finished converting document 4_2024-08-28 in 0.12 sec.
2025-11-14 16:09:29,652 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:29,683 - INFO - Going to convert document batch...
2025-11-14 16:09:29,685 - INFO - Processing document 4_2024-09-05
2025-11-14 16:09:29,756 - INFO - Finished converting document 4_2024-09-05 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2024-08-28' --> 'data\processed_data\CRM\4_2024-08-28.md'


2025-11-14 16:09:29,830 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:29,859 - INFO - Going to convert document batch...
2025-11-14 16:09:29,860 - INFO - Processing document 4_2024-09-11
2025-11-14 16:09:29,946 - INFO - Finished converting document 4_2024-09-11 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2024-09-05' --> 'data\processed_data\CRM\4_2024-09-05.md'


2025-11-14 16:09:30,035 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:30,050 - INFO - Going to convert document batch...
2025-11-14 16:09:30,052 - INFO - Processing document 4_2024-09-12
2025-11-14 16:09:30,086 - INFO - Finished converting document 4_2024-09-12 in 0.06 sec.
2025-11-14 16:09:30,142 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:30,175 - INFO - Going to convert document batch...
2025-11-14 16:09:30,176 - INFO - Processing document 4_2024-09-18


Converted 'data\edgar_documents\CRM\4_2024-09-11' --> 'data\processed_data\CRM\4_2024-09-11.md'
Converted 'data\edgar_documents\CRM\4_2024-09-12' --> 'data\processed_data\CRM\4_2024-09-12.md'


2025-11-14 16:09:30,245 - INFO - Finished converting document 4_2024-09-18 in 0.14 sec.
2025-11-14 16:09:30,331 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:30,369 - INFO - Going to convert document batch...
2025-11-14 16:09:30,372 - INFO - Processing document 4_2024-09-23
2025-11-14 16:09:30,435 - INFO - Finished converting document 4_2024-09-23 in 0.12 sec.
2025-11-14 16:09:30,490 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:30,506 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2024-09-18' --> 'data\processed_data\CRM\4_2024-09-18.md'
Converted 'data\edgar_documents\CRM\4_2024-09-23' --> 'data\processed_data\CRM\4_2024-09-23.md'


2025-11-14 16:09:30,507 - INFO - Processing document 4_2024-09-25
2025-11-14 16:09:30,541 - INFO - Finished converting document 4_2024-09-25 in 0.06 sec.
2025-11-14 16:09:30,591 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:30,607 - INFO - Going to convert document batch...
2025-11-14 16:09:30,608 - INFO - Processing document 4_2024-09-27
2025-11-14 16:09:30,645 - INFO - Finished converting document 4_2024-09-27 in 0.06 sec.
2025-11-14 16:09:30,697 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:30,734 - INFO - Going to convert document batch...
2025-11-14 16:09:30,738 - INFO - Processing document 4_2024-10-02


Converted 'data\edgar_documents\CRM\4_2024-09-25' --> 'data\processed_data\CRM\4_2024-09-25.md'
Converted 'data\edgar_documents\CRM\4_2024-09-27' --> 'data\processed_data\CRM\4_2024-09-27.md'


2025-11-14 16:09:30,820 - INFO - Finished converting document 4_2024-10-02 in 0.12 sec.
2025-11-14 16:09:30,892 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:30,906 - INFO - Going to convert document batch...
2025-11-14 16:09:30,907 - INFO - Processing document 4_2024-10-03
2025-11-14 16:09:30,940 - INFO - Finished converting document 4_2024-10-03 in 0.06 sec.
2025-11-14 16:09:30,991 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:31,028 - INFO - Going to convert document batch...
2025-11-14 16:09:31,030 - INFO - Processing document 4_2024-10-09


Converted 'data\edgar_documents\CRM\4_2024-10-02' --> 'data\processed_data\CRM\4_2024-10-02.md'
Converted 'data\edgar_documents\CRM\4_2024-10-03' --> 'data\processed_data\CRM\4_2024-10-03.md'


2025-11-14 16:09:31,150 - INFO - Finished converting document 4_2024-10-09 in 0.17 sec.
2025-11-14 16:09:31,255 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:31,294 - INFO - Going to convert document batch...
2025-11-14 16:09:31,295 - INFO - Processing document 4_2024-10-16
2025-11-14 16:09:31,360 - INFO - Finished converting document 4_2024-10-16 in 0.12 sec.
2025-11-14 16:09:31,436 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-10-09' --> 'data\processed_data\CRM\4_2024-10-09.md'
Converted 'data\edgar_documents\CRM\4_2024-10-16' --> 'data\processed_data\CRM\4_2024-10-16.md'


2025-11-14 16:09:31,459 - INFO - Going to convert document batch...
2025-11-14 16:09:31,461 - INFO - Processing document 4_2024-10-22
2025-11-14 16:09:31,520 - INFO - Finished converting document 4_2024-10-22 in 0.09 sec.
2025-11-14 16:09:31,579 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:31,596 - INFO - Going to convert document batch...
2025-11-14 16:09:31,596 - INFO - Processing document 4_2024-10-23
2025-11-14 16:09:31,639 - INFO - Finished converting document 4_2024-10-23 in 0.08 sec.
2025-11-14 16:09:31,703 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:31,719 - INFO - Going to convert document batch...
2025-11-14 16:09:31,723 - INFO - Processing document 4_2024-10-25
2025-11-14 16:09:31,766 - INFO - Finished converting document 4_2024-10-25 in 0.09 sec.


Converted 'data\edgar_documents\CRM\4_2024-10-22' --> 'data\processed_data\CRM\4_2024-10-22.md'
Converted 'data\edgar_documents\CRM\4_2024-10-23' --> 'data\processed_data\CRM\4_2024-10-23.md'


2025-11-14 16:09:31,824 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:31,843 - INFO - Going to convert document batch...
2025-11-14 16:09:31,844 - INFO - Processing document 4_2024-10-30
2025-11-14 16:09:31,885 - INFO - Finished converting document 4_2024-10-30 in 0.09 sec.
2025-11-14 16:09:31,956 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:31,974 - INFO - Going to convert document batch...
2025-11-14 16:09:31,975 - INFO - Processing document 4_2024-11-04


Converted 'data\edgar_documents\CRM\4_2024-10-25' --> 'data\processed_data\CRM\4_2024-10-25.md'
Converted 'data\edgar_documents\CRM\4_2024-10-30' --> 'data\processed_data\CRM\4_2024-10-30.md'


2025-11-14 16:09:32,014 - INFO - Finished converting document 4_2024-11-04 in 0.08 sec.
2025-11-14 16:09:32,069 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:32,096 - INFO - Going to convert document batch...
2025-11-14 16:09:32,097 - INFO - Processing document 4_2024-11-06
2025-11-14 16:09:32,160 - INFO - Finished converting document 4_2024-11-06 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2024-11-04' --> 'data\processed_data\CRM\4_2024-11-04.md'
Converted 'data\edgar_documents\CRM\4_2024-11-06' --> 'data\processed_data\CRM\4_2024-11-06.md'


2025-11-14 16:09:32,249 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:32,275 - INFO - Going to convert document batch...
2025-11-14 16:09:32,277 - INFO - Processing document 4_2024-11-22
2025-11-14 16:09:32,370 - INFO - Finished converting document 4_2024-11-22 in 0.16 sec.
2025-11-14 16:09:32,441 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:32,460 - INFO - Going to convert document batch...
2025-11-14 16:09:32,461 - INFO - Processing document 4_2024-11-25
2025-11-14 16:09:32,512 - INFO - Finished converting document 4_2024-11-25 in 0.09 sec.
2025-11-14 16:09:32,613 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2024-11-22' --> 'data\processed_data\CRM\4_2024-11-22.md'
Converted 'data\edgar_documents\CRM\4_2024-11-25' --> 'data\processed_data\CRM\4_2024-11-25.md'


2025-11-14 16:09:32,638 - INFO - Going to convert document batch...
2025-11-14 16:09:32,640 - INFO - Processing document 4_2024-11-26
2025-11-14 16:09:32,677 - INFO - Finished converting document 4_2024-11-26 in 0.09 sec.
2025-11-14 16:09:32,751 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:32,800 - INFO - Going to convert document batch...
2025-11-14 16:09:32,801 - INFO - Processing document 4_2024-12-20
2025-11-14 16:09:32,927 - INFO - Finished converting document 4_2024-12-20 in 0.19 sec.


Converted 'data\edgar_documents\CRM\4_2024-11-26' --> 'data\processed_data\CRM\4_2024-11-26.md'


2025-11-14 16:09:33,102 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:33,158 - INFO - Going to convert document batch...
2025-11-14 16:09:33,159 - INFO - Processing document 4_2024-12-23
2025-11-14 16:09:33,228 - INFO - Finished converting document 4_2024-12-23 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2024-12-20' --> 'data\processed_data\CRM\4_2024-12-20.md'


2025-11-14 16:09:33,295 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:33,316 - INFO - Going to convert document batch...
2025-11-14 16:09:33,317 - INFO - Processing document 4_2024-12-26
2025-11-14 16:09:33,366 - INFO - Finished converting document 4_2024-12-26 in 0.08 sec.


Converted 'data\edgar_documents\CRM\4_2024-12-23' --> 'data\processed_data\CRM\4_2024-12-23.md'
Converted 'data\edgar_documents\CRM\4_2024-12-26' --> 'data\processed_data\CRM\4_2024-12-26.md'


2025-11-14 16:09:33,489 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:33,506 - INFO - Going to convert document batch...
2025-11-14 16:09:33,507 - INFO - Processing document 4_2024-12-27
2025-11-14 16:09:33,539 - INFO - Finished converting document 4_2024-12-27 in 0.08 sec.
2025-11-14 16:09:33,596 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:33,637 - INFO - Going to convert document batch...
2025-11-14 16:09:33,640 - INFO - Processing document 4_2025-01-03
2025-11-14 16:09:33,721 - INFO - Finished converting document 4_2025-01-03 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2024-12-27' --> 'data\processed_data\CRM\4_2024-12-27.md'
Converted 'data\edgar_documents\CRM\4_2025-01-03' --> 'data\processed_data\CRM\4_2025-01-03.md'


2025-11-14 16:09:33,817 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:33,840 - INFO - Going to convert document batch...
2025-11-14 16:09:33,841 - INFO - Processing document 4_2025-01-16
2025-11-14 16:09:33,886 - INFO - Finished converting document 4_2025-01-16 in 0.09 sec.
2025-11-14 16:09:33,955 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:33,978 - INFO - Going to convert document batch...
2025-11-14 16:09:33,979 - INFO - Processing document 4_2025-01-23
2025-11-14 16:09:34,039 - INFO - Finished converting document 4_2025-01-23 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2025-01-16' --> 'data\processed_data\CRM\4_2025-01-16.md'
Converted 'data\edgar_documents\CRM\4_2025-01-23' --> 'data\processed_data\CRM\4_2025-01-23.md'


2025-11-14 16:09:34,107 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:34,123 - INFO - Going to convert document batch...
2025-11-14 16:09:34,125 - INFO - Processing document 4_2025-02-03
2025-11-14 16:09:34,176 - INFO - Finished converting document 4_2025-02-03 in 0.09 sec.
2025-11-14 16:09:34,234 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:34,249 - INFO - Going to convert document batch...
2025-11-14 16:09:34,250 - INFO - Processing document 4_2025-02-04
2025-11-14 16:09:34,310 - INFO - Finished converting document 4_2025-02-04 in 0.09 sec.
2025-11-14 16:09:34,378 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:34,409 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2025-02-03' --> 'data\processed_data\CRM\4_2025-02-03.md'
Converted 'data\edgar_documents\CRM\4_2025-02-04' --> 'data\processed_data\CRM\4_2025-02-04.md'


2025-11-14 16:09:34,410 - INFO - Processing document 4_2025-02-19
2025-11-14 16:09:34,468 - INFO - Finished converting document 4_2025-02-19 in 0.11 sec.
2025-11-14 16:09:34,529 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:34,558 - INFO - Going to convert document batch...
2025-11-14 16:09:34,560 - INFO - Processing document 4_2025-02-24
2025-11-14 16:09:34,611 - INFO - Finished converting document 4_2025-02-24 in 0.09 sec.
2025-11-14 16:09:34,668 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:34,689 - INFO - Going to convert document batch...
2025-11-14 16:09:34,690 - INFO - Processing document 4_2025-02-25


Converted 'data\edgar_documents\CRM\4_2025-02-19' --> 'data\processed_data\CRM\4_2025-02-19.md'
Converted 'data\edgar_documents\CRM\4_2025-02-24' --> 'data\processed_data\CRM\4_2025-02-24.md'


2025-11-14 16:09:34,739 - INFO - Finished converting document 4_2025-02-25 in 0.08 sec.
2025-11-14 16:09:34,812 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:34,838 - INFO - Going to convert document batch...
2025-11-14 16:09:34,840 - INFO - Processing document 4_2025-02-26
2025-11-14 16:09:34,882 - INFO - Finished converting document 4_2025-02-26 in 0.08 sec.
2025-11-14 16:09:34,944 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:34,960 - INFO - Going to convert document batch...
2025-11-14 16:09:34,962 - INFO - Processing document 4_2025-03-03
2025-11-14 16:09:34,997 - INFO - Finished converting document 4_2025-03-03 in 0.08 sec.


Converted 'data\edgar_documents\CRM\4_2025-02-25' --> 'data\processed_data\CRM\4_2025-02-25.md'
Converted 'data\edgar_documents\CRM\4_2025-02-26' --> 'data\processed_data\CRM\4_2025-02-26.md'


2025-11-14 16:09:35,048 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:35,071 - INFO - Going to convert document batch...
2025-11-14 16:09:35,073 - INFO - Processing document 4_2025-03-04


Converted 'data\edgar_documents\CRM\4_2025-03-03' --> 'data\processed_data\CRM\4_2025-03-03.md'


2025-11-14 16:09:35,659 - INFO - Finished converting document 4_2025-03-04 in 0.62 sec.
2025-11-14 16:09:35,751 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:35,769 - INFO - Going to convert document batch...
2025-11-14 16:09:35,771 - INFO - Processing document 4_2025-03-17
2025-11-14 16:09:35,819 - INFO - Finished converting document 4_2025-03-17 in 0.09 sec.
2025-11-14 16:09:35,887 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:35,908 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2025-03-04' --> 'data\processed_data\CRM\4_2025-03-04.md'
Converted 'data\edgar_documents\CRM\4_2025-03-17' --> 'data\processed_data\CRM\4_2025-03-17.md'


2025-11-14 16:09:35,909 - INFO - Processing document 4_2025-03-18
2025-11-14 16:09:35,951 - INFO - Finished converting document 4_2025-03-18 in 0.09 sec.
2025-11-14 16:09:36,015 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:36,052 - INFO - Going to convert document batch...
2025-11-14 16:09:36,053 - INFO - Processing document 4_2025-03-25
2025-11-14 16:09:36,142 - INFO - Finished converting document 4_2025-03-25 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-03-18' --> 'data\processed_data\CRM\4_2025-03-18.md'


2025-11-14 16:09:36,228 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:36,244 - INFO - Going to convert document batch...
2025-11-14 16:09:36,245 - INFO - Processing document 4_2025-03-27
2025-11-14 16:09:36,304 - INFO - Finished converting document 4_2025-03-27 in 0.08 sec.
2025-11-14 16:09:36,369 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:36,386 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2025-03-25' --> 'data\processed_data\CRM\4_2025-03-25.md'
Converted 'data\edgar_documents\CRM\4_2025-03-27' --> 'data\processed_data\CRM\4_2025-03-27.md'


2025-11-14 16:09:36,387 - INFO - Processing document 4_2025-04-04
2025-11-14 16:09:36,422 - INFO - Finished converting document 4_2025-04-04 in 0.08 sec.
2025-11-14 16:09:36,472 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:36,496 - INFO - Going to convert document batch...
2025-11-14 16:09:36,497 - INFO - Processing document 4_2025-04-10
2025-11-14 16:09:36,544 - INFO - Finished converting document 4_2025-04-10 in 0.09 sec.
2025-11-14 16:09:36,621 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:36,647 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2025-04-04' --> 'data\processed_data\CRM\4_2025-04-04.md'
Converted 'data\edgar_documents\CRM\4_2025-04-10' --> 'data\processed_data\CRM\4_2025-04-10.md'


2025-11-14 16:09:36,649 - INFO - Processing document 4_2025-04-17
2025-11-14 16:09:36,711 - INFO - Finished converting document 4_2025-04-17 in 0.09 sec.
2025-11-14 16:09:36,788 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:36,820 - INFO - Going to convert document batch...
2025-11-14 16:09:36,821 - INFO - Processing document 4_2025-04-24
2025-11-14 16:09:36,889 - INFO - Finished converting document 4_2025-04-24 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2025-04-17' --> 'data\processed_data\CRM\4_2025-04-17.md'
Converted 'data\edgar_documents\CRM\4_2025-04-24' --> 'data\processed_data\CRM\4_2025-04-24.md'


2025-11-14 16:09:36,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:36,992 - INFO - Going to convert document batch...
2025-11-14 16:09:36,994 - INFO - Processing document 4_2025-05-05
2025-11-14 16:09:37,029 - INFO - Finished converting document 4_2025-05-05 in 0.09 sec.
2025-11-14 16:09:37,107 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:37,137 - INFO - Going to convert document batch...
2025-11-14 16:09:37,139 - INFO - Processing document 4_2025-05-15
2025-11-14 16:09:37,191 - INFO - Finished converting document 4_2025-05-15 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2025-05-05' --> 'data\processed_data\CRM\4_2025-05-05.md'
Converted 'data\edgar_documents\CRM\4_2025-05-15' --> 'data\processed_data\CRM\4_2025-05-15.md'


2025-11-14 16:09:37,281 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:37,313 - INFO - Going to convert document batch...
2025-11-14 16:09:37,316 - INFO - Processing document 4_2025-05-23
2025-11-14 16:09:37,389 - INFO - Finished converting document 4_2025-05-23 in 0.14 sec.
2025-11-14 16:09:37,491 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:37,520 - INFO - Going to convert document batch...
2025-11-14 16:09:37,522 - INFO - Processing document 4_2025-05-28
2025-11-14 16:09:37,594 - INFO - Finished converting document 4_2025-05-28 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2025-05-23' --> 'data\processed_data\CRM\4_2025-05-23.md'
Converted 'data\edgar_documents\CRM\4_2025-05-28' --> 'data\processed_data\CRM\4_2025-05-28.md'


2025-11-14 16:09:37,705 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:37,765 - INFO - Going to convert document batch...
2025-11-14 16:09:37,766 - INFO - Processing document 4_2025-06-24
2025-11-14 16:09:37,895 - INFO - Finished converting document 4_2025-06-24 in 0.22 sec.
2025-11-14 16:09:38,004 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:38,038 - INFO - Going to convert document batch...
2025-11-14 16:09:38,039 - INFO - Processing document 4_2025-07-01
2025-11-14 16:09:38,094 - INFO - Finished converting document 4_2025-07-01 in 0.11 sec.
2025-11-14 16:09:38,182 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2025-06-24' --> 'data\processed_data\CRM\4_2025-06-24.md'
Converted 'data\edgar_documents\CRM\4_2025-07-01' --> 'data\processed_data\CRM\4_2025-07-01.md'


2025-11-14 16:09:38,208 - INFO - Going to convert document batch...
2025-11-14 16:09:38,210 - INFO - Processing document 4_2025-07-03
2025-11-14 16:09:38,313 - INFO - Finished converting document 4_2025-07-03 in 0.16 sec.
2025-11-14 16:09:38,395 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:38,435 - INFO - Going to convert document batch...
2025-11-14 16:09:38,437 - INFO - Processing document 4_2025-07-07
2025-11-14 16:09:38,530 - INFO - Finished converting document 4_2025-07-07 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2025-07-03' --> 'data\processed_data\CRM\4_2025-07-03.md'


2025-11-14 16:09:38,648 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:38,676 - INFO - Going to convert document batch...
2025-11-14 16:09:38,677 - INFO - Processing document 4_2025-07-08
2025-11-14 16:09:38,757 - INFO - Finished converting document 4_2025-07-08 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2025-07-07' --> 'data\processed_data\CRM\4_2025-07-07.md'


2025-11-14 16:09:38,851 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:38,913 - INFO - Going to convert document batch...
2025-11-14 16:09:38,915 - INFO - Processing document 4_2025-07-09


Converted 'data\edgar_documents\CRM\4_2025-07-08' --> 'data\processed_data\CRM\4_2025-07-08.md'


2025-11-14 16:09:39,046 - INFO - Finished converting document 4_2025-07-09 in 0.22 sec.
2025-11-14 16:09:39,177 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:39,236 - INFO - Going to convert document batch...
2025-11-14 16:09:39,237 - INFO - Processing document 4_2025-07-10
2025-11-14 16:09:39,334 - INFO - Finished converting document 4_2025-07-10 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2025-07-09' --> 'data\processed_data\CRM\4_2025-07-09.md'


2025-11-14 16:09:39,427 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:39,471 - INFO - Going to convert document batch...
2025-11-14 16:09:39,472 - INFO - Processing document 4_2025-07-11
2025-11-14 16:09:39,564 - INFO - Finished converting document 4_2025-07-11 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2025-07-10' --> 'data\processed_data\CRM\4_2025-07-10.md'


2025-11-14 16:09:39,642 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:39,670 - INFO - Going to convert document batch...
2025-11-14 16:09:39,671 - INFO - Processing document 4_2025-07-14
2025-11-14 16:09:39,734 - INFO - Finished converting document 4_2025-07-14 in 0.11 sec.
2025-11-14 16:09:39,822 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2025-07-11' --> 'data\processed_data\CRM\4_2025-07-11.md'
Converted 'data\edgar_documents\CRM\4_2025-07-14' --> 'data\processed_data\CRM\4_2025-07-14.md'


2025-11-14 16:09:39,860 - INFO - Going to convert document batch...
2025-11-14 16:09:39,861 - INFO - Processing document 4_2025-07-15
2025-11-14 16:09:39,941 - INFO - Finished converting document 4_2025-07-15 in 0.14 sec.
2025-11-14 16:09:40,021 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:40,063 - INFO - Going to convert document batch...
2025-11-14 16:09:40,066 - INFO - Processing document 4_2025-07-16
2025-11-14 16:09:40,166 - INFO - Finished converting document 4_2025-07-16 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2025-07-15' --> 'data\processed_data\CRM\4_2025-07-15.md'


2025-11-14 16:09:40,307 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:40,388 - INFO - Going to convert document batch...
2025-11-14 16:09:40,390 - INFO - Processing document 4_2025-07-17
2025-11-14 16:09:40,485 - INFO - Finished converting document 4_2025-07-17 in 0.20 sec.


Converted 'data\edgar_documents\CRM\4_2025-07-16' --> 'data\processed_data\CRM\4_2025-07-16.md'


2025-11-14 16:09:40,562 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:40,586 - INFO - Going to convert document batch...
2025-11-14 16:09:40,587 - INFO - Processing document 4_2025-07-18
2025-11-14 16:09:40,647 - INFO - Finished converting document 4_2025-07-18 in 0.09 sec.


Converted 'data\edgar_documents\CRM\4_2025-07-17' --> 'data\processed_data\CRM\4_2025-07-17.md'
Converted 'data\edgar_documents\CRM\4_2025-07-18' --> 'data\processed_data\CRM\4_2025-07-18.md'


2025-11-14 16:09:40,728 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:40,762 - INFO - Going to convert document batch...
2025-11-14 16:09:40,763 - INFO - Processing document 4_2025-07-21
2025-11-14 16:09:40,852 - INFO - Finished converting document 4_2025-07-21 in 0.14 sec.
2025-11-14 16:09:40,939 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:40,972 - INFO - Going to convert document batch...
2025-11-14 16:09:40,973 - INFO - Processing document 4_2025-07-22
2025-11-14 16:09:41,053 - INFO - Finished converting document 4_2025-07-22 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2025-07-21' --> 'data\processed_data\CRM\4_2025-07-21.md'


2025-11-14 16:09:41,134 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:41,155 - INFO - Going to convert document batch...
2025-11-14 16:09:41,156 - INFO - Processing document 4_2025-07-23
2025-11-14 16:09:41,211 - INFO - Finished converting document 4_2025-07-23 in 0.08 sec.
2025-11-14 16:09:41,292 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:41,319 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CRM\4_2025-07-22' --> 'data\processed_data\CRM\4_2025-07-22.md'
Converted 'data\edgar_documents\CRM\4_2025-07-23' --> 'data\processed_data\CRM\4_2025-07-23.md'


2025-11-14 16:09:41,321 - INFO - Processing document 4_2025-07-24
2025-11-14 16:09:41,401 - INFO - Finished converting document 4_2025-07-24 in 0.14 sec.
2025-11-14 16:09:41,497 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:41,529 - INFO - Going to convert document batch...
2025-11-14 16:09:41,530 - INFO - Processing document 4_2025-07-25
2025-11-14 16:09:41,584 - INFO - Finished converting document 4_2025-07-25 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2025-07-24' --> 'data\processed_data\CRM\4_2025-07-24.md'
Converted 'data\edgar_documents\CRM\4_2025-07-25' --> 'data\processed_data\CRM\4_2025-07-25.md'


2025-11-14 16:09:41,675 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:41,716 - INFO - Going to convert document batch...
2025-11-14 16:09:41,720 - INFO - Processing document 4_2025-07-28
2025-11-14 16:09:41,786 - INFO - Finished converting document 4_2025-07-28 in 0.14 sec.
2025-11-14 16:09:41,856 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:41,888 - INFO - Going to convert document batch...
2025-11-14 16:09:41,889 - INFO - Processing document 4_2025-07-29
2025-11-14 16:09:41,969 - INFO - Finished converting document 4_2025-07-29 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2025-07-28' --> 'data\processed_data\CRM\4_2025-07-28.md'
Converted 'data\edgar_documents\CRM\4_2025-07-29' --> 'data\processed_data\CRM\4_2025-07-29.md'


2025-11-14 16:09:42,072 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:42,105 - INFO - Going to convert document batch...
2025-11-14 16:09:42,106 - INFO - Processing document 4_2025-07-30
2025-11-14 16:09:42,201 - INFO - Finished converting document 4_2025-07-30 in 0.16 sec.
2025-11-14 16:09:42,312 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:42,343 - INFO - Going to convert document batch...
2025-11-14 16:09:42,344 - INFO - Processing document 4_2025-07-31
2025-11-14 16:09:42,436 - INFO - Finished converting document 4_2025-07-31 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-07-30' --> 'data\processed_data\CRM\4_2025-07-30.md'


2025-11-14 16:09:42,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:42,566 - INFO - Going to convert document batch...
2025-11-14 16:09:42,567 - INFO - Processing document 4_2025-08-01
2025-11-14 16:09:42,639 - INFO - Finished converting document 4_2025-08-01 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-07-31' --> 'data\processed_data\CRM\4_2025-07-31.md'


2025-11-14 16:09:42,758 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:42,786 - INFO - Going to convert document batch...
2025-11-14 16:09:42,787 - INFO - Processing document 4_2025-08-04


Converted 'data\edgar_documents\CRM\4_2025-08-01' --> 'data\processed_data\CRM\4_2025-08-01.md'


2025-11-14 16:09:43,434 - INFO - Finished converting document 4_2025-08-04 in 0.70 sec.
2025-11-14 16:09:43,519 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:43,544 - INFO - Going to convert document batch...
2025-11-14 16:09:43,545 - INFO - Processing document 4_2025-08-05
2025-11-14 16:09:43,604 - INFO - Finished converting document 4_2025-08-05 in 0.11 sec.
2025-11-14 16:09:43,671 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2025-08-04' --> 'data\processed_data\CRM\4_2025-08-04.md'
Converted 'data\edgar_documents\CRM\4_2025-08-05' --> 'data\processed_data\CRM\4_2025-08-05.md'


2025-11-14 16:09:43,711 - INFO - Going to convert document batch...
2025-11-14 16:09:43,714 - INFO - Processing document 4_2025-08-06
2025-11-14 16:09:43,803 - INFO - Finished converting document 4_2025-08-06 in 0.14 sec.
2025-11-14 16:09:43,928 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:43,967 - INFO - Going to convert document batch...
2025-11-14 16:09:43,968 - INFO - Processing document 4_2025-08-07
2025-11-14 16:09:44,044 - INFO - Finished converting document 4_2025-08-07 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-08-06' --> 'data\processed_data\CRM\4_2025-08-06.md'


2025-11-14 16:09:44,141 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:44,299 - INFO - Going to convert document batch...
2025-11-14 16:09:44,303 - INFO - Processing document 4_2025-08-08


Converted 'data\edgar_documents\CRM\4_2025-08-07' --> 'data\processed_data\CRM\4_2025-08-07.md'


2025-11-14 16:09:44,488 - INFO - Finished converting document 4_2025-08-08 in 0.36 sec.
2025-11-14 16:09:44,590 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:44,634 - INFO - Going to convert document batch...
2025-11-14 16:09:44,636 - INFO - Processing document 4_2025-08-11
2025-11-14 16:09:44,737 - INFO - Finished converting document 4_2025-08-11 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2025-08-08' --> 'data\processed_data\CRM\4_2025-08-08.md'


2025-11-14 16:09:44,873 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:44,939 - INFO - Going to convert document batch...
2025-11-14 16:09:44,941 - INFO - Processing document 4_2025-08-12


Converted 'data\edgar_documents\CRM\4_2025-08-11' --> 'data\processed_data\CRM\4_2025-08-11.md'


2025-11-14 16:09:45,090 - INFO - Finished converting document 4_2025-08-12 in 0.25 sec.
2025-11-14 16:09:45,232 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:45,274 - INFO - Going to convert document batch...
2025-11-14 16:09:45,276 - INFO - Processing document 4_2025-08-13
2025-11-14 16:09:45,361 - INFO - Finished converting document 4_2025-08-13 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-08-12' --> 'data\processed_data\CRM\4_2025-08-12.md'


2025-11-14 16:09:45,484 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:45,596 - INFO - Going to convert document batch...
2025-11-14 16:09:45,601 - INFO - Processing document 4_2025-08-14


Converted 'data\edgar_documents\CRM\4_2025-08-13' --> 'data\processed_data\CRM\4_2025-08-13.md'


2025-11-14 16:09:45,736 - INFO - Finished converting document 4_2025-08-14 in 0.26 sec.
2025-11-14 16:09:45,817 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:45,847 - INFO - Going to convert document batch...
2025-11-14 16:09:45,849 - INFO - Processing document 4_2025-08-15
2025-11-14 16:09:45,916 - INFO - Finished converting document 4_2025-08-15 in 0.12 sec.
2025-11-14 16:09:46,005 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2025-08-14' --> 'data\processed_data\CRM\4_2025-08-14.md'
Converted 'data\edgar_documents\CRM\4_2025-08-15' --> 'data\processed_data\CRM\4_2025-08-15.md'


2025-11-14 16:09:46,050 - INFO - Going to convert document batch...
2025-11-14 16:09:46,052 - INFO - Processing document 4_2025-08-18
2025-11-14 16:09:46,288 - INFO - Finished converting document 4_2025-08-18 in 0.31 sec.
2025-11-14 16:09:46,420 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:46,467 - INFO - Going to convert document batch...
2025-11-14 16:09:46,469 - INFO - Processing document 4_2025-08-19
2025-11-14 16:09:46,586 - INFO - Finished converting document 4_2025-08-19 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2025-08-18' --> 'data\processed_data\CRM\4_2025-08-18.md'


2025-11-14 16:09:46,708 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:46,754 - INFO - Going to convert document batch...
2025-11-14 16:09:46,756 - INFO - Processing document 4_2025-08-20
2025-11-14 16:09:46,835 - INFO - Finished converting document 4_2025-08-20 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-08-19' --> 'data\processed_data\CRM\4_2025-08-19.md'


2025-11-14 16:09:46,938 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:46,975 - INFO - Going to convert document batch...
2025-11-14 16:09:46,977 - INFO - Processing document 4_2025-08-21
2025-11-14 16:09:47,052 - INFO - Finished converting document 4_2025-08-21 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2025-08-20' --> 'data\processed_data\CRM\4_2025-08-20.md'
Converted 'data\edgar_documents\CRM\4_2025-08-21' --> 'data\processed_data\CRM\4_2025-08-21.md'


2025-11-14 16:09:47,149 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:47,198 - INFO - Going to convert document batch...
2025-11-14 16:09:47,200 - INFO - Processing document 4_2025-08-22
2025-11-14 16:09:47,305 - INFO - Finished converting document 4_2025-08-22 in 0.19 sec.
2025-11-14 16:09:47,402 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:47,421 - INFO - Going to convert document batch...
2025-11-14 16:09:47,422 - INFO - Processing document 4_2025-08-25
2025-11-14 16:09:47,462 - INFO - Finished converting document 4_2025-08-25 in 0.08 sec.
2025-11-14 16:09:47,514 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:47,555 - INFO - Going to convert document batch...
2025-11-14 16:09:47,556 - INFO - Processing document 4_2025-08-26


Converted 'data\edgar_documents\CRM\4_2025-08-22' --> 'data\processed_data\CRM\4_2025-08-22.md'
Converted 'data\edgar_documents\CRM\4_2025-08-25' --> 'data\processed_data\CRM\4_2025-08-25.md'


2025-11-14 16:09:47,666 - INFO - Finished converting document 4_2025-08-26 in 0.17 sec.
2025-11-14 16:09:47,771 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:47,820 - INFO - Going to convert document batch...
2025-11-14 16:09:47,822 - INFO - Processing document 4_2025-08-27
2025-11-14 16:09:47,923 - INFO - Finished converting document 4_2025-08-27 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2025-08-26' --> 'data\processed_data\CRM\4_2025-08-26.md'


2025-11-14 16:09:48,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:48,057 - INFO - Going to convert document batch...
2025-11-14 16:09:48,059 - INFO - Processing document 4_2025-08-28
2025-11-14 16:09:48,154 - INFO - Finished converting document 4_2025-08-28 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-08-27' --> 'data\processed_data\CRM\4_2025-08-27.md'


2025-11-14 16:09:48,272 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:48,322 - INFO - Going to convert document batch...
2025-11-14 16:09:48,324 - INFO - Processing document 4_2025-08-29
2025-11-14 16:09:48,393 - INFO - Finished converting document 4_2025-08-29 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2025-08-28' --> 'data\processed_data\CRM\4_2025-08-28.md'


2025-11-14 16:09:48,477 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:48,550 - INFO - Going to convert document batch...
2025-11-14 16:09:48,553 - INFO - Processing document 4_2025-09-02


Converted 'data\edgar_documents\CRM\4_2025-08-29' --> 'data\processed_data\CRM\4_2025-08-29.md'


2025-11-14 16:09:48,718 - INFO - Finished converting document 4_2025-09-02 in 0.25 sec.
2025-11-14 16:09:48,814 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:48,865 - INFO - Going to convert document batch...
2025-11-14 16:09:48,867 - INFO - Processing document 4_2025-09-03


Converted 'data\edgar_documents\CRM\4_2025-09-02' --> 'data\processed_data\CRM\4_2025-09-02.md'


2025-11-14 16:09:48,993 - INFO - Finished converting document 4_2025-09-03 in 0.20 sec.
2025-11-14 16:09:49,123 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:49,166 - INFO - Going to convert document batch...
2025-11-14 16:09:49,167 - INFO - Processing document 4_2025-09-04
2025-11-14 16:09:49,290 - INFO - Finished converting document 4_2025-09-04 in 0.19 sec.


Converted 'data\edgar_documents\CRM\4_2025-09-03' --> 'data\processed_data\CRM\4_2025-09-03.md'


2025-11-14 16:09:49,398 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:49,460 - INFO - Going to convert document batch...
2025-11-14 16:09:49,462 - INFO - Processing document 4_2025-09-05
2025-11-14 16:09:49,587 - INFO - Finished converting document 4_2025-09-05 in 0.19 sec.


Converted 'data\edgar_documents\CRM\4_2025-09-04' --> 'data\processed_data\CRM\4_2025-09-04.md'


2025-11-14 16:09:49,667 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:49,711 - INFO - Going to convert document batch...
2025-11-14 16:09:49,713 - INFO - Processing document 4_2025-09-08
2025-11-14 16:09:49,825 - INFO - Finished converting document 4_2025-09-08 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2025-09-05' --> 'data\processed_data\CRM\4_2025-09-05.md'


2025-11-14 16:09:49,940 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:49,986 - INFO - Going to convert document batch...
2025-11-14 16:09:49,987 - INFO - Processing document 4_2025-09-09
2025-11-14 16:09:50,100 - INFO - Finished converting document 4_2025-09-09 in 0.19 sec.


Converted 'data\edgar_documents\CRM\4_2025-09-08' --> 'data\processed_data\CRM\4_2025-09-08.md'


2025-11-14 16:09:50,213 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:50,244 - INFO - Going to convert document batch...
2025-11-14 16:09:50,245 - INFO - Processing document 4_2025-09-10
2025-11-14 16:09:50,306 - INFO - Finished converting document 4_2025-09-10 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2025-09-09' --> 'data\processed_data\CRM\4_2025-09-09.md'
Converted 'data\edgar_documents\CRM\4_2025-09-10' --> 'data\processed_data\CRM\4_2025-09-10.md'


2025-11-14 16:09:50,411 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:50,473 - INFO - Going to convert document batch...
2025-11-14 16:09:50,475 - INFO - Processing document 4_2025-09-11
2025-11-14 16:09:50,599 - INFO - Finished converting document 4_2025-09-11 in 0.24 sec.
2025-11-14 16:09:50,676 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:50,702 - INFO - Going to convert document batch...
2025-11-14 16:09:50,703 - INFO - Processing document 4_2025-09-12
2025-11-14 16:09:50,769 - INFO - Finished converting document 4_2025-09-12 in 0.11 sec.
2025-11-14 16:09:50,857 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2025-09-11' --> 'data\processed_data\CRM\4_2025-09-11.md'
Converted 'data\edgar_documents\CRM\4_2025-09-12' --> 'data\processed_data\CRM\4_2025-09-12.md'


2025-11-14 16:09:50,899 - INFO - Going to convert document batch...
2025-11-14 16:09:50,901 - INFO - Processing document 4_2025-09-15
2025-11-14 16:09:51,011 - INFO - Finished converting document 4_2025-09-15 in 0.19 sec.
2025-11-14 16:09:51,118 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2025-09-15' --> 'data\processed_data\CRM\4_2025-09-15.md'


2025-11-14 16:09:51,630 - INFO - Going to convert document batch...
2025-11-14 16:09:51,632 - INFO - Processing document 4_2025-09-16
2025-11-14 16:09:51,702 - INFO - Finished converting document 4_2025-09-16 in 0.59 sec.
2025-11-14 16:09:51,770 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:51,818 - INFO - Going to convert document batch...
2025-11-14 16:09:51,819 - INFO - Processing document 4_2025-09-17
2025-11-14 16:09:51,902 - INFO - Finished converting document 4_2025-09-17 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2025-09-16' --> 'data\processed_data\CRM\4_2025-09-16.md'


2025-11-14 16:09:51,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:52,006 - INFO - Going to convert document batch...
2025-11-14 16:09:52,008 - INFO - Processing document 4_2025-09-18
2025-11-14 16:09:52,071 - INFO - Finished converting document 4_2025-09-18 in 0.09 sec.
2025-11-14 16:09:52,149 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2025-09-17' --> 'data\processed_data\CRM\4_2025-09-17.md'
Converted 'data\edgar_documents\CRM\4_2025-09-18' --> 'data\processed_data\CRM\4_2025-09-18.md'


2025-11-14 16:09:52,187 - INFO - Going to convert document batch...
2025-11-14 16:09:52,188 - INFO - Processing document 4_2025-09-19
2025-11-14 16:09:52,282 - INFO - Finished converting document 4_2025-09-19 in 0.14 sec.
2025-11-14 16:09:52,402 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:52,438 - INFO - Going to convert document batch...
2025-11-14 16:09:52,439 - INFO - Processing document 4_2025-09-22
2025-11-14 16:09:52,539 - INFO - Finished converting document 4_2025-09-22 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-09-19' --> 'data\processed_data\CRM\4_2025-09-19.md'


2025-11-14 16:09:52,625 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:52,669 - INFO - Going to convert document batch...
2025-11-14 16:09:52,671 - INFO - Processing document 4_2025-09-23
2025-11-14 16:09:52,748 - INFO - Finished converting document 4_2025-09-23 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-09-22' --> 'data\processed_data\CRM\4_2025-09-22.md'
Converted 'data\edgar_documents\CRM\4_2025-09-23' --> 'data\processed_data\CRM\4_2025-09-23.md'


2025-11-14 16:09:52,826 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:52,860 - INFO - Going to convert document batch...
2025-11-14 16:09:52,861 - INFO - Processing document 4_2025-09-24
2025-11-14 16:09:52,931 - INFO - Finished converting document 4_2025-09-24 in 0.12 sec.
2025-11-14 16:09:53,082 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:53,132 - INFO - Going to convert document batch...
2025-11-14 16:09:53,133 - INFO - Processing document 4_2025-09-25


Converted 'data\edgar_documents\CRM\4_2025-09-24' --> 'data\processed_data\CRM\4_2025-09-24.md'


2025-11-14 16:09:53,226 - INFO - Finished converting document 4_2025-09-25 in 0.20 sec.
2025-11-14 16:09:53,307 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:53,339 - INFO - Going to convert document batch...
2025-11-14 16:09:53,340 - INFO - Processing document 4_2025-09-26
2025-11-14 16:09:53,418 - INFO - Finished converting document 4_2025-09-26 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2025-09-25' --> 'data\processed_data\CRM\4_2025-09-25.md'
Converted 'data\edgar_documents\CRM\4_2025-09-26' --> 'data\processed_data\CRM\4_2025-09-26.md'


2025-11-14 16:09:53,503 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:53,534 - INFO - Going to convert document batch...
2025-11-14 16:09:53,535 - INFO - Processing document 4_2025-09-29
2025-11-14 16:09:53,612 - INFO - Finished converting document 4_2025-09-29 in 0.14 sec.
2025-11-14 16:09:53,732 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:53,770 - INFO - Going to convert document batch...
2025-11-14 16:09:53,771 - INFO - Processing document 4_2025-09-30
2025-11-14 16:09:53,863 - INFO - Finished converting document 4_2025-09-30 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2025-09-29' --> 'data\processed_data\CRM\4_2025-09-29.md'
Converted 'data\edgar_documents\CRM\4_2025-09-30' --> 'data\processed_data\CRM\4_2025-09-30.md'


2025-11-14 16:09:53,943 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:53,982 - INFO - Going to convert document batch...
2025-11-14 16:09:53,984 - INFO - Processing document 4_2025-10-01
2025-11-14 16:09:54,094 - INFO - Finished converting document 4_2025-10-01 in 0.19 sec.
2025-11-14 16:09:54,175 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:54,211 - INFO - Going to convert document batch...
2025-11-14 16:09:54,212 - INFO - Processing document 4_2025-10-02
2025-11-14 16:09:54,323 - INFO - Finished converting document 4_2025-10-02 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2025-10-01' --> 'data\processed_data\CRM\4_2025-10-01.md'


2025-11-14 16:09:54,430 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:54,457 - INFO - Going to convert document batch...
2025-11-14 16:09:54,459 - INFO - Processing document 4_2025-10-03
2025-11-14 16:09:54,533 - INFO - Finished converting document 4_2025-10-03 in 0.11 sec.
2025-11-14 16:09:54,619 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2025-10-02' --> 'data\processed_data\CRM\4_2025-10-02.md'
Converted 'data\edgar_documents\CRM\4_2025-10-03' --> 'data\processed_data\CRM\4_2025-10-03.md'


2025-11-14 16:09:54,644 - INFO - Going to convert document batch...
2025-11-14 16:09:54,645 - INFO - Processing document 4_2025-10-06
2025-11-14 16:09:54,706 - INFO - Finished converting document 4_2025-10-06 in 0.11 sec.
2025-11-14 16:09:54,899 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:54,933 - INFO - Going to convert document batch...
2025-11-14 16:09:54,934 - INFO - Processing document 4_2025-10-07
2025-11-14 16:09:55,026 - INFO - Finished converting document 4_2025-10-07 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2025-10-06' --> 'data\processed_data\CRM\4_2025-10-06.md'


2025-11-14 16:09:55,157 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:55,215 - INFO - Going to convert document batch...
2025-11-14 16:09:55,217 - INFO - Processing document 4_2025-10-08


Converted 'data\edgar_documents\CRM\4_2025-10-07' --> 'data\processed_data\CRM\4_2025-10-07.md'


2025-11-14 16:09:55,366 - INFO - Finished converting document 4_2025-10-08 in 0.22 sec.
2025-11-14 16:09:55,577 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:55,644 - INFO - Going to convert document batch...
2025-11-14 16:09:55,645 - INFO - Processing document 4_2025-10-09


Converted 'data\edgar_documents\CRM\4_2025-10-08' --> 'data\processed_data\CRM\4_2025-10-08.md'


2025-11-14 16:09:55,721 - INFO - Finished converting document 4_2025-10-09 in 0.20 sec.
2025-11-14 16:09:55,810 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:55,843 - INFO - Going to convert document batch...
2025-11-14 16:09:55,844 - INFO - Processing document 4_2025-10-10
2025-11-14 16:09:55,911 - INFO - Finished converting document 4_2025-10-10 in 0.11 sec.


Converted 'data\edgar_documents\CRM\4_2025-10-09' --> 'data\processed_data\CRM\4_2025-10-09.md'
Converted 'data\edgar_documents\CRM\4_2025-10-10' --> 'data\processed_data\CRM\4_2025-10-10.md'


2025-11-14 16:09:56,005 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:56,053 - INFO - Going to convert document batch...
2025-11-14 16:09:56,054 - INFO - Processing document 4_2025-10-14
2025-11-14 16:09:56,196 - INFO - Finished converting document 4_2025-10-14 in 0.20 sec.
2025-11-14 16:09:56,306 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:56,335 - INFO - Going to convert document batch...
2025-11-14 16:09:56,336 - INFO - Processing document 4_2025-10-15
2025-11-14 16:09:56,436 - INFO - Finished converting document 4_2025-10-15 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-10-14' --> 'data\processed_data\CRM\4_2025-10-14.md'


2025-11-14 16:09:56,584 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:56,622 - INFO - Going to convert document batch...
2025-11-14 16:09:56,623 - INFO - Processing document 4_2025-10-16
2025-11-14 16:09:56,700 - INFO - Finished converting document 4_2025-10-16 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2025-10-15' --> 'data\processed_data\CRM\4_2025-10-15.md'


2025-11-14 16:09:56,770 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:56,807 - INFO - Going to convert document batch...
2025-11-14 16:09:56,809 - INFO - Processing document 4_2025-10-17
2025-11-14 16:09:56,891 - INFO - Finished converting document 4_2025-10-17 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-10-16' --> 'data\processed_data\CRM\4_2025-10-16.md'


2025-11-14 16:09:57,003 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:57,045 - INFO - Going to convert document batch...
2025-11-14 16:09:57,046 - INFO - Processing document 4_2025-10-20
2025-11-14 16:09:57,136 - INFO - Finished converting document 4_2025-10-20 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2025-10-17' --> 'data\processed_data\CRM\4_2025-10-17.md'


2025-11-14 16:09:57,230 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:57,261 - INFO - Going to convert document batch...
2025-11-14 16:09:57,262 - INFO - Processing document 4_2025-10-21
2025-11-14 16:09:57,354 - INFO - Finished converting document 4_2025-10-21 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-10-20' --> 'data\processed_data\CRM\4_2025-10-20.md'
Converted 'data\edgar_documents\CRM\4_2025-10-21' --> 'data\processed_data\CRM\4_2025-10-21.md'


2025-11-14 16:09:57,457 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:57,497 - INFO - Going to convert document batch...
2025-11-14 16:09:57,498 - INFO - Processing document 4_2025-10-22
2025-11-14 16:09:57,673 - INFO - Finished converting document 4_2025-10-22 in 0.25 sec.
2025-11-14 16:09:57,780 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:57,811 - INFO - Going to convert document batch...
2025-11-14 16:09:57,813 - INFO - Processing document 4_2025-10-23
2025-11-14 16:09:57,878 - INFO - Finished converting document 4_2025-10-23 in 0.12 sec.
2025-11-14 16:09:57,949 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\4_2025-10-22' --> 'data\processed_data\CRM\4_2025-10-22.md'
Converted 'data\edgar_documents\CRM\4_2025-10-23' --> 'data\processed_data\CRM\4_2025-10-23.md'


2025-11-14 16:09:58,482 - INFO - Going to convert document batch...
2025-11-14 16:09:58,484 - INFO - Processing document 4_2025-10-24
2025-11-14 16:09:58,577 - INFO - Finished converting document 4_2025-10-24 in 0.66 sec.
2025-11-14 16:09:58,655 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:58,690 - INFO - Going to convert document batch...
2025-11-14 16:09:58,692 - INFO - Processing document 4_2025-10-27
2025-11-14 16:09:58,788 - INFO - Finished converting document 4_2025-10-27 in 0.16 sec.


Converted 'data\edgar_documents\CRM\4_2025-10-24' --> 'data\processed_data\CRM\4_2025-10-24.md'


2025-11-14 16:09:58,891 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:58,932 - INFO - Going to convert document batch...
2025-11-14 16:09:58,934 - INFO - Processing document 4_2025-10-28


Converted 'data\edgar_documents\CRM\4_2025-10-27' --> 'data\processed_data\CRM\4_2025-10-27.md'


2025-11-14 16:09:59,084 - INFO - Finished converting document 4_2025-10-28 in 0.22 sec.
2025-11-14 16:09:59,166 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:59,196 - INFO - Going to convert document batch...
2025-11-14 16:09:59,198 - INFO - Processing document 4_2025-10-29
2025-11-14 16:09:59,263 - INFO - Finished converting document 4_2025-10-29 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2025-10-28' --> 'data\processed_data\CRM\4_2025-10-28.md'
Converted 'data\edgar_documents\CRM\4_2025-10-29' --> 'data\processed_data\CRM\4_2025-10-29.md'


2025-11-14 16:09:59,340 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:59,392 - INFO - Going to convert document batch...
2025-11-14 16:09:59,394 - INFO - Processing document 4_2025-10-30
2025-11-14 16:09:59,484 - INFO - Finished converting document 4_2025-10-30 in 0.16 sec.
2025-11-14 16:09:59,549 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:59,592 - INFO - Going to convert document batch...
2025-11-14 16:09:59,594 - INFO - Processing document 4_2025-10-31
2025-11-14 16:09:59,680 - INFO - Finished converting document 4_2025-10-31 in 0.14 sec.


Converted 'data\edgar_documents\CRM\4_2025-10-30' --> 'data\processed_data\CRM\4_2025-10-30.md'


2025-11-14 16:09:59,801 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:09:59,852 - INFO - Going to convert document batch...
2025-11-14 16:09:59,853 - INFO - Processing document 4_2025-11-03
2025-11-14 16:09:59,956 - INFO - Finished converting document 4_2025-11-03 in 0.17 sec.


Converted 'data\edgar_documents\CRM\4_2025-10-31' --> 'data\processed_data\CRM\4_2025-10-31.md'


2025-11-14 16:10:00,047 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:00,072 - INFO - Going to convert document batch...
2025-11-14 16:10:00,074 - INFO - Processing document 4_2025-11-04
2025-11-14 16:10:00,138 - INFO - Finished converting document 4_2025-11-04 in 0.12 sec.


Converted 'data\edgar_documents\CRM\4_2025-11-03' --> 'data\processed_data\CRM\4_2025-11-03.md'
Converted 'data\edgar_documents\CRM\4_2025-11-04' --> 'data\processed_data\CRM\4_2025-11-04.md'


2025-11-14 16:10:00,240 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:00,282 - INFO - Going to convert document batch...
2025-11-14 16:10:00,283 - INFO - Processing document 8-K_2023-01-04
2025-11-14 16:10:00,331 - INFO - Finished converting document 8-K_2023-01-04 in 0.12 sec.
2025-11-14 16:10:00,364 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:00,389 - INFO - Going to convert document batch...
2025-11-14 16:10:00,391 - INFO - Processing document 8-K_2023-01-27
2025-11-14 16:10:00,434 - INFO - Finished converting document 8-K_2023-01-27 in 0.09 sec.
2025-11-14 16:10:00,493 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:00,516 - INFO - Going to convert document batch...
2025-11-14 16:10:00,517 - INFO - Processing document 8-K_2023-03-01
2025-11-14 16:10:00,550 - INFO - Finished converting document 8-K_2023-03-01 in 0.09 sec.


Converted 'data\edgar_documents\CRM\8-K_2023-01-04' --> 'data\processed_data\CRM\8-K_2023-01-04.md'
Converted 'data\edgar_documents\CRM\8-K_2023-01-27' --> 'data\processed_data\CRM\8-K_2023-01-27.md'


2025-11-14 16:10:00,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:00,609 - INFO - Going to convert document batch...
2025-11-14 16:10:00,610 - INFO - Processing document 8-K_2023-05-31
2025-11-14 16:10:00,650 - INFO - Finished converting document 8-K_2023-05-31 in 0.08 sec.
2025-11-14 16:10:00,705 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\8-K_2023-03-01' --> 'data\processed_data\CRM\8-K_2023-03-01.md'
Converted 'data\edgar_documents\CRM\8-K_2023-05-31' --> 'data\processed_data\CRM\8-K_2023-05-31.md'


2025-11-14 16:10:00,793 - INFO - Going to convert document batch...
2025-11-14 16:10:00,794 - INFO - Processing document 8-K_2023-06-12
2025-11-14 16:10:00,884 - INFO - Finished converting document 8-K_2023-06-12 in 0.20 sec.
2025-11-14 16:10:00,961 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:01,010 - INFO - Going to convert document batch...
2025-11-14 16:10:01,012 - INFO - Processing document 8-K_2023-08-30
2025-11-14 16:10:01,051 - INFO - Finished converting document 8-K_2023-08-30 in 0.12 sec.
2025-11-14 16:10:01,088 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\8-K_2023-06-12' --> 'data\processed_data\CRM\8-K_2023-06-12.md'
Converted 'data\edgar_documents\CRM\8-K_2023-08-30' --> 'data\processed_data\CRM\8-K_2023-08-30.md'


2025-11-14 16:10:01,121 - INFO - Going to convert document batch...
2025-11-14 16:10:01,123 - INFO - Processing document 8-K_2023-11-29
2025-11-14 16:10:01,164 - INFO - Finished converting document 8-K_2023-11-29 in 0.09 sec.
2025-11-14 16:10:01,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:01,214 - INFO - Going to convert document batch...
2025-11-14 16:10:01,215 - INFO - Processing document 8-K_2024-02-28
2025-11-14 16:10:01,249 - INFO - Finished converting document 8-K_2024-02-28 in 0.06 sec.
2025-11-14 16:10:01,301 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:01,332 - INFO - Going to convert document batch...
2025-11-14 16:10:01,334 - INFO - Processing document 8-K_2024-05-29
2025-11-14 16:10:01,379 - INFO - Finished converting document 8-K_2024-05-29 in 0.09 sec.


Converted 'data\edgar_documents\CRM\8-K_2023-11-29' --> 'data\processed_data\CRM\8-K_2023-11-29.md'
Converted 'data\edgar_documents\CRM\8-K_2024-02-28' --> 'data\processed_data\CRM\8-K_2024-02-28.md'


2025-11-14 16:10:01,417 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:01,488 - INFO - Going to convert document batch...
2025-11-14 16:10:01,490 - INFO - Processing document 8-K_2024-07-01


Converted 'data\edgar_documents\CRM\8-K_2024-05-29' --> 'data\processed_data\CRM\8-K_2024-05-29.md'


2025-11-14 16:10:01,612 - INFO - Finished converting document 8-K_2024-07-01 in 0.20 sec.
2025-11-14 16:10:01,681 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:01,705 - INFO - Going to convert document batch...
2025-11-14 16:10:01,707 - INFO - Processing document 8-K_2024-08-28
2025-11-14 16:10:01,784 - INFO - Finished converting document 8-K_2024-08-28 in 0.11 sec.
2025-11-14 16:10:01,840 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\8-K_2024-07-01' --> 'data\processed_data\CRM\8-K_2024-07-01.md'
Converted 'data\edgar_documents\CRM\8-K_2024-08-28' --> 'data\processed_data\CRM\8-K_2024-08-28.md'


2025-11-14 16:10:01,861 - INFO - Going to convert document batch...
2025-11-14 16:10:01,862 - INFO - Processing document 8-K_2024-09-05
2025-11-14 16:10:01,903 - INFO - Finished converting document 8-K_2024-09-05 in 0.09 sec.
2025-11-14 16:10:01,946 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:01,965 - INFO - Going to convert document batch...
2025-11-14 16:10:01,966 - INFO - Processing document 8-K_2024-11-05
2025-11-14 16:10:02,001 - INFO - Finished converting document 8-K_2024-11-05 in 0.08 sec.
2025-11-14 16:10:02,069 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:02,094 - INFO - Going to convert document batch...
2025-11-14 16:10:02,095 - INFO - Processing document 8-K_2024-12-03


Converted 'data\edgar_documents\CRM\8-K_2024-09-05' --> 'data\processed_data\CRM\8-K_2024-09-05.md'
Converted 'data\edgar_documents\CRM\8-K_2024-11-05' --> 'data\processed_data\CRM\8-K_2024-11-05.md'


2025-11-14 16:10:02,135 - INFO - Finished converting document 8-K_2024-12-03 in 0.11 sec.
2025-11-14 16:10:02,171 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:02,192 - INFO - Going to convert document batch...
2025-11-14 16:10:02,193 - INFO - Processing document 8-K_2024-12-10
2025-11-14 16:10:02,232 - INFO - Finished converting document 8-K_2024-12-10 in 0.08 sec.
2025-11-14 16:10:02,285 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:02,306 - INFO - Going to convert document batch...
2025-11-14 16:10:02,310 - INFO - Processing document 8-K_2025-02-05
2025-11-14 16:10:02,347 - INFO - Finished converting document 8-K_2025-02-05 in 0.09 sec.


Converted 'data\edgar_documents\CRM\8-K_2024-12-03' --> 'data\processed_data\CRM\8-K_2024-12-03.md'
Converted 'data\edgar_documents\CRM\8-K_2024-12-10' --> 'data\processed_data\CRM\8-K_2024-12-10.md'


2025-11-14 16:10:02,392 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:02,413 - INFO - Going to convert document batch...
2025-11-14 16:10:02,414 - INFO - Processing document 8-K_2025-02-26
2025-11-14 16:10:02,463 - INFO - Finished converting document 8-K_2025-02-26 in 0.09 sec.
2025-11-14 16:10:02,526 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:02,541 - INFO - Going to convert document batch...
2025-11-14 16:10:02,542 - INFO - Processing document 8-K_2025-05-27
2025-11-14 16:10:02,570 - INFO - Finished converting document 8-K_2025-05-27 in 0.06 sec.


Converted 'data\edgar_documents\CRM\8-K_2025-02-05' --> 'data\processed_data\CRM\8-K_2025-02-05.md'
Converted 'data\edgar_documents\CRM\8-K_2025-02-26' --> 'data\processed_data\CRM\8-K_2025-02-26.md'


2025-11-14 16:10:02,605 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:02,625 - INFO - Going to convert document batch...
2025-11-14 16:10:02,626 - INFO - Processing document 8-K_2025-05-28
2025-11-14 16:10:02,659 - INFO - Finished converting document 8-K_2025-05-28 in 0.08 sec.
2025-11-14 16:10:02,698 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:02,738 - INFO - Going to convert document batch...
2025-11-14 16:10:02,740 - INFO - Processing document 8-K_2025-06-09


Converted 'data\edgar_documents\CRM\8-K_2025-05-27' --> 'data\processed_data\CRM\8-K_2025-05-27.md'
Converted 'data\edgar_documents\CRM\8-K_2025-05-28' --> 'data\processed_data\CRM\8-K_2025-05-28.md'


2025-11-14 16:10:02,828 - INFO - Finished converting document 8-K_2025-06-09 in 0.14 sec.
2025-11-14 16:10:02,886 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:02,911 - INFO - Going to convert document batch...
2025-11-14 16:10:02,912 - INFO - Processing document 8-K_2025-06-24
2025-11-14 16:10:02,950 - INFO - Finished converting document 8-K_2025-06-24 in 0.09 sec.
2025-11-14 16:10:02,996 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:03,022 - INFO - Going to convert document batch...
2025-11-14 16:10:03,023 - INFO - Processing document 8-K_2025-07-09


Converted 'data\edgar_documents\CRM\8-K_2025-06-09' --> 'data\processed_data\CRM\8-K_2025-06-09.md'
Converted 'data\edgar_documents\CRM\8-K_2025-06-24' --> 'data\processed_data\CRM\8-K_2025-06-24.md'


2025-11-14 16:10:03,059 - INFO - Finished converting document 8-K_2025-07-09 in 0.09 sec.
2025-11-14 16:10:03,115 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:03,148 - INFO - Going to convert document batch...
2025-11-14 16:10:03,151 - INFO - Processing document 8-K_2025-09-03
2025-11-14 16:10:03,232 - INFO - Finished converting document 8-K_2025-09-03 in 0.14 sec.
2025-11-14 16:10:03,285 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\8-K_2025-07-09' --> 'data\processed_data\CRM\8-K_2025-07-09.md'
Converted 'data\edgar_documents\CRM\8-K_2025-09-03' --> 'data\processed_data\CRM\8-K_2025-09-03.md'


2025-11-14 16:10:03,330 - INFO - Going to convert document batch...
2025-11-14 16:10:03,331 - INFO - Processing document 8-K_2025-10-16
2025-11-14 16:10:03,389 - INFO - Finished converting document 8-K_2025-10-16 in 0.14 sec.
2025-11-14 16:10:03,465 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:10:03,466 - ERROR - Input document DEF-14A_2023-04-27 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:10:03,469 - INFO - Going to convert 

Converted 'data\edgar_documents\CRM\8-K_2025-10-16' --> 'data\processed_data\CRM\8-K_2025-10-16.md'
Error processing data\edgar_documents\CRM\DEF-14A_2023-04-27: File format not allowed: data\edgar_documents\CRM\DEF-14A_2023-04-27
Error processing data\edgar_documents\CRM\DEF-14A_2024-05-16: File format not allowed: data\edgar_documents\CRM\DEF-14A_2024-05-16


2025-11-14 16:10:03,650 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:10:05,898 - INFO - Going to convert document batch...
2025-11-14 16:10:05,900 - INFO - Processing document DEF-14A_2025-04-24
2025-11-14 16:10:50,592 - INFO - Finished converting document DEF-14A_2025-04-24 in 47.06 sec.
2025-11-14 16:10:52,231 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CRM\DEF-14A_2025-04-24' --> 'data\processed_data\CRM\DEF-14A_2025-04-24.md'
Processed 509 new files. Errors: 2
Found 128 files to process in data\edgar_documents\CSCO


2025-11-14 16:10:53,216 - INFO - Going to convert document batch...
2025-11-14 16:10:53,218 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:10:53,218 - INFO - Processing document 10-K_2023-09-07
2025-11-14 16:10:55,011 - INFO - Finished converting document 10-K_2023-09-07 in 2.86 sec.
2025-11-14 16:10:55,662 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\10-K_2023-09-07' --> 'data\processed_data\CSCO\10-K_2023-09-07.md'


2025-11-14 16:10:56,617 - INFO - Going to convert document batch...
2025-11-14 16:10:56,618 - INFO - Processing document 10-K_2024-09-05
2025-11-14 16:10:58,499 - INFO - Finished converting document 10-K_2024-09-05 in 2.91 sec.
2025-11-14 16:10:59,234 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\10-K_2024-09-05' --> 'data\processed_data\CSCO\10-K_2024-09-05.md'


2025-11-14 16:11:00,380 - INFO - Going to convert document batch...
2025-11-14 16:11:00,380 - INFO - Processing document 10-K_2025-09-03
2025-11-14 16:11:02,250 - INFO - Finished converting document 10-K_2025-09-03 in 3.09 sec.
2025-11-14 16:11:02,935 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\10-K_2025-09-03' --> 'data\processed_data\CSCO\10-K_2025-09-03.md'


2025-11-14 16:11:03,523 - INFO - Going to convert document batch...
2025-11-14 16:11:03,524 - INFO - Processing document 10-Q_2023-02-21
2025-11-14 16:11:05,454 - INFO - Finished converting document 10-Q_2023-02-21 in 2.59 sec.
2025-11-14 16:11:06,080 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\10-Q_2023-02-21' --> 'data\processed_data\CSCO\10-Q_2023-02-21.md'


2025-11-14 16:11:06,671 - INFO - Going to convert document batch...
2025-11-14 16:11:06,672 - INFO - Processing document 10-Q_2023-05-24
2025-11-14 16:11:08,187 - INFO - Finished converting document 10-Q_2023-05-24 in 2.17 sec.
2025-11-14 16:11:08,830 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\10-Q_2023-05-24' --> 'data\processed_data\CSCO\10-Q_2023-05-24.md'


2025-11-14 16:11:09,807 - INFO - Going to convert document batch...
2025-11-14 16:11:09,808 - INFO - Processing document 10-Q_2023-11-21
2025-11-14 16:11:11,031 - INFO - Finished converting document 10-Q_2023-11-21 in 2.25 sec.
2025-11-14 16:11:11,525 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\10-Q_2023-11-21' --> 'data\processed_data\CSCO\10-Q_2023-11-21.md'


2025-11-14 16:11:12,499 - INFO - Going to convert document batch...
2025-11-14 16:11:12,500 - INFO - Processing document 10-Q_2024-02-20
2025-11-14 16:11:15,895 - INFO - Finished converting document 10-Q_2024-02-20 in 4.42 sec.
2025-11-14 16:11:17,323 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\10-Q_2024-02-20' --> 'data\processed_data\CSCO\10-Q_2024-02-20.md'


2025-11-14 16:11:20,243 - INFO - Going to convert document batch...
2025-11-14 16:11:20,245 - INFO - Processing document 10-Q_2024-05-21
2025-11-14 16:11:24,307 - INFO - Finished converting document 10-Q_2024-05-21 in 7.05 sec.
2025-11-14 16:11:25,795 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\10-Q_2024-05-21' --> 'data\processed_data\CSCO\10-Q_2024-05-21.md'


2025-11-14 16:11:26,925 - INFO - Going to convert document batch...
2025-11-14 16:11:26,927 - INFO - Processing document 10-Q_2024-11-19
2025-11-14 16:11:29,859 - INFO - Finished converting document 10-Q_2024-11-19 in 4.09 sec.
2025-11-14 16:11:31,982 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\10-Q_2024-11-19' --> 'data\processed_data\CSCO\10-Q_2024-11-19.md'


2025-11-14 16:11:33,735 - INFO - Going to convert document batch...
2025-11-14 16:11:33,737 - INFO - Processing document 10-Q_2025-02-18
2025-11-14 16:11:37,528 - INFO - Finished converting document 10-Q_2025-02-18 in 5.62 sec.
2025-11-14 16:11:39,494 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\10-Q_2025-02-18' --> 'data\processed_data\CSCO\10-Q_2025-02-18.md'


2025-11-14 16:11:40,919 - INFO - Going to convert document batch...
2025-11-14 16:11:40,920 - INFO - Processing document 10-Q_2025-05-20
2025-11-14 16:11:44,629 - INFO - Finished converting document 10-Q_2025-05-20 in 5.22 sec.
2025-11-14 16:11:46,979 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:47,004 - INFO - Going to convert document batch...
2025-11-14 16:11:47,006 - INFO - Processing document 4_2023-02-14
2025-11-14 16:11:47,059 - INFO - Finished converting document 4_2023-02-14 in 0.11 sec.


Converted 'data\edgar_documents\CSCO\10-Q_2025-05-20' --> 'data\processed_data\CSCO\10-Q_2025-05-20.md'
Converted 'data\edgar_documents\CSCO\4_2023-02-14' --> 'data\processed_data\CSCO\4_2023-02-14.md'


2025-11-14 16:11:47,146 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:47,177 - INFO - Going to convert document batch...
2025-11-14 16:11:47,179 - INFO - Processing document 4_2023-02-22
2025-11-14 16:11:47,234 - INFO - Finished converting document 4_2023-02-22 in 0.11 sec.
2025-11-14 16:11:47,310 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:47,339 - INFO - Going to convert document batch...
2025-11-14 16:11:47,341 - INFO - Processing document 4_2023-02-24
2025-11-14 16:11:47,405 - INFO - Finished converting document 4_2023-02-24 in 0.12 sec.


Converted 'data\edgar_documents\CSCO\4_2023-02-22' --> 'data\processed_data\CSCO\4_2023-02-22.md'
Converted 'data\edgar_documents\CSCO\4_2023-02-24' --> 'data\processed_data\CSCO\4_2023-02-24.md'


2025-11-14 16:11:47,497 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:47,533 - INFO - Going to convert document batch...
2025-11-14 16:11:47,536 - INFO - Processing document 4_2023-03-14
2025-11-14 16:11:47,602 - INFO - Finished converting document 4_2023-03-14 in 0.12 sec.
2025-11-14 16:11:47,676 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:47,690 - INFO - Going to convert document batch...
2025-11-14 16:11:47,691 - INFO - Processing document 4_2023-03-17
2025-11-14 16:11:47,753 - INFO - Finished converting document 4_2023-03-17 in 0.09 sec.
2025-11-14 16:11:47,830 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\4_2023-03-14' --> 'data\processed_data\CSCO\4_2023-03-14.md'
Converted 'data\edgar_documents\CSCO\4_2023-03-17' --> 'data\processed_data\CSCO\4_2023-03-17.md'


2025-11-14 16:11:47,857 - INFO - Going to convert document batch...
2025-11-14 16:11:47,861 - INFO - Processing document 4_2023-05-12
2025-11-14 16:11:47,924 - INFO - Finished converting document 4_2023-05-12 in 0.12 sec.
2025-11-14 16:11:48,008 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:48,030 - INFO - Going to convert document batch...
2025-11-14 16:11:48,031 - INFO - Processing document 4_2023-05-23
2025-11-14 16:11:48,086 - INFO - Finished converting document 4_2023-05-23 in 0.09 sec.


Converted 'data\edgar_documents\CSCO\4_2023-05-12' --> 'data\processed_data\CSCO\4_2023-05-12.md'
Converted 'data\edgar_documents\CSCO\4_2023-05-23' --> 'data\processed_data\CSCO\4_2023-05-23.md'


2025-11-14 16:11:48,189 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:48,218 - INFO - Going to convert document batch...
2025-11-14 16:11:48,220 - INFO - Processing document 4_2023-06-08
2025-11-14 16:11:48,256 - INFO - Finished converting document 4_2023-06-08 in 0.09 sec.
2025-11-14 16:11:48,336 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:48,362 - INFO - Going to convert document batch...
2025-11-14 16:11:48,365 - INFO - Processing document 4_2023-06-13
2025-11-14 16:11:48,422 - INFO - Finished converting document 4_2023-06-13 in 0.11 sec.


Converted 'data\edgar_documents\CSCO\4_2023-06-08' --> 'data\processed_data\CSCO\4_2023-06-08.md'
Converted 'data\edgar_documents\CSCO\4_2023-06-13' --> 'data\processed_data\CSCO\4_2023-06-13.md'


2025-11-14 16:11:48,507 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:48,545 - INFO - Going to convert document batch...
2025-11-14 16:11:48,547 - INFO - Processing document 4_2023-06-14
2025-11-14 16:11:48,605 - INFO - Finished converting document 4_2023-06-14 in 0.14 sec.
2025-11-14 16:11:48,675 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:48,691 - INFO - Going to convert document batch...
2025-11-14 16:11:48,693 - INFO - Processing document 4_2023-06-16
2025-11-14 16:11:48,727 - INFO - Finished converting document 4_2023-06-16 in 0.06 sec.
2025-11-14 16:11:48,802 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:48,821 - INFO - Going to convert document batch...
2025-11-14 16:11:48,823 - INFO - Processing document 4_2023-06-23


Converted 'data\edgar_documents\CSCO\4_2023-06-14' --> 'data\processed_data\CSCO\4_2023-06-14.md'
Converted 'data\edgar_documents\CSCO\4_2023-06-16' --> 'data\processed_data\CSCO\4_2023-06-16.md'


2025-11-14 16:11:48,862 - INFO - Finished converting document 4_2023-06-23 in 0.09 sec.
2025-11-14 16:11:48,941 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:48,957 - INFO - Going to convert document batch...
2025-11-14 16:11:48,958 - INFO - Processing document 4_2023-08-14
2025-11-14 16:11:48,999 - INFO - Finished converting document 4_2023-08-14 in 0.08 sec.
2025-11-14 16:11:49,064 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:49,094 - INFO - Going to convert document batch...
2025-11-14 16:11:49,096 - INFO - Processing document 4_2023-08-22


Converted 'data\edgar_documents\CSCO\4_2023-06-23' --> 'data\processed_data\CSCO\4_2023-06-23.md'
Converted 'data\edgar_documents\CSCO\4_2023-08-14' --> 'data\processed_data\CSCO\4_2023-08-14.md'


2025-11-14 16:11:49,144 - INFO - Finished converting document 4_2023-08-22 in 0.11 sec.
2025-11-14 16:11:49,258 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:49,321 - INFO - Going to convert document batch...
2025-11-14 16:11:49,324 - INFO - Processing document 4_2023-08-23
2025-11-14 16:11:49,407 - INFO - Finished converting document 4_2023-08-23 in 0.19 sec.


Converted 'data\edgar_documents\CSCO\4_2023-08-22' --> 'data\processed_data\CSCO\4_2023-08-22.md'


2025-11-14 16:11:49,455 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:49,468 - INFO - Going to convert document batch...
2025-11-14 16:11:49,470 - INFO - Processing document 4_2023-09-12
2025-11-14 16:11:49,493 - INFO - Finished converting document 4_2023-09-12 in 0.05 sec.
2025-11-14 16:11:49,572 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:49,599 - INFO - Going to convert document batch...
2025-11-14 16:11:49,601 - INFO - Processing document 4_2023-09-14
2025-11-14 16:11:49,642 - INFO - Finished converting document 4_2023-09-14 in 0.09 sec.


Converted 'data\edgar_documents\CSCO\4_2023-08-23' --> 'data\processed_data\CSCO\4_2023-08-23.md'
Converted 'data\edgar_documents\CSCO\4_2023-09-12' --> 'data\processed_data\CSCO\4_2023-09-12.md'


2025-11-14 16:11:49,727 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:49,761 - INFO - Going to convert document batch...
2025-11-14 16:11:49,764 - INFO - Processing document 4_2023-09-19
2025-11-14 16:11:49,814 - INFO - Finished converting document 4_2023-09-19 in 0.11 sec.
2025-11-14 16:11:49,878 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:11:49,880 - ERROR - Input document 4_2023-09-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:11

Converted 'data\edgar_documents\CSCO\4_2023-09-14' --> 'data\processed_data\CSCO\4_2023-09-14.md'
Converted 'data\edgar_documents\CSCO\4_2023-09-19' --> 'data\processed_data\CSCO\4_2023-09-19.md'
Error processing data\edgar_documents\CSCO\4_2023-09-21: File format not allowed: data\edgar_documents\CSCO\4_2023-09-21


2025-11-14 16:11:49,908 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:49,947 - INFO - Going to convert document batch...
2025-11-14 16:11:49,950 - INFO - Processing document 4_2023-09-25
2025-11-14 16:11:49,994 - INFO - Finished converting document 4_2023-09-25 in 0.12 sec.
2025-11-14 16:11:50,040 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:50,055 - INFO - Going to convert document batch...
2025-11-14 16:11:50,055 - INFO - Processing document 4_2023-10-12
2025-11-14 16:11:50,088 - INFO - Finished converting document 4_2023-10-12 in 0.05 sec.
2025-11-14 16:11:50,176 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:50,204 - INFO - Going to convert document batch...
2025-11-14 16:11:50,206 - INFO - Processing document 4_2023-11-14
2025-11-14 16:11:50,261 - INFO - Finished converting document 4_2023-11-14 in 0.12 sec.


Converted 'data\edgar_documents\CSCO\4_2023-09-25' --> 'data\processed_data\CSCO\4_2023-09-25.md'
Converted 'data\edgar_documents\CSCO\4_2023-10-12' --> 'data\processed_data\CSCO\4_2023-10-12.md'


2025-11-14 16:11:50,347 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:50,359 - INFO - Going to convert document batch...
2025-11-14 16:11:50,360 - INFO - Processing document 4_2023-11-21
2025-11-14 16:11:50,399 - INFO - Finished converting document 4_2023-11-21 in 0.06 sec.
2025-11-14 16:11:50,489 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\4_2023-11-14' --> 'data\processed_data\CSCO\4_2023-11-14.md'
Converted 'data\edgar_documents\CSCO\4_2023-11-21' --> 'data\processed_data\CSCO\4_2023-11-21.md'


2025-11-14 16:11:50,526 - INFO - Going to convert document batch...
2025-11-14 16:11:50,529 - INFO - Processing document 4_2023-11-30
2025-11-14 16:11:50,606 - INFO - Finished converting document 4_2023-11-30 in 0.16 sec.
2025-11-14 16:11:50,678 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:50,707 - INFO - Going to convert document batch...
2025-11-14 16:11:50,708 - INFO - Processing document 4_2023-12-08
2025-11-14 16:11:50,778 - INFO - Finished converting document 4_2023-12-08 in 0.12 sec.


Converted 'data\edgar_documents\CSCO\4_2023-11-30' --> 'data\processed_data\CSCO\4_2023-11-30.md'
Converted 'data\edgar_documents\CSCO\4_2023-12-08' --> 'data\processed_data\CSCO\4_2023-12-08.md'


2025-11-14 16:11:50,879 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:50,911 - INFO - Going to convert document batch...
2025-11-14 16:11:50,913 - INFO - Processing document 4_2023-12-12
2025-11-14 16:11:50,968 - INFO - Finished converting document 4_2023-12-12 in 0.12 sec.
2025-11-14 16:11:51,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:51,044 - INFO - Going to convert document batch...
2025-11-14 16:11:51,045 - INFO - Processing document 4_2023-12-15
2025-11-14 16:11:51,101 - INFO - Finished converting document 4_2023-12-15 in 0.09 sec.
2025-11-14 16:11:51,180 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\4_2023-12-12' --> 'data\processed_data\CSCO\4_2023-12-12.md'
Converted 'data\edgar_documents\CSCO\4_2023-12-15' --> 'data\processed_data\CSCO\4_2023-12-15.md'


2025-11-14 16:11:51,201 - INFO - Going to convert document batch...
2025-11-14 16:11:51,203 - INFO - Processing document 4_2023-12-18
2025-11-14 16:11:51,274 - INFO - Finished converting document 4_2023-12-18 in 0.12 sec.
2025-11-14 16:11:51,325 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:51,339 - INFO - Going to convert document batch...
2025-11-14 16:11:51,341 - INFO - Processing document 4_2024-02-13
2025-11-14 16:11:51,387 - INFO - Finished converting document 4_2024-02-13 in 0.08 sec.
2025-11-14 16:11:51,463 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:51,492 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CSCO\4_2023-12-18' --> 'data\processed_data\CSCO\4_2023-12-18.md'
Converted 'data\edgar_documents\CSCO\4_2024-02-13' --> 'data\processed_data\CSCO\4_2024-02-13.md'


2025-11-14 16:11:51,495 - INFO - Processing document 4_2024-02-21
2025-11-14 16:11:51,541 - INFO - Finished converting document 4_2024-02-21 in 0.09 sec.
2025-11-14 16:11:51,623 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:11:51,624 - ERROR - Input document 4_2024-02-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:11:51,627 - INFO - Going to convert document batch...
2025-11-14 16:11:51,658 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11

Converted 'data\edgar_documents\CSCO\4_2024-02-21' --> 'data\processed_data\CSCO\4_2024-02-21.md'
Error processing data\edgar_documents\CSCO\4_2024-02-22: File format not allowed: data\edgar_documents\CSCO\4_2024-02-22
Converted 'data\edgar_documents\CSCO\4_2024-03-07' --> 'data\processed_data\CSCO\4_2024-03-07.md'


2025-11-14 16:11:51,784 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:51,819 - INFO - Going to convert document batch...
2025-11-14 16:11:51,822 - INFO - Processing document 4_2024-03-12
2025-11-14 16:11:51,871 - INFO - Finished converting document 4_2024-03-12 in 0.11 sec.
2025-11-14 16:11:51,946 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:51,972 - INFO - Going to convert document batch...
2025-11-14 16:11:51,974 - INFO - Processing document 4_2024-03-14
2025-11-14 16:11:52,029 - INFO - Finished converting document 4_2024-03-14 in 0.12 sec.


Converted 'data\edgar_documents\CSCO\4_2024-03-12' --> 'data\processed_data\CSCO\4_2024-03-12.md'
Converted 'data\edgar_documents\CSCO\4_2024-03-14' --> 'data\processed_data\CSCO\4_2024-03-14.md'


2025-11-14 16:11:52,100 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:52,123 - INFO - Going to convert document batch...
2025-11-14 16:11:52,124 - INFO - Processing document 4_2024-03-19
2025-11-14 16:11:52,175 - INFO - Finished converting document 4_2024-03-19 in 0.11 sec.
2025-11-14 16:11:52,229 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:52,256 - INFO - Going to convert document batch...
2025-11-14 16:11:52,257 - INFO - Processing document 4_2024-05-14
2025-11-14 16:11:52,297 - INFO - Finished converting document 4_2024-05-14 in 0.08 sec.
2025-11-14 16:11:52,375 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:52,391 - INFO - Going to convert document batch...
2025-11-14 16:11:52,393 - INFO - Processing document 4_2024-05-21


Converted 'data\edgar_documents\CSCO\4_2024-03-19' --> 'data\processed_data\CSCO\4_2024-03-19.md'
Converted 'data\edgar_documents\CSCO\4_2024-05-14' --> 'data\processed_data\CSCO\4_2024-05-14.md'


2025-11-14 16:11:52,452 - INFO - Finished converting document 4_2024-05-21 in 0.11 sec.
2025-11-14 16:11:52,519 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:52,534 - INFO - Going to convert document batch...
2025-11-14 16:11:52,535 - INFO - Processing document 4_2024-05-31
2025-11-14 16:11:52,578 - INFO - Finished converting document 4_2024-05-31 in 0.08 sec.
2025-11-14 16:11:52,640 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:52,660 - INFO - Going to convert document batch...
2025-11-14 16:11:52,661 - INFO - Processing document 4_2024-06-12


Converted 'data\edgar_documents\CSCO\4_2024-05-21' --> 'data\processed_data\CSCO\4_2024-05-21.md'
Converted 'data\edgar_documents\CSCO\4_2024-05-31' --> 'data\processed_data\CSCO\4_2024-05-31.md'


2025-11-14 16:11:52,719 - INFO - Finished converting document 4_2024-06-12 in 0.11 sec.
2025-11-14 16:11:52,822 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:52,847 - INFO - Going to convert document batch...
2025-11-14 16:11:52,850 - INFO - Processing document 4_2024-06-14
2025-11-14 16:11:52,889 - INFO - Finished converting document 4_2024-06-14 in 0.08 sec.
2025-11-14 16:11:52,956 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:52,982 - INFO - Going to convert document batch...
2025-11-14 16:11:52,984 - INFO - Processing document 4_2024-06-18


Converted 'data\edgar_documents\CSCO\4_2024-06-12' --> 'data\processed_data\CSCO\4_2024-06-12.md'
Converted 'data\edgar_documents\CSCO\4_2024-06-14' --> 'data\processed_data\CSCO\4_2024-06-14.md'


2025-11-14 16:11:53,038 - INFO - Finished converting document 4_2024-06-18 in 0.09 sec.
2025-11-14 16:11:53,118 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:53,147 - INFO - Going to convert document batch...
2025-11-14 16:11:53,149 - INFO - Processing document 4_2024-08-13
2025-11-14 16:11:53,204 - INFO - Finished converting document 4_2024-08-13 in 0.09 sec.


Converted 'data\edgar_documents\CSCO\4_2024-06-18' --> 'data\processed_data\CSCO\4_2024-06-18.md'
Converted 'data\edgar_documents\CSCO\4_2024-08-13' --> 'data\processed_data\CSCO\4_2024-08-13.md'


2025-11-14 16:11:53,294 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:53,321 - INFO - Going to convert document batch...
2025-11-14 16:11:53,324 - INFO - Processing document 4_2024-08-20
2025-11-14 16:11:53,395 - INFO - Finished converting document 4_2024-08-20 in 0.12 sec.
2025-11-14 16:11:53,473 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:53,495 - INFO - Going to convert document batch...
2025-11-14 16:11:53,497 - INFO - Processing document 4_2024-08-22
2025-11-14 16:11:53,555 - INFO - Finished converting document 4_2024-08-22 in 0.09 sec.
2025-11-14 16:11:53,640 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\4_2024-08-20' --> 'data\processed_data\CSCO\4_2024-08-20.md'
Converted 'data\edgar_documents\CSCO\4_2024-08-22' --> 'data\processed_data\CSCO\4_2024-08-22.md'


2025-11-14 16:11:53,655 - INFO - Going to convert document batch...
2025-11-14 16:11:53,656 - INFO - Processing document 4_2024-08-28
2025-11-14 16:11:53,692 - INFO - Finished converting document 4_2024-08-28 in 0.08 sec.
2025-11-14 16:11:53,783 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:53,807 - INFO - Going to convert document batch...
2025-11-14 16:11:53,809 - INFO - Processing document 4_2024-09-12
2025-11-14 16:11:53,857 - INFO - Finished converting document 4_2024-09-12 in 0.09 sec.
2025-11-14 16:11:53,915 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:53,942 - INFO - Going to convert document batch...
2025-11-14 16:11:53,944 - INFO - Processing document 4_2024-09-18


Converted 'data\edgar_documents\CSCO\4_2024-08-28' --> 'data\processed_data\CSCO\4_2024-08-28.md'
Converted 'data\edgar_documents\CSCO\4_2024-09-12' --> 'data\processed_data\CSCO\4_2024-09-12.md'


2025-11-14 16:11:54,006 - INFO - Finished converting document 4_2024-09-18 in 0.11 sec.
2025-11-14 16:11:54,090 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:54,123 - INFO - Going to convert document batch...
2025-11-14 16:11:54,125 - INFO - Processing document 4_2024-09-23
2025-11-14 16:11:54,175 - INFO - Finished converting document 4_2024-09-23 in 0.11 sec.
2025-11-14 16:11:54,230 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:54,245 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CSCO\4_2024-09-18' --> 'data\processed_data\CSCO\4_2024-09-18.md'
Converted 'data\edgar_documents\CSCO\4_2024-09-23' --> 'data\processed_data\CSCO\4_2024-09-23.md'


2025-11-14 16:11:54,246 - INFO - Processing document 4_2024-11-06
2025-11-14 16:11:54,321 - INFO - Finished converting document 4_2024-11-06 in 0.09 sec.
2025-11-14 16:11:54,372 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:54,396 - INFO - Going to convert document batch...
2025-11-14 16:11:54,397 - INFO - Processing document 4_2024-11-13
2025-11-14 16:11:54,439 - INFO - Finished converting document 4_2024-11-13 in 0.08 sec.
2025-11-14 16:11:54,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:54,529 - INFO - Going to convert document batch...
2025-11-14 16:11:54,531 - INFO - Processing document 4_2024-11-19


Converted 'data\edgar_documents\CSCO\4_2024-11-06' --> 'data\processed_data\CSCO\4_2024-11-06.md'
Converted 'data\edgar_documents\CSCO\4_2024-11-13' --> 'data\processed_data\CSCO\4_2024-11-13.md'


2025-11-14 16:11:54,587 - INFO - Finished converting document 4_2024-11-19 in 0.11 sec.
2025-11-14 16:11:54,661 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:54,693 - INFO - Going to convert document batch...
2025-11-14 16:11:54,695 - INFO - Processing document 4_2024-11-21
2025-11-14 16:11:54,749 - INFO - Finished converting document 4_2024-11-21 in 0.11 sec.
2025-11-14 16:11:54,830 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\4_2024-11-19' --> 'data\processed_data\CSCO\4_2024-11-19.md'
Converted 'data\edgar_documents\CSCO\4_2024-11-21' --> 'data\processed_data\CSCO\4_2024-11-21.md'


2025-11-14 16:11:54,864 - INFO - Going to convert document batch...
2025-11-14 16:11:54,866 - INFO - Processing document 4_2024-12-02
2025-11-14 16:11:54,908 - INFO - Finished converting document 4_2024-12-02 in 0.09 sec.
2025-11-14 16:11:54,963 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:54,977 - INFO - Going to convert document batch...
2025-11-14 16:11:54,977 - INFO - Processing document 4_2024-12-06
2025-11-14 16:11:55,006 - INFO - Finished converting document 4_2024-12-06 in 0.06 sec.
2025-11-14 16:11:55,067 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:55,096 - INFO - Going to convert document batch...
2025-11-14 16:11:55,098 - INFO - Processing document 4_2024-12-11


Converted 'data\edgar_documents\CSCO\4_2024-12-02' --> 'data\processed_data\CSCO\4_2024-12-02.md'
Converted 'data\edgar_documents\CSCO\4_2024-12-06' --> 'data\processed_data\CSCO\4_2024-12-06.md'


2025-11-14 16:11:55,160 - INFO - Finished converting document 4_2024-12-11 in 0.12 sec.
2025-11-14 16:11:55,245 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:55,268 - INFO - Going to convert document batch...
2025-11-14 16:11:55,269 - INFO - Processing document 4_2024-12-12
2025-11-14 16:11:55,311 - INFO - Finished converting document 4_2024-12-12 in 0.09 sec.
2025-11-14 16:11:55,383 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\4_2024-12-11' --> 'data\processed_data\CSCO\4_2024-12-11.md'
Converted 'data\edgar_documents\CSCO\4_2024-12-12' --> 'data\processed_data\CSCO\4_2024-12-12.md'


2025-11-14 16:11:55,407 - INFO - Going to convert document batch...
2025-11-14 16:11:55,410 - INFO - Processing document 4_2025-02-12
2025-11-14 16:11:55,469 - INFO - Finished converting document 4_2025-02-12 in 0.11 sec.
2025-11-14 16:11:55,544 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:55,572 - INFO - Going to convert document batch...
2025-11-14 16:11:55,573 - INFO - Processing document 4_2025-02-18
2025-11-14 16:11:55,627 - INFO - Finished converting document 4_2025-02-18 in 0.11 sec.


Converted 'data\edgar_documents\CSCO\4_2025-02-12' --> 'data\processed_data\CSCO\4_2025-02-12.md'
Converted 'data\edgar_documents\CSCO\4_2025-02-18' --> 'data\processed_data\CSCO\4_2025-02-18.md'


2025-11-14 16:11:55,698 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:11:55,700 - ERROR - Input document 4_2025-02-19 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:11:55,703 - INFO - Going to convert document batch...
2025-11-14 16:11:55,736 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:11:55,739 - ERROR - Input document 4_2025-02-21 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\CSCO\4_2025-02-19: File format not allowed: data\edgar_documents\CSCO\4_2025-02-19
Error processing data\edgar_documents\CSCO\4_2025-02-21: File format not allowed: data\edgar_documents\CSCO\4_2025-02-21


2025-11-14 16:11:55,934 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:55,956 - INFO - Going to convert document batch...
2025-11-14 16:11:55,957 - INFO - Processing document 4_2025-02-27
2025-11-14 16:11:55,990 - INFO - Finished converting document 4_2025-02-27 in 0.06 sec.
2025-11-14 16:11:56,053 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:56,083 - INFO - Going to convert document batch...
2025-11-14 16:11:56,085 - INFO - Processing document 4_2025-03-12


Converted 'data\edgar_documents\CSCO\4_2025-02-24' --> 'data\processed_data\CSCO\4_2025-02-24.md'
Converted 'data\edgar_documents\CSCO\4_2025-02-27' --> 'data\processed_data\CSCO\4_2025-02-27.md'


2025-11-14 16:11:56,147 - INFO - Finished converting document 4_2025-03-12 in 0.12 sec.
2025-11-14 16:11:56,230 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:56,247 - INFO - Going to convert document batch...
2025-11-14 16:11:56,251 - INFO - Processing document 4_2025-03-18
2025-11-14 16:11:56,321 - INFO - Finished converting document 4_2025-03-18 in 0.09 sec.
2025-11-14 16:11:56,415 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\4_2025-03-12' --> 'data\processed_data\CSCO\4_2025-03-12.md'
Converted 'data\edgar_documents\CSCO\4_2025-03-18' --> 'data\processed_data\CSCO\4_2025-03-18.md'


2025-11-14 16:11:56,431 - INFO - Going to convert document batch...
2025-11-14 16:11:56,434 - INFO - Processing document 4_2025-05-13
2025-11-14 16:11:56,492 - INFO - Finished converting document 4_2025-05-13 in 0.09 sec.
2025-11-14 16:11:56,547 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:56,571 - INFO - Going to convert document batch...
2025-11-14 16:11:56,575 - INFO - Processing document 4_2025-05-20
2025-11-14 16:11:56,635 - INFO - Finished converting document 4_2025-05-20 in 0.09 sec.


Converted 'data\edgar_documents\CSCO\4_2025-05-13' --> 'data\processed_data\CSCO\4_2025-05-13.md'
Converted 'data\edgar_documents\CSCO\4_2025-05-20' --> 'data\processed_data\CSCO\4_2025-05-20.md'


2025-11-14 16:11:56,731 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:56,748 - INFO - Going to convert document batch...
2025-11-14 16:11:56,750 - INFO - Processing document 4_2025-05-29
2025-11-14 16:11:56,787 - INFO - Finished converting document 4_2025-05-29 in 0.08 sec.
2025-11-14 16:11:56,858 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:56,884 - INFO - Going to convert document batch...
2025-11-14 16:11:56,886 - INFO - Processing document 4_2025-06-06
2025-11-14 16:11:56,943 - INFO - Finished converting document 4_2025-06-06 in 0.09 sec.
2025-11-14 16:11:57,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\4_2025-05-29' --> 'data\processed_data\CSCO\4_2025-05-29.md'
Converted 'data\edgar_documents\CSCO\4_2025-06-06' --> 'data\processed_data\CSCO\4_2025-06-06.md'


2025-11-14 16:11:57,041 - INFO - Going to convert document batch...
2025-11-14 16:11:57,045 - INFO - Processing document 4_2025-06-09
2025-11-14 16:11:57,100 - INFO - Finished converting document 4_2025-06-09 in 0.09 sec.
2025-11-14 16:11:57,196 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:57,215 - INFO - Going to convert document batch...
2025-11-14 16:11:57,216 - INFO - Processing document 4_2025-06-12
2025-11-14 16:11:57,290 - INFO - Finished converting document 4_2025-06-12 in 0.11 sec.
2025-11-14 16:11:57,352 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\4_2025-06-09' --> 'data\processed_data\CSCO\4_2025-06-09.md'
Converted 'data\edgar_documents\CSCO\4_2025-06-12' --> 'data\processed_data\CSCO\4_2025-06-12.md'


2025-11-14 16:11:57,381 - INFO - Going to convert document batch...
2025-11-14 16:11:57,383 - INFO - Processing document 4_2025-06-18
2025-11-14 16:11:57,432 - INFO - Finished converting document 4_2025-06-18 in 0.11 sec.
2025-11-14 16:11:57,494 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:57,513 - INFO - Going to convert document batch...
2025-11-14 16:11:57,514 - INFO - Processing document 4_2025-06-20
2025-11-14 16:11:57,569 - INFO - Finished converting document 4_2025-06-20 in 0.09 sec.
2025-11-14 16:11:57,633 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:57,649 - INFO - Going to convert document batch...
2025-11-14 16:11:57,650 - INFO - Processing document 4_2025-07-14


Converted 'data\edgar_documents\CSCO\4_2025-06-18' --> 'data\processed_data\CSCO\4_2025-06-18.md'
Converted 'data\edgar_documents\CSCO\4_2025-06-20' --> 'data\processed_data\CSCO\4_2025-06-20.md'


2025-11-14 16:11:57,686 - INFO - Finished converting document 4_2025-07-14 in 0.08 sec.
2025-11-14 16:11:57,742 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:57,772 - INFO - Going to convert document batch...
2025-11-14 16:11:57,773 - INFO - Processing document 4_2025-08-12
2025-11-14 16:11:57,838 - INFO - Finished converting document 4_2025-08-12 in 0.12 sec.


Converted 'data\edgar_documents\CSCO\4_2025-07-14' --> 'data\processed_data\CSCO\4_2025-07-14.md'
Converted 'data\edgar_documents\CSCO\4_2025-08-12' --> 'data\processed_data\CSCO\4_2025-08-12.md'


2025-11-14 16:11:57,930 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:57,963 - INFO - Going to convert document batch...
2025-11-14 16:11:57,965 - INFO - Processing document 4_2025-08-19
2025-11-14 16:11:58,038 - INFO - Finished converting document 4_2025-08-19 in 0.12 sec.
2025-11-14 16:11:58,124 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:58,142 - INFO - Going to convert document batch...
2025-11-14 16:11:58,144 - INFO - Processing document 4_2025-08-20
2025-11-14 16:11:58,189 - INFO - Finished converting document 4_2025-08-20 in 0.08 sec.


Converted 'data\edgar_documents\CSCO\4_2025-08-19' --> 'data\processed_data\CSCO\4_2025-08-19.md'
Converted 'data\edgar_documents\CSCO\4_2025-08-20' --> 'data\processed_data\CSCO\4_2025-08-20.md'


2025-11-14 16:11:58,311 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:58,337 - INFO - Going to convert document batch...
2025-11-14 16:11:58,339 - INFO - Processing document 4_2025-08-27
2025-11-14 16:11:58,405 - INFO - Finished converting document 4_2025-08-27 in 0.12 sec.
2025-11-14 16:11:58,485 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:58,506 - INFO - Going to convert document batch...
2025-11-14 16:11:58,507 - INFO - Processing document 4_2025-09-11
2025-11-14 16:11:58,558 - INFO - Finished converting document 4_2025-09-11 in 0.09 sec.
2025-11-14 16:11:58,610 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:58,624 - INFO - Going to convert document batch...
2025-11-14 16:11:58,628 - INFO - Processing document 4_2025-09-15


Converted 'data\edgar_documents\CSCO\4_2025-08-27' --> 'data\processed_data\CSCO\4_2025-08-27.md'
Converted 'data\edgar_documents\CSCO\4_2025-09-11' --> 'data\processed_data\CSCO\4_2025-09-11.md'


2025-11-14 16:11:58,698 - INFO - Finished converting document 4_2025-09-15 in 0.11 sec.
2025-11-14 16:11:58,769 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:58,796 - INFO - Going to convert document batch...
2025-11-14 16:11:58,799 - INFO - Processing document 4_2025-09-17
2025-11-14 16:11:58,861 - INFO - Finished converting document 4_2025-09-17 in 0.12 sec.


Converted 'data\edgar_documents\CSCO\4_2025-09-15' --> 'data\processed_data\CSCO\4_2025-09-15.md'
Converted 'data\edgar_documents\CSCO\4_2025-09-17' --> 'data\processed_data\CSCO\4_2025-09-17.md'


2025-11-14 16:11:58,941 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:58,970 - INFO - Going to convert document batch...
2025-11-14 16:11:58,972 - INFO - Processing document 4_2025-09-18
2025-11-14 16:11:59,010 - INFO - Finished converting document 4_2025-09-18 in 0.11 sec.
2025-11-14 16:11:59,066 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:59,087 - INFO - Going to convert document batch...
2025-11-14 16:11:59,088 - INFO - Processing document 4_2025-09-22
2025-11-14 16:11:59,128 - INFO - Finished converting document 4_2025-09-22 in 0.08 sec.
2025-11-14 16:11:59,195 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:59,220 - INFO - Going to convert document batch...
2025-11-14 16:11:59,222 - INFO - Processing document 4_2025-10-14


Converted 'data\edgar_documents\CSCO\4_2025-09-18' --> 'data\processed_data\CSCO\4_2025-09-18.md'
Converted 'data\edgar_documents\CSCO\4_2025-09-22' --> 'data\processed_data\CSCO\4_2025-09-22.md'


2025-11-14 16:11:59,263 - INFO - Finished converting document 4_2025-10-14 in 0.11 sec.
2025-11-14 16:11:59,322 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:59,343 - INFO - Going to convert document batch...
2025-11-14 16:11:59,344 - INFO - Processing document 8-K_2023-02-15
2025-11-14 16:11:59,379 - INFO - Finished converting document 8-K_2023-02-15 in 0.08 sec.
2025-11-14 16:11:59,436 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:59,470 - INFO - Going to convert document batch...
2025-11-14 16:11:59,471 - INFO - Processing document 8-K_2023-02-21


Converted 'data\edgar_documents\CSCO\4_2025-10-14' --> 'data\processed_data\CSCO\4_2025-10-14.md'
Converted 'data\edgar_documents\CSCO\8-K_2023-02-15' --> 'data\processed_data\CSCO\8-K_2023-02-15.md'


2025-11-14 16:11:59,497 - INFO - Finished converting document 8-K_2023-02-21 in 0.09 sec.
2025-11-14 16:11:59,533 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:59,558 - INFO - Going to convert document batch...
2025-11-14 16:11:59,559 - INFO - Processing document 8-K_2023-03-10
2025-11-14 16:11:59,590 - INFO - Finished converting document 8-K_2023-03-10 in 0.08 sec.
2025-11-14 16:11:59,649 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:59,680 - INFO - Going to convert document batch...
2025-11-14 16:11:59,683 - INFO - Processing document 8-K_2023-05-17


Converted 'data\edgar_documents\CSCO\8-K_2023-02-21' --> 'data\processed_data\CSCO\8-K_2023-02-21.md'
Converted 'data\edgar_documents\CSCO\8-K_2023-03-10' --> 'data\processed_data\CSCO\8-K_2023-03-10.md'


2025-11-14 16:11:59,753 - INFO - Finished converting document 8-K_2023-05-17 in 0.14 sec.
2025-11-14 16:11:59,804 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:11:59,832 - INFO - Going to convert document batch...
2025-11-14 16:11:59,834 - INFO - Processing document 8-K_2023-07-19
2025-11-14 16:11:59,874 - INFO - Finished converting document 8-K_2023-07-19 in 0.09 sec.
2025-11-14 16:11:59,938 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\8-K_2023-05-17' --> 'data\processed_data\CSCO\8-K_2023-05-17.md'
Converted 'data\edgar_documents\CSCO\8-K_2023-07-19' --> 'data\processed_data\CSCO\8-K_2023-07-19.md'


2025-11-14 16:11:59,971 - INFO - Going to convert document batch...
2025-11-14 16:11:59,973 - INFO - Processing document 8-K_2023-08-16
2025-11-14 16:12:00,018 - INFO - Finished converting document 8-K_2023-08-16 in 0.11 sec.
2025-11-14 16:12:00,080 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\8-K_2023-08-16' --> 'data\processed_data\CSCO\8-K_2023-08-16.md'


2025-11-14 16:12:01,155 - INFO - Going to convert document batch...
2025-11-14 16:12:01,156 - INFO - Processing document 8-K_2023-09-21
2025-11-14 16:12:01,224 - INFO - Finished converting document 8-K_2023-09-21 in 1.16 sec.
2025-11-14 16:12:01,275 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:01,291 - INFO - Going to convert document batch...
2025-11-14 16:12:01,292 - INFO - Processing document 8-K_2023-09-25
2025-11-14 16:12:01,318 - INFO - Finished converting document 8-K_2023-09-25 in 0.06 sec.
2025-11-14 16:12:01,373 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:01,402 - INFO - Going to convert document batch...
2025-11-14 16:12:01,403 - INFO - Processing document 8-K_2023-10-10
2025-11-14 16:12:01,432 - INFO - Finished converting document 8-K_2023-10-10 in 0.09 sec.


Converted 'data\edgar_documents\CSCO\8-K_2023-09-21' --> 'data\processed_data\CSCO\8-K_2023-09-21.md'
Converted 'data\edgar_documents\CSCO\8-K_2023-09-25' --> 'data\processed_data\CSCO\8-K_2023-09-25.md'


2025-11-14 16:12:01,463 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:01,483 - INFO - Going to convert document batch...
2025-11-14 16:12:01,484 - INFO - Processing document 8-K_2023-11-15
2025-11-14 16:12:01,521 - INFO - Finished converting document 8-K_2023-11-15 in 0.06 sec.
2025-11-14 16:12:01,565 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:01,609 - INFO - Going to convert document batch...
2025-11-14 16:12:01,611 - INFO - Processing document 8-K_2023-12-08


Converted 'data\edgar_documents\CSCO\8-K_2023-10-10' --> 'data\processed_data\CSCO\8-K_2023-10-10.md'
Converted 'data\edgar_documents\CSCO\8-K_2023-11-15' --> 'data\processed_data\CSCO\8-K_2023-11-15.md'


2025-11-14 16:12:01,682 - INFO - Finished converting document 8-K_2023-12-08 in 0.14 sec.
2025-11-14 16:12:01,733 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:01,770 - INFO - Going to convert document batch...
2025-11-14 16:12:01,771 - INFO - Processing document 8-K_2024-02-08
2025-11-14 16:12:01,834 - INFO - Finished converting document 8-K_2024-02-08 in 0.11 sec.
2025-11-14 16:12:01,892 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:01,917 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CSCO\8-K_2023-12-08' --> 'data\processed_data\CSCO\8-K_2023-12-08.md'
Converted 'data\edgar_documents\CSCO\8-K_2024-02-08' --> 'data\processed_data\CSCO\8-K_2024-02-08.md'


2025-11-14 16:12:01,918 - INFO - Processing document 8-K_2024-02-14
2025-11-14 16:12:01,951 - INFO - Finished converting document 8-K_2024-02-14 in 0.09 sec.
2025-11-14 16:12:01,988 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:02,013 - INFO - Going to convert document batch...
2025-11-14 16:12:02,015 - INFO - Processing document 8-K_2024-02-26
2025-11-14 16:12:02,076 - INFO - Finished converting document 8-K_2024-02-26 in 0.11 sec.
2025-11-14 16:12:02,137 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:02,168 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CSCO\8-K_2024-02-14' --> 'data\processed_data\CSCO\8-K_2024-02-14.md'
Converted 'data\edgar_documents\CSCO\8-K_2024-02-26' --> 'data\processed_data\CSCO\8-K_2024-02-26.md'


2025-11-14 16:12:02,169 - INFO - Processing document 8-K_2024-03-18
2025-11-14 16:12:02,224 - INFO - Finished converting document 8-K_2024-03-18 in 0.11 sec.
2025-11-14 16:12:02,262 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:02,305 - INFO - Going to convert document batch...
2025-11-14 16:12:02,307 - INFO - Processing document 8-K_2024-05-15
2025-11-14 16:12:02,369 - INFO - Finished converting document 8-K_2024-05-15 in 0.12 sec.


Converted 'data\edgar_documents\CSCO\8-K_2024-03-18' --> 'data\processed_data\CSCO\8-K_2024-03-18.md'
Converted 'data\edgar_documents\CSCO\8-K_2024-05-15' --> 'data\processed_data\CSCO\8-K_2024-05-15.md'


2025-11-14 16:12:02,435 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:02,460 - INFO - Going to convert document batch...
2025-11-14 16:12:02,463 - INFO - Processing document 8-K_2024-06-14
2025-11-14 16:12:02,501 - INFO - Finished converting document 8-K_2024-06-14 in 0.09 sec.
2025-11-14 16:12:02,542 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:02,567 - INFO - Going to convert document batch...
2025-11-14 16:12:02,568 - INFO - Processing document 8-K_2024-07-19
2025-11-14 16:12:02,603 - INFO - Finished converting document 8-K_2024-07-19 in 0.08 sec.
2025-11-14 16:12:02,664 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:02,681 - INFO - Going to convert document batch...
2025-11-14 16:12:02,682 - INFO - Processing document 8-K_2024-08-14


Converted 'data\edgar_documents\CSCO\8-K_2024-06-14' --> 'data\processed_data\CSCO\8-K_2024-06-14.md'
Converted 'data\edgar_documents\CSCO\8-K_2024-07-19' --> 'data\processed_data\CSCO\8-K_2024-07-19.md'


2025-11-14 16:12:02,733 - INFO - Finished converting document 8-K_2024-08-14 in 0.11 sec.
2025-11-14 16:12:02,780 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:02,803 - INFO - Going to convert document batch...
2025-11-14 16:12:02,806 - INFO - Processing document 8-K_2024-10-11
2025-11-14 16:12:02,834 - INFO - Finished converting document 8-K_2024-10-11 in 0.08 sec.
2025-11-14 16:12:02,884 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:02,921 - INFO - Going to convert document batch...
2025-11-14 16:12:02,924 - INFO - Processing document 8-K_2024-11-13


Converted 'data\edgar_documents\CSCO\8-K_2024-08-14' --> 'data\processed_data\CSCO\8-K_2024-08-14.md'
Converted 'data\edgar_documents\CSCO\8-K_2024-10-11' --> 'data\processed_data\CSCO\8-K_2024-10-11.md'


2025-11-14 16:12:02,981 - INFO - Finished converting document 8-K_2024-11-13 in 0.14 sec.
2025-11-14 16:12:03,033 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:03,086 - INFO - Going to convert document batch...
2025-11-14 16:12:03,087 - INFO - Processing document 8-K_2024-12-11
2025-11-14 16:12:03,164 - INFO - Finished converting document 8-K_2024-12-11 in 0.14 sec.


Converted 'data\edgar_documents\CSCO\8-K_2024-11-13' --> 'data\processed_data\CSCO\8-K_2024-11-13.md'


2025-11-14 16:12:03,224 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:03,234 - INFO - Going to convert document batch...
2025-11-14 16:12:03,235 - INFO - Processing document 8-K_2025-02-12
2025-11-14 16:12:03,284 - INFO - Finished converting document 8-K_2025-02-12 in 0.06 sec.
2025-11-14 16:12:03,350 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\8-K_2024-12-11' --> 'data\processed_data\CSCO\8-K_2024-12-11.md'
Converted 'data\edgar_documents\CSCO\8-K_2025-02-12' --> 'data\processed_data\CSCO\8-K_2025-02-12.md'


2025-11-14 16:12:03,392 - INFO - Going to convert document batch...
2025-11-14 16:12:03,394 - INFO - Processing document 8-K_2025-02-24
2025-11-14 16:12:03,468 - INFO - Finished converting document 8-K_2025-02-24 in 0.16 sec.
2025-11-14 16:12:03,519 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:03,535 - INFO - Going to convert document batch...
2025-11-14 16:12:03,537 - INFO - Processing document 8-K_2025-02-27
2025-11-14 16:12:03,583 - INFO - Finished converting document 8-K_2025-02-27 in 0.08 sec.
2025-11-14 16:12:03,642 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:03,661 - INFO - Going to convert document batch...
2025-11-14 16:12:03,663 - INFO - Processing document 8-K_2025-05-13
2025-11-14 16:12:03,705 - INFO - Finished converting document 8-K_2025-05-13 in 0.09 sec.


Converted 'data\edgar_documents\CSCO\8-K_2025-02-24' --> 'data\processed_data\CSCO\8-K_2025-02-24.md'
Converted 'data\edgar_documents\CSCO\8-K_2025-02-27' --> 'data\processed_data\CSCO\8-K_2025-02-27.md'


2025-11-14 16:12:03,742 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:03,758 - INFO - Going to convert document batch...
2025-11-14 16:12:03,758 - INFO - Processing document 8-K_2025-05-14
2025-11-14 16:12:03,783 - INFO - Finished converting document 8-K_2025-05-14 in 0.06 sec.
2025-11-14 16:12:03,824 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:03,842 - INFO - Going to convert document batch...
2025-11-14 16:12:03,844 - INFO - Processing document 8-K_2025-06-09
2025-11-14 16:12:03,869 - INFO - Finished converting document 8-K_2025-06-09 in 0.06 sec.


Converted 'data\edgar_documents\CSCO\8-K_2025-05-13' --> 'data\processed_data\CSCO\8-K_2025-05-13.md'
Converted 'data\edgar_documents\CSCO\8-K_2025-05-14' --> 'data\processed_data\CSCO\8-K_2025-05-14.md'
Converted 'data\edgar_documents\CSCO\8-K_2025-06-09' --> 'data\processed_data\CSCO\8-K_2025-06-09.md'


2025-11-14 16:12:03,933 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:03,967 - INFO - Going to convert document batch...
2025-11-14 16:12:03,968 - INFO - Processing document 8-K_2025-08-13
2025-11-14 16:12:04,004 - INFO - Finished converting document 8-K_2025-08-13 in 0.11 sec.
2025-11-14 16:12:04,041 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:04,056 - INFO - Going to convert document batch...
2025-11-14 16:12:04,058 - INFO - Processing document 8-K_2025-08-25
2025-11-14 16:12:04,110 - INFO - Finished converting document 8-K_2025-08-25 in 0.09 sec.
2025-11-14 16:12:04,170 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:12:04,195 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CSCO\8-K_2025-08-13' --> 'data\processed_data\CSCO\8-K_2025-08-13.md'
Converted 'data\edgar_documents\CSCO\8-K_2025-08-25' --> 'data\processed_data\CSCO\8-K_2025-08-25.md'


2025-11-14 16:12:04,197 - INFO - Processing document 8-K_2025-10-17
2025-11-14 16:12:04,254 - INFO - Finished converting document 8-K_2025-10-17 in 0.11 sec.
2025-11-14 16:12:04,376 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:12:04,379 - ERROR - Input document DEF-14A_2023-10-17 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:12:04,385 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CSCO\8-K_2025-10-17' --> 'data\processed_data\CSCO\8-K_2025-10-17.md'
Error processing data\edgar_documents\CSCO\DEF-14A_2023-10-17: File format not allowed: data\edgar_documents\CSCO\DEF-14A_2023-10-17


2025-11-14 16:12:04,463 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:12:04,466 - ERROR - Input document DEF-14A_2024-10-18 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:12:04,472 - INFO - Going to convert document batch...
2025-11-14 16:12:04,571 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Error processing data\edgar_documents\CSCO\DEF-14A_2024-10-18: File format not allowed: data\edgar_documents\CSCO\DEF-14A_2024-10-18


2025-11-14 16:12:05,673 - INFO - Going to convert document batch...
2025-11-14 16:12:05,674 - INFO - Processing document DEF-14A_2025-10-28
2025-11-14 16:12:10,551 - INFO - Finished converting document DEF-14A_2025-10-28 in 6.08 sec.
2025-11-14 16:12:12,503 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CSCO\DEF-14A_2025-10-28' --> 'data\processed_data\CSCO\DEF-14A_2025-10-28.md'
Processed 122 new files. Errors: 6
Found 112 files to process in data\edgar_documents\CVS


2025-11-14 16:12:15,996 - INFO - Going to convert document batch...
2025-11-14 16:12:15,998 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:12:15,999 - INFO - Processing document 10-K_2023-02-08
2025-11-14 16:12:27,447 - INFO - Finished converting document 10-K_2023-02-08 in 15.08 sec.
2025-11-14 16:12:30,467 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\10-K_2023-02-08' --> 'data\processed_data\CVS\10-K_2023-02-08.md'


2025-11-14 16:12:34,438 - INFO - Going to convert document batch...
2025-11-14 16:12:34,439 - INFO - Processing document 10-K_2024-02-07
2025-11-14 16:12:48,257 - INFO - Finished converting document 10-K_2024-02-07 in 17.92 sec.
2025-11-14 16:12:51,052 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\10-K_2024-02-07' --> 'data\processed_data\CVS\10-K_2024-02-07.md'


2025-11-14 16:12:55,097 - INFO - Going to convert document batch...
2025-11-14 16:12:55,099 - INFO - Processing document 10-K_2025-02-12
2025-11-14 16:13:08,019 - INFO - Finished converting document 10-K_2025-02-12 in 17.09 sec.
2025-11-14 16:13:10,751 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\10-K_2025-02-12' --> 'data\processed_data\CVS\10-K_2025-02-12.md'


2025-11-14 16:13:13,657 - INFO - Going to convert document batch...
2025-11-14 16:13:13,658 - INFO - Processing document 10-Q_2023-05-03
2025-11-14 16:13:17,618 - INFO - Finished converting document 10-Q_2023-05-03 in 6.97 sec.
2025-11-14 16:13:19,295 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\10-Q_2023-05-03' --> 'data\processed_data\CVS\10-Q_2023-05-03.md'


2025-11-14 16:13:22,814 - INFO - Going to convert document batch...
2025-11-14 16:13:22,816 - INFO - Processing document 10-Q_2023-08-02
2025-11-14 16:13:27,696 - INFO - Finished converting document 10-Q_2023-08-02 in 8.50 sec.
2025-11-14 16:13:29,796 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\10-Q_2023-08-02' --> 'data\processed_data\CVS\10-Q_2023-08-02.md'


2025-11-14 16:13:33,210 - INFO - Going to convert document batch...
2025-11-14 16:13:33,212 - INFO - Processing document 10-Q_2023-11-01
2025-11-14 16:13:38,186 - INFO - Finished converting document 10-Q_2023-11-01 in 8.52 sec.
2025-11-14 16:13:40,163 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\10-Q_2023-11-01' --> 'data\processed_data\CVS\10-Q_2023-11-01.md'


2025-11-14 16:13:42,657 - INFO - Going to convert document batch...
2025-11-14 16:13:42,659 - INFO - Processing document 10-Q_2024-05-01
2025-11-14 16:13:45,620 - INFO - Finished converting document 10-Q_2024-05-01 in 5.52 sec.
2025-11-14 16:13:47,089 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\10-Q_2024-05-01' --> 'data\processed_data\CVS\10-Q_2024-05-01.md'


2025-11-14 16:13:49,737 - INFO - Going to convert document batch...
2025-11-14 16:13:49,738 - INFO - Processing document 10-Q_2024-08-07
2025-11-14 16:13:53,358 - INFO - Finished converting document 10-Q_2024-08-07 in 6.33 sec.
2025-11-14 16:13:55,020 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\10-Q_2024-08-07' --> 'data\processed_data\CVS\10-Q_2024-08-07.md'


2025-11-14 16:13:57,423 - INFO - Going to convert document batch...
2025-11-14 16:13:57,424 - INFO - Processing document 10-Q_2024-11-06
2025-11-14 16:14:01,715 - INFO - Finished converting document 10-Q_2024-11-06 in 6.80 sec.
2025-11-14 16:14:03,391 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\10-Q_2024-11-06' --> 'data\processed_data\CVS\10-Q_2024-11-06.md'


2025-11-14 16:14:04,843 - INFO - Going to convert document batch...
2025-11-14 16:14:04,846 - INFO - Processing document 10-Q_2025-05-01
2025-11-14 16:14:07,475 - INFO - Finished converting document 10-Q_2025-05-01 in 4.12 sec.
2025-11-14 16:14:10,060 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\10-Q_2025-05-01' --> 'data\processed_data\CVS\10-Q_2025-05-01.md'


2025-11-14 16:14:11,916 - INFO - Going to convert document batch...
2025-11-14 16:14:11,918 - INFO - Processing document 10-Q_2025-07-31
2025-11-14 16:14:16,629 - INFO - Finished converting document 10-Q_2025-07-31 in 6.62 sec.
2025-11-14 16:14:18,508 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\10-Q_2025-07-31' --> 'data\processed_data\CVS\10-Q_2025-07-31.md'


2025-11-14 16:14:20,534 - INFO - Going to convert document batch...
2025-11-14 16:14:20,536 - INFO - Processing document 10-Q_2025-10-29
2025-11-14 16:14:25,955 - INFO - Finished converting document 10-Q_2025-10-29 in 7.55 sec.
2025-11-14 16:14:27,924 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:27,961 - INFO - Going to convert document batch...
2025-11-14 16:14:27,962 - INFO - Processing document 4_2023-01-04
2025-11-14 16:14:28,049 - INFO - Finished converting document 4_2023-01-04 in 0.14 sec.


Converted 'data\edgar_documents\CVS\10-Q_2025-10-29' --> 'data\processed_data\CVS\10-Q_2025-10-29.md'


2025-11-14 16:14:28,160 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:28,197 - INFO - Going to convert document batch...
2025-11-14 16:14:28,199 - INFO - Processing document 4_2023-02-03
2025-11-14 16:14:28,279 - INFO - Finished converting document 4_2023-02-03 in 0.14 sec.


Converted 'data\edgar_documents\CVS\4_2023-01-04' --> 'data\processed_data\CVS\4_2023-01-04.md'
Converted 'data\edgar_documents\CVS\4_2023-02-03' --> 'data\processed_data\CVS\4_2023-02-03.md'


2025-11-14 16:14:28,387 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:14:28,389 - ERROR - Input document 4_2023-02-13 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:14:28,392 - INFO - Going to convert document batch...
2025-11-14 16:14:28,434 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:14:28,438 - ERROR - Input document 4_2023-02-15 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Error processing data\edgar_documents\CVS\4_2023-02-13: File format not allowed: data\edgar_documents\CVS\4_2023-02-13
Error processing data\edgar_documents\CVS\4_2023-02-15: File format not allowed: data\edgar_documents\CVS\4_2023-02-15
Converted 'data\edgar_documents\CVS\4_2023-03-01' --> 'data\processed_data\CVS\4_2023-03-01.md'


2025-11-14 16:14:28,604 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:28,663 - INFO - Going to convert document batch...
2025-11-14 16:14:28,665 - INFO - Processing document 4_2023-04-04
2025-11-14 16:14:28,755 - INFO - Finished converting document 4_2023-04-04 in 0.17 sec.
2025-11-14 16:14:28,845 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:28,886 - INFO - Going to convert document batch...
2025-11-14 16:14:28,888 - INFO - Processing document 4_2023-05-05
2025-11-14 16:14:28,976 - INFO - Finished converting document 4_2023-05-05 in 0.14 sec.


Converted 'data\edgar_documents\CVS\4_2023-04-04' --> 'data\processed_data\CVS\4_2023-04-04.md'


2025-11-14 16:14:29,077 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:29,107 - INFO - Going to convert document batch...
2025-11-14 16:14:29,109 - INFO - Processing document 4_2023-05-19
2025-11-14 16:14:29,167 - INFO - Finished converting document 4_2023-05-19 in 0.11 sec.
2025-11-14 16:14:29,263 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\CVS\4_2023-05-05' --> 'data\processed_data\CVS\4_2023-05-05.md'
Converted 'data\edgar_documents\CVS\4_2023-05-19' --> 'data\processed_data\CVS\4_2023-05-19.md'


2025-11-14 16:14:29,265 - ERROR - Input document 4_2023-05-30 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:14:29,267 - INFO - Going to convert document batch...
2025-11-14 16:14:29,292 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:14:29,299 - ERROR - Input document 4_2023-06-01 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputForm

Error processing data\edgar_documents\CVS\4_2023-05-30: File format not allowed: data\edgar_documents\CVS\4_2023-05-30
Error processing data\edgar_documents\CVS\4_2023-06-01: File format not allowed: data\edgar_documents\CVS\4_2023-06-01


2025-11-14 16:14:29,510 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:29,565 - INFO - Going to convert document batch...
2025-11-14 16:14:29,567 - INFO - Processing document 4_2023-09-01
2025-11-14 16:14:29,649 - INFO - Finished converting document 4_2023-09-01 in 0.14 sec.


Converted 'data\edgar_documents\CVS\4_2023-08-04' --> 'data\processed_data\CVS\4_2023-08-04.md'


2025-11-14 16:14:29,747 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:29,771 - INFO - Going to convert document batch...
2025-11-14 16:14:29,772 - INFO - Processing document 4_2023-10-02
2025-11-14 16:14:29,827 - INFO - Finished converting document 4_2023-10-02 in 0.09 sec.
2025-11-14 16:14:29,909 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:29,927 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CVS\4_2023-09-01' --> 'data\processed_data\CVS\4_2023-09-01.md'
Converted 'data\edgar_documents\CVS\4_2023-10-02' --> 'data\processed_data\CVS\4_2023-10-02.md'


2025-11-14 16:14:29,929 - INFO - Processing document 4_2023-11-06
2025-11-14 16:14:29,997 - INFO - Finished converting document 4_2023-11-06 in 0.12 sec.
2025-11-14 16:14:30,052 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:30,073 - INFO - Going to convert document batch...
2025-11-14 16:14:30,074 - INFO - Processing document 4_2023-11-17
2025-11-14 16:14:30,115 - INFO - Finished converting document 4_2023-11-17 in 0.08 sec.
2025-11-14 16:14:30,205 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\4_2023-11-06' --> 'data\processed_data\CVS\4_2023-11-06.md'
Converted 'data\edgar_documents\CVS\4_2023-11-17' --> 'data\processed_data\CVS\4_2023-11-17.md'


2025-11-14 16:14:30,223 - INFO - Going to convert document batch...
2025-11-14 16:14:30,225 - INFO - Processing document 4_2023-12-01
2025-11-14 16:14:30,296 - INFO - Finished converting document 4_2023-12-01 in 0.12 sec.
2025-11-14 16:14:30,373 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:30,399 - INFO - Going to convert document batch...
2025-11-14 16:14:30,401 - INFO - Processing document 4_2023-12-08
2025-11-14 16:14:30,457 - INFO - Finished converting document 4_2023-12-08 in 0.11 sec.


Converted 'data\edgar_documents\CVS\4_2023-12-01' --> 'data\processed_data\CVS\4_2023-12-01.md'
Converted 'data\edgar_documents\CVS\4_2023-12-08' --> 'data\processed_data\CVS\4_2023-12-08.md'


2025-11-14 16:14:30,554 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:30,596 - INFO - Going to convert document batch...
2025-11-14 16:14:30,598 - INFO - Processing document 4_2023-12-15
2025-11-14 16:14:30,685 - INFO - Finished converting document 4_2023-12-15 in 0.17 sec.
2025-11-14 16:14:30,775 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:30,811 - INFO - Going to convert document batch...
2025-11-14 16:14:30,814 - INFO - Processing document 4_2024-02-14
2025-11-14 16:14:30,892 - INFO - Finished converting document 4_2024-02-14 in 0.14 sec.


Converted 'data\edgar_documents\CVS\4_2023-12-15' --> 'data\processed_data\CVS\4_2023-12-15.md'


2025-11-14 16:14:30,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:31,024 - INFO - Going to convert document batch...
2025-11-14 16:14:31,026 - INFO - Processing document 4_2024-02-16
2025-11-14 16:14:31,111 - INFO - Finished converting document 4_2024-02-16 in 0.16 sec.


Converted 'data\edgar_documents\CVS\4_2024-02-14' --> 'data\processed_data\CVS\4_2024-02-14.md'


2025-11-14 16:14:31,197 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:31,225 - INFO - Going to convert document batch...
2025-11-14 16:14:31,227 - INFO - Processing document 4_2024-02-28
2025-11-14 16:14:31,281 - INFO - Finished converting document 4_2024-02-28 in 0.11 sec.


Converted 'data\edgar_documents\CVS\4_2024-02-16' --> 'data\processed_data\CVS\4_2024-02-16.md'
Converted 'data\edgar_documents\CVS\4_2024-02-28' --> 'data\processed_data\CVS\4_2024-02-28.md'


2025-11-14 16:14:31,387 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:31,418 - INFO - Going to convert document batch...
2025-11-14 16:14:31,419 - INFO - Processing document 4_2024-03-01
2025-11-14 16:14:31,464 - INFO - Finished converting document 4_2024-03-01 in 0.12 sec.
2025-11-14 16:14:31,520 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:31,536 - INFO - Going to convert document batch...
2025-11-14 16:14:31,537 - INFO - Processing document 4_2024-04-03
2025-11-14 16:14:31,572 - INFO - Finished converting document 4_2024-04-03 in 0.06 sec.
2025-11-14 16:14:31,639 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:31,665 - INFO - Going to convert document batch...
2025-11-14 16:14:31,668 - INFO - Processing document 4_2024-05-02


Converted 'data\edgar_documents\CVS\4_2024-03-01' --> 'data\processed_data\CVS\4_2024-03-01.md'
Converted 'data\edgar_documents\CVS\4_2024-04-03' --> 'data\processed_data\CVS\4_2024-04-03.md'


2025-11-14 16:14:31,725 - INFO - Finished converting document 4_2024-05-02 in 0.11 sec.
2025-11-14 16:14:31,802 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:14:31,803 - ERROR - Input document 4_2024-05-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:14:31,805 - INFO - Going to convert document batch...
2025-11-14 16:14:31,852 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:14:31,854 - ERROR - Input document 4_2024-05-08 with forma

Converted 'data\edgar_documents\CVS\4_2024-05-02' --> 'data\processed_data\CVS\4_2024-05-02.md'
Error processing data\edgar_documents\CVS\4_2024-05-07: File format not allowed: data\edgar_documents\CVS\4_2024-05-07
Error processing data\edgar_documents\CVS\4_2024-05-08: File format not allowed: data\edgar_documents\CVS\4_2024-05-08


2025-11-14 16:14:31,965 - INFO - Finished converting document 4_2024-05-17 in 0.11 sec.
2025-11-14 16:14:32,041 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:32,054 - INFO - Going to convert document batch...
2025-11-14 16:14:32,056 - INFO - Processing document 4_2024-09-03
2025-11-14 16:14:32,108 - INFO - Finished converting document 4_2024-09-03 in 0.08 sec.
2025-11-14 16:14:32,190 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:32,222 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CVS\4_2024-05-17' --> 'data\processed_data\CVS\4_2024-05-17.md'
Converted 'data\edgar_documents\CVS\4_2024-09-03' --> 'data\processed_data\CVS\4_2024-09-03.md'


2025-11-14 16:14:32,224 - INFO - Processing document 4_2024-11-25
2025-11-14 16:14:32,301 - INFO - Finished converting document 4_2024-11-25 in 0.14 sec.
2025-11-14 16:14:32,382 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:32,425 - INFO - Going to convert document batch...
2025-11-14 16:14:32,433 - INFO - Processing document 4_2024-12-03
2025-11-14 16:14:32,532 - INFO - Finished converting document 4_2024-12-03 in 0.17 sec.


Converted 'data\edgar_documents\CVS\4_2024-11-25' --> 'data\processed_data\CVS\4_2024-11-25.md'


2025-11-14 16:14:32,613 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:14:32,614 - ERROR - Input document 4_2024-12-05 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:14:32,616 - INFO - Going to convert document batch...
2025-11-14 16:14:32,632 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:32,676 - INFO - Going to convert document batch...
2025-11-14 16:14:32,678 - INFO - Processing document 4_2024-12-09
2025-11-14 16:14:32,720 - INFO - Fin

Converted 'data\edgar_documents\CVS\4_2024-12-03' --> 'data\processed_data\CVS\4_2024-12-03.md'
Error processing data\edgar_documents\CVS\4_2024-12-05: File format not allowed: data\edgar_documents\CVS\4_2024-12-05


2025-11-14 16:14:32,804 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:32,841 - INFO - Going to convert document batch...
2025-11-14 16:14:32,844 - INFO - Processing document 4_2024-12-26
2025-11-14 16:14:32,921 - INFO - Finished converting document 4_2024-12-26 in 0.14 sec.


Converted 'data\edgar_documents\CVS\4_2024-12-09' --> 'data\processed_data\CVS\4_2024-12-09.md'


2025-11-14 16:14:33,001 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:33,031 - INFO - Going to convert document batch...
2025-11-14 16:14:33,032 - INFO - Processing document 4_2025-02-19
2025-11-14 16:14:33,097 - INFO - Finished converting document 4_2025-02-19 in 0.11 sec.
2025-11-14 16:14:33,178 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\4_2024-12-26' --> 'data\processed_data\CVS\4_2024-12-26.md'
Converted 'data\edgar_documents\CVS\4_2025-02-19' --> 'data\processed_data\CVS\4_2025-02-19.md'


2025-11-14 16:14:33,199 - INFO - Going to convert document batch...
2025-11-14 16:14:33,200 - INFO - Processing document 4_2025-03-03
2025-11-14 16:14:33,243 - INFO - Finished converting document 4_2025-03-03 in 0.08 sec.
2025-11-14 16:14:33,340 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:33,370 - INFO - Going to convert document batch...
2025-11-14 16:14:33,372 - INFO - Processing document 4_2025-03-07
2025-11-14 16:14:33,431 - INFO - Finished converting document 4_2025-03-07 in 0.11 sec.


Converted 'data\edgar_documents\CVS\4_2025-03-03' --> 'data\processed_data\CVS\4_2025-03-03.md'
Converted 'data\edgar_documents\CVS\4_2025-03-07' --> 'data\processed_data\CVS\4_2025-03-07.md'


2025-11-14 16:14:33,519 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:33,540 - INFO - Going to convert document batch...
2025-11-14 16:14:33,541 - INFO - Processing document 4_2025-03-14
2025-11-14 16:14:33,606 - INFO - Finished converting document 4_2025-03-14 in 0.12 sec.
2025-11-14 16:14:33,685 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:33,706 - INFO - Going to convert document batch...
2025-11-14 16:14:33,707 - INFO - Processing document 4_2025-03-18
2025-11-14 16:14:33,739 - INFO - Finished converting document 4_2025-03-18 in 0.06 sec.
2025-11-14 16:14:33,802 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:33,835 - INFO - Going to convert document batch...
2025-11-14 16:14:33,836 - INFO - Processing document 4_2025-04-03


Converted 'data\edgar_documents\CVS\4_2025-03-14' --> 'data\processed_data\CVS\4_2025-03-14.md'
Converted 'data\edgar_documents\CVS\4_2025-03-18' --> 'data\processed_data\CVS\4_2025-03-18.md'


2025-11-14 16:14:33,894 - INFO - Finished converting document 4_2025-04-03 in 0.12 sec.
2025-11-14 16:14:33,976 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:34,020 - INFO - Going to convert document batch...
2025-11-14 16:14:34,022 - INFO - Processing document 4_2025-05-06
2025-11-14 16:14:34,101 - INFO - Finished converting document 4_2025-05-06 in 0.14 sec.


Converted 'data\edgar_documents\CVS\4_2025-04-03' --> 'data\processed_data\CVS\4_2025-04-03.md'


2025-11-14 16:14:34,211 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:34,240 - INFO - Going to convert document batch...
2025-11-14 16:14:34,241 - INFO - Processing document 4_2025-05-09
2025-11-14 16:14:34,304 - INFO - Finished converting document 4_2025-05-09 in 0.12 sec.


Converted 'data\edgar_documents\CVS\4_2025-05-06' --> 'data\processed_data\CVS\4_2025-05-06.md'
Converted 'data\edgar_documents\CVS\4_2025-05-09' --> 'data\processed_data\CVS\4_2025-05-09.md'


2025-11-14 16:14:34,384 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:34,409 - INFO - Going to convert document batch...
2025-11-14 16:14:34,411 - INFO - Processing document 4_2025-05-19
2025-11-14 16:14:34,518 - INFO - Finished converting document 4_2025-05-19 in 0.14 sec.
2025-11-14 16:14:34,628 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:34,643 - INFO - Going to convert document batch...
2025-11-14 16:14:34,643 - INFO - Processing document 4_2025-06-03
2025-11-14 16:14:34,678 - INFO - Finished converting document 4_2025-06-03 in 0.06 sec.
2025-11-14 16:14:34,750 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:34,775 - INFO - Going to convert document batch...
2025-11-14 16:14:34,777 - INFO - Processing document 4_2025-06-09


Converted 'data\edgar_documents\CVS\4_2025-05-19' --> 'data\processed_data\CVS\4_2025-05-19.md'
Converted 'data\edgar_documents\CVS\4_2025-06-03' --> 'data\processed_data\CVS\4_2025-06-03.md'


2025-11-14 16:14:34,830 - INFO - Finished converting document 4_2025-06-09 in 0.11 sec.
2025-11-14 16:14:34,926 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:14:34,928 - ERROR - Input document 4_2025-08-11 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:14:34,932 - INFO - Going to convert document batch...
2025-11-14 16:14:34,967 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:14:34,969 - ERROR - Input document 4_2025-08-12 with forma

Converted 'data\edgar_documents\CVS\4_2025-06-09' --> 'data\processed_data\CVS\4_2025-06-09.md'
Error processing data\edgar_documents\CVS\4_2025-08-11: File format not allowed: data\edgar_documents\CVS\4_2025-08-11
Error processing data\edgar_documents\CVS\4_2025-08-12: File format not allowed: data\edgar_documents\CVS\4_2025-08-12


2025-11-14 16:14:35,080 - INFO - Finished converting document 4_2025-08-29 in 0.11 sec.
2025-11-14 16:14:35,153 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:35,170 - INFO - Going to convert document batch...
2025-11-14 16:14:35,171 - INFO - Processing document 4_2025-09-02
2025-11-14 16:14:35,203 - INFO - Finished converting document 4_2025-09-02 in 0.06 sec.
2025-11-14 16:14:35,263 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:35,292 - INFO - Going to convert document batch...
2025-11-14 16:14:35,293 - INFO - Processing document 4_2025-10-14


Converted 'data\edgar_documents\CVS\4_2025-08-29' --> 'data\processed_data\CVS\4_2025-08-29.md'
Converted 'data\edgar_documents\CVS\4_2025-09-02' --> 'data\processed_data\CVS\4_2025-09-02.md'


2025-11-14 16:14:35,349 - INFO - Finished converting document 4_2025-10-14 in 0.11 sec.
2025-11-14 16:14:35,421 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:35,461 - INFO - Going to convert document batch...
2025-11-14 16:14:35,463 - INFO - Processing document 8-K_2023-01-09
2025-11-14 16:14:35,511 - INFO - Finished converting document 8-K_2023-01-09 in 0.12 sec.
2025-11-14 16:14:35,562 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\4_2025-10-14' --> 'data\processed_data\CVS\4_2025-10-14.md'
Converted 'data\edgar_documents\CVS\8-K_2023-01-09' --> 'data\processed_data\CVS\8-K_2023-01-09.md'


2025-11-14 16:14:35,596 - INFO - Going to convert document batch...
2025-11-14 16:14:35,598 - INFO - Processing document 8-K_2023-01-23
2025-11-14 16:14:35,660 - INFO - Finished converting document 8-K_2023-01-23 in 0.11 sec.
2025-11-14 16:14:35,714 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:35,761 - INFO - Going to convert document batch...
2025-11-14 16:14:35,762 - INFO - Processing document 8-K_2023-02-08
2025-11-14 16:14:35,821 - INFO - Finished converting document 8-K_2023-02-08 in 0.12 sec.


Converted 'data\edgar_documents\CVS\8-K_2023-01-23' --> 'data\processed_data\CVS\8-K_2023-01-23.md'


2025-11-14 16:14:35,919 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:35,967 - INFO - Going to convert document batch...
2025-11-14 16:14:35,968 - INFO - Processing document 8-K_2023-02-15
2025-11-14 16:14:36,026 - INFO - Finished converting document 8-K_2023-02-15 in 0.14 sec.


Converted 'data\edgar_documents\CVS\8-K_2023-02-08' --> 'data\processed_data\CVS\8-K_2023-02-08.md'
Converted 'data\edgar_documents\CVS\8-K_2023-02-15' --> 'data\processed_data\CVS\8-K_2023-02-15.md'


2025-11-14 16:14:36,093 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:36,133 - INFO - Going to convert document batch...
2025-11-14 16:14:36,135 - INFO - Processing document 8-K_2023-02-21
2025-11-14 16:14:36,207 - INFO - Finished converting document 8-K_2023-02-21 in 0.14 sec.
2025-11-14 16:14:36,256 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:36,275 - INFO - Going to convert document batch...
2025-11-14 16:14:36,276 - INFO - Processing document 8-K_2023-03-30
2025-11-14 16:14:36,301 - INFO - Finished converting document 8-K_2023-03-30 in 0.06 sec.
2025-11-14 16:14:36,363 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:36,387 - INFO - Going to convert document batch...
2025-11-14 16:14:36,388 - INFO - Processing document 8-K_2023-05-02


Converted 'data\edgar_documents\CVS\8-K_2023-02-21' --> 'data\processed_data\CVS\8-K_2023-02-21.md'
Converted 'data\edgar_documents\CVS\8-K_2023-03-30' --> 'data\processed_data\CVS\8-K_2023-03-30.md'


2025-11-14 16:14:36,459 - INFO - Finished converting document 8-K_2023-05-02 in 0.12 sec.
2025-11-14 16:14:36,535 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:36,575 - INFO - Going to convert document batch...
2025-11-14 16:14:36,578 - INFO - Processing document 8-K_2023-05-03
2025-11-14 16:14:36,613 - INFO - Finished converting document 8-K_2023-05-03 in 0.09 sec.
2025-11-14 16:14:36,662 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\8-K_2023-05-02' --> 'data\processed_data\CVS\8-K_2023-05-02.md'
Converted 'data\edgar_documents\CVS\8-K_2023-05-03' --> 'data\processed_data\CVS\8-K_2023-05-03.md'


2025-11-14 16:14:36,721 - INFO - Going to convert document batch...
2025-11-14 16:14:36,723 - INFO - Processing document 8-K_2023-05-24
2025-11-14 16:14:36,808 - INFO - Finished converting document 8-K_2023-05-24 in 0.19 sec.
2025-11-14 16:14:36,891 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\8-K_2023-05-24' --> 'data\processed_data\CVS\8-K_2023-05-24.md'


2025-11-14 16:14:37,339 - INFO - Going to convert document batch...
2025-11-14 16:14:37,341 - INFO - Processing document 8-K_2023-05-25
2025-11-14 16:14:38,791 - INFO - Finished converting document 8-K_2023-05-25 in 1.92 sec.
2025-11-14 16:14:38,862 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:38,907 - INFO - Going to convert document batch...
2025-11-14 16:14:38,908 - INFO - Processing document 8-K_2023-05-31
2025-11-14 16:14:38,952 - INFO - Finished converting document 8-K_2023-05-31 in 0.12 sec.


Converted 'data\edgar_documents\CVS\8-K_2023-05-25' --> 'data\processed_data\CVS\8-K_2023-05-25.md'
Converted 'data\edgar_documents\CVS\8-K_2023-05-31' --> 'data\processed_data\CVS\8-K_2023-05-31.md'


2025-11-14 16:14:39,027 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:39,068 - INFO - Going to convert document batch...
2025-11-14 16:14:39,070 - INFO - Processing document 8-K_2023-06-01
2025-11-14 16:14:39,131 - INFO - Finished converting document 8-K_2023-06-01 in 0.14 sec.
2025-11-14 16:14:39,182 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:39,214 - INFO - Going to convert document batch...
2025-11-14 16:14:39,217 - INFO - Processing document 8-K_2023-06-02
2025-11-14 16:14:39,270 - INFO - Finished converting document 8-K_2023-06-02 in 0.11 sec.
2025-11-14 16:14:39,325 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\8-K_2023-06-01' --> 'data\processed_data\CVS\8-K_2023-06-01.md'
Converted 'data\edgar_documents\CVS\8-K_2023-06-02' --> 'data\processed_data\CVS\8-K_2023-06-02.md'


2025-11-14 16:14:39,361 - INFO - Going to convert document batch...
2025-11-14 16:14:39,363 - INFO - Processing document 8-K_2023-07-20
2025-11-14 16:14:39,421 - INFO - Finished converting document 8-K_2023-07-20 in 0.14 sec.
2025-11-14 16:14:39,478 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:39,511 - INFO - Going to convert document batch...
2025-11-14 16:14:39,512 - INFO - Processing document 8-K_2023-08-02
2025-11-14 16:14:39,553 - INFO - Finished converting document 8-K_2023-08-02 in 0.08 sec.
2025-11-14 16:14:39,636 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\8-K_2023-07-20' --> 'data\processed_data\CVS\8-K_2023-07-20.md'
Converted 'data\edgar_documents\CVS\8-K_2023-08-02' --> 'data\processed_data\CVS\8-K_2023-08-02.md'


2025-11-14 16:14:39,669 - INFO - Going to convert document batch...
2025-11-14 16:14:39,672 - INFO - Processing document 8-K_2023-08-17
2025-11-14 16:14:39,729 - INFO - Finished converting document 8-K_2023-08-17 in 0.14 sec.
2025-11-14 16:14:39,805 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:39,847 - INFO - Going to convert document batch...
2025-11-14 16:14:39,849 - INFO - Processing document 8-K_2023-08-23
2025-11-14 16:14:39,929 - INFO - Finished converting document 8-K_2023-08-23 in 0.14 sec.


Converted 'data\edgar_documents\CVS\8-K_2023-08-17' --> 'data\processed_data\CVS\8-K_2023-08-17.md'
Converted 'data\edgar_documents\CVS\8-K_2023-08-23' --> 'data\processed_data\CVS\8-K_2023-08-23.md'


2025-11-14 16:14:40,010 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:40,075 - INFO - Going to convert document batch...
2025-11-14 16:14:40,078 - INFO - Processing document 8-K_2023-09-11
2025-11-14 16:14:40,167 - INFO - Finished converting document 8-K_2023-09-11 in 0.20 sec.
2025-11-14 16:14:40,220 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:40,239 - INFO - Going to convert document batch...
2025-11-14 16:14:40,240 - INFO - Processing document 8-K_2023-09-21
2025-11-14 16:14:40,293 - INFO - Finished converting document 8-K_2023-09-21 in 0.09 sec.
2025-11-14 16:14:40,363 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\8-K_2023-09-11' --> 'data\processed_data\CVS\8-K_2023-09-11.md'
Converted 'data\edgar_documents\CVS\8-K_2023-09-21' --> 'data\processed_data\CVS\8-K_2023-09-21.md'


2025-11-14 16:14:40,403 - INFO - Going to convert document batch...
2025-11-14 16:14:40,405 - INFO - Processing document 8-K_2023-10-13
2025-11-14 16:14:40,452 - INFO - Finished converting document 8-K_2023-10-13 in 0.12 sec.
2025-11-14 16:14:40,499 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:40,546 - INFO - Going to convert document batch...
2025-11-14 16:14:40,547 - INFO - Processing document 8-K_2023-10-16
2025-11-14 16:14:40,619 - INFO - Finished converting document 8-K_2023-10-16 in 0.12 sec.


Converted 'data\edgar_documents\CVS\8-K_2023-10-13' --> 'data\processed_data\CVS\8-K_2023-10-13.md'


2025-11-14 16:14:40,689 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:40,730 - INFO - Going to convert document batch...
2025-11-14 16:14:40,731 - INFO - Processing document 8-K_2023-11-01
2025-11-14 16:14:40,768 - INFO - Finished converting document 8-K_2023-11-01 in 0.09 sec.
2025-11-14 16:14:40,811 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:40,845 - INFO - Going to convert document batch...
2025-11-14 16:14:40,847 - INFO - Processing document 8-K_2023-12-05


Converted 'data\edgar_documents\CVS\8-K_2023-10-16' --> 'data\processed_data\CVS\8-K_2023-10-16.md'
Converted 'data\edgar_documents\CVS\8-K_2023-11-01' --> 'data\processed_data\CVS\8-K_2023-11-01.md'


2025-11-14 16:14:40,890 - INFO - Finished converting document 8-K_2023-12-05 in 0.09 sec.
2025-11-14 16:14:40,961 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:41,015 - INFO - Going to convert document batch...
2025-11-14 16:14:41,017 - INFO - Processing document 8-K_2024-01-05
2025-11-14 16:14:41,102 - INFO - Finished converting document 8-K_2024-01-05 in 0.17 sec.


Converted 'data\edgar_documents\CVS\8-K_2023-12-05' --> 'data\processed_data\CVS\8-K_2023-12-05.md'


2025-11-14 16:14:41,193 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:41,220 - INFO - Going to convert document batch...
2025-11-14 16:14:41,223 - INFO - Processing document 8-K_2024-02-07
2025-11-14 16:14:41,286 - INFO - Finished converting document 8-K_2024-02-07 in 0.11 sec.
2025-11-14 16:14:41,353 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\8-K_2024-01-05' --> 'data\processed_data\CVS\8-K_2024-01-05.md'
Converted 'data\edgar_documents\CVS\8-K_2024-02-07' --> 'data\processed_data\CVS\8-K_2024-02-07.md'


2025-11-14 16:14:41,401 - INFO - Going to convert document batch...
2025-11-14 16:14:41,403 - INFO - Processing document 8-K_2024-03-05
2025-11-14 16:14:41,498 - INFO - Finished converting document 8-K_2024-03-05 in 0.19 sec.
2025-11-14 16:14:41,561 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:41,591 - INFO - Going to convert document batch...
2025-11-14 16:14:41,594 - INFO - Processing document 8-K_2024-05-01
2025-11-14 16:14:41,645 - INFO - Finished converting document 8-K_2024-05-01 in 0.11 sec.
2025-11-14 16:14:41,705 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:41,727 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CVS\8-K_2024-03-05' --> 'data\processed_data\CVS\8-K_2024-03-05.md'
Converted 'data\edgar_documents\CVS\8-K_2024-05-01' --> 'data\processed_data\CVS\8-K_2024-05-01.md'


2025-11-14 16:14:41,729 - INFO - Processing document 8-K_2024-05-08
2025-11-14 16:14:41,798 - INFO - Finished converting document 8-K_2024-05-08 in 0.12 sec.
2025-11-14 16:14:41,835 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:41,878 - INFO - Going to convert document batch...
2025-11-14 16:14:41,879 - INFO - Processing document 8-K_2024-05-09
2025-11-14 16:14:41,937 - INFO - Finished converting document 8-K_2024-05-09 in 0.12 sec.
2025-11-14 16:14:42,003 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\8-K_2024-05-08' --> 'data\processed_data\CVS\8-K_2024-05-08.md'
Converted 'data\edgar_documents\CVS\8-K_2024-05-09' --> 'data\processed_data\CVS\8-K_2024-05-09.md'


2025-11-14 16:14:42,060 - INFO - Going to convert document batch...
2025-11-14 16:14:42,062 - INFO - Processing document 8-K_2024-05-22
2025-11-14 16:14:42,138 - INFO - Finished converting document 8-K_2024-05-22 in 0.17 sec.
2025-11-14 16:14:42,186 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:42,205 - INFO - Going to convert document batch...
2025-11-14 16:14:42,207 - INFO - Processing document 8-K_2024-08-07
2025-11-14 16:14:42,260 - INFO - Finished converting document 8-K_2024-08-07 in 0.08 sec.
2025-11-14 16:14:42,321 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:42,353 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CVS\8-K_2024-05-22' --> 'data\processed_data\CVS\8-K_2024-05-22.md'
Converted 'data\edgar_documents\CVS\8-K_2024-08-07' --> 'data\processed_data\CVS\8-K_2024-08-07.md'


2025-11-14 16:14:42,355 - INFO - Processing document 8-K_2024-10-18
2025-11-14 16:14:42,395 - INFO - Finished converting document 8-K_2024-10-18 in 0.11 sec.
2025-11-14 16:14:42,445 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:42,463 - INFO - Going to convert document batch...
2025-11-14 16:14:42,465 - INFO - Processing document 8-K_2024-11-06
2025-11-14 16:14:42,497 - INFO - Finished converting document 8-K_2024-11-06 in 0.09 sec.
2025-11-14 16:14:42,553 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:42,584 - INFO - Going to convert document batch...
2025-11-14 16:14:42,586 - INFO - Processing document 8-K_2024-11-18


Converted 'data\edgar_documents\CVS\8-K_2024-10-18' --> 'data\processed_data\CVS\8-K_2024-10-18.md'
Converted 'data\edgar_documents\CVS\8-K_2024-11-06' --> 'data\processed_data\CVS\8-K_2024-11-06.md'


2025-11-14 16:14:42,636 - INFO - Finished converting document 8-K_2024-11-18 in 0.12 sec.
2025-11-14 16:14:42,687 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:42,727 - INFO - Going to convert document batch...
2025-11-14 16:14:42,731 - INFO - Processing document 8-K_2024-12-02
2025-11-14 16:14:42,789 - INFO - Finished converting document 8-K_2024-12-02 in 0.11 sec.
2025-11-14 16:14:42,838 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\8-K_2024-11-18' --> 'data\processed_data\CVS\8-K_2024-11-18.md'
Converted 'data\edgar_documents\CVS\8-K_2024-12-02' --> 'data\processed_data\CVS\8-K_2024-12-02.md'


2025-11-14 16:14:42,869 - INFO - Going to convert document batch...
2025-11-14 16:14:42,871 - INFO - Processing document 8-K_2024-12-05
2025-11-14 16:14:42,930 - INFO - Finished converting document 8-K_2024-12-05 in 0.11 sec.
2025-11-14 16:14:42,980 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:43,010 - INFO - Going to convert document batch...
2025-11-14 16:14:43,011 - INFO - Processing document 8-K_2024-12-06
2025-11-14 16:14:43,043 - INFO - Finished converting document 8-K_2024-12-06 in 0.09 sec.
2025-11-14 16:14:43,074 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:43,092 - INFO - Going to convert document batch...
2025-11-14 16:14:43,094 - INFO - Processing document 8-K_2024-12-09
2025-11-14 16:14:43,134 - INFO - Finished converting document 8-K_2024-12-09 in 0.06 sec.


Converted 'data\edgar_documents\CVS\8-K_2024-12-05' --> 'data\processed_data\CVS\8-K_2024-12-05.md'
Converted 'data\edgar_documents\CVS\8-K_2024-12-06' --> 'data\processed_data\CVS\8-K_2024-12-06.md'


2025-11-14 16:14:43,179 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:43,224 - INFO - Going to convert document batch...
2025-11-14 16:14:43,226 - INFO - Processing document 8-K_2024-12-10
2025-11-14 16:14:43,298 - INFO - Finished converting document 8-K_2024-12-10 in 0.14 sec.


Converted 'data\edgar_documents\CVS\8-K_2024-12-09' --> 'data\processed_data\CVS\8-K_2024-12-09.md'
Converted 'data\edgar_documents\CVS\8-K_2024-12-10' --> 'data\processed_data\CVS\8-K_2024-12-10.md'


2025-11-14 16:14:43,362 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:43,393 - INFO - Going to convert document batch...
2025-11-14 16:14:43,395 - INFO - Processing document 8-K_2024-12-17
2025-11-14 16:14:43,455 - INFO - Finished converting document 8-K_2024-12-17 in 0.12 sec.
2025-11-14 16:14:43,507 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:43,530 - INFO - Going to convert document batch...
2025-11-14 16:14:43,531 - INFO - Processing document 8-K_2025-02-12
2025-11-14 16:14:43,577 - INFO - Finished converting document 8-K_2025-02-12 in 0.09 sec.
2025-11-14 16:14:43,646 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\8-K_2024-12-17' --> 'data\processed_data\CVS\8-K_2024-12-17.md'
Converted 'data\edgar_documents\CVS\8-K_2025-02-12' --> 'data\processed_data\CVS\8-K_2025-02-12.md'


2025-11-14 16:14:43,676 - INFO - Going to convert document batch...
2025-11-14 16:14:43,678 - INFO - Processing document 8-K_2025-04-08
2025-11-14 16:14:43,737 - INFO - Finished converting document 8-K_2025-04-08 in 0.12 sec.
2025-11-14 16:14:43,807 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:43,836 - INFO - Going to convert document batch...
2025-11-14 16:14:43,838 - INFO - Processing document 8-K_2025-05-01
2025-11-14 16:14:43,892 - INFO - Finished converting document 8-K_2025-05-01 in 0.12 sec.
2025-11-14 16:14:43,936 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\8-K_2025-04-08' --> 'data\processed_data\CVS\8-K_2025-04-08.md'
Converted 'data\edgar_documents\CVS\8-K_2025-05-01' --> 'data\processed_data\CVS\8-K_2025-05-01.md'


2025-11-14 16:14:43,980 - INFO - Going to convert document batch...
2025-11-14 16:14:43,983 - INFO - Processing document 8-K_2025-05-20
2025-11-14 16:14:44,042 - INFO - Finished converting document 8-K_2025-05-20 in 0.12 sec.
2025-11-14 16:14:44,112 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:44,141 - INFO - Going to convert document batch...
2025-11-14 16:14:44,143 - INFO - Processing document 8-K_2025-07-31
2025-11-14 16:14:44,196 - INFO - Finished converting document 8-K_2025-07-31 in 0.11 sec.


Converted 'data\edgar_documents\CVS\8-K_2025-05-20' --> 'data\processed_data\CVS\8-K_2025-05-20.md'
Converted 'data\edgar_documents\CVS\8-K_2025-07-31' --> 'data\processed_data\CVS\8-K_2025-07-31.md'


2025-11-14 16:14:44,266 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:44,306 - INFO - Going to convert document batch...
2025-11-14 16:14:44,308 - INFO - Processing document 8-K_2025-08-15
2025-11-14 16:14:44,369 - INFO - Finished converting document 8-K_2025-08-15 in 0.12 sec.
2025-11-14 16:14:44,432 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:14:44,452 - INFO - Going to convert document batch...
2025-11-14 16:14:44,452 - INFO - Processing document 8-K_2025-09-22
2025-11-14 16:14:44,498 - INFO - Finished converting document 8-K_2025-09-22 in 0.09 sec.
2025-11-14 16:14:44,562 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\8-K_2025-08-15' --> 'data\processed_data\CVS\8-K_2025-08-15.md'
Converted 'data\edgar_documents\CVS\8-K_2025-09-22' --> 'data\processed_data\CVS\8-K_2025-09-22.md'


2025-11-14 16:14:44,594 - INFO - Going to convert document batch...
2025-11-14 16:14:44,597 - INFO - Processing document 8-K_2025-10-29
2025-11-14 16:14:44,645 - INFO - Finished converting document 8-K_2025-10-29 in 0.11 sec.
2025-11-14 16:14:44,769 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\8-K_2025-10-29' --> 'data\processed_data\CVS\8-K_2025-10-29.md'


2025-11-14 16:14:47,000 - INFO - Going to convert document batch...
2025-11-14 16:14:47,002 - INFO - Processing document DEF-14A_2023-04-07
2025-11-14 16:16:04,149 - INFO - Finished converting document DEF-14A_2023-04-07 in 79.48 sec.
2025-11-14 16:16:09,268 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\DEF-14A_2023-04-07' --> 'data\processed_data\CVS\DEF-14A_2023-04-07.md'


2025-11-14 16:16:11,641 - INFO - Going to convert document batch...
2025-11-14 16:16:11,643 - INFO - Processing document DEF-14A_2024-04-05
2025-11-14 16:16:19,248 - INFO - Finished converting document DEF-14A_2024-04-05 in 10.09 sec.
2025-11-14 16:17:05,258 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\DEF-14A_2024-04-05' --> 'data\processed_data\CVS\DEF-14A_2024-04-05.md'


2025-11-14 16:17:09,088 - INFO - Going to convert document batch...
2025-11-14 16:17:09,090 - INFO - Processing document DEF-14A_2025-04-04
2025-11-14 16:17:16,296 - INFO - Finished converting document DEF-14A_2025-04-04 in 11.16 sec.
2025-11-14 16:17:21,776 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVS\DEF-14A_2025-04-04' --> 'data\processed_data\CVS\DEF-14A_2025-04-04.md'
Processed 103 new files. Errors: 9
Found 106 files to process in data\edgar_documents\CVX


2025-11-14 16:17:27,892 - INFO - Going to convert document batch...
2025-11-14 16:17:27,893 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:17:27,895 - INFO - Processing document 10-K_2023-02-23
2025-11-14 16:17:39,216 - INFO - Finished converting document 10-K_2023-02-23 in 17.59 sec.
2025-11-14 16:17:44,001 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\10-K_2023-02-23' --> 'data\processed_data\CVX\10-K_2023-02-23.md'


2025-11-14 16:17:49,306 - INFO - Going to convert document batch...
2025-11-14 16:17:49,309 - INFO - Processing document 10-K_2024-02-26
2025-11-14 16:18:01,471 - INFO - Finished converting document 10-K_2024-02-26 in 17.62 sec.
2025-11-14 16:18:06,454 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\10-K_2024-02-26' --> 'data\processed_data\CVX\10-K_2024-02-26.md'


2025-11-14 16:18:11,065 - INFO - Going to convert document batch...
2025-11-14 16:18:11,068 - INFO - Processing document 10-K_2025-02-21
2025-11-14 16:18:25,616 - INFO - Finished converting document 10-K_2025-02-21 in 19.36 sec.
2025-11-14 16:18:30,893 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\10-K_2025-02-21' --> 'data\processed_data\CVX\10-K_2025-02-21.md'


2025-11-14 16:18:32,075 - INFO - Going to convert document batch...
2025-11-14 16:18:32,077 - INFO - Processing document 10-Q_2023-05-04
2025-11-14 16:18:34,559 - INFO - Finished converting document 10-Q_2023-05-04 in 3.73 sec.
2025-11-14 16:18:35,706 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\10-Q_2023-05-04' --> 'data\processed_data\CVX\10-Q_2023-05-04.md'


2025-11-14 16:18:37,793 - INFO - Going to convert document batch...
2025-11-14 16:18:37,796 - INFO - Processing document 10-Q_2023-08-03
2025-11-14 16:18:41,677 - INFO - Finished converting document 10-Q_2023-08-03 in 6.03 sec.
2025-11-14 16:18:43,620 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\10-Q_2023-08-03' --> 'data\processed_data\CVX\10-Q_2023-08-03.md'


2025-11-14 16:18:46,151 - INFO - Going to convert document batch...
2025-11-14 16:18:46,153 - INFO - Processing document 10-Q_2023-11-02
2025-11-14 16:18:49,790 - INFO - Finished converting document 10-Q_2023-11-02 in 6.25 sec.
2025-11-14 16:18:51,633 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\10-Q_2023-11-02' --> 'data\processed_data\CVX\10-Q_2023-11-02.md'


2025-11-14 16:18:52,539 - INFO - Going to convert document batch...
2025-11-14 16:18:52,540 - INFO - Processing document 10-Q_2024-05-02
2025-11-14 16:18:55,545 - INFO - Finished converting document 10-Q_2024-05-02 in 3.95 sec.
2025-11-14 16:18:56,827 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\10-Q_2024-05-02' --> 'data\processed_data\CVX\10-Q_2024-05-02.md'


2025-11-14 16:18:58,527 - INFO - Going to convert document batch...
2025-11-14 16:18:58,529 - INFO - Processing document 10-Q_2024-08-07
2025-11-14 16:19:01,680 - INFO - Finished converting document 10-Q_2024-08-07 in 4.92 sec.
2025-11-14 16:19:03,591 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\10-Q_2024-08-07' --> 'data\processed_data\CVX\10-Q_2024-08-07.md'


2025-11-14 16:19:05,991 - INFO - Going to convert document batch...
2025-11-14 16:19:05,993 - INFO - Processing document 10-Q_2024-11-07
2025-11-14 16:19:09,545 - INFO - Finished converting document 10-Q_2024-11-07 in 6.09 sec.
2025-11-14 16:19:11,734 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\10-Q_2024-11-07' --> 'data\processed_data\CVX\10-Q_2024-11-07.md'


2025-11-14 16:19:12,556 - INFO - Going to convert document batch...
2025-11-14 16:19:12,558 - INFO - Processing document 10-Q_2025-05-08
2025-11-14 16:19:14,203 - INFO - Finished converting document 10-Q_2025-05-08 in 2.52 sec.
2025-11-14 16:19:15,658 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\10-Q_2025-05-08' --> 'data\processed_data\CVX\10-Q_2025-05-08.md'


2025-11-14 16:19:18,256 - INFO - Going to convert document batch...
2025-11-14 16:19:18,258 - INFO - Processing document 10-Q_2025-08-07
2025-11-14 16:19:21,988 - INFO - Finished converting document 10-Q_2025-08-07 in 6.44 sec.
2025-11-14 16:19:24,308 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\10-Q_2025-08-07' --> 'data\processed_data\CVX\10-Q_2025-08-07.md'


2025-11-14 16:19:26,761 - INFO - Going to convert document batch...
2025-11-14 16:19:26,763 - INFO - Processing document 10-Q_2025-11-06
2025-11-14 16:19:30,357 - INFO - Finished converting document 10-Q_2025-11-06 in 6.12 sec.
2025-11-14 16:19:32,657 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:32,708 - INFO - Going to convert document batch...
2025-11-14 16:19:32,710 - INFO - Processing document 4_2023-01-27


Converted 'data\edgar_documents\CVX\10-Q_2025-11-06' --> 'data\processed_data\CVX\10-Q_2025-11-06.md'


2025-11-14 16:19:32,828 - INFO - Finished converting document 4_2023-01-27 in 0.23 sec.
2025-11-14 16:19:33,014 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:33,053 - INFO - Going to convert document batch...
2025-11-14 16:19:33,056 - INFO - Processing document 4_2023-02-01
2025-11-14 16:19:33,136 - INFO - Finished converting document 4_2023-02-01 in 0.17 sec.


Converted 'data\edgar_documents\CVX\4_2023-01-27' --> 'data\processed_data\CVX\4_2023-01-27.md'


2025-11-14 16:19:33,231 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:33,277 - INFO - Going to convert document batch...
2025-11-14 16:19:33,280 - INFO - Processing document 4_2023-02-02
2025-11-14 16:19:33,383 - INFO - Finished converting document 4_2023-02-02 in 0.17 sec.


Converted 'data\edgar_documents\CVX\4_2023-02-01' --> 'data\processed_data\CVX\4_2023-02-01.md'


2025-11-14 16:19:33,508 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:33,553 - INFO - Going to convert document batch...
2025-11-14 16:19:33,555 - INFO - Processing document 4_2023-02-09
2025-11-14 16:19:33,649 - INFO - Finished converting document 4_2023-02-09 in 0.19 sec.


Converted 'data\edgar_documents\CVX\4_2023-02-02' --> 'data\processed_data\CVX\4_2023-02-02.md'


2025-11-14 16:19:33,764 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:33,795 - INFO - Going to convert document batch...
2025-11-14 16:19:33,797 - INFO - Processing document 4_2023-02-27
2025-11-14 16:19:33,867 - INFO - Finished converting document 4_2023-02-27 in 0.12 sec.


Converted 'data\edgar_documents\CVX\4_2023-02-09' --> 'data\processed_data\CVX\4_2023-02-09.md'


2025-11-14 16:19:34,186 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:34,259 - INFO - Going to convert document batch...
2025-11-14 16:19:34,261 - INFO - Processing document 4_2023-03-01


Converted 'data\edgar_documents\CVX\4_2023-02-27' --> 'data\processed_data\CVX\4_2023-02-27.md'


2025-11-14 16:19:34,354 - INFO - Finished converting document 4_2023-03-01 in 0.23 sec.
2025-11-14 16:19:34,512 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:34,514 - ERROR - Input document 4_2023-05-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:19:34,517 - INFO - Going to convert document batch...
2025-11-14 16:19:34,536 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:34,568 - INFO - Going to convert document batch...
2025-11-14 16:

Converted 'data\edgar_documents\CVX\4_2023-03-01' --> 'data\processed_data\CVX\4_2023-03-01.md'
Error processing data\edgar_documents\CVX\4_2023-05-22: File format not allowed: data\edgar_documents\CVX\4_2023-05-22


2025-11-14 16:19:34,651 - INFO - Finished converting document 4_2023-05-30 in 0.14 sec.
2025-11-14 16:19:34,822 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:34,853 - INFO - Going to convert document batch...
2025-11-14 16:19:34,855 - INFO - Processing document 4_2023-06-02
2025-11-14 16:19:34,923 - INFO - Finished converting document 4_2023-06-02 in 0.16 sec.


Converted 'data\edgar_documents\CVX\4_2023-05-30' --> 'data\processed_data\CVX\4_2023-05-30.md'


2025-11-14 16:19:35,100 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:35,103 - ERROR - Input document 4_2023-07-07 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:19:35,107 - INFO - Going to convert document batch...
2025-11-14 16:19:35,129 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:35,180 - INFO - Going to convert document batch...
2025-11-14 16:19:35,181 - INFO - Processing document 4_2023-08-07


Converted 'data\edgar_documents\CVX\4_2023-06-02' --> 'data\processed_data\CVX\4_2023-06-02.md'
Error processing data\edgar_documents\CVX\4_2023-07-07: File format not allowed: data\edgar_documents\CVX\4_2023-07-07


2025-11-14 16:19:35,447 - INFO - Finished converting document 4_2023-08-07 in 0.33 sec.
2025-11-14 16:19:35,604 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:35,642 - INFO - Going to convert document batch...
2025-11-14 16:19:35,644 - INFO - Processing document 4_2023-08-15
2025-11-14 16:19:35,724 - INFO - Finished converting document 4_2023-08-15 in 0.17 sec.


Converted 'data\edgar_documents\CVX\4_2023-08-07' --> 'data\processed_data\CVX\4_2023-08-07.md'


2025-11-14 16:19:35,861 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:35,901 - INFO - Going to convert document batch...
2025-11-14 16:19:35,903 - INFO - Processing document 4_2023-08-29


Converted 'data\edgar_documents\CVX\4_2023-08-15' --> 'data\processed_data\CVX\4_2023-08-15.md'


2025-11-14 16:19:36,007 - INFO - Finished converting document 4_2023-08-29 in 0.19 sec.
2025-11-14 16:19:36,284 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:36,287 - ERROR - Input document 4_2023-10-23 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))


Converted 'data\edgar_documents\CVX\4_2023-08-29' --> 'data\processed_data\CVX\4_2023-08-29.md'


2025-11-14 16:19:36,298 - INFO - Going to convert document batch...
2025-11-14 16:19:36,368 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:36,370 - ERROR - Input document 4_2023-10-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:19:36,373 - INFO - Going to convert document batch...
2025-11-14 16:19:36,425 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:36,427 - ERROR - Input document 4_2023-10-26 with format None does not matc

Error processing data\edgar_documents\CVX\4_2023-10-23: File format not allowed: data\edgar_documents\CVX\4_2023-10-23
Error processing data\edgar_documents\CVX\4_2023-10-24: File format not allowed: data\edgar_documents\CVX\4_2023-10-24
Error processing data\edgar_documents\CVX\4_2023-10-26: File format not allowed: data\edgar_documents\CVX\4_2023-10-26
Error processing data\edgar_documents\CVX\4_2023-10-27: File format not allowed: data\edgar_documents\CVX\4_2023-10-27


2025-11-14 16:19:36,481 - ERROR - Input document 4_2023-11-02 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:19:36,485 - INFO - Going to convert document batch...
2025-11-14 16:19:36,508 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:36,548 - INFO - Going to convert document batch...
2025-11-14 16:19:36,550 - INFO - Processing document 4_2023-11-29
2025-11-14 16:19:36,640 - INFO - Finished converting document 4_2023-11-29 in 0.16 sec.


Error processing data\edgar_documents\CVX\4_2023-11-02: File format not allowed: data\edgar_documents\CVX\4_2023-11-02


2025-11-14 16:19:36,875 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:36,876 - ERROR - Input document 4_2023-12-08 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:19:36,881 - INFO - Going to convert document batch...


Converted 'data\edgar_documents\CVX\4_2023-11-29' --> 'data\processed_data\CVX\4_2023-11-29.md'
Error processing data\edgar_documents\CVX\4_2023-12-08: File format not allowed: data\edgar_documents\CVX\4_2023-12-08


2025-11-14 16:19:36,986 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:37,047 - INFO - Going to convert document batch...
2025-11-14 16:19:37,049 - INFO - Processing document 4_2023-12-20
2025-11-14 16:19:37,213 - INFO - Finished converting document 4_2023-12-20 in 0.34 sec.
2025-11-14 16:19:37,371 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:37,406 - INFO - Going to convert document batch...
2025-11-14 16:19:37,408 - INFO - Processing document 4_2024-02-02
2025-11-14 16:19:37,477 - INFO - Finished converting document 4_2024-02-02 in 0.16 sec.


Converted 'data\edgar_documents\CVX\4_2023-12-20' --> 'data\processed_data\CVX\4_2023-12-20.md'


2025-11-14 16:19:37,597 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:37,634 - INFO - Going to convert document batch...
2025-11-14 16:19:37,636 - INFO - Processing document 4_2024-02-08
2025-11-14 16:19:37,730 - INFO - Finished converting document 4_2024-02-08 in 0.19 sec.


Converted 'data\edgar_documents\CVX\4_2024-02-02' --> 'data\processed_data\CVX\4_2024-02-02.md'


2025-11-14 16:19:37,849 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:37,886 - INFO - Going to convert document batch...
2025-11-14 16:19:37,888 - INFO - Processing document 4_2024-03-06
2025-11-14 16:19:38,001 - INFO - Finished converting document 4_2024-03-06 in 0.17 sec.


Converted 'data\edgar_documents\CVX\4_2024-02-08' --> 'data\processed_data\CVX\4_2024-02-08.md'


2025-11-14 16:19:38,143 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:38,145 - ERROR - Input document 4_2024-03-22 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:19:38,146 - INFO - Going to convert document batch...
2025-11-14 16:19:38,168 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:38,170 - ERROR - Input document 4_2024-04-03 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <Input

Converted 'data\edgar_documents\CVX\4_2024-03-06' --> 'data\processed_data\CVX\4_2024-03-06.md'
Error processing data\edgar_documents\CVX\4_2024-03-22: File format not allowed: data\edgar_documents\CVX\4_2024-03-22
Error processing data\edgar_documents\CVX\4_2024-04-03: File format not allowed: data\edgar_documents\CVX\4_2024-04-03


2025-11-14 16:19:38,333 - INFO - Finished converting document 4_2024-04-04 in 0.16 sec.
2025-11-14 16:19:38,620 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\CVX\4_2024-04-04' --> 'data\processed_data\CVX\4_2024-04-04.md'


2025-11-14 16:19:38,621 - ERROR - Input document 4_2024-04-26 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:19:38,635 - INFO - Going to convert document batch...
2025-11-14 16:19:38,656 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:38,706 - INFO - Going to convert document batch...
2025-11-14 16:19:38,708 - INFO - Processing document 4_2024-04-29
2025-11-14 16:19:38,798 - INFO - Finished converting document 4_2024-04-29 in 0.16 sec.


Error processing data\edgar_documents\CVX\4_2024-04-26: File format not allowed: data\edgar_documents\CVX\4_2024-04-26


2025-11-14 16:19:38,930 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:38,959 - INFO - Going to convert document batch...
2025-11-14 16:19:38,962 - INFO - Processing document 4_2024-05-06
2025-11-14 16:19:39,048 - INFO - Finished converting document 4_2024-05-06 in 0.16 sec.


Converted 'data\edgar_documents\CVX\4_2024-04-29' --> 'data\processed_data\CVX\4_2024-04-29.md'


2025-11-14 16:19:39,167 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:39,202 - INFO - Going to convert document batch...
2025-11-14 16:19:39,204 - INFO - Processing document 4_2024-05-13
2025-11-14 16:19:39,284 - INFO - Finished converting document 4_2024-05-13 in 0.17 sec.


Converted 'data\edgar_documents\CVX\4_2024-05-06' --> 'data\processed_data\CVX\4_2024-05-06.md'


2025-11-14 16:19:39,410 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:39,453 - INFO - Going to convert document batch...
2025-11-14 16:19:39,456 - INFO - Processing document 4_2024-05-23
2025-11-14 16:19:39,552 - INFO - Finished converting document 4_2024-05-23 in 0.19 sec.


Converted 'data\edgar_documents\CVX\4_2024-05-13' --> 'data\processed_data\CVX\4_2024-05-13.md'


2025-11-14 16:19:39,659 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:39,691 - INFO - Going to convert document batch...
2025-11-14 16:19:39,693 - INFO - Processing document 4_2024-05-28
2025-11-14 16:19:39,788 - INFO - Finished converting document 4_2024-05-28 in 0.14 sec.


Converted 'data\edgar_documents\CVX\4_2024-05-23' --> 'data\processed_data\CVX\4_2024-05-23.md'


2025-11-14 16:19:39,898 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:39,925 - INFO - Going to convert document batch...
2025-11-14 16:19:39,927 - INFO - Processing document 4_2024-05-30
2025-11-14 16:19:40,013 - INFO - Finished converting document 4_2024-05-30 in 0.14 sec.


Converted 'data\edgar_documents\CVX\4_2024-05-28' --> 'data\processed_data\CVX\4_2024-05-28.md'


2025-11-14 16:19:40,103 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:40,171 - INFO - Going to convert document batch...
2025-11-14 16:19:40,173 - INFO - Processing document 4_2024-08-08


Converted 'data\edgar_documents\CVX\4_2024-05-30' --> 'data\processed_data\CVX\4_2024-05-30.md'


2025-11-14 16:19:40,514 - INFO - Finished converting document 4_2024-08-08 in 0.42 sec.
2025-11-14 16:19:40,620 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:40,654 - INFO - Going to convert document batch...
2025-11-14 16:19:40,655 - INFO - Processing document 4_2024-08-22
2025-11-14 16:19:40,718 - INFO - Finished converting document 4_2024-08-22 in 0.11 sec.


Converted 'data\edgar_documents\CVX\4_2024-08-08' --> 'data\processed_data\CVX\4_2024-08-08.md'
Converted 'data\edgar_documents\CVX\4_2024-08-22' --> 'data\processed_data\CVX\4_2024-08-22.md'


2025-11-14 16:19:40,821 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:40,857 - INFO - Going to convert document batch...
2025-11-14 16:19:40,859 - INFO - Processing document 4_2024-09-04
2025-11-14 16:19:40,940 - INFO - Finished converting document 4_2024-09-04 in 0.14 sec.
2025-11-14 16:19:41,095 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:41,153 - INFO - Going to convert document batch...
2025-11-14 16:19:41,155 - INFO - Processing document 4_2024-11-18
2025-11-14 16:19:41,233 - INFO - Finished converting document 4_2024-11-18 in 0.16 sec.


Converted 'data\edgar_documents\CVX\4_2024-09-04' --> 'data\processed_data\CVX\4_2024-09-04.md'


2025-11-14 16:19:41,342 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:41,382 - INFO - Going to convert document batch...
2025-11-14 16:19:41,385 - INFO - Processing document 4_2024-12-04
2025-11-14 16:19:41,470 - INFO - Finished converting document 4_2024-12-04 in 0.16 sec.


Converted 'data\edgar_documents\CVX\4_2024-11-18' --> 'data\processed_data\CVX\4_2024-11-18.md'


2025-11-14 16:19:41,566 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:41,642 - INFO - Going to convert document batch...
2025-11-14 16:19:41,644 - INFO - Processing document 4_2024-12-19


Converted 'data\edgar_documents\CVX\4_2024-12-04' --> 'data\processed_data\CVX\4_2024-12-04.md'


2025-11-14 16:19:41,812 - INFO - Finished converting document 4_2024-12-19 in 0.27 sec.
2025-11-14 16:19:42,087 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:42,133 - INFO - Going to convert document batch...
2025-11-14 16:19:42,135 - INFO - Processing document 4_2025-02-04


Converted 'data\edgar_documents\CVX\4_2024-12-19' --> 'data\processed_data\CVX\4_2024-12-19.md'


2025-11-14 16:19:42,248 - INFO - Finished converting document 4_2025-02-04 in 0.22 sec.
2025-11-14 16:19:42,393 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:42,440 - INFO - Going to convert document batch...
2025-11-14 16:19:42,443 - INFO - Processing document 4_2025-02-06
2025-11-14 16:19:42,530 - INFO - Finished converting document 4_2025-02-06 in 0.16 sec.


Converted 'data\edgar_documents\CVX\4_2025-02-04' --> 'data\processed_data\CVX\4_2025-02-04.md'


2025-11-14 16:19:42,670 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:42,778 - INFO - Going to convert document batch...
2025-11-14 16:19:42,781 - INFO - Processing document 4_2025-02-11


Converted 'data\edgar_documents\CVX\4_2025-02-06' --> 'data\processed_data\CVX\4_2025-02-06.md'


2025-11-14 16:19:42,905 - INFO - Finished converting document 4_2025-02-11 in 0.30 sec.
2025-11-14 16:19:43,068 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:43,112 - INFO - Going to convert document batch...
2025-11-14 16:19:43,114 - INFO - Processing document 4_2025-02-12


Converted 'data\edgar_documents\CVX\4_2025-02-11' --> 'data\processed_data\CVX\4_2025-02-11.md'


2025-11-14 16:19:43,228 - INFO - Finished converting document 4_2025-02-12 in 0.22 sec.
2025-11-14 16:19:43,354 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:43,356 - ERROR - Input document 4_2025-02-24 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:19:43,359 - INFO - Going to convert document batch...
2025-11-14 16:19:43,383 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:43,385 - ERROR - Input document 4_2025-02-25 with forma

Converted 'data\edgar_documents\CVX\4_2025-02-12' --> 'data\processed_data\CVX\4_2025-02-12.md'
Error processing data\edgar_documents\CVX\4_2025-02-24: File format not allowed: data\edgar_documents\CVX\4_2025-02-24
Error processing data\edgar_documents\CVX\4_2025-02-25: File format not allowed: data\edgar_documents\CVX\4_2025-02-25


2025-11-14 16:19:43,544 - INFO - Finished converting document 4_2025-02-27 in 0.16 sec.
2025-11-14 16:19:43,742 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:43,786 - INFO - Going to convert document batch...
2025-11-14 16:19:43,789 - INFO - Processing document 4_2025-03-05
2025-11-14 16:19:43,884 - INFO - Finished converting document 4_2025-03-05 in 0.19 sec.


Converted 'data\edgar_documents\CVX\4_2025-02-27' --> 'data\processed_data\CVX\4_2025-02-27.md'


2025-11-14 16:19:44,031 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:44,061 - INFO - Going to convert document batch...
2025-11-14 16:19:44,063 - INFO - Processing document 4_2025-05-29
2025-11-14 16:19:44,145 - INFO - Finished converting document 4_2025-05-29 in 0.16 sec.


Converted 'data\edgar_documents\CVX\4_2025-03-05' --> 'data\processed_data\CVX\4_2025-03-05.md'


2025-11-14 16:19:44,248 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:44,282 - INFO - Going to convert document batch...
2025-11-14 16:19:44,284 - INFO - Processing document 4_2025-06-04
2025-11-14 16:19:44,363 - INFO - Finished converting document 4_2025-06-04 in 0.12 sec.


Converted 'data\edgar_documents\CVX\4_2025-05-29' --> 'data\processed_data\CVX\4_2025-05-29.md'


2025-11-14 16:19:44,500 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:44,605 - INFO - Going to convert document batch...
2025-11-14 16:19:44,609 - INFO - Processing document 4_2025-07-22


Converted 'data\edgar_documents\CVX\4_2025-06-04' --> 'data\processed_data\CVX\4_2025-06-04.md'


2025-11-14 16:19:44,727 - INFO - Finished converting document 4_2025-07-22 in 0.27 sec.
2025-11-14 16:19:44,839 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:44,884 - INFO - Going to convert document batch...
2025-11-14 16:19:44,886 - INFO - Processing document 4_2025-07-30
2025-11-14 16:19:44,991 - INFO - Finished converting document 4_2025-07-30 in 0.16 sec.


Converted 'data\edgar_documents\CVX\4_2025-07-22' --> 'data\processed_data\CVX\4_2025-07-22.md'


2025-11-14 16:19:45,110 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:45,141 - INFO - Going to convert document batch...
2025-11-14 16:19:45,143 - INFO - Processing document 4_2025-08-08
2025-11-14 16:19:45,212 - INFO - Finished converting document 4_2025-08-08 in 0.11 sec.


Converted 'data\edgar_documents\CVX\4_2025-07-30' --> 'data\processed_data\CVX\4_2025-07-30.md'


2025-11-14 16:19:45,561 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:45,564 - ERROR - Input document 4_2025-08-11 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:19:45,569 - INFO - Going to convert document batch...
2025-11-14 16:19:45,596 - INFO - detected formats: [<InputFormat.XML_USPTO: 'xml_uspto'>]


Converted 'data\edgar_documents\CVX\4_2025-08-08' --> 'data\processed_data\CVX\4_2025-08-08.md'
Error processing data\edgar_documents\CVX\4_2025-08-11: File format not allowed: data\edgar_documents\CVX\4_2025-08-11


2025-11-14 16:19:45,597 - ERROR - Input document 4_2025-08-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:19:45,602 - INFO - Going to convert document batch...
2025-11-14 16:19:45,625 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:45,673 - INFO - Going to convert document batch...
2025-11-14 16:19:45,675 - INFO - Processing document 4_2025-08-26
2025-11-14 16:19:45,796 - INFO - Finished converting document 4_2025-08-26 in 0.19 sec.


Error processing data\edgar_documents\CVX\4_2025-08-12: File format not allowed: data\edgar_documents\CVX\4_2025-08-12


2025-11-14 16:19:45,938 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:45,974 - INFO - Going to convert document batch...
2025-11-14 16:19:45,975 - INFO - Processing document 4_2025-09-03


Converted 'data\edgar_documents\CVX\4_2025-08-26' --> 'data\processed_data\CVX\4_2025-08-26.md'


2025-11-14 16:19:46,162 - INFO - Finished converting document 4_2025-09-03 in 0.23 sec.
2025-11-14 16:19:46,330 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:46,389 - INFO - Going to convert document batch...
2025-11-14 16:19:46,391 - INFO - Processing document 8-K_2023-01-27
2025-11-14 16:19:46,489 - INFO - Finished converting document 8-K_2023-01-27 in 0.20 sec.


Converted 'data\edgar_documents\CVX\4_2025-09-03' --> 'data\processed_data\CVX\4_2025-09-03.md'


2025-11-14 16:19:46,583 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:46,633 - INFO - Going to convert document batch...
2025-11-14 16:19:46,635 - INFO - Processing document 8-K_2023-04-28


Converted 'data\edgar_documents\CVX\8-K_2023-01-27' --> 'data\processed_data\CVX\8-K_2023-01-27.md'


2025-11-14 16:19:47,658 - INFO - Finished converting document 8-K_2023-04-28 in 1.12 sec.
2025-11-14 16:19:47,752 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:47,793 - INFO - Going to convert document batch...
2025-11-14 16:19:47,795 - INFO - Processing document 8-K_2023-05-22
2025-11-14 16:19:47,868 - INFO - Finished converting document 8-K_2023-05-22 in 0.16 sec.


Converted 'data\edgar_documents\CVX\8-K_2023-04-28' --> 'data\processed_data\CVX\8-K_2023-04-28.md'


2025-11-14 16:19:48,093 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\8-K_2023-05-22' --> 'data\processed_data\CVX\8-K_2023-05-22.md'


2025-11-14 16:19:48,211 - INFO - Going to convert document batch...
2025-11-14 16:19:48,212 - INFO - Processing document 8-K_2023-06-02
2025-11-14 16:19:48,427 - INFO - Finished converting document 8-K_2023-06-02 in 0.45 sec.
2025-11-14 16:19:48,679 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:48,707 - INFO - Going to convert document batch...
2025-11-14 16:19:48,709 - INFO - Processing document 8-K_2023-07-24
2025-11-14 16:19:48,767 - INFO - Finished converting document 8-K_2023-07-24 in 0.16 sec.


Converted 'data\edgar_documents\CVX\8-K_2023-06-02' --> 'data\processed_data\CVX\8-K_2023-06-02.md'


2025-11-14 16:19:48,845 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:48,883 - INFO - Going to convert document batch...
2025-11-14 16:19:48,884 - INFO - Processing document 8-K_2023-07-26
2025-11-14 16:19:48,950 - INFO - Finished converting document 8-K_2023-07-26 in 0.14 sec.


Converted 'data\edgar_documents\CVX\8-K_2023-07-24' --> 'data\processed_data\CVX\8-K_2023-07-24.md'
Converted 'data\edgar_documents\CVX\8-K_2023-07-26' --> 'data\processed_data\CVX\8-K_2023-07-26.md'


2025-11-14 16:19:49,022 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:49,070 - INFO - Going to convert document batch...
2025-11-14 16:19:49,072 - INFO - Processing document 8-K_2023-07-28
2025-11-14 16:19:49,151 - INFO - Finished converting document 8-K_2023-07-28 in 0.17 sec.
2025-11-14 16:19:49,212 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:49,239 - INFO - Going to convert document batch...
2025-11-14 16:19:49,240 - INFO - Processing document 8-K_2023-08-07
2025-11-14 16:19:49,292 - INFO - Finished converting document 8-K_2023-08-07 in 0.11 sec.


Converted 'data\edgar_documents\CVX\8-K_2023-07-28' --> 'data\processed_data\CVX\8-K_2023-07-28.md'
Converted 'data\edgar_documents\CVX\8-K_2023-08-07' --> 'data\processed_data\CVX\8-K_2023-08-07.md'


2025-11-14 16:19:49,387 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:49,426 - INFO - Going to convert document batch...
2025-11-14 16:19:49,427 - INFO - Processing document 8-K_2023-10-23
2025-11-14 16:19:49,539 - INFO - Finished converting document 8-K_2023-10-23 in 0.22 sec.
2025-11-14 16:19:49,690 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:49,724 - INFO - Going to convert document batch...
2025-11-14 16:19:49,725 - INFO - Processing document 8-K_2023-10-27
2025-11-14 16:19:49,789 - INFO - Finished converting document 8-K_2023-10-27 in 0.14 sec.


Converted 'data\edgar_documents\CVX\8-K_2023-10-23' --> 'data\processed_data\CVX\8-K_2023-10-23.md'
Converted 'data\edgar_documents\CVX\8-K_2023-10-27' --> 'data\processed_data\CVX\8-K_2023-10-27.md'


2025-11-14 16:19:49,890 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:49,931 - INFO - Going to convert document batch...
2025-11-14 16:19:49,934 - INFO - Processing document 8-K_2023-11-24
2025-11-14 16:19:49,996 - INFO - Finished converting document 8-K_2023-11-24 in 0.17 sec.
2025-11-14 16:19:50,067 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:50,114 - INFO - Going to convert document batch...
2025-11-14 16:19:50,117 - INFO - Processing document 8-K_2023-12-08
2025-11-14 16:19:50,194 - INFO - Finished converting document 8-K_2023-12-08 in 0.14 sec.


Converted 'data\edgar_documents\CVX\8-K_2023-11-24' --> 'data\processed_data\CVX\8-K_2023-11-24.md'


2025-11-14 16:19:50,367 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:50,397 - INFO - Going to convert document batch...
2025-11-14 16:19:50,398 - INFO - Processing document 8-K_2024-01-02
2025-11-14 16:19:50,436 - INFO - Finished converting document 8-K_2024-01-02 in 0.09 sec.
2025-11-14 16:19:50,477 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:50,516 - INFO - Going to convert document batch...
2025-11-14 16:19:50,517 - INFO - Processing document 8-K_2024-02-02


Converted 'data\edgar_documents\CVX\8-K_2023-12-08' --> 'data\processed_data\CVX\8-K_2023-12-08.md'
Converted 'data\edgar_documents\CVX\8-K_2024-01-02' --> 'data\processed_data\CVX\8-K_2024-01-02.md'


2025-11-14 16:19:50,595 - INFO - Finished converting document 8-K_2024-02-02 in 0.14 sec.
2025-11-14 16:19:50,693 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:50,716 - INFO - Going to convert document batch...
2025-11-14 16:19:50,717 - INFO - Processing document 8-K_2024-04-26
2025-11-14 16:19:50,749 - INFO - Finished converting document 8-K_2024-04-26 in 0.11 sec.
2025-11-14 16:19:50,780 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:50,811 - INFO - Going to convert document batch...
2025-11-14 16:19:50,812 - INFO - Processing document 8-K_2024-05-31


Converted 'data\edgar_documents\CVX\8-K_2024-02-02' --> 'data\processed_data\CVX\8-K_2024-02-02.md'
Converted 'data\edgar_documents\CVX\8-K_2024-04-26' --> 'data\processed_data\CVX\8-K_2024-04-26.md'


2025-11-14 16:19:50,867 - INFO - Finished converting document 8-K_2024-05-31 in 0.09 sec.
2025-11-14 16:19:50,978 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:50,995 - INFO - Going to convert document batch...
2025-11-14 16:19:50,996 - INFO - Processing document 8-K_2024-07-31
2025-11-14 16:19:51,023 - INFO - Finished converting document 8-K_2024-07-31 in 0.06 sec.
2025-11-14 16:19:51,082 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:51,097 - INFO - Going to convert document batch...
2025-11-14 16:19:51,098 - INFO - Processing document 8-K_2024-08-02
2025-11-14 16:19:51,133 - INFO - Finished converting document 8-K_2024-08-02 in 0.08 sec.


Converted 'data\edgar_documents\CVX\8-K_2024-05-31' --> 'data\processed_data\CVX\8-K_2024-05-31.md'
Converted 'data\edgar_documents\CVX\8-K_2024-07-31' --> 'data\processed_data\CVX\8-K_2024-07-31.md'


2025-11-14 16:19:51,174 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:51,192 - INFO - Going to convert document batch...
2025-11-14 16:19:51,195 - INFO - Processing document 8-K_2024-09-30
2025-11-14 16:19:51,229 - INFO - Finished converting document 8-K_2024-09-30 in 0.08 sec.
2025-11-14 16:19:51,282 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:51,300 - INFO - Going to convert document batch...
2025-11-14 16:19:51,302 - INFO - Processing document 8-K_2024-10-07
2025-11-14 16:19:51,340 - INFO - Finished converting document 8-K_2024-10-07 in 0.09 sec.


Converted 'data\edgar_documents\CVX\8-K_2024-08-02' --> 'data\processed_data\CVX\8-K_2024-08-02.md'
Converted 'data\edgar_documents\CVX\8-K_2024-09-30' --> 'data\processed_data\CVX\8-K_2024-09-30.md'


2025-11-14 16:19:51,374 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:51,394 - INFO - Going to convert document batch...
2025-11-14 16:19:51,395 - INFO - Processing document 8-K_2024-11-01
2025-11-14 16:19:51,429 - INFO - Finished converting document 8-K_2024-11-01 in 0.06 sec.
2025-11-14 16:19:51,462 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:51,474 - INFO - Going to convert document batch...
2025-11-14 16:19:51,475 - INFO - Processing document 8-K_2024-12-10
2025-11-14 16:19:51,511 - INFO - Finished converting document 8-K_2024-12-10 in 0.08 sec.
2025-11-14 16:19:51,542 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\CVX\8-K_2024-10-07' --> 'data\processed_data\CVX\8-K_2024-10-07.md'
Converted 'data\edgar_documents\CVX\8-K_2024-11-01' --> 'data\processed_data\CVX\8-K_2024-11-01.md'
Converted 'data\edgar_documents\CVX\8-K_2024-12-10' --> 'data\processed_data\CVX\8-K_2024-12-10.md'


2025-11-14 16:19:51,566 - INFO - Going to convert document batch...
2025-11-14 16:19:51,567 - INFO - Processing document 8-K_2025-01-31
2025-11-14 16:19:51,614 - INFO - Finished converting document 8-K_2025-01-31 in 0.08 sec.
2025-11-14 16:19:51,720 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:51,734 - INFO - Going to convert document batch...
2025-11-14 16:19:51,735 - INFO - Processing document 8-K_2025-02-26
2025-11-14 16:19:51,764 - INFO - Finished converting document 8-K_2025-02-26 in 0.11 sec.
2025-11-14 16:19:51,798 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:51,814 - INFO - Going to convert document batch...
2025-11-14 16:19:51,815 - INFO - Processing document 8-K_2025-03-17
2025-11-14 16:19:51,839 - INFO - Finished converting document 8-K_2025-03-17 in 0.06 sec.


Converted 'data\edgar_documents\CVX\8-K_2025-01-31' --> 'data\processed_data\CVX\8-K_2025-01-31.md'
Converted 'data\edgar_documents\CVX\8-K_2025-02-26' --> 'data\processed_data\CVX\8-K_2025-02-26.md'


2025-11-14 16:19:51,878 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:51,898 - INFO - Going to convert document batch...
2025-11-14 16:19:51,899 - INFO - Processing document 8-K_2025-05-02
2025-11-14 16:19:51,947 - INFO - Finished converting document 8-K_2025-05-02 in 0.09 sec.
2025-11-14 16:19:52,000 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:52,034 - INFO - Going to convert document batch...
2025-11-14 16:19:52,035 - INFO - Processing document 8-K_2025-05-30


Converted 'data\edgar_documents\CVX\8-K_2025-03-17' --> 'data\processed_data\CVX\8-K_2025-03-17.md'
Converted 'data\edgar_documents\CVX\8-K_2025-05-02' --> 'data\processed_data\CVX\8-K_2025-05-02.md'


2025-11-14 16:19:52,085 - INFO - Finished converting document 8-K_2025-05-30 in 0.11 sec.
2025-11-14 16:19:52,201 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:52,216 - INFO - Going to convert document batch...
2025-11-14 16:19:52,217 - INFO - Processing document 8-K_2025-07-18
2025-11-14 16:19:52,248 - INFO - Finished converting document 8-K_2025-07-18 in 0.11 sec.
2025-11-14 16:19:52,290 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:52,317 - INFO - Going to convert document batch...
2025-11-14 16:19:52,318 - INFO - Processing document 8-K_2025-07-29


Converted 'data\edgar_documents\CVX\8-K_2025-05-30' --> 'data\processed_data\CVX\8-K_2025-05-30.md'
Converted 'data\edgar_documents\CVX\8-K_2025-07-18' --> 'data\processed_data\CVX\8-K_2025-07-18.md'


2025-11-14 16:19:52,375 - INFO - Finished converting document 8-K_2025-07-29 in 0.11 sec.
2025-11-14 16:19:52,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:52,527 - INFO - Going to convert document batch...
2025-11-14 16:19:52,532 - INFO - Processing document 8-K_2025-08-01
2025-11-14 16:19:52,572 - INFO - Finished converting document 8-K_2025-08-01 in 0.16 sec.


Converted 'data\edgar_documents\CVX\8-K_2025-07-29' --> 'data\processed_data\CVX\8-K_2025-07-29.md'
Converted 'data\edgar_documents\CVX\8-K_2025-08-01' --> 'data\processed_data\CVX\8-K_2025-08-01.md'


2025-11-14 16:19:52,619 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:52,640 - INFO - Going to convert document batch...
2025-11-14 16:19:52,642 - INFO - Processing document 8-K_2025-08-13
2025-11-14 16:19:52,679 - INFO - Finished converting document 8-K_2025-08-13 in 0.09 sec.
2025-11-14 16:19:52,714 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:52,732 - INFO - Going to convert document batch...
2025-11-14 16:19:52,732 - INFO - Processing document 8-K_2025-09-25
2025-11-14 16:19:52,763 - INFO - Finished converting document 8-K_2025-09-25 in 0.06 sec.
2025-11-14 16:19:52,798 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:52,812 - INFO - Going to convert document batch...
2025-11-14 16:19:52,813 - INFO - Processing document 8-K_2025-10-31
2025-11-14 16:19:52,841 - INFO - Finished converting document 8-K_2025-10-31 in 0.06 sec.
2025-11-14 16:19:52,874 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
20

Converted 'data\edgar_documents\CVX\8-K_2025-08-13' --> 'data\processed_data\CVX\8-K_2025-08-13.md'
Converted 'data\edgar_documents\CVX\8-K_2025-09-25' --> 'data\processed_data\CVX\8-K_2025-09-25.md'
Converted 'data\edgar_documents\CVX\8-K_2025-10-31' --> 'data\processed_data\CVX\8-K_2025-10-31.md'


2025-11-14 16:19:52,889 - INFO - Processing document 8-K_2025-11-03
2025-11-14 16:19:52,915 - INFO - Finished converting document 8-K_2025-11-03 in 0.05 sec.
2025-11-14 16:19:53,017 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:53,018 - ERROR - Input document DEF-14A_2023-04-12 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:19:53,023 - INFO - Going to convert document batch...
2025-11-14 16:19:53,109 - INFO - detected formats:

Converted 'data\edgar_documents\CVX\8-K_2025-11-03' --> 'data\processed_data\CVX\8-K_2025-11-03.md'
Error processing data\edgar_documents\CVX\DEF-14A_2023-04-12: File format not allowed: data\edgar_documents\CVX\DEF-14A_2023-04-12
Error processing data\edgar_documents\CVX\DEF-14A_2024-04-10: File format not allowed: data\edgar_documents\CVX\DEF-14A_2024-04-10


2025-11-14 16:19:53,198 - INFO - detected formats: [<InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.XML_USPTO: 'xml_uspto'>]
2025-11-14 16:19:53,200 - ERROR - Input document DEF-14A_2025-04-09 with format None does not match any allowed format: (dict_keys([<InputFormat.DOCX: 'docx'>, <InputFormat.PPTX: 'pptx'>, <InputFormat.HTML: 'html'>, <InputFormat.IMAGE: 'image'>, <InputFormat.PDF: 'pdf'>, <InputFormat.ASCIIDOC: 'asciidoc'>, <InputFormat.MD: 'md'>, <InputFormat.CSV: 'csv'>, <InputFormat.XLSX: 'xlsx'>, <InputFormat.XML_USPTO: 'xml_uspto'>, <InputFormat.XML_JATS: 'xml_jats'>, <InputFormat.METS_GBS: 'mets_gbs'>, <InputFormat.JSON_DOCLING: 'json_docling'>, <InputFormat.AUDIO: 'audio'>, <InputFormat.VTT: 'vtt'>]))
2025-11-14 16:19:53,204 - INFO - Going to convert document batch...


Error processing data\edgar_documents\CVX\DEF-14A_2025-04-09: File format not allowed: data\edgar_documents\CVX\DEF-14A_2025-04-09
Processed 88 new files. Errors: 18
Found 75 files to process in data\edgar_documents\DE


2025-11-14 16:19:53,501 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:19:57,472 - INFO - Going to convert document batch...
2025-11-14 16:19:57,474 - INFO - Initializing pipeline for SimplePipeline with options hash 995a146ad601044538e6a923bea22f4e
2025-11-14 16:19:57,475 - INFO - Processing document 10-K_2023-12-15
2025-11-14 16:20:09,155 - INFO - Finished converting document 10-K_2023-12-15 in 15.94 sec.


Converted 'data\edgar_documents\DE\10-K_2023-12-15' --> 'data\processed_data\DE\10-K_2023-12-15.md'


2025-11-14 16:20:11,616 - INFO - detected formats: [<InputFormat.HTML: 'html'>]
2025-11-14 16:20:15,862 - INFO - Going to convert document batch...
2025-11-14 16:20:15,863 - INFO - Processing document 10-K_2024-12-12
2025-11-14 16:20:28,879 - INFO - Finished converting document 10-K_2024-12-12 in 17.52 sec.
2025-11-14 16:20:30,563 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\10-K_2024-12-12' --> 'data\processed_data\DE\10-K_2024-12-12.md'


2025-11-14 16:20:32,851 - INFO - Going to convert document batch...
2025-11-14 16:20:32,852 - INFO - Processing document 10-Q_2023-02-23
2025-11-14 16:20:35,570 - INFO - Finished converting document 10-Q_2023-02-23 in 5.19 sec.
2025-11-14 16:20:36,236 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\10-Q_2023-02-23' --> 'data\processed_data\DE\10-Q_2023-02-23.md'


2025-11-14 16:20:40,030 - INFO - Going to convert document batch...
2025-11-14 16:20:40,031 - INFO - Processing document 10-Q_2023-06-01
2025-11-14 16:20:43,161 - INFO - Finished converting document 10-Q_2023-06-01 in 7.05 sec.
2025-11-14 16:20:44,092 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\10-Q_2023-06-01' --> 'data\processed_data\DE\10-Q_2023-06-01.md'


2025-11-14 16:20:47,248 - INFO - Going to convert document batch...
2025-11-14 16:20:47,250 - INFO - Processing document 10-Q_2023-08-31
2025-11-14 16:20:50,657 - INFO - Finished converting document 10-Q_2023-08-31 in 6.75 sec.
2025-11-14 16:20:51,614 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\10-Q_2023-08-31' --> 'data\processed_data\DE\10-Q_2023-08-31.md'


2025-11-14 16:20:54,136 - INFO - Going to convert document batch...
2025-11-14 16:20:54,137 - INFO - Processing document 10-Q_2024-02-29
2025-11-14 16:20:56,834 - INFO - Finished converting document 10-Q_2024-02-29 in 5.34 sec.
2025-11-14 16:20:57,530 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\10-Q_2024-02-29' --> 'data\processed_data\DE\10-Q_2024-02-29.md'


2025-11-14 16:21:00,567 - INFO - Going to convert document batch...
2025-11-14 16:21:00,568 - INFO - Processing document 10-Q_2024-05-30
2025-11-14 16:21:04,370 - INFO - Finished converting document 10-Q_2024-05-30 in 6.97 sec.
2025-11-14 16:21:05,243 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\10-Q_2024-05-30' --> 'data\processed_data\DE\10-Q_2024-05-30.md'


2025-11-14 16:21:08,180 - INFO - Going to convert document batch...
2025-11-14 16:21:08,181 - INFO - Processing document 10-Q_2024-08-29
2025-11-14 16:21:11,398 - INFO - Finished converting document 10-Q_2024-08-29 in 6.31 sec.
2025-11-14 16:21:12,616 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\10-Q_2024-08-29' --> 'data\processed_data\DE\10-Q_2024-08-29.md'


2025-11-14 16:21:15,133 - INFO - Going to convert document batch...
2025-11-14 16:21:15,134 - INFO - Processing document 10-Q_2025-02-27
2025-11-14 16:21:17,452 - INFO - Finished converting document 10-Q_2025-02-27 in 4.97 sec.
2025-11-14 16:21:18,319 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\10-Q_2025-02-27' --> 'data\processed_data\DE\10-Q_2025-02-27.md'


2025-11-14 16:21:21,070 - INFO - Going to convert document batch...
2025-11-14 16:21:21,072 - INFO - Processing document 10-Q_2025-05-29
2025-11-14 16:21:23,846 - INFO - Finished converting document 10-Q_2025-05-29 in 5.72 sec.
2025-11-14 16:21:24,528 - INFO - detected formats: [<InputFormat.HTML: 'html'>]


Converted 'data\edgar_documents\DE\10-Q_2025-05-29' --> 'data\processed_data\DE\10-Q_2025-05-29.md'
