In [4]:
from docx import Document

def parse_docx1(file_path: str) -> dict:
    """
    Парсит таблицы и списки из docx-файла, представляя каждый список как отдельный Python list.
    
    :param file_path: Путь к файлу .docx
    :return: Словарь с таблицами и списками
    """
    doc = Document(file_path)
    
    parsed_data = {
        "tables": [[
            [cell.text.strip() for cell in row.cells]
            for row in table.rows
        ] for table in doc.tables],
        "numbered_lists": [],
        "bullet_lists": [],
    }

    current_list, current_type = [], None
    
    for paragraph in doc.paragraphs:
        text = paragraph.text.strip()
        if not text:
            continue

        style_name = paragraph.style.name.lower()
        is_numbered = "list number" in style_name
        is_bullet = "list bullet" in style_name

        if is_numbered or is_bullet:
            new_type = "numbered" if is_numbered else "bullet"
            if current_type != new_type:
                if current_list:
                    parsed_data[f"{current_type}_lists"].append(current_list)
                current_list, current_type = [], new_type
            current_list.append(text)
        else:
            if current_list:
                parsed_data[f"{current_type}_lists"].append(current_list)
                current_list, current_type = [], None

    if current_list:
        parsed_data[f"{current_type}_lists"].append(current_list)
    
    return parsed_data

In [5]:
out = parse_docx1("someshit.docx")

In [6]:
out

{'tables': [[['Document History', 'Document History', 'Document History'],
   ['Release number', 'Release date', 'Document number'],
   ['1.0', '20 April 2006', 's05pu378.v01.doc'],
   ['2.0', '02 August 2006', 's05pu378.v02.doc'],
   ['3.0', '04 August 2006', 's05pu378.v03.doc'],
   ['4.0', '21 August 2006', 's05pu378.v04.doc'],
   ['4.1', '30 August 2010', 's05pu378.v08.docx'],
   ['4.2', '25 January 2013', 's05pu378.v10.docx'],
   ['4.3 - renumbered only', '27 July 2016', 's05pu378.v13.docx'],
   ['4.4', '24 June 2019', 's05pu378.v20.docx'],
   ['4.5', '24 August 2021', 's05pu378.v23.docx']]],
 'numbered_lists': [],
 'bullet_lists': []}