In [1]:
import re
import os

def split_markdown_by_continuation_phrase(markdown_text, phrase="（待续）"):
    sections = re.split(rf'({phrase})', markdown_text)
    combined_sections = []
    for i in range(0, len(sections) - 1, 2):
        combined_section = sections[i] + sections[i + 1]
        combined_sections.append(combined_section)
    return combined_sections

def find_first_chinese_line_and_add_hash(section_content):
    lines = section_content.split('\n')
    for i, line in enumerate(lines):
        if re.search(r'[\u4e00-\u9fff]', line):
            lines[i] = f'# {line}'
            break
    return '\n'.join(lines).strip()

# 读取Markdown文件
file_path = './output/index.md'
with open(file_path, 'r', encoding='utf-8') as file:
    content = file.read()

# 拆分Markdown文件内容
split_sections = split_markdown_by_continuation_phrase(content)

# 创建一个目录来存储拆分后的文件
output_dir = 'split_markdown_files'
os.makedirs(output_dir, exist_ok=True)

# 将每个部分保存到一个新的Markdown文件中
for index, section_content in enumerate(split_sections):
    # 去除首行以及前面的空白
    section_content = '\n'.join(section_content.split('\n')[1:]).strip()
    # 找到第一行带有中文的文字，并在前面添加"#"
    section_content = find_first_chinese_line_and_add_hash(section_content)

    output_file_path = os.path.join(output_dir, f"section_{index + 1}.md")
    with open(output_file_path, 'w', encoding='utf-8') as file:
        file.write(section_content)

    print(f"Section {index + 1} has been saved to '{output_file_path}'.")


Section 1 has been saved to 'split_markdown_files/section_1.md'.
Section 2 has been saved to 'split_markdown_files/section_2.md'.
Section 3 has been saved to 'split_markdown_files/section_3.md'.
Section 4 has been saved to 'split_markdown_files/section_4.md'.
Section 5 has been saved to 'split_markdown_files/section_5.md'.
Section 6 has been saved to 'split_markdown_files/section_6.md'.
Section 7 has been saved to 'split_markdown_files/section_7.md'.
Section 8 has been saved to 'split_markdown_files/section_8.md'.
Section 9 has been saved to 'split_markdown_files/section_9.md'.
Section 10 has been saved to 'split_markdown_files/section_10.md'.
Section 11 has been saved to 'split_markdown_files/section_11.md'.
Section 12 has been saved to 'split_markdown_files/section_12.md'.
Section 13 has been saved to 'split_markdown_files/section_13.md'.
Section 14 has been saved to 'split_markdown_files/section_14.md'.
Section 15 has been saved to 'split_markdown_files/section_15.md'.
Section 16 ha