In [7]:
import csv

# CSVファイルを読み込む 
with open('notion/Comprehensive Collection of LLM-Related Papers and b0fc32542854456cbde923e0adb48845_all.csv', 'r', encoding="utf_8_sig") as csv_file:
    csv_reader = csv.DictReader(csv_file)
    data = list(csv_reader)
data.sort(key=lambda x: x['Category'], reverse=False)

# Markdownファイルを書き込む
with open('table.md', 'w', encoding='utf-8') as markdown_file:
    
    num_papers = len(data)
    markdown_file.write(f"<div align=\"center\"> Number of papers and repos in total: {num_papers}</div>\n<br>\n\n")
    
    markdown_file.write('| Category | Title | Image | Links |\n')
    markdown_file.write('| --- | --- | --- | --- |\n')

    for row in data:
        category = row['Category'] if row['Category'] else ''
        title = row['Title'] if row['Title'] else ''
        arxiv_link = f'[ArXiv]({row["ArXiv Link"]})' if row['ArXiv Link'] else ''
        github_link = f'[GitHub]({row["GitHub"]})' if row['GitHub'] else ''
        image_url = row['ImageURL'] if row['ImageURL'] else ''
        links = ', '.join(filter(None, [arxiv_link, github_link]))
        if title != "":
            if len(category) > 10:
                # 単語の途中で改行されないように空白で分割してから改行
                split_category = category.split(' ')
                category = ''
                for word in split_category:
                    if len(category) + len(word) < 50:
                        category += word + ' '
                    else:
                        category += '<br>' + word + ' '
                category = category.rstrip()  # 末尾の空白を削除
                
            # if len(title) > 50:
            #     title = title[:50] + '<br>' + title[50:]

            if image_url != '':
                markdown_file.write(f'| {category} | {title} | {links} | <img src="{image_url}" alt="Image" style="width:100px;"> |\n')
            else:
                markdown_file.write(f'| {category} | {title} | {links} | |\n')



In [8]:
def combine_files(header_file, table_file, output_file):
    # ヘッダーファイルを読み込む
    with open(header_file, 'r', encoding='utf-8') as f:
        header_content = f.read()

    # テーブルファイルを読み込む
    with open(table_file, 'r', encoding='utf-8') as f:
        table_content = f.read()

    # READMEファイルに書き込む
    with open(output_file, 'w', encoding='utf-8') as f:
        f.write(header_content)
        f.write('\n\n')
        f.write(table_content)

# ファイル名を指定して結合を実行
combine_files('header.md', 'table.md', 'README.md')
