# Generate Docs

## Imports and definitions

In [1]:
import os
import shutil
import pandas as pd
import markdownify as md

In [2]:
output_dir = 'output'

## Create DataFrames

In [3]:
comments_df = pd.read_csv('data/comments.csv')
posts_questions_df = pd.read_csv('data/posts_questions.csv')
posts_answers_df = pd.read_csv('data/posts_answers.csv')
posts_tag_wiki_df = pd.read_csv('data/posts_tag_wiki.csv')
posts_tag_wiki_excerpt_df = pd.read_csv('data/posts_tag_wiki_excerpt.csv')
selected_tags_df = pd.read_csv('data/selected_tags.csv')
tags_df = pd.read_csv('data/tags.csv')
users_df = pd.read_csv('data/users.csv')

## Development

In [4]:
def tag_to_title(tag_name):
    return ' '.join(word.capitalize() for word in tag_name.split('-'))

def get_header(tag_name):
    header_attrs = {
        'title': tag_to_title(tag_name)
    }
    attrs_content = [f"{key}: \"{value}\"" for (key, value) in header_attrs.items()]
    header_content = ['---'] + attrs_content + ['---\n\n']
    return '\n'.join(header_content)

In [5]:
try:
    shutil.rmtree(output_dir)
except:
    pass

os.mkdir(output_dir)

In [6]:
for idx, row in selected_tags_df.iterrows():
    tag_name = row.tag_name 
    content = posts_tag_wiki_df.loc[posts_tag_wiki_df.id == row.wiki_post_id]['body'].values[0]
    content_md = md.markdownify(content)
    with open(f"output/{tag_name}.md", 'w+') as f:
        f.write(get_header(tag_name) + content_md)
        