# report_generator

In [58]:
from datetime import datetime
import pandas as pd

In [59]:
df = pd.read_csv('../DwCA/occurrence.txt', sep='|')
df['eventDate'] = pd.to_datetime(df['eventDate'])

In [60]:
def generate_report_html():
    html = f'''
        <!DOCTYPE html>
        <html>
            <header>
                <meta charset="utf-8">
                <meta name="viewport" content="width=device-width, initial-scale=1">
                <title>validator2</title>
                <link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/bulma@0.9.3/css/bulma.min.css">
            </header>
            <body>
                <section class="section">
                    <div class="container">
                        {title_html}

                        <p>The objective of this project is to build a public database to facilitate sharing information on new geographical 
                        occurrence records for the coconut rhinoceros beetle (CRB), <i>Oryctes rhinoceros</i>, a major pest of coconut and oil palm. 
                        CRB is currently spreading among Pacific Islands.</p>

                        <p>Instead of building,maintaining, and hosting a custom database, I decided to use the Global Biodiversity Information Facility
                        as the project database which already contains <a href="https://www.gbif.org/species/4995642">occurrence records for CRB</a>.
                        The first step is to build a <a href="https://ipt.gbif.org/manual/en/ipt/latest/dwca-guide">Darwin Core Archive</a> (DwCA) which is 
                        a biodiversity informatics data used for uploading data to GBIF.</p>
                        <p> </p><p> </p>
                        <p class="title is-4"h2>Darwin Core Archive (under construction)</p>

                        <p><a href="DwCA/occurrence.txt">DwCA/occurrence.txt</a></p>
                        <p><a href="DwCA/meta.xml">DwCA/meta.xml</a></p>

                        <p class="title is-4">Data Products</p>

                        <p><a href="data_table.htl">Data table</a></p>
                        <p><a href="crb_distribution.gif">Map of new island records for CRB (animated GBIF)</a>
                        <p><a href="code/timeline.html">Timeline of new island records for CRB</a>
            </body>
        </html>        
        '''
    return html

In [61]:
def generate_title_html():
    html = f'''
        <p class="title is-1">CRB Geographic Distribution Project</p>
        <p class="subtitle is-3">Earliest Recorded Dates</p>
        <p>Generated by <b>crbdist/report_generator.ipynb</b> at {datetime.utcnow()} UTC</p>
        '''
    return html

In [62]:
# MAIN
title_html = generate_title_html()
df.to_html('../data_table.html', index=False)

report_html = generate_report_html()
with open('../index.html', 'w') as f:
    f.write(report_html)

print('FINISHED')

FINISHED
