write_pdf.py

from pathlib import Path

from jinja2 import Template
from xhtml2pdf import pisa

import access        
import create_png
import page_definition

import logging
logging.basicConfig(level=logging.DEBUG,
format='%(asctime)s - %(name)s - %(levelname)s - %(message)s')

table_doc = """
{% for plot in plot_dicts %}

<div id="section_header">
{{plot['header']}}
</div>
<div id="images">
<img class="image" src="{{plot['filenames'][0]}}">
<img class="image" src="{{plot['filenames'][1]}}">
</div>

{% endfor %}
""" 

# NOT TODO: put me back
#{% if loop.index == 4 %}
#<div style="page-break-before: always" id="plot">
#{% else %}


# пробовали: 
#    @font-face { font-family: Arial; src: url('fonts/arial.ttf') }

template_doc = """<html>
<head>
    <meta http-equiv="content-type" 
          content="text/html; charset=UTF-8">
    <title>{{ page_header }}</title>
<style type="text/css">
    @page { size: A4; margin: 1cm; }
    @font-face { font-family: Arial; src: url('D:/arial.ttf') }
    * {font-family: Arial}
</style>
<style>
.rowimage {
    display: inline-block;
    margin-left: auto;
    margin-right: auto;
    height: 260px; 
}
  </style>""" + \
"""  
</head>
<body>
     %s
</body>
</html>""" % table_doc
    

# NOTE: weasyprint is not windows-compatible. msu yuse different pdf renderer
#HTML(string=html_out, base_url=os.path.dirname(os.path.abspath(__file__))).write_pdf("ts.pdf", stylesheets=[CSS(string='@page {size: Letter;  margin: 0.3in 0.3in 0.3in 0.3in;}')])

# alternatives documented at https://gist.github.com/philfreo/44e2e26a65820497db234d0c66ed58ae
# python: weasyprint or xhtml2pdf.pisa

def convertHtmlToPdf(sourceHtml: str, outputFilename: str):
    # open output file for writing (truncated binary)
    with open(outputFilename, "w+b") as resultFile:
        # convert HTML to PDF
        pisaStatus = pisa.CreatePDF(
                sourceHtml.encode('utf-8'),                # the HTML to convert
                dest=resultFile,           # file handle to recieve result
                encoding='utf-8',
                show_error_as_pdf=True)
    # return True on success and False on errors
    return pisaStatus.err


FONT = str(Path(__file__).parent / 'fonts'/ 'arial.ttf')

FOLDER = Path(__file__).parent / 'output'
if not FOLDER.exists():
    FOLDER.mkdir()

# filenaming convention
def locate(filename):
    return str(FOLDER / filename)

def as_uri(filename):
    return Path(locate(filename)).as_uri()  

if __name__ == "__main__":
    dfa, dfq, dfm = (access.get_dataframe(freq) for freq in 'aqm')
    
    # select dataframe frequency
    df = dfq    
    # add transformations 
    df['TRADE_SURPLUS_bln_usd'] = (df['EXPORT_GOODS_bln_usd'] 
                                 - df['IMPORT_GOODS_bln_usd'])                       
    
    # png files
    if 1:
        for header, charts in page_definition.CHARTS_DICT.items():
            for chart in charts:
                create_png.plot_long(df[chart.names],
                          title=chart.title, 
                          start=2005)
                figname = locate(chart.filename)
                create_png.save(figname)
    if 0:    
        # render template
        template = Template(template_doc)
        # create template parameters
        plot_dicts = [{'header': header,
                       'filenames': [as_uri(c.filename) for c in charts]}                      
                      for header, charts in  page_definition.CHARTS_DICT.items()]
        template_vars = dict(page_header="Macroeconomic charts",
                             plot_dicts=plot_dicts
                             )
        html_out = template.render(template_vars)
        print('Created html:\n', html_out)
        Path(locate('listing.html')).write_text(html_out, encoding='utf-8')
        sig = Path(locate('listing.html')).read_bytes()
        assert sig.startswith(b'<html>')
        
        # ERROR: xhtml2pdf cannot render Russian letters without patching
        convertHtmlToPdf(html_out, locate('out.pdf'))