In [None]:
#| default_exp xml

# XML

> Concise generation of XML.

In [None]:
#| export
from fastcore.utils import *

import types,json

from dataclasses import dataclass, asdict
from typing import Mapping
from functools import partial
from html import escape

In [None]:
from IPython.display import Markdown
from pprint import pprint

In [None]:
#|export
class FT(list):
    "A 'Fast Tag' structure, which is a `list` of `[tag,children,attrs]`"
    def __init__(self, tag, cs, attrs=None, void_=False, **kwargs):
        assert isinstance(cs, tuple)
        super().__init__([tag, cs, {**(attrs or {}), **kwargs}])
        self.void_ = void_

    @property
    def tag(self): return self[0]
    @property
    def children(self): return self[1]
    @property
    def attrs(self): return self[2]

    def __setattr__(self, k, v):
        if k.startswith('__') or k in ('tag','cs','attrs','void_'): return super().__setattr__(k,v)
        self.attrs[k.lstrip('_').replace('_', '-')] = v

    def __getattr__(self, k):
        if k.startswith('__') or k not in self.attrs: raise AttributeError(k)
        return self.get(k)

    def get(self, k, default=None): return self[2].get(k.lstrip('_').replace('_', '-'), default)

In [None]:
#| export
def attrmap(o):
    if o=='_': return o
    o = dict(htmlClass='class', cls='class', _class='class', klass='class',
             _for='for', fr='for', htmlFor='for').get(o, o)
    return o.lstrip('_').replace('_', '-')

In [None]:
#| export
def valmap(o):
    if is_listy(o): return ' '.join(o)
    if isinstance(o, dict): return '; '.join(f"{k}:{v}" for k,v in o.items())
    return o

In [None]:
#|export
def _preproc(c, kw, attrmap=attrmap, valmap=valmap):
    if len(c)==1 and isinstance(c[0], (types.GeneratorType, map, filter)): c = tuple(c[0])
    return c,{attrmap(k.lower()):valmap(v) for k,v in kw.items() if v is not None}

In [None]:
#| export
def ft(tag:str, *c, void_=False, attrmap=attrmap, valmap=valmap, **kw):
    "Create an `FT` structure for `to_xml()`"
    return FT(tag.lower(),*_preproc(c,kw,attrmap=attrmap, valmap=valmap), void_=void_)

In [None]:
#| export
voids = set('area base br col command embed hr img input keygen link meta param source track wbr !doctype'.split())
_g = globals()
_all_ = ['Head', 'Title', 'Meta', 'Link', 'Style', 'Body', 'Pre', 'Code',
    'Div', 'Span', 'P', 'H1', 'H2', 'H3', 'H4', 'H5', 'H6', 'Strong', 'Em', 'B',
    'I', 'U', 'S', 'Strike', 'Sub', 'Sup', 'Hr', 'Br', 'Img', 'A', 'Link', 'Nav',
    'Ul', 'Ol', 'Li', 'Dl', 'Dt', 'Dd', 'Table', 'Thead', 'Tbody', 'Tfoot', 'Tr',
    'Th', 'Td', 'Caption', 'Col', 'Colgroup', 'Form', 'Input', 'Textarea',
    'Button', 'Select', 'Option', 'Label', 'Fieldset', 'Legend', 'Details',
    'Summary', 'Main', 'Header', 'Footer', 'Section', 'Article', 'Aside', 'Figure',
    'Figcaption', 'Mark', 'Small', 'Iframe', 'Object', 'Embed', 'Param', 'Video',
    'Audio', 'Source', 'Canvas', 'Svg', 'Math', 'Script', 'Noscript', 'Template', 'Slot']

for o in _all_: _g[o] = partial(ft, o.lower(), void_=o.lower() in voids)

The main HTML tags are exported as `ft` partials.

Attributes are passed as keywords. Use 'klass' and 'fr' instead of 'class' and 'for', to avoid Python reserved word clashes.

In [None]:
#| export
def Html(*c, doctype=True, **kwargs)->FT:
    "An HTML tag, optionally preceeded by `!DOCTYPE HTML`"
    res = ft('html', *c, **kwargs)
    if not doctype: return res
    return (ft('!DOCTYPE', html=True, void_=True), res)

In [None]:
samp = Html(
    Head(Title('Some page')),
    Body(Div('Some text\nanother line', Input(name='me'), Img(src="filename", data=1),
             cls=['myclass', 'another'],
             style={'padding':1, 'margin':2}))
)
pprint(samp)

(['!doctype', (), {'html': True}],
 ['html',
  (['head', (['title', ('Some page',), {}],), {}],
   ['body',
    (['div',
      ('Some text\nanother line',
       ['input', (), {'name': 'me'}],
       ['img', (), {'data': 1, 'src': 'filename'}]),
      {'class': 'myclass another', 'style': 'padding:1; margin:2'}],),
    {}]),
  {}])


The three elements of the list can also be accessed with property names, so you don't have to remember their order.

In [None]:
elem = P('Some text', id="myid")
print(elem.tag)
print(elem.children)
print(elem.attrs)

p
('Some text',)
{'id': 'myid'}


You can also get and set attrs directly:

In [None]:
elem.id = 'newid'
print(elem.id, elem.get('id'), elem.get('foo', 'missing'))
elem

newid newid missing


['p', ('Some text',), {'id': 'newid'}]

In [None]:
#| export
class Safe(str):
    def __html__(self): return self

In [None]:
#| export
def _escape(s): return '' if s is None else s.__html__() if hasattr(s, '__html__') else escape(s) if isinstance(s, str) else s

In [None]:
#| export
def _to_attr(k,v):
    if isinstance(v,bool):
        if v==True : return str(k)
        if v==False: return ''
    if isinstance(v,str): v = escape(v, quote=True)
    elif isinstance(v, Mapping): v = json.dumps(v)
    else: v = str(v)
    qt = '"'
    if qt in v: qt = "'"
    return f'{k}={qt}{v}{qt}'

In [None]:
#| export
def _to_xml(elm, lvl, indent:bool):
    nl = '\n'
    if not indent: lvl,nl = 0,''
    if elm is None: return ''
    if isinstance(elm, tuple): return f'{nl}'.join(to_xml(o, indent=indent) for o in elm)
    if hasattr(elm, '__ft__'): elm = elm.__ft__()
    sp = ' ' * lvl
    if not isinstance(elm, list): return f'{_escape(elm)}{nl}'

    tag,cs,attrs = elm
    stag = tag
    if attrs:
        sattrs = (_to_attr(k,v) for k,v in attrs.items())
        stag += ' ' + ' '.join(sattrs)

    isvoid = getattr(elm, 'void_', False)
    cltag = '' if isvoid else f'</{tag}>'
    if not cs: return f'{sp}<{stag}>{cltag}{nl}'
    if len(cs)==1 and not isinstance(cs[0],(list,tuple)) and not hasattr(cs[0],'__ft__'):
        return f'{sp}<{stag}>{_escape(cs[0])}{cltag}{nl}'
    res = f'{sp}<{stag}>{nl}'
    res += ''.join(to_xml(c, lvl=lvl+2, indent=indent) for c in cs)
    if not isvoid: res += f'{sp}{cltag}{nl}'
    return Safe(res)

def to_xml(elm, lvl=0, indent:bool=True):
    "Convert `ft` element tree into an XML string"
    return Safe(_to_xml(elm, lvl, indent))

FT.__html__ = to_xml

In [None]:
h = to_xml(samp)
print(h)

<!doctype html>

<html>
  <head>
    <title>Some page</title>
  </head>
  <body>
    <div class="myclass another" style="padding:1; margin:2">
Some text
another line
      <input name="me">
      <img src="filename" data="1">
    </div>
  </body>
</html>



In [None]:
h = to_xml(samp, indent=False)
print(h)

<!doctype html><html><head><title>Some page</title></head><body><div class="myclass another" style="padding:1; margin:2">Some text
another line<input name="me"><img src="filename" data="1"></div></body></html>


Interoperability both directions with Django and Jinja using the [__html__() protocol](https://jinja.palletsprojects.com/en/3.1.x/templates/#jinja-filters.escape):

In [None]:
def _esc(s): return s.__html__() if hasattr(s, '__html__') else Safe(escape(s))

r = Safe('<b>Hello from Django</b>')
print(to_xml(Div(r)))
print(_esc(Div(P('Hello from fastcore <3'))))

<div><b>Hello from Django</b></div>

<div>
  <p>Hello from fastcore &lt;3</p>
</div>



In [None]:
#| export
def highlight(s, lang='html'):
    "Markdown to syntax-highlight `s` in language `lang`"
    return f'```{lang}\n{to_xml(s)}\n```'

In [None]:
#| export
def showtags(s):
    return f"""<code><pre>
{escape(to_xml(s))}
</code></pre>"""

FT._repr_markdown_ = highlight

In [None]:
#| export
def __getattr__(tag):
    if tag.startswith('_') or tag[0].islower(): raise AttributeError
    def _f(*c, target_id=None, **kwargs): return ft(tag, *c, target_id=target_id, **kwargs)
    return _f

In [None]:
#|export
@patch
def __call__(self:FT, *c, **kw):
    c,kw = _preproc(c,kw)
    if c: self[1] = self[1]+c
    if kw: self[2] = {**self[2], **kw}
    return self

You can also reorder the children to come *after* the attrs, if you use this alternative syntax for `FT` where the children are in a second pair of `()` (behind the scenes this is because `FT` implements `__call__` to add children).

In [None]:
Body(klass='myclass')(
    Div(style='padding:3px')(
        'Some text ',
        I(spurious=True)('in italics'),
        Input(name='me'),
        Img(src="filename", data=1)
    )
)

```html
<body class="myclass">
  <div style="padding:3px">
Some text 
    <i spurious>in italics</i>
    <input name="me">
    <img src="filename" data="1">
  </div>
</body>

```

# Export -

In [None]:
#|hide
import nbdev; nbdev.nbdev_export()