From f8451aa44bf462c477ed19f4a4380c735b16e05e Mon Sep 17 00:00:00 2001
From: Thorsten Vitt <thorsten.vitt@uni-wuerzburg.de>
Date: Thu, 9 May 2019 11:58:32 +0200
Subject: [PATCH] Experimental timeline visualisation

---
 src/macrogen/etc/logging.yaml |   1 +
 src/macrogen/graph.py         |  23 +++-
 src/macrogen/report.py        |  73 ++++++----
 src/macrogen/timeline.html    | 243 ++++++++++++++++++++++++++++++++++
 src/macrogen/uris.py          |   5 +-
 src/macrogen/witnesses.py     |  20 ++-
 6 files changed, 332 insertions(+), 33 deletions(-)
 create mode 100644 src/macrogen/timeline.html

diff --git a/src/macrogen/etc/logging.yaml b/src/macrogen/etc/logging.yaml
index 4705bee..fae37d9 100644
--- a/src/macrogen/etc/logging.yaml
+++ b/src/macrogen/etc/logging.yaml
@@ -14,6 +14,7 @@ filters:
     levels:
       macrogen.graph: INFO
       macrogen.fes: INFO
+      macrogen.witnesses: DEBUG
   file:
     (): macrogen.logging.LevelFilter
     default: INFO
diff --git a/src/macrogen/graph.py b/src/macrogen/graph.py
index d773c7e..a279df6 100644
--- a/src/macrogen/graph.py
+++ b/src/macrogen/graph.py
@@ -1,6 +1,7 @@
 """
 Functions to build the graphs and perform their analyses.
 """
+import json
 import pickle
 import re
 from collections import defaultdict, Counter
@@ -76,6 +77,8 @@ def __init__(self, load_from: Optional[Path] = None):
         self.closure: nx.MultiDiGraph = None
         self.conflicts: List[MultiEdge] = []
         self.simple_cycles: Set[Sequence[Tuple[Node, Node]]] = set()
+        self.order: List[Reference] = None
+        self.index: Dict[Reference, int] = None
 
         if load_from:
             self._load_from(load_from)
@@ -214,8 +217,8 @@ def run_analysis(self):
         self._augment_details()
 
     def order_refs(self):
-        if hasattr(self, '_order'):
-            return self._order
+        if self.order:
+            return self.order
 
         logger.info('Creating sort order from DAG')
 
@@ -229,12 +232,17 @@ def secondary_key(node):
 
         nodes = nx.lexicographical_topological_sort(self.dag, key=secondary_key)
         refs = [node for node in nodes if isinstance(node, Reference)]
-        self._order = refs
-        for index, ref in enumerate(refs):
+        self.order = refs
+        self._build_index()
+        for ref, index in self.index.items():
             if ref in self.base.node:
                 self.base.node[ref]['index'] = index
+            ref.index = index
         return refs
 
+    def _build_index(self):
+        self.index = {ref: i for (i, ref) in enumerate(self.order, start=1)}
+
     def _augment_details(self):
         logger.info('Augmenting refs with data from graphs')
         for index, ref in enumerate(self.order_refs(), start=1):
@@ -277,6 +285,9 @@ def save(self, outfile: Path):
                 nx.write_gpickle(self.base, base_entry)
             with zip.open('simple_cycles.pickle', 'w') as sc_entry:
                 pickle.dump(self.simple_cycles, sc_entry)
+            with zip.open('order.json', 'w') as order_entry:
+                text = TextIOWrapper(order_entry, encoding='utf-8')
+                json.dump([ref.uri for ref in self.order], text)
             with zip.open('config.yaml', 'w') as config_entry:
                 config.save_config(config_entry)
             with zip.open('base.yaml', 'w') as base_entry:
@@ -291,6 +302,10 @@ def _load_from(self, load_from: Path):
                 self.base = nx.read_gpickle(base_entry)
             with zip.open('simple_cycles.pickle', 'r') as sc_entry:
                 self.simple_cycles = pickle.load(sc_entry)
+            with zip.open('order.json', 'r') as order_entry:
+                uris = json.load(order_entry)
+                self.order = [Witness.get(uri) for uri in uris]
+                self._build_index()
 
         # Now reconstruct the other data:
         self.working: nx.MultiDiGraph = self.base.copy()
diff --git a/src/macrogen/report.py b/src/macrogen/report.py
index 002e59b..41b68cf 100644
--- a/src/macrogen/report.py
+++ b/src/macrogen/report.py
@@ -13,6 +13,7 @@
 
 import networkx as nx
 import pandas as pd
+import pkg_resources
 import requests
 from lxml import etree
 from lxml.builder import ElementMaker
@@ -222,7 +223,8 @@ def write_html(filename: Path, content: str, head: str = None, breadcrumbs: List
     if head is not None:
         breadcrumbs = breadcrumbs + [dict(caption=head)]
     breadcrumbs = [dict(caption='Makrogenese-Lab', link='/macrogenesis')] + breadcrumbs
-    prefix = """<?php include "../includes/header.php"?>
+    prefix = f"""<?php include "../includes/header.php"?>
+    <!-- Generiert: {datetime.now().isoformat()} -->
      <section>"""
     require = "requirejs(['faust_common', 'svg-pan-zoom'], function(Faust, svgPanZoom)"
     if graph_id is not None:
@@ -361,7 +363,7 @@ class RefTable(HtmlTable):
     Builds a table of references.
     """
 
-    def __init__(self, base: nx.MultiDiGraph, **table_attrs):
+    def __init__(self, graphs: MacrogenesisInfo, **table_attrs):
         super().__init__(data_sortable="true", **table_attrs)
         (self.column('Nr.', data_sortable="numericplus")
          .column('Knoten davor', data_sortable="numericplus")
@@ -372,7 +374,8 @@ def __init__(self, base: nx.MultiDiGraph, **table_attrs):
          .column('erster Vers', data_sortable="numericplus")
          .column('Aussagen', data_sortable="numericplus")
          .column('<a href="conflicts">Konflikte</a>', data_sortable="numericplus"))
-        self.base = base
+        self.graphs = graphs
+        self.base = graphs.base
 
     def reference(self, ref: Reference, index: Optional[int] = None, write_subpage: bool = False):
         """
@@ -385,7 +388,7 @@ def reference(self, ref: Reference, index: Optional[int] = None, write_subpage:
         """
         if ref in self.base:
             if index is None:
-                index = ref.rank # self.base.node[ref]['index']
+                index = self.graphs.index.get(ref, -1)
             assertions = list(chain(self.base.in_edges(ref, data=True), self.base.out_edges(ref, data=True)))
             conflicts = [assertion for assertion in assertions if 'delete' in assertion[2] and assertion[2]['delete']]
             self.row((f'<a href="refs#idx{index}">{index}</a>', ref.rank, ref, ref, ref.earliest, ref.latest,
@@ -632,7 +635,7 @@ def report_refs(graphs: MacrogenesisInfo):
     nx.write_gpickle(graphs.base, str(target / 'base.gpickle'))
 
     refs = graphs.order_refs()
-    overview = RefTable(graphs.base)
+    overview = RefTable(graphs)
 
     for index, ref in enumerate(refs, start=1):
         overview.reference(ref, index, write_subpage=True)
@@ -1027,13 +1030,13 @@ def report_scenes(graphs: MacrogenesisInfo):
                   .column('Gesamt'))
     for scene in SceneInfo.get().scenes:
         items = WitInscrInfo.get().by_scene[scene]
-        witnessTable = RefTable(graphs.base)
+        witnessTable = RefTable(graphs)
         scene_docs = [doc for doc in items if isinstance(doc, DocumentCoverage)]
         scene_inscr = [inscr for inscr in items if isinstance(inscr, InscriptionCoverage)]
         scene_refs = scene_docs + scene_inscr
         scene_wits = {graphs.node(doc.uri, default=None) for doc in scene_refs} - {None}
         scene_graph = graphs.subgraph(*scene_wits, context=False, abs_dates=True)
-        for wit in sorted(scene_wits, key=attrgetter('rank')):
+        for wit in sorted(scene_wits, key=lambda ref: graphs.index.get(ref, 0)):
             witnessTable.reference(wit)
         basename = 'scene_' + scene.n.replace('.', '-')
         subgraph_page = Path(basename + '-subgraph.php')
@@ -1057,6 +1060,26 @@ def report_scenes(graphs: MacrogenesisInfo):
 
     write_html(target / "scenes.php", sceneTable.format_table(), head='nach Szene')
 
+def report_unused(graphs: MacrogenesisInfo):
+    unused_nodes = set(node for node in graphs.base.node if isinstance(node, Reference)) - set(graphs.dag.node)
+    not_in_dag_table = RefTable(graphs)
+    for node in unused_nodes:
+        not_in_dag_table.reference(node)
+
+    unindexed = [node for node in graphs.base.node if isinstance(node, Reference) and not node in graphs.index]
+    unindexed_table = RefTable(graphs)
+    for node in unindexed:
+        unindexed_table.reference(node)
+
+    write_html(config.path.report_dir / 'unused.php',
+               f"""<p>{len(unused_nodes)} Zeugen existieren im Ausgangsgraphen, aber nicht im DAG:</p>
+               {not_in_dag_table.format_table()}
+               <p>{len(unindexed)} Knoten haben auf unerklärliche Weise keinen Index:</p>
+               {unindexed_table.format_table()}
+               """,
+               "Nicht eingeordnete Zeugen")
+
+
 
 def write_order_xml(graphs):
     target: Path = config.path.report_dir
@@ -1174,24 +1197,25 @@ def _dating_table():
     return stat, dating_stat, edge_df
 
 
-def report_timeline(info: MacrogenesisInfo):
-    refs = info.order_refs()
+def report_timeline(graphs: MacrogenesisInfo):
+    witinfo = WitInscrInfo.get()
+
+    def rel_scenes(ref: Reference) -> List[str]:
+        info = witinfo.get().by_uri.get(ref.uri, None)
+        if info:
+            return sorted([scene.n for scene in info.max_scenes])
+        else:
+            return []
+
+    refs = graphs.order_refs()
     data = [dict(start=ref.earliest.isoformat(), end=ref.latest.isoformat(),
-                 content=_fmt_node(ref))
+                 content=_fmt_node(ref), id=ref.filename.stem, scenes=rel_scenes(ref),
+                 index=graphs.index[ref])
             for ref in refs
             if ref.earliest > EARLIEST and ref.latest < LATEST]
-    (config.path.report_dir / 'timeline.html').write_text(f"""
-    <html><head><title>Zeitstrahl</title>
-    <script src="//unpkg.com/timeline-plus/dist/timeline.js"></script>
-    <link href="//unpkg.com/timeline-plus/dist/timeline.css" rel="stylesheet" type="text/css" />
-    </head>
-    <body>
-    <div id="timeline">Lade Zeitstrahl ...</div>
-    <script>
-    const Timeline = new timeline.Timeline(document.getElementById('timeline'), {json.dumps(data)});
-    </script>
-    </body></html>
-    """)
+    with (config.path.report_dir / 'timeline.json').open("wt") as data_out:
+        json.dump(data, data_out)
+    (config.path.report_dir / 'timeline.html').write_binary(pkg_resources.resource_string('macrogen', 'timeline.html'))
 
 
 def report_inscriptions(info: MacrogenesisInfo):
@@ -1213,10 +1237,10 @@ def report_inscriptions(info: MacrogenesisInfo):
                             lambda _, __, attr: attr.get('copy') or attr.get('kind') in ['inscription', 'orphan'])
 
     table = (HtmlTable()
-             .column('Dokument', lambda uri: _fmt_node(Witness.get(uri)))
+             .column('Dokument', lambda uri: _fmt_node(Witness.get(uri)), data_sortable_type='sigil')
              .column('Inskriptionen Makrogenese')
              .column('Inskriptionen Transkript')
-             .column('Dok.-Aussagen')
+             .column('Dok.-Aussagen', data_sortable_type='numericplus')
              .column('Graph'))
 
     def uri_idx(uri):
@@ -1303,4 +1327,5 @@ def ghlink(path: Path):
 def generate_reports(info: MacrogenesisInfo):
     report_functions = [fn for name, fn in globals().items() if name.startswith('report_')]
     for report in report_functions:
+        logger.info('Running %s', report.__name__)
         report(info)
diff --git a/src/macrogen/timeline.html b/src/macrogen/timeline.html
new file mode 100644
index 0000000..cd65be0
--- /dev/null
+++ b/src/macrogen/timeline.html
@@ -0,0 +1,243 @@
+<!DOCTYPE HTML>
+<html lang="de" xml:lang="de">
+<head>
+    <meta charset='utf-8'>
+    <title>Faustedition – Zeitstrahl</title>
+
+    <script type="text/javascript" src="/js/require.js"></script>
+    <script type="text/javascript" src="/js/faust_config.js"></script>
+
+    <link rel="stylesheet" href="/css/webfonts.css">
+    <link rel="stylesheet" href="/css/pure-min.css">
+    <link rel="stylesheet" href="/css/pure-custom.css">
+    <link rel="stylesheet" href="/css/basic_layout.css">
+    <link rel="stylesheet" href="/css/overlay.css">
+    <link rel="stylesheet" href="/css/chocolat.css">
+    <link rel="stylesheet" href="/css/chocolat-custom.css">
+    <link rel="stylesheet" href="/css/timeline.min.css"/>
+    <link rel="icon" type="image/png" href="/favicon-16x16.png" sizes="16x16">
+    <link rel="icon" type="image/png" href="/favicon-32x32.png" sizes="32x32">
+
+    <style>
+        .timeline-item .timeline-item-overflow { overflow: visible; }
+    </style>
+
+</head>
+<body>
+<header>
+    <div class="logo">
+        <a href="/"><img src="/img/faustlogo.svg" alt="Faustedition"></a>
+        <sup class="pure-fade-50"><mark>1.1 RC</mark></sup>
+    </div>
+    <div class="breadcrumbs pure-right pure-nowrap pure-noprint pure-fade-50">
+        <small id="breadcrumbs"></small>
+    </div>
+    <div id="current" class="pure-nowrap"></div>
+    <nav id="nav_all" class="pure-menu pure-menu-open pure-menu-horizontal pure-right pure-nowrap pure-noprint">
+        <ul>
+            <li><a href="/help" title="Hilfe"><i class="fa fa-help-circled fa-lg"></i></a></li>
+            <li><a href="#quotation" title="Zitieremfehlung"><i class="fa fa-bookmark fa-lg"></i></a></li>
+            <li><a href="#download" title="Download"><i class="fa fa-download fa-lg"></i></a></li>
+            <li><form class="pure-form" action="/query" method="GET"><input id="quick-search" name="q" type="text" onblur="this.value=''" /><button type="submit" class="pure-fade-30"><i class="fa fa-search fa-lg"></i></button></form></li>
+            <li><a href="#navigation" title="Seitennavigation"><i class="fa fa-menu fa-lg"></i> Menü</a></li>
+        </ul>
+    </nav>
+</header>
+<main>
+    <div id="timeline" style="height:calc(100vh - 3.5em);border:1px solid red;">
+        <div id="loading-spinner" class="background-container">
+            <div class="pure-center pure-fade-50">
+                <i class="fa fa-spinner fa-pulse fa-5x"></i><br/>
+                Zeitstrahl wird geladen …
+            </div>
+        </div>
+    </div>
+
+    <script>
+        requirejs(['faust_common', 'timeline', 'jquery', 'json'],
+        function(Faust, timeline, $) {
+            Faust.xhr.get('timeline.json')
+                .then((response) => {
+                    let container = document.getElementById('timeline'),
+                        raw_data = JSON.parse(response),
+                        data = new timeline.DataSet({type: {start: 'ISODate', end: 'ISODate'}}),
+                        options = {
+                            height: container.style.height,
+                            locale: "de",
+                            min: "1750-01-01",
+                            max: "1850-12-31",
+                            order: (a, b) => b.index - a.index,
+                            zoomMin: 1000 * 60 * 60 * 24 * 15
+                        };
+                    data.add(raw_data);
+                    let tl = new timeline.Timeline(container, data, options);
+                    let params = Faust.url.getParameters();
+                    if (params.focus) {
+                        let items = params.focus.split(/,[+ ]*/);
+                        console.log(items);
+                        tl.setSelection(items);
+                        tl.focus(items, {animation: {duration: 2000, easingFunction: 'easeInOutQuad'}});
+                    }
+                    return tl;
+                })
+                .catch((reason) => Faust.error('Fehler beim Laden des Zeitstrahls', reason, document.getElementById('timeline')))
+                .then(() => Faust.finishedLoading())
+
+        });
+    </script>
+</main>
+
+<noscript>
+    <div class="pure-alert pure-alert-warning">
+        <h3>JavaScript erforderlich</h3>
+        <p>Die Faustedition bietet ein interaktives Userinterface, für das JavaScript erforderlich ist.</p>
+        <p>Bitte deaktivieren Sie ggf. vorhandene Skriptblocker für diese Seite.</p>
+    </div>
+</noscript>
+
+<div id="cookie-consent" class="pure-modal center" style="top:auto;">
+    <div class="pure-modal-body">
+        <p>Diese Website verwendet Cookies und vergleichbare Technologien zur Erhöhung des Bedienkomforts
+            und – entsprechend Ihren Browsereinstellungen – für eine anonymisierte Nutzungsstatistik.
+            Durch die Benutzung erklären Sie sich damit einverstanden.</p>
+        <p>Die Webanalyse können Sie <a href="/imprint#privacy">auf unserer Datenschutzseite</a> oder
+            über Ihre Browsereinstellungen deaktivieren. Falls Sie Cookies grundsätzlich ablehnen wollen,
+            verwenden Sie Ihre Browsereinstellungen dazu und nehmen entsprechende Funktionalitätseinbußen
+            in Kauf.</p>
+        <p><a id="cookie-consent-button" class="pure-button pull-right">Verstanden</a></p>
+    </div>
+
+</div>
+
+
+
+<script type="text/template" id="navigation">
+    <div class="center pure-g-r navigation">
+        <div class="pure-u-1-4 pure-gap">
+            <a href="/archive"><big>Archiv</big></a>
+            <a href="/archive_locations">Aufbewahrungsorte</a>
+            <a href="/archive_manuscripts">Handschriften</a>
+            <a href="/archive_prints">Drucke</a>
+            <a href="/archive_testimonies">Entstehungszeugnisse</a>
+            <a href="/archive_materials">Materialien</a>
+        </div>
+        <div class="pure-u-1-4 pure-gap">
+            <a><big>Genese</big></a>
+            <a href="/genesis">Werkgenese</a>
+            <a href="/genesis_faust_i">Genese Faust I</a>
+            <a href="/genesis_faust_ii">Genese Faust II</a>
+            <a href="/macrogenesis">Makrogenese-Lab</a>
+        </div>
+        <div class="pure-u-1-4 pure-gap">
+            <a href="/text"><big>Text</big></a>
+            <a href="/print/faust">Faust: Konstituierter Text</a>
+            <a href="/print/app">Apparat</a>
+            <a href="/intro_text">Editorischer Bericht</a>
+            <br />
+            <a href="/paralipomena">Paralipomena</a>
+        </div>
+        <div class="pure-u-1-4 pure-gap pure-fade-50">
+            <a><big>Informationen</big></a>
+            <a href="/intro">Über die Ausgabe</a>
+            <a href="/project">Über das Projekt</a>
+            <a href="/contact">Kontakt</a>
+            <a href="/imprint">Impressum</a>
+            <a href="/intro#sitemap">Sitemap</a>
+            <a class="undecorated" rel="license" href="http://creativecommons.org/licenses/by-nc-sa/4.0/"><img alt="Creative-Commons-Lizenzvertrag CC BY-NC-SA 4.0" src="/img/cc-by-nc-sa-40-80x15.png" align="middle"></a>
+        </div>
+    </div>
+</script>
+
+
+<script type="text/template" id="quotation">
+    <div class="center pure-g-r quotation">
+        <div class="pure-u-1">
+            <h3>Zitierempfehlung</h3>
+            <p class="quotation-content">
+                Johann Wolfgang Goethe: Faust. Historisch-kritische Edition.
+                Herausgegeben von Anne Bohnenkamp, Silke Henke und Fotis Jannidis
+                unter Mitarbeit von Gerrit Brüning, Katrin Henzel, Christoph Leijser, Gregor Middell, Dietmar Pravida, Thorsten Vitt und Moritz Wissenbach.
+                Version 1.1 RC. Frankfurt am Main / Weimar / Würzburg 2018,
+                <span>{context}</span>,
+                <span>URL: <a href="{url}">{url}</a></span>,
+                abgerufen am {date}.
+            </p>
+            <p><i class="fa fa-paste pure-fade-50"></i> <a href="#" data-target=".quotation-content">kopieren</a></p>
+        </div>
+    </div>
+</script>
+
+
+<script type="text/template" id="download">
+
+    <div class="center pure-g-r navigation">
+        <div class="pure-u-1">
+            <h3><i class="fa fa-code" aria-hidden="true"></i> XML-Quellen</h3>
+        </div>
+        <div id="xml-global" class="pure-u-1-3 pure-gap">
+            <a><big>Globale TEI-Daten</big></a>
+            <a href="https://github.com/faustedition/faust-xml"><i class="fa fa-github-circled"></i> alle XML-Daten</a>
+            <a href="/downloads/testimony-split.zip" disabled="disabled"><i class="fa fa-file-archive"></i> Entstehungszeugnisse</a>
+            <a href="/downloads/faust.xml" disabled="disabled"><i class="fa fa-file-code"></i> konstituierter Text</a>
+        </div>
+
+            <div id="xml-current" class="pure-u-1-3 pure-gap disabled">
+                <a><big>aktueller Datensatz</big></a>
+                <a id="xml-current-doc-source-page" href="#"><i class="fa fa-file-code"></i> Dokumentarisches Transkript</a>
+                <a id="xml-current-text-source"     href="#"><i class="fa fa-file-code"></i> Textuelles Transkript</a>
+                <a id="xml-current-metadata"        href="#"><i class="fa fa-file-code"></i> Metadaten</a>
+            </div>
+
+        <div id="more-downloads" class="pure-u-1-3 pure-gap"  >
+            <a>mehr …</a>
+            <a>weitere Downloadmöglichkeiten demnächst.</a>
+        </div>
+    </div>
+</script>
+
+
+
+<script>
+    requirejs(['jquery', 'jquery.chocolat', 'jquery.overlays', 'jquery.clipboard', 'faust_common', 'js.cookie'],
+        function ($, $chocolat, $overlays, $clipboard, Faust, Cookies) {
+            $('main').Chocolat({className:'faustedition', loop:true});
+            $('header nav').menuOverlays({highlightClass:'pure-menu-selected', onAfterShow: function() {
+                    $('[data-target]').copyToClipboard();
+                }});
+            Faust.addToTopButton();
+
+            var consent = Cookies.get('faust-cookie-consent');
+            if (navigator.cookieEnabled && (consent != 'yes')) {
+                $('#cookie-consent-button').bind('click', function () {
+                    var domain = window.location.hostname;
+                    if (/faustedition\.net$/.test(domain))
+                        domain = '.faustedition.net';
+                    Cookies.set('faust-cookie-consent', 'yes', {expires: 365, domain: domain});
+                    $('#cookie-consent').hide();
+                });
+                $('#cookie-consent').show();
+            }
+
+                document.getElementById('breadcrumbs').appendChild(Faust.createBreadcrumbs(
+                    [{caption: 'Makrogenese', link: '/macrogenesis'}, {caption: 'Zeitstrahl'}]
+                ));
+        });
+</script>
+
+<!-- Piwik -->
+<script type="text/javascript">
+    var _paq = _paq || [];
+    _paq.push(['trackPageView']);
+    _paq.push(['enableLinkTracking']);
+    (function() {
+        var u="//analytics.faustedition.net/";
+        _paq.push(['setTrackerUrl', u+'piwik.php']);
+        _paq.push(['setSiteId', 1]);
+        var d=document, g=d.createElement('script'), s=d.getElementsByTagName('script')[0];
+        g.type='text/javascript'; g.async=true; g.defer=true; g.src=u+'piwik.js'; s.parentNode.insertBefore(g,s);
+    })();
+</script>
+<noscript><p><img src="//analytics.faustedition.net/piwik.php?idsite=1" style="border:0;" alt="" /></p></noscript>
+<!-- End Piwik Code -->
+</body>
+</html>
diff --git a/src/macrogen/uris.py b/src/macrogen/uris.py
index 50beb4e..f6bfd74 100644
--- a/src/macrogen/uris.py
+++ b/src/macrogen/uris.py
@@ -164,7 +164,7 @@ class UnknownRef(Reference):
     """
 
     def __init__(self, uri):
-        self.uri = uri
+        super().__init__(uri)
         self.status = "unknown"
 
 
@@ -174,7 +174,7 @@ class AmbiguousRef(Reference):
     """
 
     def __init__(self, uri, wits):
-        self.uri = uri
+        super().__init__(uri)
         self.witnesses = frozenset(wits)
         self.status = 'ambiguous: ' + ", ".join(str(wit) for wit in sorted(self.witnesses))
 
@@ -207,6 +207,7 @@ class Witness(Reference):
 
     def __init__(self, doc_record):
         if isinstance(doc_record, dict):
+            super().__init__(doc_record.get('uri', '?'))
             self.__dict__.update(doc_record)
             self.status = '(ok)'
         else:
diff --git a/src/macrogen/witnesses.py b/src/macrogen/witnesses.py
index e7e5505..27df3d5 100644
--- a/src/macrogen/witnesses.py
+++ b/src/macrogen/witnesses.py
@@ -2,7 +2,7 @@
 from collections import defaultdict
 from itertools import chain
 from pathlib import Path
-from typing import List, Optional, Dict, Union
+from typing import List, Optional, Dict, Union, Set
 import reprlib
 
 from .config import config
@@ -18,6 +18,8 @@
 
 """
 
+logger = config.getLogger(__name__)
+
 
 def encode_sigil(sigil: str) -> str:
     """
@@ -157,6 +159,7 @@ def get(cls) -> 'SceneInfo':
         return cls._instance
 
     def __init__(self, et=None):
+        logger.debug('Reading scene info ...')
         if et is None:
             et = config.scenes_xml
         self.toplevel = [Scene(el) for el in et.xpath('/*/*')]
@@ -182,7 +185,6 @@ def is_relevant_for(self, first: int, last: int):
                    first <= interval['start'] and interval['end'] <= last
                    for interval in self.intervals)
 
-
     def _init_relevant_scenes(self):
         relevant_scenes = set()
         for scene in SceneInfo.get().scenes:
@@ -191,6 +193,16 @@ def _init_relevant_scenes(self):
             elif self.is_relevant_for(scene.first, scene.last):
                 relevant_scenes.add(scene)
         self.relevant_scenes = frozenset(relevant_scenes)
+        self.max_scenes = self._reduce_scenes(relevant_scenes)
+
+    @staticmethod
+    def _reduce_scenes(scenes: Set[Scene]) -> Set[Scene]:
+        result = set(scenes)
+        while len(result) > 1 and any(scene.parent for scene in result):
+            result = {scene.parent if scene.parent else scene for scene in result}
+        return result
+
+
 
 
 class InscriptionCoverage(IntervalsMixin):
@@ -222,11 +234,12 @@ def __init__(self, json):
 class WitInscrInfo:
 
     def __init__(self):
+        logger.debug('Loading document and witness coverage from bargraph ...')
         bargraph = config.genetic_bar_graph
         self.documents = [DocumentCoverage(doc) for doc in bargraph]
         self.by_scene: Dict[Scene, Union[InscriptionCoverage, DocumentCoverage]] = defaultdict(list)
         self.by_uri: Dict[str, Union[InscriptionCoverage, DocumentCoverage]] = dict()
-        for doc in self.documents:
+        for doc in config.progress(self.documents, desc='Analyzing documents', unit=' docs'):
             self.by_uri[doc.uri] = doc
             for inscription in doc.inscriptions:
                 self.by_uri[inscription.uri] = inscription
@@ -256,6 +269,7 @@ def resolve(self, arg: str, inscription: Optional[str]=None):
 
 
 def all_documents(path: Optional[Path] = None):
+    logger.debug('Reading inscription info from sources ...')
     if path is None:
         path = config.path.data.joinpath('document')
     return [Document(doc) for doc in config.progress(list(path.rglob('**/*.xml')))]