# Exploring the typology of abbreviations in Sicily

## Load PyEpiDoc and corpus

In [1]:
from pyepidoc import EpiDoc, EpiDocCorpus
from pyepidoc.epidoc.epidoctypes import AbbrType
from pyepidoc.epidoc.funcs import lang, owner_doc
from pyepidoc.utils import top, listfilter
from pyepidoc.displayutils import show_elems

corpus = EpiDocCorpus(folderpath='data/isicily_master')

## Get all the abbreviations

In [2]:
abbreviations = [expan for expan in corpus.expans]
print('Total abbreviations in I.Sicily corpus: ', len(abbreviations))

Loading epidoc files...
Total abbreviations in I.Sicily corpus:  4366


## Suspensions
### Find all the suspensions

In [3]:
suspensions = [abbr for abbr in abbreviations if abbr.abbr_type == AbbrType.suspension]

### Count and examples

In [4]:
print('Total suspensions in corpus: ', len(suspensions))

Total suspensions in corpus:  3896


In [5]:
latin_susp = [susp for susp in suspensions 
    if lang(susp) == 'la']
print('of which Latin: ', len(latin_susp))

of which Latin:  3182


In [6]:
greek_susp = [susp for susp in suspensions
    if lang(susp) == 'grc']
print('of which Greek: ', len(greek_susp))

of which Greek:  711


In [7]:
other_susp = [susp for susp in suspensions
    if lang(susp) not in ['grc', 'la']]
print('of which other: ', len(other_susp))

of which other:  3


### What are these others?!

In [8]:
print(show_elems(other_susp))

- ISic020131: λε̄́(κυθος) (xly-Grek)
- ISic020737: ϝι(ταριον) (scx-Grek)
- ISic020737: wi(tarion) (scx-Latn)


### First 10 examples

In [10]:
print('First 10 examples:')
print(show_elems(top(suspensions, 10)))

First 10 examples:
- ISic000001: man(ibus) (la)
- ISic000001: vix(it) (la)
- ISic000001: a(nnis) (la)
- ISic000002: D(is) (la)
- ISic000002: M(anibus) (la)
- ISic000002: s(acrum) (la)
- ISic000002: vix(it) (la)
- ISic000002: Melant(e) (la)
- ISic000003: Man(ibus) (la)
- ISic000003: vix(it) (la)


In [27]:
doc000001 = owner_doc(suspensions[0])
print(doc000001.edition_text)


                
                    Dis · manibus
                    · Zethi
                    vixit · annis · VI
                
            


## Contractions

In [11]:
contractions = [abbr for abbr in abbreviations if abbr.abbr_type == AbbrType.contraction]
print('Total contractions in corpus: ', len(contractions))

Total contractions in corpus:  63


In [12]:
latin_contractions = [contraction for contraction in contractions 
    if lang(contraction) == 'la']
print('of which Latin: ', len(latin_contractions))

of which Latin:  11


In [13]:
greek_contractions = [contraction for contraction in contractions 
    if lang(contraction) == 'grc']
print('of which Greek: ', len(greek_contractions))

of which Greek:  52


In [14]:
other_contractions = [contraction for contraction in contractions 
    if lang(contraction) not in ['grc', 'la']]
print('of which Greek: ', len(other_contractions))

of which Greek:  0


In [15]:
top_10_contractions = [contraction for contraction in top(contractions, 10)]

print('First 10 examples:')
print(show_elems(top_10_contractions))

First 10 examples:
- ISic000026: m(aiestati)qu (la)
- ISic000038: v(i)xit (la)
- ISic000043: Ian(uaria)s (la)
- ISic000080: D(e)i (la)
- ISic000447: Kal(enda)s (la)
- ISic000575: qu(a)e (la)
- ISic000755: co(n)s(ulibu)s (la)
- ISic000794: ζήσ(ασ)α (grc)
- ISic000881: θ(εο)ῦ (grc)
- ISic000970: Χ(ριστό)ς (grc)


## Contraction with suspension

In [16]:
c_with_s = [abbr for abbr in abbreviations 
    if abbr.abbr_type == AbbrType.contraction_with_suspension]
print('Total contractions with suspension in corpus: ', len(c_with_s))

Total contractions with suspension in corpus:  62


In [17]:
latin_c_with_s = listfilter(lambda x: lang(x) == 'la', c_with_s)
print('of which Latin: ', len(latin_c_with_s))

of which Latin:  48


In [18]:
greek_c_with_s = listfilter(lambda x: lang(x) == 'grc', c_with_s)
print('of which Greek: ', len(greek_c_with_s))

of which Greek:  14


In [19]:
other_c_with_s = listfilter(lambda x: lang(x) not in ['grc', 'la'], c_with_s)
print('of which Greek: ', len(other_c_with_s))

of which Greek:  0


In [20]:
print(show_elems(top(c_with_s, 10)))

- ISic000007: co(n)s(ule) (la)
- ISic000013: co(n)s(ulis) (la)
- ISic000016: co(n)s(uli) (la)
- ISic000017: co(n)s(ulis) (la)
- ISic000021: co(n)s(uli) (la)
- ISic000024: co(n)s(uli) (la)
- ISic000024: proco(n)s(uli) (la)
- ISic000024: m(aiestati)q(ue) (la)
- ISic000027: me(n)s(ibus) (la)
- ISic000044: c(n)s(ulis) (la)


## Multiplications

In [21]:
multiplications = [abbr for abbr in abbreviations 
    if abbr.abbr_type == AbbrType.multiplication]

In [22]:
print('Total multiplications in corpus: ', len(multiplications))

Total multiplications in corpus:  21


In [23]:
latin_mult = listfilter(lambda x: lang(x) == 'la', multiplications)
print('of which Latin: ', len(latin_mult))

of which Latin:  21


In [24]:
greek_mult = listfilter(lambda x: lang(x) == 'grc', multiplications)
print('of which Greek: ', len(greek_mult))

of which Greek:  0


In [25]:
print(show_elems(multiplications))

- ISic000036: v[v](iris) (la)
- ISic000036: c[c](larissimis) (la)
- ISic000298: d[dd](ominorum) (la)
- ISic000298: n[nn](ostrorum) (la)
- ISic000447: v[v](iris) (la)
- ISic000447: c[c](larissimis) (la)
- ISic000481: d[d](ominorum) (la)
- ISic000481: n[n](ostrorum) (la)
- ISic000481: A[A]u[u]g[g](ustorum) (la)
- ISic000481: v[v](iri) (la)
- ISic000481: c[c](larissimi) (la)
- ISic000501: d[d](ominis) (la)
- ISic000501: n[n](ostris) (la)
- ISic002934: D[D](ominis) (la)
- ISic002934: N[N](ostris) (la)
- ISic002934: A[A]U[U](gustis) (la)
- ISic003462: d[d](ominorum) (la)
- ISic003462: n[n](ostrorum) (la)
- ISic003462: A[A]u[u]g[g](ustorum) (la)
- ISic004376: D[DD](ominis) (la)
- ISic004376: N[NN](ostris) (la)
