# Exploring the typology of abbreviations in Sicily

## Load PyEpiDoc and corpus

In [43]:
from pyepidoc import EpiDoc, EpiDocCorpus
from pyepidoc.epidoc.enums import AbbrType
from pyepidoc.epidoc.dom import lang, owner_doc
from pyepidoc.shared.utils import top, contains, listfilter
from pyepidoc.shared.display import show_elems

corpus = EpiDocCorpus(inpt='../example_corpus')

## Get all the abbreviations

In [44]:
abbreviations = [expan for expan in corpus.expans]
print('Total abbreviations in I.Sicily corpus: ', len(abbreviations))

Total abbreviations in I.Sicily corpus:  198


## Suspensions
### Find all the suspensions

In [47]:
suspensions = [abbr for abbr in abbreviations 
               if contains(abbr.abbr_types, AbbrType.suspension)]

### Count and examples

In [48]:
print('Total suspensions in corpus: ', len(suspensions))

Total suspensions in corpus:  194


In [50]:
latin_susp = [susp for susp in suspensions 
    if lang(susp) == 'la']
print('of which Latin: ', len(latin_susp))

of which Latin:  171


In [51]:
greek_susp = [susp for susp in suspensions
    if lang(susp) == 'grc']
print('of which Greek: ', len(greek_susp))

of which Greek:  23


In [52]:
other_susp = [susp for susp in suspensions
    if lang(susp) not in ['grc', 'la']]
print('of which other: ', len(other_susp))

of which other:  0


### What are these others?!

In [53]:
print(show_elems(other_susp))




### First 10 examples

In [54]:
print('First 10 examples:')
print(show_elems(top(suspensions, 10)))

First 10 examples:
- ISic000001: man(ibus) (la)
- ISic000001: vix(it) (la)
- ISic000001: a(nnis) (la)
- ISic000002: D(is) (la)
- ISic000002: M(anibus) (la)
- ISic000002: s(acrum) (la)
- ISic000002: vix(it) (la)
- ISic000003: Man(ibus) (la)
- ISic000003: vix(it) (la)
- ISic000003: an(nis) (la)


In [55]:
doc000001 = owner_doc(suspensions[0])
print(doc000001.text_leiden)


Dis · man(ibus)
 · Zethi
vix(it) · a(nnis) · VI


## Contractions

In [56]:
[abbr for abbr in abbreviations]

[Expan('man(ibus)'),
 Expan('vix(it)'),
 Expan('a(nnis)'),
 Expan('D(is)'),
 Expan('M(anibus)'),
 Expan('s(acrum)'),
 Expan('vix(it)'),
 Expan('Man(ibus)'),
 Expan('vix(it)'),
 Expan('an(nis)'),
 Expan('Herm(es)'),
 Expan('fe(cerunt)'),
 Expan('P(ubli)'),
 Expan('f(ilius)'),
 Expan('P(ublius)'),
 Expan('P(ubli)'),
 Expan('f(ilius)'),
 Expan('P(ubli)'),
 Expan('n(epos)'),
 Expan('f(ilius)'),
 Expan('{II}(duum)virạtus'),
 Expan('D(is)'),
 Expan('M(anibus)'),
 Expan('S(acrum)'),
 Expan('M(arcus)'),
 Expan('vix(it)'),
 Expan('ann(is)'),
 Expan('mens(is)'),
 Expan('dieb(us)'),
 Expan('C(aius)'),
 Expan('ann(os)'),
 Expan('ann(os)'),
 Expan('Mag(no)'),
 Expan('Mag(ni)'),
 Expan('f(ilio)'),
 Expan('imp(eratore)'),
 Expan('co(n)s(ule)'),
 Expan('desig(nato)'),
 Expan('L(ucius)'),
 Expan('L(uci)'),
 Expan('f(ilius)'),
 Expan('leg(atus)'),
 Expan('pr(aetore)'),
 Expan('pr(aetor)'),
 Expan('des(ignatus)'),
 Expan('f(aciendum)'),
 Expan('c(uravit)'),
 Expan('D(is)'),
 Expan('M(anibus)'),
 Expan('

In [57]:
contractions = [abbr for abbr in abbreviations 
                if contains(abbr.abbr_types, AbbrType.contraction)]
print('Total contractions in corpus: ', len(contractions))

Total contractions in corpus:  0


In [58]:
latin_contractions = [contraction for contraction in contractions 
    if lang(contraction) == 'la']
print('of which Latin: ', len(latin_contractions))

of which Latin:  0


In [59]:
greek_contractions = [contraction for contraction in contractions 
    if lang(contraction) == 'grc']
print('of which Greek: ', len(greek_contractions))

of which Greek:  0


In [60]:
other_contractions = [contraction for contraction in contractions 
    if lang(contraction) not in ['grc', 'la']]
print('of which Greek: ', len(other_contractions))

of which Greek:  0


In [61]:
top_10_contractions = [contraction for contraction in top(contractions, 10)]

print('First 10 examples:')
print(show_elems(top_10_contractions))

First 10 examples:



## Contraction with suspension

In [62]:
c_with_s = [abbr for abbr in abbreviations 
    if contains(abbr.abbr_types, AbbrType.contraction_with_suspension)]
print('Total contractions with suspension in corpus: ', len(c_with_s))

Total contractions with suspension in corpus:  3


In [63]:
latin_c_with_s = listfilter(lambda x: lang(x) == 'la', c_with_s)
print('of which Latin: ', len(latin_c_with_s))

of which Latin:  3


In [64]:
greek_c_with_s = listfilter(lambda x: lang(x) == 'grc', c_with_s)
print('of which Greek: ', len(greek_c_with_s))

of which Greek:  0


In [65]:
other_c_with_s = listfilter(lambda x: lang(x) not in ['grc', 'la'], c_with_s)
print('of which Greek: ', len(other_c_with_s))

of which Greek:  0


In [66]:
print(show_elems(top(c_with_s, 10)))

- ISic000007: co(n)s(ule) (la)
- ISic000017: co(n)s(ulis) (la)
- ISic000805: proco(n)s(uli) (la)


## Multiplications

In [67]:
multiplications = [abbr for abbr in abbreviations 
    if contains(abbr.abbr_types, AbbrType.multiplication)]

In [68]:
print('Total multiplications in corpus: ', len(multiplications))

Total multiplications in corpus:  0


In [69]:
latin_mult = listfilter(lambda x: lang(x) == 'la', multiplications)
print('of which Latin: ', len(latin_mult))

of which Latin:  0


In [70]:
greek_mult = listfilter(lambda x: lang(x) == 'grc', multiplications)
print('of which Greek: ', len(greek_mult))

of which Greek:  0


In [71]:
print(show_elems(multiplications))


