# Time Markers with Marked Tendencies

This notebook examines time markers with a marked tendency to prefer a certain tense. A "marked tendency," for the purpose of this analysis, is considered a time marker with a tense that has >50% share. This analysis primarily examines the top 50 time markers.

The analysis uses the data initially gathered in `1_exploration.ipynb`.

In [33]:
import pickle, collections
import pandas as pd
from pprint import pprint
from tf.fabric import Fabric

TF = Fabric(modules='hebrew/etcbc4c', silent=True)
api = TF.load('''book chapter verse
              ''')

api.makeAvailableIn(globals())

  0.00s loading features ...
   |     0.01s B book                 from /Users/Cody/github/text-fabric-data/hebrew/etcbc4c
   |     0.01s B chapter              from /Users/Cody/github/text-fabric-data/hebrew/etcbc4c
   |     0.01s B verse                from /Users/Cody/github/text-fabric-data/hebrew/etcbc4c
   |     0.00s Feature overview: 103 for nodes; 5 for edges; 1 configs; 7 computed
  4.00s All features loaded/computed - for details use loadLog()


In [34]:
# import time markers data
tm_data_file = 'data/time_markers.pickle'

# load data
with open(tm_data_file, 'rb') as infile:
    tm_data = pickle.load(infile)

print('data available: ', ', '.join(tm_data.keys()))

data available:  markers, top_markers, stats_rows


In [35]:
# assign the data
markers = tm_data['markers']
top_markers = tm_data['top_markers']
stats_rows = tm_data['stats_rows']

In [43]:
def predominant_table(tense):
    
    marker_rows = [stats_rows[marker] for marker, count in top_markers
                         if markers[marker]['tense_percents'][tense] > 50.]
    
    # display the data with pd dataframe
    marker_table = pd.DataFrame(marker_rows, columns=tm_data['stats_rows']['header'])
    
    return marker_table

# 1. Yiqtol Predominant Markers

In [44]:
yiqtol_predominant = predominant_table('impf')

yiqtol_predominant

Unnamed: 0,marker,occur,impf,impv,infa,infc,perf,ptca,ptcp,wayq,weqt
0,L <WLM,76,60.5% (46),3.9% (3),0% (0),7.9% (6),11.8% (9),3.9% (3),2.6% (2),2.6% (2),6.6% (5)
1,>Z,57,68.4% (39),0% (0),0% (0),0% (0),29.8% (17),1.8% (1),0% (0),0% (0),0% (0)
2,>XR,31,67.7% (21),0% (0),0% (0),0% (0),32.3% (10),0% (0),0% (0),0% (0),0% (0)
3,MXR,28,64.3% (18),17.9% (5),0% (0),0% (0),0% (0),7.1% (2),3.6% (1),0% (0),7.1% (2)
4,L NYX,24,83.3% (20),0% (0),0% (0),0% (0),16.7% (4),0% (0),0% (0),0% (0),0% (0)
5,<D MTJ,19,78.9% (15),0% (0),0% (0),0% (0),10.5% (2),10.5% (2),0% (0),0% (0),0% (0)
6,CCT JMJM,14,71.4% (10),0% (0),0% (0),0% (0),21.4% (3),0% (0),0% (0),7.1% (1),0% (0)
7,<D >NH,12,75.0% (9),0% (0),0% (0),0% (0),16.7% (2),8.3% (1),0% (0),0% (0),0% (0)
8,B JWM H CMJNJ,12,66.7% (8),0% (0),0% (0),0% (0),8.3% (1),0% (0),0% (0),16.7% (2),8.3% (1)
9,L <D,11,81.8% (9),0% (0),0% (0),0% (0),0% (0),18.2% (2),0% (0),0% (0),0% (0)


# 2. Wayyiqtol Predominant Markers

In [47]:
wayy_predominant = predominant_table('wayq')

wayy_predominant

Unnamed: 0,marker,occur,impf,impv,infa,infc,perf,ptca,ptcp,wayq,weqt
0,B BQR,76,13.2% (10),10.5% (8),1.3% (1),3.9% (3),2.6% (2),3.9% (3),0% (0),55.3% (42),9.2% (7)
1,<D H JWM H ZH,58,5.2% (3),0% (0),0% (0),1.7% (1),29.3% (17),3.4% (2),0% (0),60.3% (35),0% (0)
2,LJLH,33,6.1% (2),3.0% (1),0% (0),3.0% (1),15.2% (5),12.1% (4),0% (0),54.5% (18),6.1% (2)
3,M MXRT,18,0% (0),0% (0),0% (0),0% (0),0% (0),0% (0),0% (0),100.0% (18),0% (0)
4,B <T H HW>,18,0% (0),0% (0),0% (0),0% (0),33.3% (6),5.6% (1),0% (0),61.1% (11),0% (0)
5,JMJM RBJM,16,31.2% (5),0% (0),0% (0),0% (0),6.2% (1),6.2% (1),0% (0),56.2% (9),0% (0)
6,B LJLH H HW>,15,0% (0),0% (0),0% (0),0% (0),13.3% (2),6.7% (1),0% (0),80.0% (12),0% (0)


# 3. Qatal Predominant Markers

In [48]:
qatal_predominant = predominant_table('perf')

qatal_predominant

Unnamed: 0,marker,occur,impf,impv,infa,infc,perf,ptca,ptcp,wayq,weqt
0,B >DJN,28,0% (0),0% (0),0% (0),0% (0),85.7% (24),14.3% (4),0% (0),0% (0),0% (0)
1,H JWM H ZH,26,26.9% (7),3.8% (1),0% (0),0% (0),53.8% (14),3.8% (1),0% (0),3.8% (1),7.7% (2)
2,>DJN,24,4.2% (1),0% (0),0% (0),0% (0),83.3% (20),12.5% (3),0% (0),0% (0),0% (0)
3,>XRJW,20,5.0% (1),0% (0),0% (0),0% (0),75.0% (15),0% (0),0% (0),20.0% (4),0% (0)
4,B JMJW,12,41.7% (5),0% (0),0% (0),0% (0),58.3% (7),0% (0),0% (0),0% (0),0% (0)


# 4. Weqetal Predominant Markers

In [49]:
weqetal_predominant = predominant_table('weqt')

weqetal_predominant

Unnamed: 0,marker,occur,impf,impv,infa,infc,perf,ptca,ptcp,wayq,weqt
0,<D H <RB,41,29.3% (12),0% (0),0% (0),0% (0),2.4% (1),0% (0),0% (0),14.6% (6),53.7% (22)
