In [None]:
# %%

import pandas as pd

from source.utils import FREQ_DIR, RESULT_DIR, UCS_DIR, confirm_dir
from source.utils.associate import (BINARY_ASSOC_ARGS, add_extra_am,
                                    associate_ucs, confirm_basic_ucs)
from source.utils.associate import convert_ucs_to_csv as ucs2csv
from source.utils.associate import get_associations_csv as init_am, AM_DF_DIR
from source.utils.associate import manipulate_ucs, seek_readable_ucs, adjust_assoc_columns
pd.set_option('display.float_format', '{:,.2f}'.format)



# %% [markdown]

 set parameters:
 - `UNIT` options:
   - `'Bigr'`
   - `'Adv'`
   - `'Adj'`
 - `PAT_DIR` options:
   - any directory in `results/freq_out/` containing a `ucs_format/` subdir with a `Trig*.tsv` frequency table
   - developed with the following in mind:
     - `POSmirror`
     - `NEGmirror`
     - `ANYmirror` (which has been populated by simple concatenation in the shell)

In [None]:
UNIT = 'Adv'
# UNIT = 'Bigr' 
# UNIT = 'Adv'
# PAT_DIR = 'POSmirror'
PAT_DIR = 'POSmirror'
# PAT_DIR = 'ANYmirror'
FRQ_FLOOR = 3
# FRQ_FLOOR = 10
# FRQ_FLOOR = 20
# FRQ_FLOOR = 50
# FRQ_FLOOR = 100
TRIG_TSV = FREQ_DIR.joinpath(
    f'{PAT_DIR}/ucs_format/Trig{UNIT}_frq-thrMIN-7.35f.tsv')
FOCUS = ['f', 'unexpected_f',
         'conservative_log_ratio',
         'am_p1_given2', 'am_p2_given1',
         'am_p1_given2_simple', 'am_p2_given1_simple',
         'am_log_likelihood',
        #  'mutual_information', 'am_odds_ratio_disc', 't_score',
         'N', 'f1', 'f2', 'E11',
         'l1', 'l2']

In [None]:
# %%

TRIGGER_POLARITY = {
    'positive': {'all',
                 'always',
                 'both',
                 'either',
                 'every',
                 'everybody',
                 'everyone',
                 'everything',
                 'many',
                 'often',
                 'or',
                 'some',
                 'somebody',
                 'someone',
                 'something',
                 'somethings',
                 'sometimes'},
    'negative': {'barely',
                 'hardly',
                 'neither',
                 'never',
                 'no',
                 'nobody',
                 'none',
                 'nor',
                 'nothing',
                 'seldom',
                 'rarely',
                 'scarcely'},

}

In [None]:
# %%

TRIGGER_QUANT = {
    'existential': {
        'some',
        'somebody',
        'someone',
        'something',
        'somethings',
        'either',
     'or',
        'sometimes'
    },
    'universal': {
        'all', 'every',
        'always',
        'everybody',
        'everyone',
        'both',
        'everything',
    },
    'not_exist': {
        'neither',
        'never',
        'no',
        'nobody',
        'none',
        'nor',
        'nothing',
    },
    'hedged_not_exist': {
        'barely',
        'hardly',
        'rarely',
        'scarcely',
        'seldom',
        'few'
    },
    'hedged_universal':{
     'many',
     'often',
     }
}

In [None]:
# %%

def invert_set_dict(d: dict):
    return {v: k for k in d for v in d[k]}

# %% [markdown]

## 1. Run `seek_readable_ucs()` to generate consistent output path

In [None]:
readable = seek_readable_ucs(min_freq=FRQ_FLOOR,
                             ucs_subdir='trigger_eval',
                             contained_counts_path=TRIG_TSV)
print(readable.relative_to(RESULT_DIR))

    > seeking `trigger_eval/POSmirror/readable/TrigAdv_frq-thrMIN-7.35f_min3x*` frequency data and initial associations...
ucs/trigger_eval/POSmirror/readable/TrigAdv_frq-thrMIN-7.35f_min3x.rsort-view_am-only.csv


# %% [markdown]

 Snippet of frequencies to be analyzed (`TRIG_TSV`)

In [None]:
! head -5 {TRIG_TSV} | column -t

64024  something  more
47547  all        more
45543  or         even
45382  all        too
40833  all        very


# %% [markdown]

## 2. Run `confirm_basic_ucs()`

In [None]:
basic_ucs_path = readable.parent.parent.joinpath(
    readable.name.replace('.rsort-view_am-only.txt', '.ds.gz'))
print(f'Creating initial UCS table: `{basic_ucs_path.relative_to(RESULT_DIR)}')

basic_ucs_path = confirm_basic_ucs(
    basic_ucs_path,
    freq_floor=FRQ_FLOOR,
    contained_counts_path=TRIG_TSV)

Creating initial UCS table: `ucs/trigger_eval/POSmirror/TrigAdv_frq-thrMIN-7.35f_min3x.rsort-view_am-only.csv
+ existing UCS table found ✓


# %% [markdown]

 Excerpt of initial UCS table

In [None]:
init_readable = UCS_DIR.joinpath(
    f'trigger_eval/{PAT_DIR}/readable'
).joinpath(f'{TRIG_TSV.name.replace(".tsv","")}_min{FRQ_FLOOR}x.init.txt')
! head -7 {init_readable}

         l1  l2                        f      f2      f1        N  
-----------  --------------------  -----  ------  ------  -------  
         or  more                  34344  207924  326614  1472077  
  something  more                  64024  207924  318343  1472077  
        all  more                  47547  207924  249279  1472077  
       some  more                  15949  207924  114929  1472077  
      often  more                  15169  207924   92233  1472077  


# %% [markdown]

## 3. Run `associate_ucs()`

In [None]:
associate_ucs(basic_ucs_path)

transform_ucs_log = f'/share/compling/projects/sanpi/logs/associate/ucs//ucs-{PAT_DIR}_Trig{UNIT}_frq-thrMIN-7-35f_min{FRQ_FLOOR}x*.log'
! head -15 `ls -t1 {transform_ucs_log} | head -1`
! echo '...'
! tail -2 `ls -t1 {transform_ucs_log} | head -1`


Calculating UCS associations...

```
bash /share/compling/projects/sanpi/script/transform_ucs.sh /share/compling/projects/sanpi/results/ucs/trigger_eval/POSmirror/TrigAdv_frq-thrMIN-7.35f_min3x.rsort-view_am-only.csv
> log will be saved to: /share/compling/projects/sanpi/logs/associate/ucs//ucs-POSmirror_TrigAdv_frq-thrMIN-7-35f_min3x.2024-05-25_2112.log
...
```

+ time elapsed → 00:00:13.10
# Manipulating TrigAdv_frq-thrMIN-7-35f_min3x ucs table
path to this script: /share/compling/projects/sanpi/script/transform_ucs.sh
Sat May 25 21:12:01 EDT 2024
(TMP: /share/compling/projects/sanpi/results/ucs/trigger_eval/POSmirror/tmp/tmp_POSmirror-20240525-211201.TrigAdv_frq-thrMIN-7-35f_min3x)
Caught a SIGPIPE at /usr/share/perl/5.30/Pod/Perldoc.pm line 1910.
Can't close STDOUT: Broken pipe at (eval 44) line 1.
END failed--call queue aborted.
## Initial Contingency Info

DATA SET FILE:  /share/compling/projects/sanpi/results/ucs/trigger_eval/POSmirror/TrigAdv_frq-thrMIN-7.35f_min3x.rsort-view_

# %% [markdown]

### Define dictionary containing relevant vocab sizes
 !!! Warning This is a `#HACK`: \
     Rather than developing a command/code to retrieve the vocab sizes programmatically,
     I simply copied the values given in the log output of `transform_usc.sh`
     for each `PAT_DIR`+`UNIT` combination

 |      |   ANYmirror |   NEGmirror |   POSmirror |
 |:-----|------------:|------------:|------------:|
 | Bigr |     395,338 |      64,644 |     330,694 |
 | Adv  |      23,125 |       5,004 |      18,121 |
 | Adj  |      83,422 |      21,562 |      61,860 |

In [None]:
VOCABS = {'ANYmirror': {'Adv': 23125, 'Bigr': 395338, 'Adj': 83422},
          'NEGmirror': {'Adv': 5004, 'Bigr': 64644, 'Adj': 21562},
          'POSmirror': {'Adv': 18121, 'Bigr': 330694, 'Adj': 61860}
          }  # HACK
VOCAB = VOCABS[PAT_DIR][UNIT]
pd.DataFrame(VOCABS)

Unnamed: 0,ANYmirror,NEGmirror,POSmirror
Adv,23125,5004,18121
Bigr,395338,64644,330694
Adj,83422,21562,61860


# %% [markdown]

## 4. Run `ucs_to_csv()` to convert `ucs/[PAT_DIR]/readable/*.txt` to format that `pandas` can parse as a dataframe

In [None]:
! head -5 {readable}
csv_path = ucs2csv(readable)
print(f'CSV: `{csv_path.relative_to(RESULT_DIR)}`')

         l1  l2                        f            E11  am.log.likelihood  am.odds.ratio.disc   am.p1.given2    am.p2.given1  am.p1.given2.simple  am.p2.given1.simple      f1      f2        N  
-----------  --------------------  -----  -------------  -----------------  ------------------  -------------  --------------  -------------------  -------------------  ------  ------  -------  
         or  more                  34344  46132.7018464       -4777.300943       -0.1818145104  -0.0660225433  -0.04638532985         0.1651757373        0.10515164690  326614  207924  1472077  
  something  more                  64024  44964.4617313       11177.921632        0.2471544354   0.1067428125   0.07639094924         0.3079202016        0.20111640589  318343  207924  1472077  
        all  more                  47547  35209.4943376        5664.083926        0.1935052280   0.0690961153   0.05958232948         0.2286749004        0.19073808865  249279  207924  1472077  
UCS table text converted 

# %% [markdown]

##

In [None]:
trig_amdf = pd.read_csv(csv_path).convert_dtypes()
trig_amdf

Unnamed: 0,l1,l2,f,E11,am_log_likelihood,am_odds_ratio_disc,am_p1_given2,am_p2_given1,am_p1_given2_simple,am_p2_given1_simple,f1,f2,N
0,or,more,34344,46132.70,-4777.30,-0.18,-0.07,-0.05,0.17,0.11,326614,207924,1472077
1,something,more,64024,44964.46,11177.92,0.25,0.11,0.08,0.31,0.20,318343,207924,1472077
2,all,more,47547,35209.49,5664.08,0.19,0.07,0.06,0.23,0.19,249279,207924,1472077
3,some,more,15949,16233.18,-6.31,-0.01,-0.00,-0.00,0.08,0.14,114929,207924,1472077
4,often,more,15169,13027.48,420.10,0.08,0.01,0.02,0.07,0.16,92233,207924,1472077
...,...,...,...,...,...,...,...,...,...,...,...,...,...
8329,all,big-rig,3,0.51,10.66,1.54,0.83,0.00,1.00,0.00,249279,3,1472077
8330,all,conscientiously,3,0.51,10.66,1.54,0.83,0.00,1.00,0.00,249279,3,1472077
8331,all,fantasticly,3,0.51,10.66,1.54,0.83,0.00,1.00,0.00,249279,3,1472077
8332,often,eye-crossingly,3,0.19,16.62,2.02,0.94,0.00,1.00,0.00,92233,3,1472077


In [None]:
# %%

trig_amdf['key'] = (trig_amdf.l1 + '~' +
                    trig_amdf.l2).astype('string')
trig_amdf = trig_amdf.set_index('key')
trig_amdf

Unnamed: 0_level_0,l1,l2,f,E11,am_log_likelihood,am_odds_ratio_disc,am_p1_given2,am_p2_given1,am_p1_given2_simple,am_p2_given1_simple,f1,f2,N
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1
or~more,or,more,34344,46132.70,-4777.30,-0.18,-0.07,-0.05,0.17,0.11,326614,207924,1472077
something~more,something,more,64024,44964.46,11177.92,0.25,0.11,0.08,0.31,0.20,318343,207924,1472077
all~more,all,more,47547,35209.49,5664.08,0.19,0.07,0.06,0.23,0.19,249279,207924,1472077
some~more,some,more,15949,16233.18,-6.31,-0.01,-0.00,-0.00,0.08,0.14,114929,207924,1472077
often~more,often,more,15169,13027.48,420.10,0.08,0.01,0.02,0.07,0.16,92233,207924,1472077
...,...,...,...,...,...,...,...,...,...,...,...,...,...
all~big-rig,all,big-rig,3,0.51,10.66,1.54,0.83,0.00,1.00,0.00,249279,3,1472077
all~conscientiously,all,conscientiously,3,0.51,10.66,1.54,0.83,0.00,1.00,0.00,249279,3,1472077
all~fantasticly,all,fantasticly,3,0.51,10.66,1.54,0.83,0.00,1.00,0.00,249279,3,1472077
often~eye-crossingly,often,eye-crossingly,3,0.19,16.62,2.02,0.94,0.00,1.00,0.00,92233,3,1472077


# %% [markdown]

## 6. Save to `./results/assoc_df/`

In [None]:
df_csv_path = AM_DF_DIR.joinpath(
    str(csv_path.relative_to(UCS_DIR))
    .replace('/readable', '')
    .replace('.rsort-view_am-only', ''))

if not df_csv_path.is_file():
    confirm_dir(df_csv_path.parent)
    trig_amdf.to_csv(df_csv_path)

df_pkl_path = df_csv_path.with_suffix('.pkl.gz')
if not df_pkl_path.is_file():
    trig_amdf.to_pickle(df_csv_path.with_suffix('.pkl.gz'))

# %% [markdown]

## 7. Add additional AM via `add_extra_am()`

In [None]:
ex_trig_amdf = add_extra_am(df=trig_amdf,
                            verbose=True,
                            vocab=VOCAB,
                            metrics=['t_score', 'mutual_information']
                            ).convert_dtypes()


Preview of Extended Measures (rounded)

| key             |   t_score |   mutual_information |   deltaP_min |   deltaP_max |   deltaP_max_abs |   deltaP_product |   unexpected_f |   unexpected_ratio |
|:----------------|----------:|---------------------:|-------------:|-------------:|-----------------:|-----------------:|---------------:|-------------------:|
| or~more         |    -63.61 |                -0.13 |        -0.07 |        -0.05 |             0.07 |             0.00 |     -11,788.70 |              -0.34 |
| something~more  |     75.33 |                 0.15 |         0.08 |         0.11 |             0.11 |             0.01 |      19,059.54 |               0.30 |
| all~more        |     56.58 |                 0.13 |         0.06 |         0.07 |             0.07 |             0.00 |      12,337.51 |               0.26 |
| some~more       |     -2.25 |                -0.01 |        -0.00 |        -0.00 |             0.00 |             0.00 |        -284.18 |              -

#%% [markdown]

 Add trigger features as columns: polarity and quantification type

In [None]:
def add_feature(triggers:pd.Series, 
                group_dict: dict) -> pd.Series:
    assign_dict = invert_set_dict(group_dict)
    return triggers.apply(lambda x: assign_dict[x] if x in assign_dict.keys() else '')

ex_trig_amdf['polarity'] = add_feature(ex_trig_amdf.l1, TRIGGER_POLARITY)
ex_trig_amdf['quant'] = add_feature(ex_trig_amdf.l1, TRIGGER_QUANT)

# %% [markdown]

 Save extended AM tables to `extra/` subdirectory if not already saved

In [None]:
df_extra_csv = df_csv_path.parent / 'extra' / \
    df_csv_path.name.replace('.csv', '_extra.csv')
print(df_extra_csv)
if not df_extra_csv.is_file():
    confirm_dir(df_extra_csv.parent)
    ex_trig_amdf.to_csv(df_extra_csv)

df_extra_pkl = df_extra_csv.with_suffix('.pkl.gz')
if not df_extra_pkl.is_file():
    ex_trig_amdf.to_pickle(df_extra_pkl)

/share/compling/projects/sanpi/results/assoc_df/trigger_eval/POSmirror/extra/TrigAdv_frq-thrMIN-7.35f_min3x_extra.csv


In [None]:
# %%

ex_trig_full = ex_trig_amdf.copy()
ex_trig_abbr = adjust_assoc_columns(
    ex_trig_amdf[[c for c in ['polarity', 'quant'] + FOCUS if c in ex_trig_amdf.columns]]).sort_values('LRC', ascending=False)
cols = ex_trig_abbr.columns

# %% [markdown]

 Define lexical items with given lean shown in binary environment evaluation

In [None]:
pos_prone = {
    'Adj': [
        'unrelated',
        'unable',
        'akin',
        'larger',
        'different',
        'familiar',
        'similar',
        'likely', 
        'brief', 
        'unaware'
    ],
    'Adv': [
        'slightly', 
        'definitely',
        'utterly',
        # LRC top
        'pretty', 
        'rather', 
        'plain', 
        'fairly', 
        'somewhat', 
        'otherwise', 
        'downright',
        'relatively', 
        # G2 top
        # 'very', 
        # 'even', 
        # 'just', 
        # dP1 top (and odds ratio disc)
        'plain', 
        'maybe'
    ], 
    'Bigr': [
        # G2 top
        'completely_different', 
        'too_familiar',
        'even_better',
        # dP1 top
        'quite_different', 
        'too_real', 
        'well_aware', 
        # LRC top
        'too_common', 
        'entirely_different'
        ]}
neg_prone = {
    'Bigr': [
        # LRC top
        'quite_sure',
        'really_sure', 
        'too_early', 
        'too_pleased', 
        'too_fancy',
        # dP1 top
        'entirely_sure', 
        'ever_easy', 
        'ever_perfect', 
        'particularly_surprising',
        'particularly_new',
        # G2 top
        'too_late', 
        'more_important',
        'so_easy', 
        'as_good', 
        'too_old'
        ], 
    'Adv': [
        'yet',
        #LRC top
        'ever',
        'any', 
        'longer', 
        'necessarily',
        'that',
        #dP1 top
        'before', 
        'wise',  #? How is this used as an adverb?
        'earthly',
        'remotely',
        'exactly',
        # G2 top
        'particularly', 
        'too',
        # 'inherently'
        ],
    'Adj': [
        # LRC top
        'early', 
        'late', 
        'fancy', 
        'alone', 
        'sure',
        # dP1 top
        'shabby',
        'demoralizing',
        'alone',
        'aggravating',
        'groundbreaking',
        'eventful',
        #G2 top
        'important', 
        'frustrating',
        'evident', 
        'certain'
        ]
    }
def sort_prone_by_f2(prone_list, amdf):
    return amdf.copy().loc[amdf.l2.isin(prone_list), ['f2','l2']].drop_duplicates().reset_index(drop=True).set_index('l2').round(1).sort_values(['f2'], ascending=False).index.to_list()
pos_prone[UNIT] = sort_prone_by_f2(pos_prone[UNIT], ex_trig_abbr)
neg_prone[UNIT] = sort_prone_by_f2(neg_prone[UNIT], ex_trig_abbr)
pos_prone[UNIT]

['pretty',
 'rather',
 'slightly',
 'otherwise',
 'fairly',
 'relatively',
 'plain',
 'downright',
 'somewhat',
 'maybe',
 'utterly',
 'definitely']

# %% [markdown]

## Strongest associations for each polarity by metric

In [None]:
def show_metric_top(amdf: pd.DataFrame,
                    metric: str,
                    k=5, cols=[None]):
    if not any(cols):
        cols = amdf.columns
    return (pd.concat((polar_df.nlargest(k, metric)
                       for pol, polar_df in amdf.groupby('polarity')))
            .loc[:, [metric] + cols[cols != metric].to_list()]
            .reset_index(drop=True).set_index(['polarity', 'l1', 'l2'])
            )
def update_prone(exdf, pos_prone, neg_prone) -> dict: 
    prone_dict = {'positive':pos_prone, 
                  'negative': neg_prone}
    for polarity, prone in prone_dict.items():
        try: 
            polar_ex = exdf.loc[polarity, :]
        except KeyError: 
            continue
        else: 
                
            for topw in polar_ex.reset_index().l2.head(2).squeeze(): 
                if topw not in prone[UNIT]: 
                    prone[UNIT].append(topw)
            prone_dict[polarity] = prone
    return prone_dict['positive'], prone_dict['negative']

# %% [markdown]

 Top consevative log ratio $LRC$ values

In [None]:
exdf = show_metric_top(ex_trig_abbr,"LRC")
pos_prone, neg_prone = update_prone(exdf, pos_prone, neg_prone)
exdf

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,LRC,quant,f,unexp_f,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
,everythings,all,5.67,,9,8.94,0.0,0.56,0.0,0.56,79.67,1472077,16,5226,0.06
,somethin,n't,1.51,,6,5.66,0.0,0.23,0.0,0.24,24.59,1472077,25,19938,0.34
,alls,not,0.0,,3,2.42,0.0,0.16,0.0,0.2,5.48,1472077,15,56607,0.58
,somethin,more,0.0,,5,1.47,0.0,0.06,0.0,0.2,0.64,1472077,25,207924,3.53
,everythings,so,0.0,,4,2.86,0.0,0.18,0.0,0.25,4.93,1472077,16,104617,1.14
positive,or,otherwise,6.37,existential,6378,4922.07,0.75,0.02,0.97,0.02,17716.43,1472077,326614,6562,1455.93
positive,everything,humanly,6.23,universal,256,247.54,0.79,0.01,0.81,0.01,1553.24,1472077,39516,315,8.46
positive,every,so-slightly,5.82,universal,4,4.0,1.0,0.01,1.0,0.01,67.15,1472077,335,4,0.0
positive,all,around,5.52,universal,934,768.05,0.78,0.0,0.95,0.0,2966.0,1472077,249279,980,165.95
positive,everything,all,5.21,universal,2819,2678.71,0.51,0.07,0.54,0.07,13506.99,1472077,39516,5226,140.29


# %% [markdown]

 Top $\Delta P(\texttt{trigger}|\texttt{adv})$ values

In [None]:
exdf = show_metric_top(ex_trig_abbr, 'dP1')
pos_prone, neg_prone = update_prone(exdf, pos_prone, neg_prone)
exdf

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,dP1,quant,f,unexp_f,LRC,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
,everythings,all,0.0,,9,8.94,5.67,0.56,0.0,0.56,79.67,1472077,16,5226,0.06
,somethin,n't,0.0,,6,5.66,1.51,0.23,0.0,0.24,24.59,1472077,25,19938,0.34
,alls,not,0.0,,3,2.42,0.0,0.16,0.0,0.2,5.48,1472077,15,56607,0.58
,everythings,so,0.0,,4,2.86,0.0,0.18,0.0,0.25,4.93,1472077,16,104617,1.14
,everyones,so,0.0,,4,2.86,0.0,0.18,0.0,0.25,4.93,1472077,16,104617,1.14
positive,every,so-slightly,1.0,universal,4,4.0,5.82,0.01,1.0,0.01,67.15,1472077,335,4,0.0
positive,everything,peachy,0.97,universal,4,3.89,0.0,0.0,1.0,0.0,28.94,1472077,39516,4,0.11
positive,everything,pixel,0.97,universal,3,2.92,0.0,0.0,1.0,0.0,21.71,1472077,39516,3,0.08
positive,always,bitter,0.94,universal,4,3.78,0.0,0.0,1.0,0.0,23.08,1472077,82200,4,0.22
positive,often,drily,0.94,hedged_universal,4,3.75,0.0,0.0,1.0,0.0,22.16,1472077,92233,4,0.25


# %% [markdown]

 Top conditional probability $P(\texttt{trigger}|\texttt{adv})$ values

In [None]:
exdf = show_metric_top(ex_trig_abbr, 'dP1_simple')
pos_prone, neg_prone = update_prone(exdf, pos_prone, neg_prone)
exdf

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,dP1_simple,quant,f,unexp_f,LRC,dP1,dP2,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
,everythings,all,0.0,,9,8.94,5.67,0.0,0.56,0.56,79.67,1472077,16,5226,0.06
,somethin,n't,0.0,,6,5.66,1.51,0.0,0.23,0.24,24.59,1472077,25,19938,0.34
,alls,not,0.0,,3,2.42,0.0,0.0,0.16,0.2,5.48,1472077,15,56607,0.58
,everythings,so,0.0,,4,2.86,0.0,0.0,0.18,0.25,4.93,1472077,16,104617,1.14
,everyones,so,0.0,,4,2.86,0.0,0.0,0.18,0.25,4.93,1472077,16,104617,1.14
positive,every,so-slightly,1.0,universal,4,4.0,5.82,1.0,0.01,0.01,67.15,1472077,335,4,0.0
positive,something,sizey,1.0,existential,80,62.7,0.72,0.78,0.0,0.0,245.02,1472077,318343,80,17.3
positive,something,primally,1.0,existential,13,10.19,0.0,0.78,0.0,0.0,39.81,1472077,318343,13,2.81
positive,or,second-most,1.0,existential,6,4.67,0.0,0.78,0.0,0.0,18.07,1472077,326614,6,1.33
positive,or,etiologically,1.0,existential,6,4.67,0.0,0.78,0.0,0.0,18.07,1472077,326614,6,1.33


# %% [markdown]

 Top $\Delta P(\texttt{adv}|\texttt{trigger})$ values

In [None]:
exdf = show_metric_top(ex_trig_abbr, 'dP2')
pos_prone, neg_prone = update_prone(exdf, pos_prone, neg_prone)
exdf

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,dP2,quant,f,unexp_f,LRC,dP1,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
,everythings,all,0.56,,9,8.94,5.67,0.0,0.0,0.56,79.67,1472077,16,5226,0.06
,somethin,n't,0.23,,6,5.66,1.51,0.0,0.0,0.24,24.59,1472077,25,19938,0.34
,everythings,so,0.18,,4,2.86,0.0,0.0,0.0,0.25,4.93,1472077,16,104617,1.14
,everyones,so,0.18,,4,2.86,0.0,0.0,0.0,0.25,4.93,1472077,16,104617,1.14
,alls,not,0.16,,3,2.42,0.0,0.0,0.0,0.2,5.48,1472077,15,56607,0.58
positive,either,too,0.21,existential,1110,814.32,1.73,0.01,0.01,0.29,1514.98,1472077,3886,112009,295.68
positive,everyone,so,0.18,universal,8043,5745.6,1.82,0.06,0.08,0.25,10195.44,1472077,32327,104617,2297.4
positive,everybody,so,0.17,universal,1894,1327.95,1.61,0.01,0.02,0.24,2191.44,1472077,7965,104617,566.05
positive,always,very,0.13,universal,19988,10210.23,1.07,0.07,0.11,0.24,10404.38,1472077,82200,175105,9777.77
positive,or,even,0.13,existential,45543,32647.52,3.59,0.58,0.78,0.14,87219.31,1472077,326614,58121,12895.48


# %% [markdown]

 Top conditional probability $P(\texttt{adv}|\texttt{trigger})$ values

In [None]:
exdf = show_metric_top(ex_trig_abbr, 'dP2_simple')
pos_prone, neg_prone = update_prone(exdf, pos_prone, neg_prone)
exdf

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,dP2_simple,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
,everythings,all,0.56,,9,8.94,5.67,0.0,0.56,0.0,79.67,1472077,16,5226,0.06
,everythings,so,0.25,,4,2.86,0.0,0.0,0.18,0.0,4.93,1472077,16,104617,1.14
,everyones,so,0.25,,4,2.86,0.0,0.0,0.18,0.0,4.93,1472077,16,104617,1.14
,somethin,n't,0.24,,6,5.66,1.51,0.0,0.23,0.0,24.59,1472077,25,19938,0.34
,alls,not,0.2,,3,2.42,0.0,0.0,0.16,0.0,5.48,1472077,15,56607,0.58
positive,either,too,0.29,existential,1110,814.32,1.73,0.01,0.21,0.01,1514.98,1472077,3886,112009,295.68
positive,everyone,so,0.25,universal,8043,5745.6,1.82,0.06,0.18,0.08,10195.44,1472077,32327,104617,2297.4
positive,always,very,0.24,universal,19988,10210.23,1.07,0.07,0.13,0.11,10404.38,1472077,82200,175105,9777.77
positive,everybody,so,0.24,universal,1894,1327.95,1.61,0.01,0.17,0.02,2191.44,1472077,7965,104617,566.05
positive,somethings,more,0.21,existential,33,10.82,0.0,0.0,0.07,0.0,5.48,1472077,157,207924,22.18


# %% [markdown]

 Top log-likelihood $G^2$ values

In [None]:
exdf = show_metric_top(ex_trig_abbr, 'G2')
pos_prone, neg_prone = update_prone(exdf, pos_prone, neg_prone)
exdf

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,G2,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
,everythings,all,79.67,,9,8.94,5.67,0.0,0.56,0.0,0.56,1472077,16,5226,0.06
,somethin,n't,24.59,,6,5.66,1.51,0.0,0.23,0.0,0.24,1472077,25,19938,0.34
,alls,not,5.48,,3,2.42,0.0,0.0,0.16,0.0,0.2,1472077,15,56607,0.58
,everythings,so,4.93,,4,2.86,0.0,0.0,0.18,0.0,0.25,1472077,16,104617,1.14
,everyones,so,4.93,,4,2.86,0.0,0.0,0.18,0.0,0.25,1472077,16,104617,1.14
positive,or,even,87219.31,existential,45543,32647.52,3.59,0.58,0.13,0.78,0.14,1472077,326614,58121,12895.48
positive,all,too,38448.8,universal,45382,26414.59,1.7,0.26,0.13,0.41,0.18,1472077,249279,112009,18967.41
positive,or,otherwise,17716.43,existential,6378,4922.07,6.37,0.75,0.02,0.97,0.02,1472077,326614,6562,1455.93
positive,something,as,14184.17,existential,30864,14215.23,1.23,0.19,0.06,0.4,0.1,1472077,318343,76987,16648.77
positive,or,just,13554.55,existential,14940,8810.76,1.96,0.33,0.03,0.54,0.05,1472077,326614,27625,6129.24


In [None]:
# %%

sig_trig_abbr = ex_trig_abbr.loc[ex_trig_abbr.LRC.abs() > 1, :]
def show_prone_ex(amdf, prone_list, list_index):
    try: 
        example = prone[list_index]

    except IndexError: 
        return list_index + 1, f'No {list_index}th entry'
    else:
        print(f'>> {example} <<')
        return list_index+ 1, amdf.filter(regex=f'~{example}$', axis=0).iloc[:10, :]

# %% [markdown]

 ---
 Significant Examples for Items demonstrated positive polarity environment lean overall (Top 10 by $|LRC|>1$)

In [None]:
prone = pos_prone[UNIT]
prone

['pretty',
 'rather',
 'slightly',
 'otherwise',
 'fairly',
 'relatively',
 'plain',
 'downright',
 'somewhat',
 'maybe',
 'utterly',
 'definitely',
 'humanly',
 'so-slightly',
 'peachy',
 'sizey',
 'too',
 'so',
 'even']

In [None]:
# %%

ix = 0
ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> pretty <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
everybody~pretty,positive,universal,421,287.9,1.32,0.01,0.04,0.02,0.05,407.97,1472077,7965,24599,133.1,everybody,pretty
some~pretty,positive,existential,4085,2164.49,1.11,0.09,0.02,0.17,0.04,2095.89,1472077,114929,24599,1920.51,some,pretty
all~pretty,positive,universal,7720,3554.45,1.07,0.15,0.02,0.31,0.03,3136.99,1472077,249279,24599,4165.55,all,pretty
someone~pretty,positive,existential,147,-348.66,-1.16,-0.01,-0.01,0.01,0.0,-349.24,1472077,29662,24599,495.66,someone,pretty
or~pretty,positive,existential,1099,-4358.85,-2.38,-0.18,-0.02,0.04,0.0,-6195.67,1472077,326614,24599,5457.85,or,pretty


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> rather <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> slightly <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
or~slightly,positive,existential,3411,1741.63,1.37,0.23,0.01,0.45,0.01,1982.29,1472077,326614,7524,1669.37,or,slightly
all~slightly,positive,universal,452,-822.1,-1.31,-0.11,-0.0,0.06,0.0,-814.34,1472077,249279,7524,1274.1,all,slightly
many~slightly,positive,hedged_universal,34,-206.9,-1.59,-0.03,-0.0,0.0,0.0,-287.43,1472077,47133,7524,240.9,many,slightly


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> otherwise <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
or~otherwise,positive,existential,6378,4922.07,6.37,0.75,0.02,0.97,0.02,17716.43,1472077,326614,6562,1455.93,or,otherwise
someone~otherwise,positive,existential,20,-112.22,-1.09,-0.02,-0.0,0.0,0.0,-151.28,1472077,29662,6562,132.22,someone,otherwise
everyone~otherwise,positive,universal,3,-141.1,-1.34,-0.02,-0.0,0.0,0.0,-262.68,1472077,32327,6562,144.1,everyone,otherwise
many~otherwise,positive,hedged_universal,26,-184.1,-1.6,-0.03,-0.0,0.0,0.0,-265.58,1472077,47133,6562,210.1,many,otherwise
everything~otherwise,positive,universal,6,-170.15,-1.89,-0.03,-0.0,0.0,0.0,-304.99,1472077,39516,6562,176.15,everything,otherwise
both~otherwise,positive,universal,6,-216.91,-2.24,-0.03,-0.0,0.0,0.0,-398.76,1472077,50007,6562,222.91,both,otherwise
often~otherwise,positive,hedged_universal,25,-386.14,-2.64,-0.06,-0.0,0.0,0.0,-657.76,1472077,92233,6562,411.14,often,otherwise
sometimes~otherwise,positive,existential,5,-328.02,-2.81,-0.05,-0.0,0.0,0.0,-632.55,1472077,74707,6562,333.02,sometimes,otherwise
some~otherwise,positive,existential,20,-492.31,-3.13,-0.08,-0.0,0.0,0.0,-896.21,1472077,114929,6562,512.31,some,otherwise
something~otherwise,positive,existential,55,-1364.06,-4.02,-0.21,-0.01,0.01,0.0,-2711.53,1472077,318343,6562,1419.06,something,otherwise


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> fairly <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
both~fairly,positive,universal,483,290.12,1.05,0.05,0.01,0.09,0.01,323.86,1472077,50007,5678,192.88,both,fairly
or~fairly,positive,existential,565,-694.79,-1.04,-0.12,-0.0,0.1,0.0,-589.32,1472077,326614,5678,1259.79,or,fairly


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> relatively <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
both~relatively,positive,universal,465,284.01,1.08,0.05,0.01,0.09,0.01,327.16,1472077,50007,5328,180.99,both,relatively


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> plain <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
or~plain,positive,existential,3681,2559.88,3.0,0.51,0.01,0.73,0.01,5889.24,1472077,326614,5053,1121.12,or,plain
someone~plain,positive,existential,9,-92.82,-1.05,-0.02,-0.0,0.0,0.0,-143.99,1472077,29662,5053,101.82,someone,plain
everyone~plain,positive,universal,9,-101.96,-1.18,-0.02,-0.0,0.0,0.0,-161.13,1472077,32327,5053,110.96,everyone,plain
everything~plain,positive,universal,18,-117.64,-1.2,-0.02,-0.0,0.0,0.0,-165.73,1472077,39516,5053,135.64,everything,plain
both~plain,positive,universal,5,-166.65,-1.83,-0.03,-0.0,0.0,0.0,-304.15,1472077,50007,5053,171.65,both,plain
always~plain,positive,universal,16,-266.16,-2.36,-0.05,-0.0,0.0,0.0,-455.97,1472077,82200,5053,282.16,always,plain
all~plain,positive,universal,67,-788.67,-3.01,-0.16,-0.0,0.01,0.0,-1378.71,1472077,249279,5053,855.67,all,plain
something~plain,positive,existential,56,-1036.73,-3.63,-0.21,-0.0,0.01,0.0,-1995.43,1472077,318343,5053,1092.73,something,plain


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> downright <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
sometimes~downright,positive,existential,1034,793.96,2.13,0.17,0.01,0.22,0.01,1590.56,1472077,74707,4730,240.04,sometimes,downright
some~downright,positive,existential,1279,909.72,1.89,0.19,0.01,0.27,0.01,1570.7,1472077,114929,4730,369.28,some,downright
everything~downright,positive,universal,21,-105.97,-1.01,-0.02,-0.0,0.0,0.0,-139.08,1472077,39516,4730,126.97,everything,downright
everyone~downright,positive,universal,6,-97.87,-1.12,-0.02,-0.0,0.0,0.0,-163.89,1472077,32327,4730,103.87,everyone,downright
both~downright,positive,universal,9,-151.68,-1.73,-0.03,-0.0,0.0,0.0,-256.94,1472077,50007,4730,160.68,both,downright
always~downright,positive,universal,7,-257.12,-2.51,-0.05,-0.0,0.0,0.0,-478.8,1472077,82200,4730,264.12,always,downright
something~downright,positive,existential,132,-890.88,-2.61,-0.19,-0.0,0.03,0.0,-1443.14,1472077,318343,4730,1022.88,something,downright
all~downright,positive,universal,46,-754.97,-3.28,-0.16,-0.0,0.01,0.0,-1386.42,1472077,249279,4730,800.97,all,downright


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> somewhat <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
always~somewhat,positive,universal,777,529.02,1.55,0.12,0.01,0.17,0.01,790.13,1472077,82200,4441,247.98,always,somewhat
something~somewhat,positive,existential,313,-647.39,-1.43,-0.15,-0.0,0.07,0.0,-708.2,1472077,318343,4441,960.39,something,somewhat


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> maybe <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
or~maybe,positive,existential,2334,1763.12,4.59,0.69,0.01,0.91,0.01,5569.58,1472077,326614,2573,570.88,or,maybe
often~maybe,positive,hedged_universal,3,-158.21,-1.56,-0.06,-0.0,0.0,0.0,-302.97,1472077,92233,2573,161.21,often,maybe
something~maybe,positive,existential,64,-492.42,-2.5,-0.19,-0.0,0.02,0.0,-820.5,1472077,318343,2573,556.42,something,maybe
all~maybe,positive,universal,7,-428.71,-3.42,-0.17,-0.0,0.0,0.0,-881.23,1472077,249279,2573,435.71,all,maybe


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> utterly <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1


# %% [markdown]

 ---
## Examples for Items demonstrating *Negative* polarity environment lean overall (Top 10 by $|LRC|>1$)

In [None]:
prone_list = neg_prone[UNIT]
prone = sig_trig_abbr.copy().loc[sig_trig_abbr.l2.isin(prone_list), ['f2','l2']].drop_duplicates().reset_index(drop=True).set_index('l2').round(1).sort_values(['f2'], ascending=False).index.to_list()
prone

['too', 'particularly', 'that', 'remotely', 'yet', 'exactly', 'any']

In [None]:
# %%

ix = 0
ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> too <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
either~too,positive,existential,1110,814.32,1.73,0.01,0.21,0.01,0.29,1514.98,1472077,3886,112009,295.68,either,too
all~too,positive,universal,45382,26414.59,1.7,0.26,0.13,0.41,0.18,38448.8,1472077,249279,112009,18967.41,all,too
everyone~too,positive,universal,1046,-1413.73,-1.03,-0.01,-0.04,0.01,0.03,-1124.19,1472077,32327,112009,2459.73,everyone,too
both~too,positive,universal,1526,-2278.99,-1.16,-0.02,-0.05,0.01,0.03,-1931.71,1472077,50007,112009,3804.99,both,too
everything~too,positive,universal,1040,-1966.74,-1.33,-0.02,-0.05,0.01,0.03,-1867.57,1472077,39516,112009,3006.74,everything,too
someone~too,positive,existential,693,-1563.95,-1.44,-0.02,-0.05,0.01,0.02,-1603.02,1472077,29662,112009,2256.95,someone,too
something~too,positive,existential,2079,-22143.43,-3.7,-0.21,-0.09,0.02,0.01,-41334.74,1472077,318343,112009,24222.43,something,too


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> particularly <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
all~particularly,positive,universal,234,-410.67,-1.14,-0.11,-0.0,0.06,0.0,-399.04,1472077,249279,3807,644.67,all,particularly


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> that <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
somebody~that,positive,existential,32,29.82,2.59,0.02,0.01,0.03,0.01,113.45,1472077,2682,1195,2.18,somebody,that
someone~that,positive,existential,93,68.92,1.24,0.06,0.0,0.08,0.0,117.79,1472077,29662,1195,24.08,someone,that
something~that,positive,existential,64,-194.42,-1.33,-0.16,-0.0,0.05,0.0,-248.17,1472077,318343,1195,258.42,something,that


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> remotely <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
everything~remotely,positive,universal,54,40.71,1.08,0.08,0.0,0.11,0.0,73.59,1472077,39516,495,13.29,everything,remotely


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> yet <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
something~yet,positive,existential,292,185.82,1.73,0.38,0.0,0.59,0.0,328.45,1472077,318343,491,106.18,something,yet


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> exactly <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
everything~exactly,positive,universal,54,48.01,2.38,0.22,0.0,0.24,0.0,153.09,1472077,39516,223,5.99,everything,exactly


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> any <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
or~any,positive,existential,82,57.15,1.68,0.51,0.0,0.73,0.0,131.82,1472077,326614,112,24.85,or,any


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

'No 7th entry'

In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

'No 8th entry'

In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

'No 9th entry'

In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

'No 10th entry'

In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

'No 11th entry'