In [None]:
# %%

import pandas as pd

from source.utils import FREQ_DIR, RESULT_DIR, UCS_DIR, confirm_dir
from source.utils.associate import (BINARY_ASSOC_ARGS, add_extra_am,
                                    associate_ucs, confirm_basic_ucs)
from source.utils.associate import convert_ucs_to_csv as ucs2csv
from source.utils.associate import get_associations_csv as init_am, AM_DF_DIR
from source.utils.associate import manipulate_ucs, seek_readable_ucs, adjust_assoc_columns
pd.set_option('display.float_format', '{:,.2f}'.format)

# %% [markdown]

 set parameters:
 - `UNIT` options:
   - `'Bigr'`
   - `'Adv'`
   - `'Adj'`
 - `PAT_DIR` options:
   - any directory in `results/freq_out/` containing a `ucs_format/` subdir with a `Trig*.tsv` frequency table
   - developed with the following in mind:
     - `POSmirror`
     - `NEGmirror`
     - `ANYmirror` (which has been populated by simple concatenation in the shell)
 UNIT = 'Adv'

In [None]:
UNIT = 'Bigr' 
# UNIT = 'Adv'
# PAT_DIR = 'POSmirror'
# PAT_DIR = 'NEGmirror'
PAT_DIR = 'ANYmirror'
# FRQ_FLOOR = 3
FRQ_FLOOR = 10
# FRQ_FLOOR = 20
# FRQ_FLOOR = 50
# FRQ_FLOOR = 100
TRIG_TSV = FREQ_DIR.joinpath(
    f'{PAT_DIR}/ucs_format/Trig{UNIT}_frq-thrMIN-7.35f.tsv')
FOCUS = ['f', 'unexpected_f',
         'conservative_log_ratio',
         'am_p1_given2', 'am_p2_given1',
         'am_p1_given2_simple', 'am_p2_given1_simple',
         'am_log_likelihood',
        #  'mutual_information', 'am_odds_ratio_disc', 't_score',
         'N', 'f1', 'f2', 'E11',
         'l1', 'l2']

In [None]:
# %%

TRIGGER_POLARITY = {
    'positive': {'all',
                 'always',
                 'both',
                 'either',
                 'every',
                 'everybody',
                 'everyone',
                 'everything',
                 'many',
                 'often',
                 'or',
                 'some',
                 'somebody',
                 'someone',
                 'something',
                 'somethings',
                 'sometimes'},
    'negative': {'barely',
                 'hardly',
                 'neither',
                 'never',
                 'no',
                 'nobody',
                 'none',
                 'nor',
                 'nothing',
                 'seldom',
                 'rarely',
                 'scarcely'},

}

In [None]:
# %%

TRIGGER_QUANT = {
    'existential': {
        'some',
        'somebody',
        'someone',
        'something',
        'somethings',
        'either',
     'or',
        'sometimes'
    },
    'universal': {
        'all', 'every',
        'always',
        'everybody',
        'everyone',
        'both',
        'everything',
    },
    'not_exist': {
        'neither',
        'never',
        'no',
        'nobody',
        'none',
        'nor',
        'nothing',
    },
    'hedged_not_exist': {
        'barely',
        'hardly',
        'rarely',
        'scarcely',
        'seldom',
        'few'
    },
    'hedged_universal':{
     'many',
     'often',
     }
}

In [None]:
# %%

def invert_set_dict(d: dict):
    return {v: k for k in d for v in d[k]}

# %% [markdown]

## 1. Run `seek_readable_ucs()` to generate consistent output path

In [None]:
readable = seek_readable_ucs(min_freq=FRQ_FLOOR,
                             ucs_subdir='trigger_eval',
                             contained_counts_path=TRIG_TSV)
print(readable.relative_to(RESULT_DIR))

    > seeking `trigger_eval/ANYmirror/readable/TrigBigr_frq-thrMIN-7.35f_min10x*` frequency data and initial associations...
ucs/trigger_eval/ANYmirror/readable/TrigBigr_frq-thrMIN-7.35f_min10x.rsort-view_am-only.txt


# %% [markdown]

 Snippet of starting frequency data (`TRIG_TSV`)

In [None]:
! head -5 {TRIG_TSV} | column -t

12233  something  as_simple
7372   something  completely_different
6933   all        too_familiar
6505   all        too_easy
5141   or         more_likely


# %% [markdown]

## 2. Run `confirm_basic_ucs()` (if needed)

In [None]:
if not readable.is_file():
    basic_ucs_path = readable.parent.parent.joinpath(
        readable.name.replace('.rsort-view_am-only.txt', '.ds.gz'))
    print(f'Creating initial UCS table: `{basic_ucs_path.relative_to(RESULT_DIR)}')

    basic_ucs_path = confirm_basic_ucs(
        basic_ucs_path,
        freq_floor=FRQ_FLOOR,
        contained_counts_path=TRIG_TSV)

Creating initial UCS table: `ucs/trigger_eval/ANYmirror/TrigBigr_frq-thrMIN-7.35f_min10x.ds.gz

## Creating initial UCS table...

```
( cat /share/compling/projects/sanpi/results/freq_out/ANYmirror/ucs_format/TrigBigr_frq-thrMIN-7.35f.tsv \ 
  | ucs-make-tables --types --threshold=10 /share/compling/projects/sanpi/results/ucs/trigger_eval/ANYmirror/TrigBigr_frq-thrMIN-7.35f_min10x.ds.gz ) \ 
  && ucs-sort /share/compling/projects/sanpi/results/ucs/trigger_eval/ANYmirror/TrigBigr_frq-thrMIN-7.35f_min10x.ds.gz BY f2- f1- INTO /share/compling/projects/sanpi/results/ucs/trigger_eval/ANYmirror/TrigBigr_frq-thrMIN-7.35f_min10x.ds.gz
== Note ==
    N = total number of tokens/all counts summed
    V = total number of rows/number of unique l1+l2 combinations before filtering to 10+ tokens
+ time to make table → 00:00:02.201
```

Saving initial frequency table in readable .txt format...

```
ucs-print -o /share/compling/projects/sanpi/results/ucs/trigger_eval/ANYmirror/readable/TrigBigr_frq-thrM

# %% [markdown]

 Excerpt of initial UCS table

In [None]:
init_readable = UCS_DIR.joinpath(
    f'trigger_eval/{PAT_DIR}/readable'
).joinpath(f'{TRIG_TSV.name.replace(".tsv","")}_min{FRQ_FLOOR}x.init.txt')
! head -7 {init_readable}

        l1  l2                                f     f2      f1        N  
----------  ----------------------------  -----  -----  ------  -------  
        or  more_important                 1067  23085  326614  1761853  
 something  more_important                 2970  23085  318343  1761853  
       all  more_important                 3987  23085  249279  1761853  
      some  more_important                  321  23085  114929  1761853  
     never  more_important                 3853  23085  109723  1761853  


# %% [markdown]

## 3. Run `associate_ucs()` (if needed)

In [None]:
if not readable.is_file():
    associate_ucs(basic_ucs_path)

transform_ucs_log = f'/share/compling/projects/sanpi/logs/associate/ucs//ucs-{PAT_DIR}_Trig{UNIT}_frq-thrMIN-7-35f_min{FRQ_FLOOR}x*.log'
! head -15 `ls -t1 {transform_ucs_log} | head -1`
! echo '...'
! tail -2 `ls -t1 {transform_ucs_log} | head -1`


Calculating UCS associations...

```
bash /share/compling/projects/sanpi/script/transform_ucs.sh /share/compling/projects/sanpi/results/ucs/trigger_eval/ANYmirror/TrigBigr_frq-thrMIN-7.35f_min10x.ds.gz
> log will be saved to: /share/compling/projects/sanpi/logs/associate/ucs//ucs-ANYmirror_TrigBigr_frq-thrMIN-7-35f_min10x.2024-05-25_2135.log
...
```

+ time elapsed → 00:00:23.61
# Manipulating TrigBigr_frq-thrMIN-7-35f_min10x ucs table
path to this script: /share/compling/projects/sanpi/script/transform_ucs.sh
Sat May 25 21:35:10 EDT 2024
(TMP: /share/compling/projects/sanpi/results/ucs/trigger_eval/ANYmirror/tmp/tmp_ANYmirror-20240525-213510.TrigBigr_frq-thrMIN-7-35f_min10x)
## Initial Contingency Info

DATA SET FILE:  /share/compling/projects/sanpi/results/ucs/trigger_eval/ANYmirror/TrigBigr_frq-thrMIN-7.35f_min10x.ds.gz

# Frequency signatures computed by the ucs-make-tables tool for relational cooccurrences.
# Sample size:  N = 1761853 tokens,  V = 395338 pair types.
# A frequency

# %% [markdown]

### Define dictionary containing relevant vocab sizes
 !!! Warning This is a `#HACK`: \
     Rather than developing a command/code to retrieve the vocab sizes programmatically,
     I simply copied the values given in the log output of `transform_usc.sh`
     for each `PAT_DIR`+`UNIT` combination

 |      |   ANYmirror |   NEGmirror |   POSmirror |
 |:-----|------------:|------------:|------------:|
 | Bigr |     395,338 |      64,644 |     330,694 |
 | Adv  |      23,125 |       5,004 |      18,121 |
 | Adj  |      83,422 |      21,562 |      61,860 |

In [None]:
VOCABS = {'ANYmirror': {'Adv': 23125, 'Bigr': 395338, 'Adj': 83422},
          'NEGmirror': {'Adv': 5004, 'Bigr': 64644, 'Adj': 21562},
          'POSmirror': {'Adv': 18121, 'Bigr': 330694, 'Adj': 61860}
          }  # HACK
VOCAB = VOCABS[PAT_DIR][UNIT]
pd.DataFrame(VOCABS)

Unnamed: 0,ANYmirror,NEGmirror,POSmirror
Adv,23125,5004,18121
Bigr,395338,64644,330694
Adj,83422,21562,61860


# %% [markdown]

## 4. Run `ucs_to_csv()` to convert `ucs/[PAT_DIR]/readable/*.txt` to format that `pandas` can parse as a dataframe

In [None]:
! head -5 {readable}
csv_path = ucs2csv(readable)
print(f'CSV: `{csv_path.relative_to(RESULT_DIR)}`')

        l1  l2                                f           E11  am.log.likelihood  am.odds.ratio.disc    am.p1.given2     am.p2.given1  am.p1.given2.simple  am.p2.given1.simple      f1     f2        N  
----------  ----------------------------  -----  ------------  -----------------  ------------------  --------------  ---------------  -------------------  -------------------  ------  -----  -------  
    hardly  strictly_bluegrass               10     0.0310355        115.5224117        3.8297658232   0.99690210762    1.8288222e-03        1.00000000000        1.8288222e-03    5468     10  1761853  
 everybody  super_heady                      20     0.0904162        216.0126120        3.9566646052   0.99549049200    2.5109856e-03        1.00000000000        2.5109856e-03    7965     20  1761853  
        no  longer_viable                    56     0.2825661        592.7414834        4.3506693418   0.99498580143    6.2992126e-03        1.00000000000        6.2992126e-03    8890     56  

# %% [markdown]

##

In [None]:
trig_amdf = pd.read_csv(csv_path).convert_dtypes()
trig_amdf

Unnamed: 0,l1,l2,f,E11,am_log_likelihood,am_odds_ratio_disc,am_p1_given2,am_p2_given1,am_p1_given2_simple,am_p2_given1_simple,f1,f2,N
0,hardly,strictly_bluegrass,10,0.03,115.52,3.83,1.00,0.00,1.00,0.00,5468,10,1761853
1,everybody,super_heady,20,0.09,216.01,3.96,1.00,0.00,1.00,0.00,7965,20,1761853
2,no,longer_viable,56,0.28,592.74,4.35,0.99,0.01,1.00,0.01,8890,56,1761853
3,no,longer_pink,42,0.21,444.49,4.23,0.99,0.00,1.00,0.00,8890,42,1761853
4,no,longer_afraid,18,0.09,190.45,3.86,0.99,0.00,1.00,0.00,8890,18,1761853
...,...,...,...,...,...,...,...,...,...,...,...,...,...
22087,or,very_excited,16,461.78,-876.17,-1.53,-0.18,-0.00,0.01,0.00,326614,2491,1761853
22088,or,too_aware,13,420.44,-809.02,-1.58,-0.18,-0.00,0.01,0.00,326614,2268,1761853
22089,or,too_common,19,915.97,-1836.19,-1.76,-0.18,-0.00,0.00,0.00,326614,4941,1761853
22090,or,very_special,18,898.73,-1806.84,-1.78,-0.18,-0.00,0.00,0.00,326614,4848,1761853


In [None]:
# %%

trig_amdf['key'] = (trig_amdf.l1 + '~' +
                    trig_amdf.l2).astype('string')
trig_amdf = trig_amdf.set_index('key')
trig_amdf

Unnamed: 0_level_0,l1,l2,f,E11,am_log_likelihood,am_odds_ratio_disc,am_p1_given2,am_p2_given1,am_p1_given2_simple,am_p2_given1_simple,f1,f2,N
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1
hardly~strictly_bluegrass,hardly,strictly_bluegrass,10,0.03,115.52,3.83,1.00,0.00,1.00,0.00,5468,10,1761853
everybody~super_heady,everybody,super_heady,20,0.09,216.01,3.96,1.00,0.00,1.00,0.00,7965,20,1761853
no~longer_viable,no,longer_viable,56,0.28,592.74,4.35,0.99,0.01,1.00,0.01,8890,56,1761853
no~longer_pink,no,longer_pink,42,0.21,444.49,4.23,0.99,0.00,1.00,0.00,8890,42,1761853
no~longer_afraid,no,longer_afraid,18,0.09,190.45,3.86,0.99,0.00,1.00,0.00,8890,18,1761853
...,...,...,...,...,...,...,...,...,...,...,...,...,...
or~very_excited,or,very_excited,16,461.78,-876.17,-1.53,-0.18,-0.00,0.01,0.00,326614,2491,1761853
or~too_aware,or,too_aware,13,420.44,-809.02,-1.58,-0.18,-0.00,0.01,0.00,326614,2268,1761853
or~too_common,or,too_common,19,915.97,-1836.19,-1.76,-0.18,-0.00,0.00,0.00,326614,4941,1761853
or~very_special,or,very_special,18,898.73,-1806.84,-1.78,-0.18,-0.00,0.00,0.00,326614,4848,1761853


# %% [markdown]

## 6. Save to `./results/assoc_df/`

In [None]:
df_csv_path = AM_DF_DIR.joinpath(
    str(csv_path.relative_to(UCS_DIR))
    .replace('/readable', '')
    .replace('.rsort-view_am-only', ''))

if not df_csv_path.is_file():
    confirm_dir(df_csv_path.parent)
    trig_amdf.to_csv(df_csv_path)

df_pkl_path = df_csv_path.with_suffix('.pkl.gz')
if not df_pkl_path.is_file():
    trig_amdf.to_pickle(df_csv_path.with_suffix('.pkl.gz'))

# %% [markdown]

## 7. Add additional AM via `add_extra_am()`

In [None]:
ex_trig_amdf = add_extra_am(df=trig_amdf,
                            verbose=True,
                            vocab=VOCAB,
                            metrics=['t_score', 'mutual_information']
                            ).convert_dtypes()


Preview of Extended Measures (rounded)

| key                       |   t_score |   mutual_information |   deltaP_min |   deltaP_max |   deltaP_max_abs |   deltaP_product |   unexpected_f |   unexpected_ratio |
|:--------------------------|----------:|---------------------:|-------------:|-------------:|-----------------:|-----------------:|---------------:|-------------------:|
| hardly~strictly_bluegrass |      3.15 |                 2.51 |         0.00 |         1.00 |             1.00 |             0.00 |           9.97 |               1.00 |
| everybody~super_heady     |      4.45 |                 2.34 |         0.00 |         1.00 |             1.00 |             0.00 |          19.91 |               1.00 |
| no~longer_viable          |      7.45 |                 2.30 |         0.01 |         0.99 |             0.99 |             0.01 |          55.72 |               0.99 |
| no~longer_pink            |      6.45 |                 2.30 |         0.00 |         0.99 |          

#%% [markdown]

 Add trigger features as columns: polarity and quantification type

In [None]:
def add_feature(triggers:pd.Series, 
                group_dict: dict) -> pd.Series:
    assign_dict = invert_set_dict(group_dict)
    return triggers.apply(lambda x: assign_dict[x] if x in assign_dict.keys() else '')

ex_trig_amdf['polarity'] = add_feature(ex_trig_amdf.l1, TRIGGER_POLARITY)
ex_trig_amdf['quant'] = add_feature(ex_trig_amdf.l1, TRIGGER_QUANT)

# %% [markdown]

 Save extended AM tables to `extra/` subdirectory if not already saved

In [None]:
df_extra_csv = df_csv_path.parent / 'extra' / \
    df_csv_path.name.replace('.csv', '_extra.csv')
print(df_extra_csv)
if not df_extra_csv.is_file():
    confirm_dir(df_extra_csv.parent)
    ex_trig_amdf.to_csv(df_extra_csv)

df_extra_pkl = df_extra_csv.with_suffix('.pkl.gz')
if not df_extra_pkl.is_file():
    ex_trig_amdf.to_pickle(df_extra_pkl)

/share/compling/projects/sanpi/results/assoc_df/trigger_eval/ANYmirror/extra/TrigBigr_frq-thrMIN-7.35f_min10x_extra.csv


In [None]:
# %%

ex_trig_full = ex_trig_amdf.copy()
ex_trig_abbr = adjust_assoc_columns(
    ex_trig_amdf[[c for c in ['polarity', 'quant'] + FOCUS if c in ex_trig_amdf.columns]]).sort_values('LRC', ascending=False)
cols = ex_trig_abbr.columns

# %% [markdown]

 Define lexical items with given lean shown in binary environment evaluation

In [None]:
pos_prone = {
    'Adj': [
        'unrelated',
        'unable',
        'akin',
        'larger',
        'different',
        'familiar',
        'similar',
        'likely', 
        'brief', 
        'unaware'
    ],
    'Adv': [
        'slightly', 
        'definitely',
        'utterly',
        # LRC top
        'pretty', 
        'rather', 
        'plain', 
        'fairly', 
        'somewhat', 
        'otherwise', 
        'downright',
        'relatively', 
        # G2 top
        # 'very', 
        # 'even', 
        # 'just', 
        # dP1 top (and odds ratio disc)
        'plain', 
        'maybe'
    ], 
    'Bigr': [
        # G2 top
        'completely_different', 
        'too_familiar',
        'even_better',
        # dP1 top
        'quite_different', 
        'too_real', 
        'well_aware', 
        # LRC top
        'too_common', 
        'entirely_different'
        ]}
neg_prone = {
    'Bigr': [
        # LRC top
        'quite_sure',
        'really_sure', 
        'too_early', 
        'too_pleased', 
        'too_fancy',
        # dP1 top
        'entirely_sure', 
        'ever_easy', 
        'ever_perfect', 
        'particularly_surprising',
        'particularly_new',
        # G2 top
        'too_late', 
        'more_important',
        'so_easy', 
        'as_good', 
        'too_old'
        ], 
    'Adv': [
        'yet',
        #LRC top
        'ever',
        'any', 
        'longer', 
        'necessarily',
        'that',
        #dP1 top
        'before', 
        'wise',  #? How is this used as an adverb?
        'earthly',
        'remotely',
        'exactly',
        # G2 top
        'particularly', 
        'too',
        # 'inherently'
        ],
    'Adj': [
        # LRC top
        'early', 
        'late', 
        'fancy', 
        'alone', 
        'sure',
        # dP1 top
        'shabby',
        'demoralizing',
        'alone',
        'aggravating',
        'groundbreaking',
        'eventful',
        #G2 top
        'important', 
        'frustrating',
        'evident', 
        'certain'
        ]
    }
def sort_prone_by_f2(prone_list, amdf):
    return amdf.copy().loc[amdf.l2.isin(prone_list), ['f2','l2']].drop_duplicates().reset_index(drop=True).set_index('l2').round(1).sort_values(['f2'], ascending=False).index.to_list()
pos_prone[UNIT] = sort_prone_by_f2(pos_prone[UNIT], ex_trig_abbr)
neg_prone[UNIT] = sort_prone_by_f2(neg_prone[UNIT], ex_trig_abbr)
pos_prone[UNIT]

['completely_different',
 'too_familiar',
 'even_better',
 'too_common',
 'entirely_different',
 'quite_different',
 'too_real',
 'well_aware']

# %% [markdown]

## Strongest associations for each polarity by metric

In [None]:
def show_metric_top(amdf: pd.DataFrame,
                    metric: str,
                    k=5, cols=[None]):
    if not any(cols):
        cols = amdf.columns
    return (pd.concat((polar_df.nlargest(k, metric)
                       for pol, polar_df in amdf.groupby('polarity')))
            .loc[:, [metric] + cols[cols != metric].to_list()]
            .reset_index(drop=True).set_index(['polarity', 'l1', 'l2'])
            )
def update_prone(exdf, pos_prone, neg_prone) -> dict: 
    prone_dict = {'positive':pos_prone, 
                  'negative': neg_prone}
    for polarity, prone in prone_dict.items():
        try: 
            polar_ex = exdf.loc[polarity, :]
        except KeyError: 
            continue
        else: 
                
            for topw in polar_ex.reset_index().l2.head(2).squeeze(): 
                if topw not in prone[UNIT]: 
                    prone[UNIT].append(topw)
            prone_dict[polarity] = prone
    return prone_dict['positive'], prone_dict['negative']

# %% [markdown]

 Top consevative log ratio $LRC$ values

In [None]:
exdf = show_metric_top(ex_trig_abbr,"LRC")
pos_prone, neg_prone = update_prone(exdf, pos_prone, neg_prone)
exdf

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,LRC,quant,f,unexp_f,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
negative,none,too_pleased,8.8,not_exist,1272,1248.12,0.92,0.04,0.94,0.04,9701.23,1761853,31021,1356,23.88
negative,hardly,more_different,8.66,hedged_not_exist,491,488.69,0.66,0.09,0.66,0.09,4764.11,1761853,5468,744,2.31
negative,nobody,more_surprised,8.16,not_exist,166,165.14,0.69,0.03,0.69,0.03,1580.5,1761853,6311,239,0.86
negative,barely,even_noticeable,8.08,hedged_not_exist,26,25.96,0.46,0.02,0.46,0.02,300.92,1761853,1235,56,0.04
negative,no,earthly_good,7.74,not_exist,73,72.59,0.89,0.01,0.89,0.01,716.17,1761853,8890,82,0.41
positive,all,too_common,7.9,universal,4882,4182.91,0.85,0.02,0.99,0.02,18554.58,1761853,249279,4941,699.09
positive,all,too_familiar,7.65,universal,6933,5934.39,0.84,0.03,0.98,0.03,26063.93,1761853,249279,7058,998.61
positive,everything,all_right,7.45,universal,2166,2108.54,0.82,0.05,0.85,0.05,14379.56,1761853,39516,2562,57.46
positive,all,too_aware,7.11,universal,2229,1908.11,0.84,0.01,0.98,0.01,8352.56,1761853,249279,2268,320.89
positive,everything,humanly_possible,6.62,universal,252,245.36,0.83,0.01,0.85,0.01,1668.6,1761853,39516,296,6.64


# %% [markdown]

 Top $\Delta P(\texttt{trigger}|\texttt{adv})$ values

In [None]:
exdf = show_metric_top(ex_trig_abbr, 'dP1')
pos_prone, neg_prone = update_prone(exdf, pos_prone, neg_prone)
exdf

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,dP1,quant,f,unexp_f,LRC,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
negative,hardly,strictly_bluegrass,1.0,hedged_not_exist,10,9.97,3.04,0.0,1.0,0.0,115.52,1761853,5468,10,0.03
negative,no,longer_viable,0.99,not_exist,56,55.72,5.15,0.01,1.0,0.01,592.74,1761853,8890,56,0.28
negative,no,longer_pink,0.99,not_exist,42,41.79,4.71,0.0,1.0,0.0,444.49,1761853,8890,42,0.21
negative,no,longer_afraid,0.99,not_exist,18,17.91,3.36,0.0,1.0,0.0,190.45,1761853,8890,18,0.09
negative,no,longer_functional,0.99,not_exist,15,14.92,3.05,0.0,1.0,0.0,158.7,1761853,8890,15,0.08
positive,everybody,super_heady,1.0,universal,20,19.91,3.69,0.0,1.0,0.0,216.01,1761853,7965,20,0.09
positive,everything,generally_real,0.98,universal,18,17.6,1.18,0.0,1.0,0.0,136.71,1761853,39516,18,0.4
positive,everything,usually_accurate,0.98,universal,14,13.69,0.76,0.0,1.0,0.0,106.33,1761853,39516,14,0.31
positive,everything,generally_genuine,0.98,universal,11,10.75,0.33,0.0,1.0,0.0,83.55,1761853,39516,11,0.25
positive,everything,usually_correct,0.98,universal,10,9.78,0.16,0.0,1.0,0.0,75.95,1761853,39516,10,0.22


# %% [markdown]

 Top conditional probability $P(\texttt{trigger}|\texttt{adv})$ values

In [None]:
exdf = show_metric_top(ex_trig_abbr, 'dP1_simple')
pos_prone, neg_prone = update_prone(exdf, pos_prone, neg_prone)
exdf

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,dP1_simple,quant,f,unexp_f,LRC,dP1,dP2,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
negative,no,longer_viable,1.0,not_exist,56,55.72,5.15,0.99,0.01,0.01,592.74,1761853,8890,56,0.28
negative,no,longer_pink,1.0,not_exist,42,41.79,4.71,0.99,0.0,0.0,444.49,1761853,8890,42,0.21
negative,no,longer_afraid,1.0,not_exist,18,17.91,3.36,0.99,0.0,0.0,190.45,1761853,8890,18,0.09
negative,never,before_available,1.0,not_exist,175,164.1,3.13,0.94,0.0,0.0,971.92,1761853,109723,175,10.9
negative,no,longer_functional,1.0,not_exist,15,14.92,3.05,0.99,0.0,0.0,158.7,1761853,8890,15,0.08
positive,everybody,super_heady,1.0,universal,20,19.91,3.69,1.0,0.0,0.0,216.01,1761853,7965,20,0.09
positive,many,instantly_bookable,1.0,hedged_universal,31,30.17,1.8,0.97,0.0,0.0,224.53,1761853,47133,31,0.83
positive,or,otherwise_inappropriate,1.0,existential,199,162.11,1.54,0.81,0.0,0.0,670.87,1761853,326614,199,36.89
positive,or,otherwise_objectionable,1.0,existential,193,157.22,1.5,0.81,0.0,0.0,650.64,1761853,326614,193,35.78
positive,all,too_commonplace,1.0,universal,124,106.46,1.31,0.86,0.0,0.0,485.03,1761853,249279,124,17.54


# %% [markdown]

 Top $\Delta P(\texttt{adv}|\texttt{trigger})$ values

In [None]:
exdf = show_metric_top(ex_trig_abbr, 'dP2')
pos_prone, neg_prone = update_prone(exdf, pos_prone, neg_prone)
exdf

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,dP2,quant,f,unexp_f,LRC,dP1,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
negative,nobody,quite_sure,0.1,not_exist,660,649.31,5.96,0.22,0.22,0.1,4366.8,1761853,6311,2984,10.69
negative,never,too_late,0.1,not_exist,10770,9974.22,6.14,0.79,0.84,0.1,49945.41,1761853,109723,12778,795.78
negative,hardly,more_different,0.09,hedged_not_exist,491,488.69,8.66,0.66,0.66,0.09,4764.11,1761853,5468,744,2.31
negative,scarcely,more_different,0.08,hedged_not_exist,67,66.67,6.78,0.09,0.09,0.09,590.05,1761853,785,744,0.33
negative,nothing,more_important,0.06,not_exist,7208,5913.61,2.82,0.26,0.31,0.07,15088.39,1761853,98788,23085,1294.39
positive,somethings,more_likely,0.07,existential,12,11.27,1.77,0.0,0.0,0.08,45.63,1761853,157,8144,0.73
positive,everything,all_right,0.05,universal,2166,2108.54,7.45,0.82,0.85,0.05,14379.56,1761853,39516,2562,57.46
positive,something,as_simple,0.04,existential,12233,9350.33,3.75,0.59,0.77,0.04,26354.21,1761853,318343,15954,2882.67
positive,all,too_familiar,0.03,universal,6933,5934.39,7.65,0.84,0.98,0.03,26063.93,1761853,249279,7058,998.61
positive,someone,so_young,0.03,existential,811,789.99,6.28,0.63,0.65,0.03,5044.83,1761853,29662,1248,21.01


# %% [markdown]

 Top conditional probability $P(\texttt{adv}|\texttt{trigger})$ values

In [None]:
exdf = show_metric_top(ex_trig_abbr, 'dP2_simple')
pos_prone, neg_prone = update_prone(exdf, pos_prone, neg_prone)
exdf

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,dP2_simple,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
negative,nobody,quite_sure,0.1,not_exist,660,649.31,5.96,0.22,0.1,0.22,4366.8,1761853,6311,2984,10.69
negative,never,too_late,0.1,not_exist,10770,9974.22,6.14,0.79,0.1,0.84,49945.41,1761853,109723,12778,795.78
negative,hardly,more_different,0.09,hedged_not_exist,491,488.69,8.66,0.66,0.09,0.66,4764.11,1761853,5468,744,2.31
negative,scarcely,more_different,0.09,hedged_not_exist,67,66.67,6.78,0.09,0.08,0.09,590.05,1761853,785,744,0.33
negative,nothing,more_important,0.07,not_exist,7208,5913.61,2.82,0.26,0.06,0.31,15088.39,1761853,98788,23085,1294.39
positive,somethings,more_likely,0.08,existential,12,11.27,1.77,0.0,0.07,0.0,45.63,1761853,157,8144,0.73
positive,everything,all_right,0.05,universal,2166,2108.54,7.45,0.82,0.05,0.85,14379.56,1761853,39516,2562,57.46
positive,something,as_simple,0.04,existential,12233,9350.33,3.75,0.59,0.04,0.77,26354.21,1761853,318343,15954,2882.67
positive,all,too_familiar,0.03,universal,6933,5934.39,7.65,0.84,0.03,0.98,26063.93,1761853,249279,7058,998.61
positive,someone,so_young,0.03,existential,811,789.99,6.28,0.63,0.03,0.65,5044.83,1761853,29662,1248,21.01


# %% [markdown]

 Top log-likelihood $G^2$ values

In [None]:
exdf = show_metric_top(ex_trig_abbr, 'G2')
pos_prone, neg_prone = update_prone(exdf, pos_prone, neg_prone)
exdf

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,G2,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
negative,never,too_late,49945.41,not_exist,10770,9974.22,6.14,0.79,0.1,0.84,0.1,1761853,109723,12778,795.78
negative,never,too_early,25284.55,not_exist,4890,4568.77,7.59,0.89,0.04,0.95,0.04,1761853,109723,5158,321.23
negative,nothing,more_important,15088.39,not_exist,7208,5913.61,2.82,0.26,0.06,0.31,0.07,1761853,98788,23085,1294.39
negative,none,too_pleased,9701.23,not_exist,1272,1248.12,8.8,0.92,0.04,0.94,0.04,1761853,31021,1356,23.88
negative,never,so_easy,9479.17,not_exist,2501,2272.01,4.71,0.62,0.02,0.68,0.02,1761853,109723,3677,228.99
positive,something,as_simple,26354.21,existential,12233,9350.33,3.75,0.59,0.04,0.77,0.04,1761853,318343,15954,2882.67
positive,all,too_familiar,26063.93,universal,6933,5934.39,7.65,0.84,0.03,0.98,0.03,1761853,249279,7058,998.61
positive,all,too_easy,20628.24,universal,6505,5466.2,5.26,0.75,0.03,0.89,0.03,1761853,249279,7342,1038.8
positive,something,completely_different,19710.6,existential,7372,5862.91,4.81,0.71,0.02,0.88,0.02,1761853,318343,8352,1509.09
positive,all,too_common,18554.58,universal,4882,4182.91,7.9,0.85,0.02,0.99,0.02,1761853,249279,4941,699.09


In [None]:
# %%

sig_trig_abbr = ex_trig_abbr.loc[ex_trig_abbr.LRC.abs() > 1, :]
def show_prone_ex(amdf, prone_list, list_index:int=0):
    try: 
        example = prone_list[list_index]

    except IndexError: 
        return list_index + 1, f'No {list_index}th entry'
    else:
        print(f'>> {example} <<')
        return list_index+ 1, amdf.filter(regex=f'~{example}$', axis=0).iloc[:10, :]

# %% [markdown]

 ---
 Significant Examples for Items demonstrated positive polarity environment lean overall (Top 10 by $|LRC|>1$)

In [None]:
prone = pos_prone[UNIT]
prone

['completely_different',
 'too_familiar',
 'even_better',
 'too_common',
 'entirely_different',
 'quite_different',
 'too_real',
 'well_aware',
 'super_heady',
 'generally_real',
 'instantly_bookable',
 'more_likely',
 'all_right',
 'as_simple']

In [None]:
# %%

ix = 0
ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> completely_different <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
something~completely_different,positive,existential,7372,5862.91,4.81,0.71,0.02,0.88,0.02,19710.6,1761853,318343,8352,1509.09,something,completely_different
both~completely_different,positive,universal,42,-195.06,-1.26,-0.02,-0.0,0.01,0.0,-250.18,1761853,50007,8352,237.06,both,completely_different
everyone~completely_different,positive,universal,11,-142.24,-1.35,-0.02,-0.0,0.0,0.0,-229.63,1761853,32327,8352,153.24,everyone,completely_different
often~completely_different,positive,hedged_universal,57,-380.23,-1.92,-0.05,-0.0,0.01,0.0,-547.83,1761853,92233,8352,437.23,often,completely_different
many~completely_different,positive,hedged_universal,10,-213.43,-1.92,-0.03,-0.0,0.0,0.0,-371.29,1761853,47133,8352,223.43,many,completely_different
sometimes~completely_different,positive,existential,38,-316.15,-1.94,-0.04,-0.0,0.0,0.0,-476.39,1761853,74707,8352,354.15,sometimes,completely_different
all~completely_different,positive,universal,207,-974.7,-2.12,-0.12,-0.0,0.02,0.0,-1359.54,1761853,249279,8352,1181.7,all,completely_different
or~completely_different,positive,existential,214,-1334.3,-2.55,-0.16,-0.01,0.03,0.0,-2074.41,1761853,326614,8352,1548.3,or,completely_different
always~completely_different,positive,universal,14,-375.67,-2.67,-0.05,-0.0,0.0,0.0,-677.46,1761853,82200,8352,389.67,always,completely_different
some~completely_different,positive,existential,22,-522.82,-2.97,-0.06,-0.0,0.0,0.0,-941.23,1761853,114929,8352,544.82,some,completely_different


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> too_familiar <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
all~too_familiar,positive,universal,6933,5934.39,7.65,0.84,0.03,0.98,0.03,26063.93,1761853,249279,7058,998.61,all,too_familiar
many~too_familiar,positive,hedged_universal,15,-173.82,-1.57,-0.02,-0.0,0.0,0.0,-276.67,1761853,47133,7058,188.82,many,too_familiar
never~too_familiar,negative,not_exist,15,-424.55,-2.84,-0.06,-0.0,0.0,0.0,-776.2,1761853,109723,7058,439.55,never,too_familiar
some~too_familiar,positive,existential,11,-449.41,-3.01,-0.06,-0.0,0.0,0.0,-848.49,1761853,114929,7058,460.41,some,too_familiar
something~too_familiar,positive,existential,18,-1257.29,-4.49,-0.18,-0.0,0.0,0.0,-2622.73,1761853,318343,7058,1275.29,something,too_familiar
or~too_familiar,positive,existential,16,-1292.42,-4.59,-0.18,-0.0,0.0,0.0,-2721.11,1761853,326614,7058,1308.42,or,too_familiar


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> even_better <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
or~even_better,positive,existential,4352,3220.62,3.22,0.53,0.01,0.71,0.01,8110.68,1761853,326614,6103,1131.38,or,even_better
both~even_better,positive,universal,25,-148.22,-1.18,-0.02,-0.0,0.0,0.0,-203.79,1761853,50007,6103,173.22,both,even_better
some~even_better,positive,existential,94,-304.11,-1.3,-0.05,-0.0,0.02,0.0,-353.65,1761853,114929,6103,398.11,some,even_better
many~even_better,positive,hedged_universal,14,-149.27,-1.38,-0.02,-0.0,0.0,0.0,-233.96,1761853,47133,6103,163.27,many,even_better
often~even_better,positive,hedged_universal,54,-265.49,-1.51,-0.04,-0.0,0.01,0.0,-351.8,1761853,92233,6103,319.49,often,even_better
always~even_better,positive,universal,10,-274.74,-2.3,-0.05,-0.0,0.0,0.0,-496.24,1761853,82200,6103,284.74,always,even_better
all~even_better,positive,universal,59,-804.49,-3.0,-0.13,-0.0,0.01,0.0,-1413.02,1761853,249279,6103,863.49,all,even_better


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> too_common <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
all~too_common,positive,universal,4882,4182.91,7.9,0.85,0.02,0.99,0.02,18554.58,1761853,249279,4941,699.09,all,too_common
or~too_common,positive,existential,19,-896.97,-3.99,-0.18,-0.0,0.0,0.0,-1836.19,1761853,326614,4941,915.97,or,too_common
something~too_common,positive,existential,11,-881.77,-4.15,-0.18,-0.0,0.0,0.0,-1849.27,1761853,318343,4941,892.77,something,too_common


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> entirely_different <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
something~entirely_different,positive,existential,3115,2517.29,5.58,0.76,0.01,0.94,0.01,9289.5,1761853,318343,3308,597.71,something,entirely_different
often~entirely_different,positive,hedged_universal,15,-158.17,-1.48,-0.05,-0.0,0.0,0.0,-251.1,1761853,92233,3308,173.17,often,entirely_different
or~entirely_different,positive,existential,45,-568.24,-2.81,-0.17,-0.0,0.01,0.0,-1014.8,1761853,326614,3308,613.24,or,entirely_different
all~entirely_different,positive,universal,14,-454.04,-3.08,-0.14,-0.0,0.0,0.0,-879.78,1761853,249279,3308,468.04,all,entirely_different


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> quite_different <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
something~quite_different,positive,existential,2268,1697.03,3.2,0.54,0.01,0.72,0.01,4366.68,1761853,318343,3160,570.97,something,quite_different
always~quite_different,positive,universal,18,-129.43,-1.15,-0.04,-0.0,0.01,0.0,-188.85,1761853,82200,3160,147.43,always,quite_different
or~quite_different,positive,existential,34,-551.8,-2.97,-0.17,-0.0,0.01,0.0,-1021.82,1761853,326614,3160,585.8,or,quite_different


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> too_real <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
all~too_real,positive,universal,2250,1920.19,6.47,0.82,0.01,0.97,0.01,8138.56,1761853,249279,2331,329.81,all,too_real
or~too_real,positive,existential,22,-410.12,-2.82,-0.18,-0.0,0.01,0.0,-772.67,1761853,326614,2331,432.12,or,too_real


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> well_aware <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
everyone~well_aware,positive,universal,391,360.27,3.55,0.22,0.01,0.23,0.01,1357.91,1761853,32327,1675,30.73,everyone,well_aware
all~well_aware,positive,universal,821,584.01,2.14,0.35,0.0,0.49,0.0,1151.78,1761853,249279,1675,236.99,all,well_aware
everybody~well_aware,positive,universal,65,57.43,2.12,0.03,0.01,0.04,0.01,167.05,1761853,7965,1675,7.57,everybody,well_aware
many~well_aware,positive,hedged_universal,145,100.19,1.07,0.06,0.0,0.09,0.0,146.68,1761853,47133,1675,44.81,many,well_aware
or~well_aware,positive,existential,34,-276.51,-2.03,-0.17,-0.0,0.02,0.0,-455.5,1761853,326614,1675,310.51,or,well_aware
something~well_aware,positive,existential,24,-278.65,-2.24,-0.17,-0.0,0.01,0.0,-489.04,1761853,318343,1675,302.65,something,well_aware


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> super_heady <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
everybody~super_heady,positive,universal,20,19.91,3.69,1.0,0.0,1.0,0.0,216.01,1761853,7965,20,0.09,everybody,super_heady


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> generally_real <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
everything~generally_real,positive,universal,18,17.6,1.18,0.98,0.0,1.0,0.0,136.71,1761853,39516,18,0.4,everything,generally_real


# %% [markdown]

 ---
## Examples for Items demonstrating *Negative* polarity environment lean overall (Top 10 by $|LRC|>1$)

In [None]:
prone_list = neg_prone[UNIT]
prone = sig_trig_abbr.copy().loc[sig_trig_abbr.l2.isin(prone_list), ['f2','l2']].drop_duplicates().reset_index(drop=True).set_index('l2').round(1).sort_values(['f2'], ascending=False).index.to_list()
prone

['more_important',
 'too_late',
 'as_good',
 'too_early',
 'so_easy',
 'too_old',
 'quite_sure',
 'too_pleased',
 'really_sure',
 'more_different',
 'too_fancy',
 'particularly_new',
 'ever_easy',
 'entirely_sure',
 'ever_perfect',
 'particularly_surprising',
 'longer_viable',
 'longer_pink',
 'strictly_bluegrass']

In [None]:
# %%

ix = 0
ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> more_important <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
nothing~more_important,negative,not_exist,7208,5913.61,2.82,0.26,0.06,0.31,0.07,15088.39,1761853,98788,23085,1294.39,nothing,more_important
never~more_important,negative,not_exist,3853,2415.33,1.45,0.11,0.02,0.17,0.04,3104.12,1761853,109723,23085,1437.67,never,more_important
nor~more_important,negative,not_exist,37,-166.69,-1.12,-0.01,-0.01,0.0,0.0,-210.2,1761853,15546,23085,203.69,nor,more_important
some~more_important,positive,existential,321,-1184.88,-1.85,-0.05,-0.01,0.01,0.0,-1454.52,1761853,114929,23085,1505.88,some,more_important
or~more_important,positive,existential,1067,-3212.52,-1.97,-0.14,-0.01,0.05,0.0,-4020.1,1761853,326614,23085,4279.52,or,more_important
everything~more_important,positive,universal,61,-456.77,-2.06,-0.02,-0.01,0.0,0.0,-667.25,1761853,39516,23085,517.77,everything,more_important
both~more_important,positive,universal,44,-611.23,-2.7,-0.03,-0.01,0.0,0.0,-1009.05,1761853,50007,23085,655.23,both,more_important
everyone~more_important,positive,universal,15,-408.57,-2.73,-0.02,-0.01,0.0,0.0,-729.55,1761853,32327,23085,423.57,everyone,more_important
many~more_important,positive,hedged_universal,22,-595.57,-3.1,-0.03,-0.01,0.0,0.0,-1067.86,1761853,47133,23085,617.57,many,more_important


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> too_late <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
never~too_late,negative,not_exist,10770,9974.22,6.14,0.79,0.1,0.84,0.1,49945.41,1761853,109723,12778,795.78,never,too_late
always~too_late,positive,universal,150,-446.16,-1.37,-0.04,-0.01,0.01,0.0,-497.06,1761853,82200,12778,596.16,always,too_late
everything~too_late,positive,universal,30,-256.59,-1.79,-0.02,-0.01,0.0,0.0,-384.72,1761853,39516,12778,286.59,everything,too_late
or~too_late,positive,existential,588,-1780.8,-1.89,-0.14,-0.01,0.05,0.0,-2223.57,1761853,326614,12778,2368.8,or,too_late
many~too_late,positive,hedged_universal,12,-329.84,-2.5,-0.03,-0.01,0.0,0.0,-590.34,1761853,47133,12778,341.84,many,too_late
all~too_late,positive,universal,240,-1567.92,-2.57,-0.12,-0.01,0.02,0.0,-2392.25,1761853,249279,12778,1807.92,all,too_late
both~too_late,positive,universal,10,-352.68,-2.62,-0.03,-0.01,0.0,0.0,-646.04,1761853,50007,12778,362.68,both,too_late
nothing~too_late,negative,not_exist,18,-698.47,-3.46,-0.06,-0.01,0.0,0.0,-1309.26,1761853,98788,12778,716.47,nothing,too_late
some~too_late,positive,existential,16,-817.53,-3.74,-0.06,-0.01,0.0,0.0,-1569.54,1761853,114929,12778,833.53,some,too_late


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> as_good <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
never~as_good,negative,not_exist,1981,1615.37,2.71,0.28,0.02,0.34,0.02,4018.2,1761853,109723,5871,365.63,never,as_good
rarely~as_good,negative,hedged_not_exist,118,103.21,2.27,0.02,0.02,0.02,0.03,287.92,1761853,4439,5871,14.79,rarely,as_good
none~as_good,negative,not_exist,444,340.63,1.79,0.06,0.01,0.08,0.01,637.36,1761853,31021,5871,103.37,none,as_good
neither~as_good,negative,not_exist,92,70.48,1.26,0.01,0.01,0.02,0.01,127.99,1761853,6458,5871,21.52,neither,as_good
all~as_good,positive,universal,274,-556.67,-1.24,-0.1,-0.0,0.05,0.0,-566.34,1761853,249279,5871,830.67,all,as_good
something~as_good,positive,existential,377,-683.81,-1.25,-0.12,-0.0,0.06,0.0,-682.28,1761853,318343,5871,1060.81,something,as_good


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> too_early <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
never~too_early,negative,not_exist,4890,4568.77,7.59,0.89,0.04,0.95,0.04,25284.55,1761853,109723,5158,321.23,never,too_early
always~too_early,positive,universal,50,-190.65,-1.16,-0.04,-0.0,0.01,0.0,-231.93,1761853,82200,5158,240.65,always,too_early
sometimes~too_early,positive,existential,24,-194.71,-1.56,-0.04,-0.0,0.0,0.0,-291.47,1761853,74707,5158,218.71,sometimes,too_early
often~too_early,positive,hedged_universal,10,-260.02,-2.23,-0.05,-0.0,0.0,0.0,-468.49,1761853,92233,5158,270.02,often,too_early
or~too_early,positive,existential,99,-857.19,-2.71,-0.17,-0.0,0.02,0.0,-1432.19,1761853,326614,5158,956.19,or,too_early
all~too_early,positive,universal,30,-699.79,-3.31,-0.14,-0.0,0.01,0.0,-1315.56,1761853,249279,5158,729.79,all,too_early


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> so_easy <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
never~so_easy,negative,not_exist,2501,2272.01,4.71,0.62,0.02,0.68,0.02,9479.17,1761853,109723,3677,228.99,never,so_easy
often~so_easy,positive,hedged_universal,20,-172.49,-1.5,-0.05,-0.0,0.01,0.0,-263.15,1761853,92233,3677,192.49,often,so_easy
some~so_easy,positive,existential,32,-207.86,-1.53,-0.06,-0.0,0.01,0.0,-299.53,1761853,114929,3677,239.86,some,so_easy
something~so_easy,positive,existential,137,-527.38,-1.8,-0.14,-0.0,0.04,0.0,-710.59,1761853,318343,3677,664.38,something,so_easy
or~so_easy,positive,existential,42,-639.65,-3.03,-0.17,-0.0,0.01,0.0,-1174.53,1761853,326614,3677,681.65,or,so_easy


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> too_old <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
never~too_old,negative,not_exist,2218,2013.61,4.67,0.61,0.02,0.68,0.02,8356.35,1761853,109723,3282,204.39,never,too_old
either~too_old,positive,existential,40,32.76,1.18,0.01,0.01,0.01,0.01,71.84,1761853,3886,3282,7.24,either,too_old
always~too_old,positive,universal,16,-137.12,-1.26,-0.04,-0.0,0.0,0.0,-208.13,1761853,82200,3282,153.12,always,too_old
often~too_old,positive,hedged_universal,21,-150.81,-1.3,-0.05,-0.0,0.01,0.0,-220.8,1761853,92233,3282,171.81,often,too_old
all~too_old,positive,universal,96,-368.36,-1.6,-0.11,-0.0,0.03,0.0,-480.89,1761853,249279,3282,464.36,all,too_old


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> quite_sure <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
nobody~quite_sure,negative,not_exist,660,649.31,5.96,0.22,0.1,0.22,0.1,4366.8,1761853,6311,2984,10.69,nobody,quite_sure
never~quite_sure,negative,not_exist,2176,1990.17,5.0,0.67,0.02,0.73,0.02,8739.05,1761853,109723,2984,185.83,never,quite_sure


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> too_pleased <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
none~too_pleased,negative,not_exist,1272,1248.12,8.8,0.92,0.04,0.94,0.04,9701.23,1761853,31021,1356,23.88,none,too_pleased


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> really_sure <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
nobody~really_sure,negative,not_exist,285,281.73,6.4,0.31,0.04,0.31,0.05,2093.12,1761853,6311,914,3.27,nobody,really_sure
never~really_sure,negative,not_exist,559,502.08,4.01,0.55,0.0,0.61,0.01,1930.7,1761853,109723,914,56.92,never,really_sure


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> more_different <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
hardly~more_different,negative,hedged_not_exist,491,488.69,8.66,0.66,0.09,0.66,0.09,4764.11,1761853,5468,744,2.31,hardly,more_different
scarcely~more_different,negative,hedged_not_exist,67,66.67,6.78,0.09,0.08,0.09,0.09,590.05,1761853,785,744,0.33,scarcely,more_different


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, prone, ix)
exdf

>> too_fancy <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
nothing~too_fancy,negative,not_exist,521,490.55,6.85,0.9,0.01,0.96,0.01,2823.11,1761853,98788,543,30.45,nothing,too_fancy


In [None]:
# %%

ix, exdf = show_prone_ex(sig_trig_abbr, [r'exactly\w*'] if UNIT!='Adj' else [r'un\w+'])
exdf

>> exactly\w* <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
nobody~exactly_sure,negative,not_exist,65,64.47,6.41,0.44,0.01,0.44,0.01,530.42,1761853,6311,148,0.53,nobody,exactly_sure
none~exactly_new,negative,not_exist,18,17.47,3.33,0.58,0.0,0.6,0.0,105.48,1761853,31021,30,0.53,none,exactly_new
never~exactly_clear,negative,not_exist,45,41.76,3.26,0.8,0.0,0.87,0.0,209.68,1761853,109723,52,3.24,never,exactly_clear
neither~exactly_right,negative,not_exist,14,13.51,2.66,0.1,0.0,0.1,0.0,68.01,1761853,6458,135,0.49,neither,exactly_right
none~exactly_alike,negative,not_exist,23,21.49,2.35,0.25,0.0,0.27,0.0,88.19,1761853,31021,86,1.51,none,exactly_alike
everything~exactly_right,positive,universal,35,31.97,2.32,0.24,0.0,0.26,0.0,115.87,1761853,39516,135,3.03,everything,exactly_right
never~exactly_sure,negative,not_exist,67,57.78,2.28,0.39,0.0,0.45,0.0,178.61,1761853,109723,148,9.22,never,exactly_sure
none~exactly_right,negative,not_exist,21,18.62,1.41,0.14,0.0,0.16,0.0,57.02,1761853,31021,135,2.38,none,exactly_right
never~exactly_easy,negative,not_exist,16,14.75,1.32,0.74,0.0,0.8,0.0,69.34,1761853,109723,20,1.25,never,exactly_easy


In [None]:
ix, exdf = show_prone_ex(sig_trig_abbr, [r'that\w*'])
exdf

>> that\w* <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
rarely~that_straightforward,negative,hedged_not_exist,14,13.88,4.74,0.29,0.0,0.29,0.0,109.81,1761853,4439,48,0.12,rarely,that_straightforward
rarely~that_simple,negative,hedged_not_exist,63,61.67,4.65,0.12,0.01,0.12,0.01,370.87,1761853,4439,529,1.33,rarely,that_simple
nobody~that_stupid,negative,not_exist,18,17.78,4.54,0.29,0.0,0.29,0.0,128.41,1761853,6311,62,0.22,nobody,that_stupid
never~that_easy,negative,not_exist,332,300.86,4.12,0.6,0.0,0.66,0.0,1227.51,1761853,109723,500,31.14,never,that_easy
never~that_great,negative,not_exist,214,192.83,3.76,0.57,0.0,0.63,0.0,756.46,1761853,109723,340,21.17,never,that_great
never~that_popular,negative,not_exist,60,55.64,3.69,0.79,0.0,0.86,0.0,277.04,1761853,109723,70,4.36,never,that_popular
never~that_simple,negative,not_exist,303,270.06,3.61,0.51,0.0,0.57,0.0,990.03,1761853,109723,529,32.94,never,that_simple
never~that_close,negative,not_exist,55,50.83,3.49,0.76,0.0,0.82,0.0,243.96,1761853,109723,67,4.17,never,that_close
never~that_good,negative,not_exist,327,288.7,3.43,0.47,0.0,0.53,0.0,1003.36,1761853,109723,615,38.3,never,that_good
never~that_interested,negative,not_exist,50,45.83,3.16,0.68,0.0,0.75,0.0,203.93,1761853,109723,67,4.17,never,that_interested


In [None]:
ix, exdf = show_prone_ex(sig_trig_abbr, [r'immediately\w*'])
exdf

>> immediately\w* <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
nobody~immediately_available,negative,not_exist,58,57.02,5.01,0.21,0.01,0.21,0.01,372.5,1761853,6311,274,0.98,nobody,immediately_available
neither~immediately_available,negative,not_exist,27,26.0,3.23,0.09,0.0,0.1,0.0,128.41,1761853,6458,274,1.0,neither,immediately_available
none~immediately_available,negative,not_exist,51,46.18,2.4,0.17,0.0,0.19,0.0,156.67,1761853,31021,274,4.82,none,immediately_available
nor~immediately_clear,negative,not_exist,10,9.62,2.13,0.22,0.0,0.23,0.0,48.56,1761853,15546,43,0.38,nor,immediately_clear


In [None]:
ix, exdf = show_prone_ex(sig_trig_abbr, [r'increasingly\w*'])
exdf

>> increasingly\w* <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
many~increasingly_concerned,positive,hedged_universal,18,17.36,2.9,0.72,0.0,0.75,0.0,103.7,1761853,47133,24,0.64,many,increasingly_concerned
many~increasingly_worried,positive,hedged_universal,10,9.55,1.65,0.56,0.0,0.59,0.0,49.77,1761853,47133,17,0.45,many,increasingly_worried


In [None]:
ix, exdf = show_prone_ex(sig_trig_abbr, [r'definitely\w*'])
exdf

>> definitely\w* <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
something~definitely_wrong,positive,existential,359,293.23,4.65,0.81,0.0,0.99,0.0,1178.01,1761853,318343,364,65.77,something,definitely_wrong
some~definitely_better,positive,existential,43,38.63,2.59,0.58,0.0,0.64,0.0,150.6,1761853,114929,67,4.37,some,definitely_better
something~definitely_different,positive,existential,34,26.59,1.05,0.65,0.0,0.83,0.0,81.66,1761853,318343,41,7.41,something,definitely_different


In [None]:
ix, exdf = show_prone_ex(sig_trig_abbr, [r'before\w*'])
exdf

>> before\w* <<


Unnamed: 0_level_0,polarity,quant,f,unexp_f,LRC,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f,l1,l2
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
never~before_available,negative,not_exist,175,164.1,3.13,0.94,0.0,1.0,0.0,971.92,1761853,109723,175,10.9,never,before_available


In [None]:
show_metric_top(sig_trig_abbr.filter(like='~very', axis=0), 'LRC', 10)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,LRC,quant,f,unexp_f,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
negative,nothing,very_remarkable,2.36,not_exist,48,42.51,0.43,0.0,0.49,0.0,146.56,1761853,98788,98,5.49
negative,neither,very_appealing,1.95,not_exist,17,15.87,0.05,0.0,0.06,0.0,61.44,1761853,6458,307,1.13
negative,neither,very_attractive,1.67,not_exist,17,15.64,0.04,0.0,0.05,0.0,55.39,1761853,6458,370,1.36
negative,neither,very_good,1.56,not_exist,130,102.75,0.01,0.02,0.02,0.02,203.84,1761853,6458,7434,27.25
negative,none,very_convincing,1.46,not_exist,19,17.05,0.15,0.0,0.17,0.0,55.16,1761853,31021,111,1.95
negative,none,very_likeable,1.33,not_exist,13,11.91,0.19,0.0,0.21,0.0,43.09,1761853,31021,62,1.09
negative,none,very_surprising,1.26,not_exist,25,21.53,0.11,0.0,0.13,0.0,58.2,1761853,31021,197,3.47
negative,neither,very_likely,1.18,not_exist,17,15.09,0.03,0.0,0.03,0.0,44.69,1761853,6458,520,1.91
negative,never,very_good,1.09,not_exist,1079,616.03,0.08,0.01,0.15,0.01,653.72,1761853,109723,7434,462.97
negative,never,very_nice,-1.17,not_exist,17,-127.05,-0.05,-0.0,0.01,0.0,-188.9,1761853,109723,2313,144.05


In [None]:
show_metric_top(sig_trig_abbr.filter(like='~exactly', axis=0), 'LRC', 10)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,LRC,quant,f,unexp_f,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
negative,nobody,exactly_sure,6.41,not_exist,65,64.47,0.44,0.01,0.44,0.01,530.42,1761853,6311,148,0.53
negative,none,exactly_new,3.33,not_exist,18,17.47,0.58,0.0,0.6,0.0,105.48,1761853,31021,30,0.53
negative,never,exactly_clear,3.26,not_exist,45,41.76,0.8,0.0,0.87,0.0,209.68,1761853,109723,52,3.24
negative,neither,exactly_right,2.66,not_exist,14,13.51,0.1,0.0,0.1,0.0,68.01,1761853,6458,135,0.49
negative,none,exactly_alike,2.35,not_exist,23,21.49,0.25,0.0,0.27,0.0,88.19,1761853,31021,86,1.51
negative,never,exactly_sure,2.28,not_exist,67,57.78,0.39,0.0,0.45,0.0,178.61,1761853,109723,148,9.22
negative,none,exactly_right,1.41,not_exist,21,18.62,0.14,0.0,0.16,0.0,57.02,1761853,31021,135,2.38
negative,never,exactly_easy,1.32,not_exist,16,14.75,0.74,0.0,0.8,0.0,69.34,1761853,109723,20,1.25
positive,everything,exactly_right,2.32,universal,35,31.97,0.24,0.0,0.26,0.0,115.87,1761853,39516,135,3.03


In [None]:
show_metric_top(sig_trig_abbr.filter(like='body~', axis=0), 'LRC', 10)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,LRC,quant,f,unexp_f,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
negative,nobody,more_surprised,8.16,not_exist,166,165.14,0.69,0.03,0.69,0.03,1580.5,1761853,6311,239,0.86
negative,nobody,more_disappointed,6.52,not_exist,67,66.48,0.46,0.01,0.46,0.01,554.53,1761853,6311,146,0.52
negative,nobody,more_frustrated,6.48,not_exist,56,55.58,0.48,0.01,0.48,0.01,469.71,1761853,6311,117,0.42
negative,nobody,exactly_sure,6.41,not_exist,65,64.47,0.44,0.01,0.44,0.01,530.42,1761853,6311,148,0.53
negative,nobody,really_sure,6.4,not_exist,285,281.73,0.31,0.04,0.31,0.05,2093.12,1761853,6311,914,3.27
negative,nobody,even_sure,6.01,not_exist,32,31.76,0.48,0.01,0.48,0.01,269.41,1761853,6311,66,0.24
negative,nobody,ever_happy,5.98,not_exist,25,24.84,0.55,0.0,0.56,0.0,220.01,1761853,6311,45,0.16
negative,nobody,quite_sure,5.96,not_exist,660,649.31,0.22,0.1,0.22,0.1,4366.8,1761853,6311,2984,10.69
negative,nobody,seriously_hurt,5.9,not_exist,49,48.53,0.37,0.01,0.37,0.01,379.68,1761853,6311,131,0.47
negative,nobody,more_committed,5.87,not_exist,28,27.79,0.48,0.0,0.48,0.0,235.38,1761853,6311,58,0.21


In [None]:
show_metric_top(sig_trig_abbr.filter(like='terribly', axis=0), 'LRC', 10)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,LRC,quant,f,unexp_f,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
negative,nothing,terribly_new,4.0,not_exist,64,60.02,0.85,0.0,0.9,0.0,323.91,1761853,98788,71,3.98
negative,none,terribly_surprising,3.67,not_exist,32,30.82,0.46,0.0,0.48,0.0,167.05,1761853,31021,67,1.18
negative,nothing,terribly_exciting,3.3,not_exist,71,64.83,0.59,0.0,0.65,0.0,270.62,1761853,98788,110,6.17
negative,nothing,terribly_original,3.13,not_exist,38,35.42,0.77,0.0,0.83,0.0,177.4,1761853,98788,46,2.58
negative,none,terribly_interesting,2.26,not_exist,19,17.84,0.27,0.0,0.29,0.0,75.95,1761853,31021,66,1.16
negative,nothing,terribly_unusual,1.9,not_exist,20,18.65,0.78,0.0,0.83,0.0,94.08,1761853,98788,24,1.35
negative,never,terribly_interested,1.73,not_exist,24,21.32,0.5,0.0,0.56,0.0,76.68,1761853,109723,43,2.68
negative,never,terribly_good,1.62,not_exist,21,18.76,0.52,0.0,0.58,0.0,69.63,1761853,109723,36,2.24
negative,nothing,terribly_interesting,1.59,not_exist,28,24.3,0.37,0.0,0.42,0.0,75.76,1761853,98788,66,3.7
negative,nothing,terribly_surprising,1.46,not_exist,27,23.24,0.35,0.0,0.4,0.0,69.86,1761853,98788,67,3.76


In [None]:
show_metric_top(sig_trig_abbr.filter(like='definitely', axis=0), 'LRC', 10)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,LRC,quant,f,unexp_f,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
positive,something,definitely_wrong,4.65,existential,359,293.23,0.81,0.0,0.99,0.0,1178.01,1761853,318343,364,65.77
positive,some,definitely_better,2.59,existential,43,38.63,0.58,0.0,0.64,0.0,150.6,1761853,114929,67,4.37
positive,something,definitely_different,1.05,existential,34,26.59,0.65,0.0,0.83,0.0,81.66,1761853,318343,41,7.41


In [None]:
show_metric_top(sig_trig_abbr.filter(like='slightly', axis=0), 'LRC', 10)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,LRC,quant,f,unexp_f,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
positive,or,slightly_higher,3.24,existential,310,240.11,0.64,0.0,0.82,0.0,719.79,1761853,326614,377,69.89
positive,or,slightly_more,3.04,existential,181,141.33,0.66,0.0,0.85,0.0,439.69,1761853,326614,214,39.67
positive,or,slightly_lower,2.8,existential,165,127.55,0.63,0.0,0.82,0.0,379.03,1761853,326614,202,37.45
positive,or,slightly_better,2.26,existential,190,139.58,0.51,0.0,0.7,0.0,341.14,1761853,326614,272,50.42
positive,something,slightly_different,2.25,existential,743,516.24,0.41,0.0,0.59,0.0,1050.59,1761853,318343,1255,226.76
positive,or,slightly_less,2.0,existential,79,60.28,0.6,0.0,0.78,0.0,169.44,1761853,326614,101,18.72
positive,or,slightly_larger,1.79,existential,143,101.1,0.45,0.0,0.63,0.0,218.9,1761853,326614,226,41.9
positive,or,slightly_damp,1.61,existential,49,38.8,0.71,0.0,0.89,0.0,129.72,1761853,326614,55,10.2
positive,or,slightly_wider,1.46,existential,55,44.25,0.76,0.0,0.95,0.0,163.01,1761853,326614,58,10.75
positive,or,slightly_golden,1.4,existential,71,57.47,0.79,0.0,0.97,0.0,221.82,1761853,326614,73,13.53


In [None]:
show_metric_top(sig_trig_abbr.filter(like='highly', axis=0), 'LRC', 10)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,LRC,quant,f,unexp_f,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
positive,both,highly_functional,2.53,universal,18,17.09,0.53,0.0,0.56,0.0,85.18,1761853,50007,32,0.91
positive,both,highly_efficient,2.46,universal,20,18.84,0.46,0.0,0.49,0.0,86.88,1761853,50007,41,1.16
positive,often,highly_complex,2.3,hedged_universal,55,48.3,0.38,0.0,0.43,0.0,157.45,1761853,92233,128,6.7
positive,all,highly_qualified,2.24,universal,145,112.32,0.49,0.0,0.63,0.0,288.41,1761853,249279,231,32.68
positive,both,highly_intelligent,2.14,universal,33,29.82,0.27,0.0,0.29,0.0,103.86,1761853,50007,112,3.18
positive,both,highly_contagious,2.11,universal,17,15.92,0.42,0.0,0.45,0.0,70.06,1761853,50007,38,1.08
positive,both,highly_effective,2.07,universal,62,53.88,0.19,0.0,0.22,0.0,155.6,1761853,50007,286,8.12
positive,both,highly_addictive,2.0,universal,19,17.58,0.35,0.0,0.38,0.0,70.74,1761853,50007,50,1.42
positive,both,highly_successful,1.88,universal,35,30.94,0.22,0.0,0.24,0.0,96.42,1761853,50007,143,4.06
positive,many,highly_critical,1.74,hedged_universal,41,35.46,0.17,0.0,0.2,0.0,99.91,1761853,47133,207,5.54


In [None]:
show_metric_top(sig_trig_abbr.filter(like='remotely', axis=0), 'LRC', 10)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,LRC,quant,f,unexp_f,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
negative,none,remotely_true,4.66,not_exist,44,42.84,0.65,0.0,0.67,0.0,272.29,1761853,31021,66,1.16
negative,nothing,remotely_comparable,3.26,not_exist,42,39.36,0.84,0.0,0.89,0.0,210.75,1761853,98788,47,2.64
negative,none,remotely_possible,3.24,not_exist,23,22.12,0.44,0.0,0.46,0.0,117.8,1761853,31021,50,0.88
negative,nothing,remotely_close,3.22,not_exist,139,124.25,0.47,0.0,0.53,0.0,451.7,1761853,98788,263,14.75
negative,nothing,remotely_similar,3.05,not_exist,64,58.06,0.55,0.0,0.6,0.0,231.32,1761853,98788,106,5.94
negative,none,remotely_accurate,2.51,not_exist,11,10.72,0.67,0.0,0.69,0.0,69.17,1761853,31021,16,0.28
negative,nothing,remotely_funny,2.48,not_exist,32,29.2,0.58,0.0,0.64,0.0,121.14,1761853,98788,50,2.8
negative,nothing,remotely_interesting,2.41,not_exist,42,37.57,0.48,0.0,0.53,0.0,137.1,1761853,98788,79,4.43
negative,nothing,remotely_new,1.66,not_exist,17,15.77,0.72,0.0,0.77,0.0,74.96,1761853,98788,22,1.23
negative,none,remotely_close,1.54,not_exist,34,29.37,0.11,0.0,0.13,0.0,80.33,1761853,31021,263,4.63


In [None]:
show_metric_top(sig_trig_abbr.filter(like='absolutely', axis=0), 'LRC', 10)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,LRC,quant,f,unexp_f,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
negative,nobody,absolutely_sure,2.68,not_exist,13,12.57,0.11,0.0,0.11,0.0,65.12,1761853,6311,119,0.43
negative,never,absolutely_sure,2.23,not_exist,56,48.59,0.41,0.0,0.47,0.0,154.5,1761853,109723,119,7.41
negative,never,absolutely_certain,2.2,not_exist,67,57.41,0.37,0.0,0.44,0.0,172.34,1761853,109723,154,9.59
positive,everything,absolutely_perfect,4.75,universal,120,115.36,0.56,0.0,0.58,0.0,633.99,1761853,39516,207,4.64
positive,everything,absolutely_true,3.6,universal,73,68.87,0.37,0.0,0.4,0.0,312.41,1761853,39516,184,4.13
positive,everything,absolutely_ideal,2.93,universal,16,15.51,0.7,0.0,0.73,0.0,96.01,1761853,39516,22,0.49
positive,everything,absolutely_delicious,2.92,universal,44,41.02,0.31,0.0,0.33,0.0,169.41,1761853,39516,133,2.98
positive,everything,absolutely_free,2.91,universal,84,76.82,0.24,0.0,0.26,0.0,280.41,1761853,39516,320,7.18
positive,everything,absolutely_fine,2.53,universal,23,21.61,0.35,0.0,0.37,0.0,94.69,1761853,39516,62,1.39
positive,something,absolutely_new,2.19,existential,83,64.39,0.63,0.0,0.81,0.0,190.61,1761853,318343,103,18.61


In [None]:
show_metric_top(sig_trig_abbr.filter(like='downright', axis=0), 'LRC', 10)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,LRC,quant,f,unexp_f,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
positive,sometimes,downright_scary,2.03,existential,40,35.25,0.31,0.0,0.36,0.0,113.11,1761853,74707,112,4.75
positive,sometimes,downright_difficult,1.97,existential,16,15.11,0.72,0.0,0.76,0.0,78.52,1761853,74707,21,0.89
positive,sometimes,downright_painful,1.72,existential,24,21.41,0.35,0.0,0.39,0.0,73.15,1761853,74707,61,2.59
positive,sometimes,downright_frustrating,1.71,existential,14,13.19,0.69,0.0,0.74,0.0,67.03,1761853,74707,19,0.81
positive,some,downright_awful,1.59,existential,34,28.91,0.37,0.0,0.44,0.0,84.73,1761853,114929,78,5.09
positive,some,downright_ugly,1.54,existential,33,27.98,0.36,0.0,0.43,0.0,80.94,1761853,114929,77,5.02
positive,sometimes,downright_bizarre,1.4,existential,30,25.55,0.24,0.0,0.29,0.0,70.5,1761853,74707,105,4.45
positive,some,downright_dangerous,1.4,existential,51,40.82,0.26,0.0,0.33,0.0,95.44,1761853,114929,156,10.18
positive,some,downright_hilarious,1.36,existential,33,27.46,0.32,0.0,0.39,0.0,73.64,1761853,114929,85,5.54
positive,or,downright_impossible,1.36,existential,57,41.8,0.51,0.0,0.7,0.0,101.54,1761853,326614,82,15.2


In [None]:
show_metric_top(sig_trig_abbr.filter(like='utterly', axis=0), 'LRC', 10)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,LRC,quant,f,unexp_f,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
positive,something,utterly_different,1.89,existential,63,48.91,0.63,0.0,0.81,0.0,145.2,1761853,318343,78,14.09
positive,something,utterly_unique,1.08,existential,37,28.15,0.57,0.0,0.76,0.0,76.85,1761853,318343,49,8.85


In [None]:
show_metric_top(sig_trig_abbr.filter(like='slightly', axis=0), 'LRC', 10)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,LRC,quant,f,unexp_f,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
positive,or,slightly_higher,3.24,existential,310,240.11,0.64,0.0,0.82,0.0,719.79,1761853,326614,377,69.89
positive,or,slightly_more,3.04,existential,181,141.33,0.66,0.0,0.85,0.0,439.69,1761853,326614,214,39.67
positive,or,slightly_lower,2.8,existential,165,127.55,0.63,0.0,0.82,0.0,379.03,1761853,326614,202,37.45
positive,or,slightly_better,2.26,existential,190,139.58,0.51,0.0,0.7,0.0,341.14,1761853,326614,272,50.42
positive,something,slightly_different,2.25,existential,743,516.24,0.41,0.0,0.59,0.0,1050.59,1761853,318343,1255,226.76
positive,or,slightly_less,2.0,existential,79,60.28,0.6,0.0,0.78,0.0,169.44,1761853,326614,101,18.72
positive,or,slightly_larger,1.79,existential,143,101.1,0.45,0.0,0.63,0.0,218.9,1761853,326614,226,41.9
positive,or,slightly_damp,1.61,existential,49,38.8,0.71,0.0,0.89,0.0,129.72,1761853,326614,55,10.2
positive,or,slightly_wider,1.46,existential,55,44.25,0.76,0.0,0.95,0.0,163.01,1761853,326614,58,10.75
positive,or,slightly_golden,1.4,existential,71,57.47,0.79,0.0,0.97,0.0,221.82,1761853,326614,73,13.53


In [None]:
show_metric_top(sig_trig_abbr.filter(like='extremely', axis=0), 'LRC', 10)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,LRC,quant,f,unexp_f,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
positive,all,extremely_innovative,5.23,universal,379,324.24,0.84,0.0,0.98,0.0,1407.34,1761853,249279,387,54.76
positive,everyone,extremely_friendly,4.78,universal,103,99.5,0.52,0.0,0.54,0.0,563.6,1761853,32327,191,3.5
positive,everyone,extremely_nice,4.54,universal,65,62.85,0.54,0.0,0.56,0.0,361.07,1761853,32327,117,2.15
positive,everyone,extremely_welcoming,3.41,universal,24,23.14,0.49,0.0,0.51,0.0,127.65,1761853,32327,47,0.86
positive,both,extremely_talented,2.87,universal,55,50.63,0.33,0.0,0.36,0.0,196.83,1761853,50007,154,4.37
positive,always,extremely_careful,2.8,universal,39,35.87,0.54,0.0,0.58,0.0,150.69,1761853,82200,67,3.13
positive,many,extremely_scarce,2.68,hedged_universal,17,16.28,0.6,0.0,0.63,0.0,88.07,1761853,47133,27,0.72
positive,everyone,extremely_supportive,2.57,universal,32,29.78,0.25,0.0,0.26,0.0,119.41,1761853,32327,121,2.22
positive,everyone,extremely_excited,2.57,universal,50,45.74,0.2,0.0,0.22,0.0,164.8,1761853,32327,232,4.26
positive,always,extremely_responsive,2.57,universal,25,23.32,0.65,0.0,0.69,0.0,109.99,1761853,82200,36,1.68


In [None]:
show_metric_top(sig_trig_abbr.filter(like='necessarily', axis=0), 'LRC', 10)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,LRC,quant,f,unexp_f,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
negative,neither,necessarily_true,6.22,not_exist,32,31.79,0.55,0.0,0.55,0.0,279.53,1761853,6458,58,0.21
negative,nothing,necessarily_wrong,5.42,not_exist,194,182.0,0.85,0.0,0.91,0.0,987.67,1761853,98788,214,12.0
negative,neither,necessarily_better,3.95,not_exist,10,9.89,0.34,0.0,0.34,0.0,74.97,1761853,6458,29,0.11
negative,none,necessarily_bad,3.35,not_exist,25,24.05,0.45,0.0,0.46,0.0,128.46,1761853,31021,54,0.95
negative,neither,necessarily_bad,3.35,not_exist,11,10.8,0.2,0.0,0.2,0.0,69.13,1761853,6458,54,0.2
negative,none,necessarily_better,1.95,not_exist,11,10.49,0.36,0.0,0.38,0.0,51.02,1761853,31021,29,0.51
negative,nor,necessarily_desirable,1.85,not_exist,12,11.89,0.99,0.0,1.0,0.0,113.54,1761853,15546,12,0.11
negative,none,necessarily_true,1.2,not_exist,12,10.98,0.19,0.0,0.21,0.0,39.45,1761853,31021,58,1.02


In [None]:
show_metric_top(sig_trig_abbr.filter(like='quite', axis=0), 'LRC', 15)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,LRC,quant,f,unexp_f,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
negative,nobody,quite_sure,5.96,not_exist,660,649.31,0.22,0.1,0.22,0.1,4366.8,1761853,6311,2984,10.69
negative,never,quite_able,5.76,not_exist,319,297.27,0.85,0.0,0.91,0.0,1571.33,1761853,109723,349,21.73
negative,never,quite_sure,5.0,not_exist,2176,1990.17,0.67,0.02,0.73,0.02,8739.05,1761853,109723,2984,185.83
negative,never,quite_clear,4.41,not_exist,399,363.75,0.64,0.0,0.7,0.0,1551.45,1761853,109723,566,35.25
negative,never,quite_enough,4.36,not_exist,150,138.17,0.73,0.0,0.79,0.0,642.61,1761853,109723,190,11.83
negative,neither,quite_ready,4.27,not_exist,28,27.46,0.19,0.0,0.19,0.0,171.52,1761853,6458,148,0.54
negative,never,quite_satisfied,4.15,not_exist,144,132.11,0.69,0.0,0.75,0.0,592.6,1761853,109723,191,11.89
negative,nobody,quite_certain,3.48,not_exist,23,22.34,0.12,0.0,0.12,0.0,121.39,1761853,6311,185,0.66
negative,never,quite_certain,3.44,not_exist,117,105.48,0.57,0.0,0.63,0.0,415.15,1761853,109723,185,11.52
negative,never,quite_right,3.24,not_exist,217,191.16,0.46,0.0,0.52,0.0,656.23,1761853,109723,415,25.84


In [None]:
show_metric_top(sig_trig_abbr.filter(like='terribly', axis=0), 'LRC', 15)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,LRC,quant,f,unexp_f,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
negative,nothing,terribly_new,4.0,not_exist,64,60.02,0.85,0.0,0.9,0.0,323.91,1761853,98788,71,3.98
negative,none,terribly_surprising,3.67,not_exist,32,30.82,0.46,0.0,0.48,0.0,167.05,1761853,31021,67,1.18
negative,nothing,terribly_exciting,3.3,not_exist,71,64.83,0.59,0.0,0.65,0.0,270.62,1761853,98788,110,6.17
negative,nothing,terribly_original,3.13,not_exist,38,35.42,0.77,0.0,0.83,0.0,177.4,1761853,98788,46,2.58
negative,none,terribly_interesting,2.26,not_exist,19,17.84,0.27,0.0,0.29,0.0,75.95,1761853,31021,66,1.16
negative,nothing,terribly_unusual,1.9,not_exist,20,18.65,0.78,0.0,0.83,0.0,94.08,1761853,98788,24,1.35
negative,never,terribly_interested,1.73,not_exist,24,21.32,0.5,0.0,0.56,0.0,76.68,1761853,109723,43,2.68
negative,never,terribly_good,1.62,not_exist,21,18.76,0.52,0.0,0.58,0.0,69.63,1761853,109723,36,2.24
negative,nothing,terribly_interesting,1.59,not_exist,28,24.3,0.37,0.0,0.42,0.0,75.76,1761853,98788,66,3.7
negative,nothing,terribly_surprising,1.46,not_exist,27,23.24,0.35,0.0,0.4,0.0,69.86,1761853,98788,67,3.76


In [None]:
show_metric_top(sig_trig_abbr.filter(like='dreadfully', axis=0), 'LRC', 15)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,LRC,quant,f,unexp_f,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
positive,something,dreadfully_wrong,2.69,existential,97,78.57,0.77,0.0,0.95,0.0,294.04,1761853,318343,102,18.43


In [None]:
show_metric_top(sig_trig_abbr.filter(like='particularly', axis=0), 'LRC', 15)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,LRC,quant,f,unexp_f,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
negative,nothing,particularly_wrong,5.83,not_exist,211,198.78,0.91,0.0,0.97,0.0,1155.16,1761853,98788,218,12.22
negative,nothing,particularly_new,5.2,not_exist,336,313.01,0.76,0.0,0.82,0.0,1558.57,1761853,98788,410,22.99
negative,nothing,particularly_special,4.85,not_exist,318,294.79,0.71,0.0,0.77,0.0,1396.02,1761853,98788,414,23.21
negative,nothing,particularly_unusual,4.7,not_exist,152,141.63,0.77,0.0,0.82,0.0,706.39,1761853,98788,185,10.37
negative,nothing,particularly_remarkable,4.47,not_exist,96,89.78,0.81,0.0,0.86,0.0,467.08,1761853,98788,111,6.22
negative,neither,particularly_effective,4.41,not_exist,24,23.61,0.22,0.0,0.23,0.0,156.51,1761853,6458,106,0.39
negative,none,particularly_surprising,4.33,not_exist,78,75.04,0.45,0.0,0.46,0.0,401.5,1761853,31021,168,2.96
negative,neither,particularly_appealing,3.91,not_exist,16,15.73,0.21,0.0,0.22,0.0,102.68,1761853,6458,74,0.27
negative,neither,particularly_good,3.84,not_exist,52,50.24,0.1,0.01,0.11,0.01,257.56,1761853,6458,480,1.76
negative,none,particularly_likeable,3.61,not_exist,19,18.54,0.71,0.0,0.73,0.0,123.47,1761853,31021,26,0.46


In [None]:
show_metric_top(ex_trig_abbr.filter(like='inherently', axis=0), 'LRC', 15)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,LRC,quant,f,unexp_f,dP1,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
negative,nothing,inherently_wrong,5.74,not_exist,1472,1371.13,0.76,0.01,0.82,0.01,6834.42,1761853,98788,1799,100.87
negative,neither,inherently_better,3.66,not_exist,13,12.78,0.21,0.0,0.22,0.0,83.48,1761853,6458,60,0.22
negative,neither,inherently_good,2.91,not_exist,15,14.53,0.11,0.0,0.12,0.0,76.4,1761853,6458,129,0.47
negative,nothing,inherently_bad,2.65,not_exist,86,75.57,0.41,0.0,0.46,0.0,250.36,1761853,98788,186,10.43
negative,nothing,inherently_evil,2.49,not_exist,51,45.39,0.45,0.0,0.51,0.0,160.96,1761853,98788,100,5.61
negative,none,inherently_bad,2.35,not_exist,38,34.73,0.19,0.0,0.2,0.0,123.95,1761853,31021,186,3.27
negative,nothing,inherently_special,2.25,not_exist,25,22.93,0.62,0.0,0.68,0.0,98.82,1761853,98788,37,2.07
negative,nothing,inherently_good,1.93,not_exist,50,42.77,0.33,0.0,0.39,0.0,124.99,1761853,98788,129,7.23
negative,nothing,inherently_immoral,1.67,not_exist,17,15.65,0.65,0.0,0.71,0.0,69.79,1761853,98788,24,1.35
negative,nothing,inherently_dangerous,1.31,not_exist,29,24.4,0.3,0.0,0.35,0.0,66.68,1761853,98788,82,4.6


In [None]:
show_metric_top(sig_trig_abbr.filter(like='terribly', axis=0), 'dP1', 15)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,dP1,quant,f,unexp_f,LRC,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
negative,nothing,terribly_new,0.85,not_exist,64,60.02,4.0,0.0,0.9,0.0,323.91,1761853,98788,71,3.98
negative,nothing,terribly_unusual,0.78,not_exist,20,18.65,1.9,0.0,0.83,0.0,94.08,1761853,98788,24,1.35
negative,nothing,terribly_original,0.77,not_exist,38,35.42,3.13,0.0,0.83,0.0,177.4,1761853,98788,46,2.58
negative,never,terribly_popular,0.73,not_exist,15,13.82,1.2,0.0,0.79,0.0,64.24,1761853,109723,19,1.18
negative,never,terribly_fond,0.69,not_exist,15,13.75,1.26,0.0,0.75,0.0,61.44,1761853,109723,20,1.25
negative,nothing,terribly_exciting,0.59,not_exist,71,64.83,3.3,0.0,0.65,0.0,270.62,1761853,98788,110,6.17
negative,nothing,terribly_serious,0.53,not_exist,13,11.77,1.04,0.0,0.59,0.0,46.18,1761853,98788,22,1.23
negative,never,terribly_good,0.52,not_exist,21,18.76,1.62,0.0,0.58,0.0,69.63,1761853,109723,36,2.24
negative,nothing,terribly_complicated,0.5,not_exist,14,12.6,1.11,0.0,0.56,0.0,47.65,1761853,98788,25,1.4
negative,never,terribly_interested,0.5,not_exist,24,21.32,1.73,0.0,0.56,0.0,76.68,1761853,109723,43,2.68


In [None]:
show_metric_top(sig_trig_abbr.filter(regex='~un\w+_', axis=0), 'dP1', 15)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,dP1,quant,f,unexp_f,LRC,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
positive,something,uniquely_special,0.7,existential,58,46.07,1.94,0.0,0.88,0.0,152.92,1761853,318343,66,11.93
positive,something,uniquely_american,0.58,existential,38,28.97,1.13,0.0,0.76,0.0,79.71,1761853,318343,50,9.03
positive,many,understandably_concerned,0.41,hedged_universal,15,14.09,2.01,0.0,0.44,0.0,63.01,1761853,47133,34,0.91
positive,all,uniquely_different,0.39,universal,53,38.85,1.13,0.0,0.53,0.0,83.37,1761853,249279,100,14.15
positive,often,unintentionally_hilarious,0.38,hedged_universal,19,16.7,1.28,0.0,0.43,0.0,54.61,1761853,92233,44,2.3


In [None]:
show_metric_top(sig_trig_abbr.filter(like='_un', axis=0), 'dP1', 15)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,dP1,quant,f,unexp_f,LRC,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
negative,nothing,more_unattractive,0.89,not_exist,32,30.09,2.09,0.0,0.94,0.0,169.42,1761853,98788,34,1.91
negative,nothing,terribly_unusual,0.78,not_exist,20,18.65,1.9,0.0,0.83,0.0,94.08,1761853,98788,24,1.35
negative,nothing,particularly_unusual,0.77,not_exist,152,141.63,4.7,0.0,0.82,0.0,706.39,1761853,98788,185,10.37
negative,nothing,too_unusual,0.73,not_exist,92,85.44,4.1,0.0,0.79,0.0,411.7,1761853,98788,117,6.56
negative,nothing,more_unsightly,0.67,not_exist,16,14.77,1.56,0.0,0.73,0.0,67.11,1761853,98788,22,1.23
negative,nothing,too_unexpected,0.67,not_exist,13,11.99,1.13,0.0,0.72,0.0,54.22,1761853,98788,18,1.01
negative,nothing,more_unappealing,0.64,not_exist,14,12.88,1.29,0.0,0.7,0.0,56.93,1761853,98788,20,1.12
negative,nothing,more_unjust,0.64,not_exist,23,21.15,2.17,0.0,0.7,0.0,93.21,1761853,98788,33,1.85
negative,nothing,especially_unusual,0.62,not_exist,17,15.6,1.64,0.0,0.68,0.0,67.54,1761853,98788,25,1.4
negative,nothing,particularly_unique,0.61,not_exist,82,75.05,3.48,0.0,0.66,0.0,318.65,1761853,98788,124,6.95


In [None]:
show_metric_top(sig_trig_abbr.filter(like='_non', axis=0), 'dP1', 15)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,dP1,quant,f,unexp_f,LRC,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
positive,or,even_nonexistent,0.81,existential,144,117.31,1.07,0.0,1.0,0.0,485.43,1761853,326614,144,26.69
positive,or,even_non-existent,0.77,existential,201,162.07,3.82,0.0,0.96,0.0,606.99,1761853,326614,210,38.93


In [None]:
show_metric_top(sig_trig_abbr.filter(like='_in', axis=0), 'dP1', 15)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,dP1,quant,f,unexp_f,LRC,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
negative,nothing,more_invigorating,0.79,not_exist,51,47.64,3.61,0.0,0.85,0.0,244.21,1761853,98788,60,3.36
negative,nor,most_intelligent,0.74,not_exist,45,44.47,5.95,0.0,0.75,0.0,358.64,1761853,15546,60,0.53
negative,nothing,more_incorrect,0.71,not_exist,13,12.05,1.08,0.0,0.76,0.0,56.82,1761853,98788,17,0.95
negative,never,that_interested,0.68,not_exist,50,45.83,3.16,0.0,0.75,0.0,203.93,1761853,109723,67,4.17
negative,nothing,too_interesting,0.65,not_exist,71,65.39,3.56,0.0,0.71,0.0,292.08,1761853,98788,100,5.61
negative,never,overly_interested,0.65,not_exist,17,15.51,1.51,0.0,0.71,0.0,66.32,1761853,109723,24,1.49
negative,nothing,more_intoxicating,0.59,not_exist,13,11.88,1.12,0.0,0.65,0.0,49.82,1761853,98788,20,1.12
negative,nothing,particularly_innovative,0.57,not_exist,34,30.97,2.53,0.0,0.63,0.0,127.05,1761853,98788,54,3.03
negative,nothing,more_insulting,0.57,not_exist,35,31.86,2.54,0.0,0.62,0.0,130.02,1761853,98788,56,3.14
negative,none,more_infamous,0.56,not_exist,15,14.54,2.99,0.0,0.58,0.0,86.16,1761853,31021,26,0.46


In [None]:
show_metric_top(sig_trig_abbr.filter(like='remotely', axis=0), 'dP1', 15)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,dP1,quant,f,unexp_f,LRC,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
negative,nothing,remotely_comparable,0.84,not_exist,42,39.36,3.26,0.0,0.89,0.0,210.75,1761853,98788,47,2.64
negative,nothing,remotely_new,0.72,not_exist,17,15.77,1.66,0.0,0.77,0.0,74.96,1761853,98788,22,1.23
negative,none,remotely_accurate,0.67,not_exist,11,10.72,2.51,0.0,0.69,0.0,69.17,1761853,31021,16,0.28
negative,none,remotely_true,0.65,not_exist,44,42.84,4.66,0.0,0.67,0.0,272.29,1761853,31021,66,1.16
negative,nothing,remotely_funny,0.58,not_exist,32,29.2,2.48,0.0,0.64,0.0,121.14,1761853,98788,50,2.8
negative,nothing,remotely_similar,0.55,not_exist,64,58.06,3.05,0.0,0.6,0.0,231.32,1761853,98788,106,5.94
negative,nothing,remotely_interesting,0.48,not_exist,42,37.57,2.41,0.0,0.53,0.0,137.1,1761853,98788,79,4.43
negative,nothing,remotely_close,0.47,not_exist,139,124.25,3.22,0.0,0.53,0.0,451.7,1761853,98788,263,14.75
negative,none,remotely_possible,0.44,not_exist,23,22.12,3.24,0.0,0.46,0.0,117.8,1761853,31021,50,0.88
negative,none,remotely_interesting,0.16,not_exist,14,12.61,1.17,0.0,0.18,0.0,41.61,1761853,31021,79,1.39


In [None]:
show_metric_top(sig_trig_abbr.filter(like='quite', axis=0), 'dP1', 15)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,dP1,quant,f,unexp_f,LRC,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
negative,never,quite_able,0.85,not_exist,319,297.27,5.76,0.0,0.91,0.0,1571.33,1761853,109723,349,21.73
negative,never,quite_enough,0.73,not_exist,150,138.17,4.36,0.0,0.79,0.0,642.61,1761853,109723,190,11.83
negative,never,quite_satisfied,0.69,not_exist,144,132.11,4.15,0.0,0.75,0.0,592.6,1761853,109723,191,11.89
negative,never,quite_sure,0.67,not_exist,2176,1990.17,5.0,0.02,0.73,0.02,8739.05,1761853,109723,2984,185.83
negative,never,quite_clear,0.64,not_exist,399,363.75,4.41,0.0,0.7,0.0,1551.45,1761853,109723,566,35.25
negative,never,quite_complete,0.63,not_exist,31,28.2,2.42,0.0,0.69,0.0,118.13,1761853,109723,45,2.8
negative,never,quite_certain,0.57,not_exist,117,105.48,3.44,0.0,0.63,0.0,415.15,1761853,109723,185,11.52
negative,never,quite_free,0.56,not_exist,18,16.19,1.48,0.0,0.62,0.0,62.86,1761853,109723,29,1.81
negative,never,quite_believable,0.47,not_exist,15,13.26,1.01,0.0,0.54,0.0,46.29,1761853,109723,28,1.74
negative,never,quite_right,0.46,not_exist,217,191.16,3.24,0.0,0.52,0.0,656.23,1761853,109723,415,25.84


In [None]:
show_metric_top(sig_trig_abbr.filter(like='that_', axis=0), 'dP1', 15)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,dP1,quant,f,unexp_f,LRC,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
negative,never,that_comfortable,0.85,not_exist,22,20.51,1.31,0.0,0.92,0.0,108.64,1761853,109723,24,1.49
negative,never,that_fond,0.85,not_exist,22,20.51,1.31,0.0,0.92,0.0,108.64,1761853,109723,24,1.49
negative,never,that_nervous,0.81,not_exist,21,19.51,1.65,0.0,0.88,0.0,98.9,1761853,109723,24,1.49
negative,never,that_keen,0.81,not_exist,27,25.07,2.27,0.0,0.87,0.0,126.59,1761853,109723,31,1.93
negative,never,that_popular,0.79,not_exist,60,55.64,3.69,0.0,0.86,0.0,277.04,1761853,109723,70,4.36
negative,never,that_high,0.78,not_exist,38,35.2,2.98,0.0,0.84,0.0,173.0,1761853,109723,45,2.8
negative,never,that_happy,0.76,not_exist,37,34.2,2.92,0.0,0.82,0.0,164.36,1761853,109723,45,2.8
negative,never,that_close,0.76,not_exist,55,50.83,3.49,0.0,0.82,0.0,243.96,1761853,109723,67,4.17
negative,never,that_low,0.7,not_exist,19,17.44,1.73,0.0,0.76,0.0,78.71,1761853,109723,25,1.56
negative,never,that_interested,0.68,not_exist,50,45.83,3.16,0.0,0.75,0.0,203.93,1761853,109723,67,4.17


In [None]:
show_metric_top(sig_trig_abbr.filter(like='too_', axis=0), 'dP1', 15)

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,dP1,quant,f,unexp_f,LRC,dP2,dP1_simple,dP2_simple,G2,N,f1,f2,exp_f
polarity,l1,l2,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1
negative,none,too_pleased,0.92,not_exist,1272,1248.12,8.8,0.04,0.94,0.04,9701.23,1761853,31021,1356,23.88
negative,nothing,too_fancy,0.9,not_exist,521,490.55,6.85,0.01,0.96,0.01,2823.11,1761853,98788,543,30.45
negative,nothing,too_major,0.9,not_exist,187,176.07,5.66,0.0,0.96,0.0,1012.04,1761853,98788,195,10.93
negative,nothing,too_special,0.89,not_exist,450,423.37,6.56,0.0,0.95,0.0,2401.96,1761853,98788,475,26.63
negative,never,too_early,0.89,not_exist,4890,4568.77,7.59,0.04,0.95,0.04,25284.55,1761853,109723,5158,321.23
negative,never,too_careful,0.88,not_exist,649,606.28,6.66,0.01,0.95,0.01,3323.75,1761853,109723,686,42.72
negative,nothing,too_spectacular,0.88,not_exist,108,101.5,4.82,0.0,0.93,0.0,565.14,1761853,98788,116,6.5
negative,nothing,too_drastic,0.86,not_exist,103,96.72,4.74,0.0,0.92,0.0,532.02,1761853,98788,112,6.28
negative,none,too_flattering,0.84,not_exist,18,17.63,3.27,0.0,0.86,0.0,128.31,1761853,31021,21,0.37
negative,never,too_safe,0.83,not_exist,213,198.12,5.24,0.0,0.89,0.0,1021.95,1761853,109723,239,14.88
