In [2]:
import os

import numpy as np
from sklearn.decomposition import PCA

from utils import load_hidden_representations_from_hdf5, read_templates_from_file

----

In [3]:
# params
log_dir = "/logfiles"
model = "bigscience-T0_3B" # bigscience-T0_B or bigscience-T0
module = "encoder" # encoder
# task = "rte"
task = "cb"
# task = "wic"

In [4]:
assert module == "encoder" # TODO(mm): support decoder as well

## Prompts

In [5]:
df = read_templates_from_file(f"/t0-analysis/prompts/{task}.csv")
display(df)

Unnamed: 0,name,template,category,includes_targets,targets,shuffle
0,null_pattern,{premise} {hypothesis},neutral,False,none,False
1,null_pattern_reversed,{hypothesis} {premise},neutral,False,none,False
2,gpt_3_true_false_neither,"{premise} Question: {hypothesis} True, False, ...",instructive,True,"True, False, Neither",False
3,gpt_3_yes_no_maybe,"{premise} Question: {hypothesis} Yes, No, or M...",instructive,True,"Yes, No, Maybe",False
4,mnli_crowdsource,{premise} Using only the above description and...,instructive,True,"Correct, Incorrect, Inconclusive",False
5,always_sometimes_never,"Suppose it's true that {premise} Then, is ""{hy...",instructive,True,"Always, Sometimes, Never",False
6,based_on_previous_passage,"{premise} Based on the previous passage, is it...",instructive,True,"Yes, No, Maybe",False
7,infer,"Suppose {premise} Can we infer that ""{hypothes...",instructive,True,"Yes, No, Maybe",False
8,claim,"{premise} Based on that information, is the cl...",instructive,True,"True, False, Inconclusive",False
9,consider,"{premise} Keeping in mind the above text, cons...",instructive,True,"Always, Sometimes, Never",False


## PCA

In [6]:
def unison_shuffled_copies(a, b):
    # from: https://stackoverflow.com/questions/4601373/better-way-to-shuffle-two-numpy-arrays-in-unison
    assert len(a) == len(b)
    p = np.random.permutation(len(a))
    return a[p], b[p]

In [7]:
# RTE patterns
# use_pattern = [
#     "null_pattern",
#     "null_pattern_reversed",
#     "gpt_3_yes_no",
#     "gpt_3_yes_no_shuffled",
#     "gpt_3_true_false",
#     "gpt_3_true_false_shuffled",
#     "start_with_the",
#     "mnli_crowdsource",
#     "based_on_previous_passage",
#     "infer",
#     "follow",
#     "imply",
#     "guaranteed",
#     "justified", 
#     "must_be_true",
#     "should_assume"
# ]

# CB patterns
use_pattern = [
    "null_pattern",
    "null_pattern_reversed",
    "gpt_3_true_false_neither",
    "gpt_3_yes_no_maybe",
    "mnli_crowdsource",
    "always_sometimes_never",
    "based_on_previous_passage",
    "infer",
    "claim",
    "consider",
    "follow",
    "imply",
    "guaranteed",
    "guaranteed_possible",
    "justified",
    "must_be_true",
    "should_assume",
    "take_the_following",
]

# WIC patterns
# use_pattern = [
#     "gpt_3",
#     "gpt_3_yes_no",
#     "affirmation",
#     "grammar_homework",
#     "polysemous",
#     "question_context",
#     "question_meaning",
#     "question_meaning_yes_no",
#     "same_sense",
#     "similar_sense",
#     "similar_sense_yes_no",
# ]

In [8]:
# for layer in range(0, 10):
for layer in range(0, 25):
# for layer in range(24, 25):
    print('layer=', layer)
    file_names, prompt_names = [], []

    for _, row in df.iterrows():
        if row['name'] in use_pattern:
            file_names.append(f"{task}/{model}/{module}/{row['name']}/hidden_represenations_layer{layer}_avg.hdf5",)
            prompt_names.append(row['name'])


    # load hidden representations from hdf5 file
    representations = None
    classes = []
    n_sequences = 0

    for idx, file_name in enumerate(file_names):
        hidden_representations = load_hidden_representations_from_hdf5(os.path.join(log_dir, file_name))
        # print(hidden_representations.shape)
        n_sequences = hidden_representations.shape[0]

        if representations is None:
            representations = hidden_representations
        else:
            representations = np.concatenate((representations, hidden_representations), axis=0)

        classes += n_sequences * [idx] # assign representations to classes
    
    classes = np.asarray(classes)

    # shuffle representations and classes
    X, y = unison_shuffled_copies(representations, classes)
    print(X.shape, y.shape)

    # perform PCA on hidden representations
    print('PCA for prompts:', prompt_names)

    for n_components in range(1, 4):
        pca = PCA(n_components=n_components)
        pca.fit(X)

        # variance explained by each of the principal components
        print(f"model:{model}; module:{module}; layer:{layer}; n_components: {n_components}; variance explained: {pca.explained_variance_ratio_}")
        print(np.sum(pca.explained_variance_ratio_))
    print('\n')


layer= 0


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4149.69it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4735.70it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5336.02it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5999.52it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5600.81it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3888.37it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5652.84it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5502.40it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3978.00it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5370.18it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5860.01it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5459.68it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5591.74it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4253.78it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:0; n_components: 1; variance explained: [0.9334196]
0.9334196
model:bigscience-T0_3B; module:encoder; layer:0; n_components: 2; variance explained: [0.9334196  0.01033202]
0.94375163
model:bigscience-T0_3B; module:encoder; layer:0; n_components: 3; variance explained: [0.93341976 0.01033203 0.00871127]
0.9524631


layer= 1


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 2679.21it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3192.92it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4117.47it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4724.93it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4048.14it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4261.42it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4518.07it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3895.40it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5110.44it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5324.17it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5600.54it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4013.28it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3999.54it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5883.50it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:1; n_components: 1; variance explained: [0.26871872]
0.26871872
model:bigscience-T0_3B; module:encoder; layer:1; n_components: 2; variance explained: [0.26871872 0.20745684]
0.47617555
model:bigscience-T0_3B; module:encoder; layer:1; n_components: 3; variance explained: [0.26871875 0.20745681 0.0925732 ]
0.5687487


layer= 2


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4362.09it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4222.66it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4231.94it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3922.59it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5006.74it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5514.03it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5715.84it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3959.56it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3885.09it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5638.05it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5778.27it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5645.23it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5568.54it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5532.73it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:2; n_components: 1; variance explained: [0.98610866]
0.98610866
model:bigscience-T0_3B; module:encoder; layer:2; n_components: 2; variance explained: [0.98610866 0.01023624]
0.9963449
model:bigscience-T0_3B; module:encoder; layer:2; n_components: 3; variance explained: [9.8610866e-01 1.0236240e-02 7.4426486e-04]
0.9970892


layer= 3


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4521.81it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4317.75it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4514.08it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3823.68it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4511.04it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4564.43it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4277.25it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5686.23it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3919.71it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5437.44it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5174.27it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5779.27it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5369.81it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5123.93it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:3; n_components: 1; variance explained: [0.989444]
0.989444
model:bigscience-T0_3B; module:encoder; layer:3; n_components: 2; variance explained: [0.98944426 0.0071625 ]
0.99660677
model:bigscience-T0_3B; module:encoder; layer:3; n_components: 3; variance explained: [9.894440e-01 7.162503e-03 7.869031e-04]
0.9973934


layer= 4


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4454.66it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3668.87it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3636.49it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4061.72it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3905.18it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4018.36it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3907.58it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5351.95it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5150.79it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4032.43it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5605.35it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5601.61it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5449.93it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5105.89it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:4; n_components: 1; variance explained: [0.9903445]
0.9903445
model:bigscience-T0_3B; module:encoder; layer:4; n_components: 2; variance explained: [0.9903445  0.00600389]
0.99634844
model:bigscience-T0_3B; module:encoder; layer:4; n_components: 3; variance explained: [9.9034470e-01 6.0038874e-03 7.6471985e-04]
0.99711335


layer= 5


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3033.03it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3161.08it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3495.41it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3571.25it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5153.39it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5758.72it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5681.41it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5698.37it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5416.62it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5608.70it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5589.74it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5584.56it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5693.12it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5301.70it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:5; n_components: 1; variance explained: [0.9908108]
0.9908108
model:bigscience-T0_3B; module:encoder; layer:5; n_components: 2; variance explained: [0.9908108  0.00527297]
0.9960838
model:bigscience-T0_3B; module:encoder; layer:5; n_components: 3; variance explained: [9.908105e-01 5.272970e-03 8.895355e-04]
0.99697304


layer= 6


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3595.96it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3709.84it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3368.24it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4855.72it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5142.22it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5378.91it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5768.91it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5222.25it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4882.17it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4305.32it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5378.91it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5293.81it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5557.21it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5619.97it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:6; n_components: 1; variance explained: [0.99958944]
0.99958944
model:bigscience-T0_3B; module:encoder; layer:6; n_components: 2; variance explained: [9.995895e-01 2.734291e-04]
0.9998629
model:bigscience-T0_3B; module:encoder; layer:6; n_components: 3; variance explained: [9.9958950e-01 2.7342880e-04 3.0254956e-05]
0.9998932


layer= 7


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4583.67it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4068.40it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4350.21it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3731.59it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5050.23it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5485.44it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5620.37it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5505.11it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5801.39it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5797.67it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5663.60it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5744.36it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5666.61it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5684.85it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:7; n_components: 1; variance explained: [0.99956113]
0.99956113
model:bigscience-T0_3B; module:encoder; layer:7; n_components: 2; variance explained: [9.9956113e-01 2.7366533e-04]
0.9998348
model:bigscience-T0_3B; module:encoder; layer:7; n_components: 3; variance explained: [9.9956113e-01 2.7366541e-04 3.6883859e-05]
0.9998717


layer= 8


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4446.82it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4284.98it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4551.52it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 2740.03it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5280.72it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5861.33it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5823.69it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5072.15it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5531.56it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5870.70it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5867.48it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5671.81it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5553.27it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4047.79it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:8; n_components: 1; variance explained: [0.99953395]
0.99953395
model:bigscience-T0_3B; module:encoder; layer:8; n_components: 2; variance explained: [9.9953395e-01 2.5839242e-04]
0.99979234
model:bigscience-T0_3B; module:encoder; layer:8; n_components: 3; variance explained: [9.9953395e-01 2.5839263e-04 5.1555540e-05]
0.9998439


layer= 9


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 2372.15it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 2208.40it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4237.74it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5712.64it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5176.33it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5310.81it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5181.01it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5466.29it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5714.87it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4242.10it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5553.79it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5381.01it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5447.53it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5437.56it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:9; n_components: 1; variance explained: [0.999481]
0.999481
model:bigscience-T0_3B; module:encoder; layer:9; n_components: 2; variance explained: [9.9948102e-01 2.5692146e-04]
0.9997379
model:bigscience-T0_3B; module:encoder; layer:9; n_components: 3; variance explained: [9.9948102e-01 2.5692143e-04 6.2848827e-05]
0.99980074


layer= 10


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5043.72it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4784.21it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3951.50it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3465.86it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3744.50it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4139.68it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5716.12it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5521.93it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5039.18it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4978.51it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5118.13it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4925.58it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5189.59it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5675.65it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:10; n_components: 1; variance explained: [0.99942017]
0.99942017
model:bigscience-T0_3B; module:encoder; layer:10; n_components: 2; variance explained: [9.9942034e-01 2.5001785e-04]
0.9996704
model:bigscience-T0_3B; module:encoder; layer:10; n_components: 3; variance explained: [9.9942034e-01 2.5001785e-04 7.2810362e-05]
0.9997432


layer= 11


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3618.34it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4629.38it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3748.50it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3293.76it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5367.48it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5548.68it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5803.69it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4361.44it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3992.00it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5336.99it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5366.50it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5372.27it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5380.76it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5683.06it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:11; n_components: 1; variance explained: [0.99931085]
0.99931085
model:bigscience-T0_3B; module:encoder; layer:11; n_components: 2; variance explained: [9.9931085e-01 2.3939855e-04]
0.9995502
model:bigscience-T0_3B; module:encoder; layer:11; n_components: 3; variance explained: [9.9931085e-01 2.3939875e-04 9.5453048e-05]
0.99964565


layer= 12


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3958.09it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3706.97it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3460.85it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3412.08it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4049.04it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5653.79it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5314.29it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5743.51it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5714.03it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5744.36it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5597.60it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5333.48it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5226.43it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5204.54it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:12; n_components: 1; variance explained: [0.9991451]
0.9991451
model:bigscience-T0_3B; module:encoder; layer:12; n_components: 2; variance explained: [9.991451e-01 2.594658e-04]
0.99940455
model:bigscience-T0_3B; module:encoder; layer:12; n_components: 3; variance explained: [9.99145210e-01 2.59465858e-04 1.19264565e-04]
0.99952394


layer= 13


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4386.36it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3956.69it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4089.80it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4541.22it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5186.50it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5623.47it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5381.75it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5452.59it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5046.43it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5527.39it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5584.56it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5727.97it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5830.34it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5595.60it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:13; n_components: 1; variance explained: [0.99882245]
0.99882245
model:bigscience-T0_3B; module:encoder; layer:13; n_components: 2; variance explained: [9.9882233e-01 2.8408118e-04]
0.9991064
model:bigscience-T0_3B; module:encoder; layer:13; n_components: 3; variance explained: [9.9882233e-01 2.8408109e-04 1.6866392e-04]
0.9992751


layer= 14


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3042.93it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3913.90it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3529.34it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3635.54it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5602.41it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3869.09it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4147.35it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5815.04it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5945.30it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4763.74it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3859.94it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5028.82it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5227.59it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5681.83it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:14; n_components: 1; variance explained: [0.99853164]
0.99853164
model:bigscience-T0_3B; module:encoder; layer:14; n_components: 2; variance explained: [9.9853164e-01 3.0207561e-04]
0.9988337
model:bigscience-T0_3B; module:encoder; layer:14; n_components: 3; variance explained: [9.9853164e-01 3.0207550e-04 2.0686837e-04]
0.9990406


layer= 15


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4294.77it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4618.19it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3666.06it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4572.34it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4663.02it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5902.57it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3900.84it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4160.06it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5554.19it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5282.86it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4651.02it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4000.29it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4073.83it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5803.83it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:15; n_components: 1; variance explained: [0.9981304]
0.9981304
model:bigscience-T0_3B; module:encoder; layer:15; n_components: 2; variance explained: [9.981304e-01 3.367109e-04]
0.9984671
model:bigscience-T0_3B; module:encoder; layer:15; n_components: 3; variance explained: [9.9813038e-01 3.3671106e-04 2.5545881e-04]
0.99872255


layer= 16


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3754.19it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3542.33it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3729.10it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3436.95it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5798.10it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5618.63it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5418.00it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5497.38it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5718.48it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5546.84it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5399.69it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5176.90it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5158.03it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5574.36it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:16; n_components: 1; variance explained: [0.99744004]
0.99744004
model:bigscience-T0_3B; module:encoder; layer:16; n_components: 2; variance explained: [9.9743998e-01 4.2179722e-04]
0.9978618
model:bigscience-T0_3B; module:encoder; layer:16; n_components: 3; variance explained: [9.9743998e-01 4.2179698e-04 3.2345337e-04]
0.9981853


layer= 17


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4567.00it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3487.47it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 2734.26it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5628.18it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5614.33it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5585.22it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5131.66it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5472.53it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5468.33it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5673.73it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5626.03it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5520.38it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5704.73it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5724.34it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:17; n_components: 1; variance explained: [0.9962167]
0.9962167
model:bigscience-T0_3B; module:encoder; layer:17; n_components: 2; variance explained: [9.962167e-01 6.133424e-04]
0.99683005
model:bigscience-T0_3B; module:encoder; layer:17; n_components: 3; variance explained: [9.9621683e-01 6.1334210e-04 4.2240438e-04]
0.9972526


layer= 18


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 2692.63it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4428.38it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 2741.41it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5332.02it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5483.77it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5619.57it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5757.03it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5571.45it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5028.93it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3959.63it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4747.95it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3976.86it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5590.94it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5667.84it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:18; n_components: 1; variance explained: [0.9946185]
0.9946185
model:bigscience-T0_3B; module:encoder; layer:18; n_components: 2; variance explained: [9.946185e-01 8.848367e-04]
0.9955033
model:bigscience-T0_3B; module:encoder; layer:18; n_components: 3; variance explained: [9.9461848e-01 8.8483683e-04 5.4812612e-04]
0.99605143


layer= 19


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4544.65it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4156.89it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4615.47it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4731.02it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4769.55it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5548.55it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5750.12it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5478.53it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5606.69it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5601.47it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5658.15it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5679.90it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5671.95it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4619.37it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:19; n_components: 1; variance explained: [0.9925578]
0.9925578
model:bigscience-T0_3B; module:encoder; layer:19; n_components: 2; variance explained: [0.99255764 0.00122527]
0.99378294
model:bigscience-T0_3B; module:encoder; layer:19; n_components: 3; variance explained: [9.9255782e-01 1.2252664e-03 7.5072056e-04]
0.99453384


layer= 20


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4702.04it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3886.06it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 1857.06it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5412.63it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5601.74it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5887.48it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5785.10it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5956.16it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5522.71it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5372.88it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5356.71it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5849.36it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5579.12it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5524.14it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:20; n_components: 1; variance explained: [0.9898807]
0.9898807
model:bigscience-T0_3B; module:encoder; layer:20; n_components: 2; variance explained: [0.9898807  0.00161116]
0.99149185
model:bigscience-T0_3B; module:encoder; layer:20; n_components: 3; variance explained: [9.898807e-01 1.611156e-03 9.720530e-04]
0.9924639


layer= 21


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4421.96it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3804.60it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4662.84it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4711.28it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4780.42it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5427.64it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5775.57it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5542.13it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5787.53it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5492.62it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5779.13it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5919.98it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5951.48it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5916.10it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:21; n_components: 1; variance explained: [0.98656076]
0.98656076
model:bigscience-T0_3B; module:encoder; layer:21; n_components: 2; variance explained: [0.98656076 0.00206176]
0.98862255
model:bigscience-T0_3B; module:encoder; layer:21; n_components: 3; variance explained: [0.9865608  0.00206176 0.00127418]
0.9898968


layer= 22


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 2771.56it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3797.16it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 2573.42it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5514.29it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5643.06it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5437.94it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5754.91it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5226.55it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5724.34it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5781.54it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5700.30it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5846.59it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5254.61it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4675.18it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:22; n_components: 1; variance explained: [0.9805164]
0.9805164
model:bigscience-T0_3B; module:encoder; layer:22; n_components: 2; variance explained: [0.9805164  0.00273535]
0.98325175
model:bigscience-T0_3B; module:encoder; layer:22; n_components: 3; variance explained: [0.98051655 0.00273535 0.0016682 ]
0.98492014


layer= 23


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4459.06it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4429.63it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 2663.05it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4559.91it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5677.98it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 3913.90it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5601.34it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5444.12it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5738.18it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5683.75it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5526.35it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5635.34it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5510.15it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4605.15it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:23; n_components: 1; variance explained: [0.97186935]
0.97186935
model:bigscience-T0_3B; module:encoder; layer:23; n_components: 2; variance explained: [0.97186935 0.00372159]
0.97559094
model:bigscience-T0_3B; module:encoder; layer:23; n_components: 3; variance explained: [0.97186935 0.00372159 0.00223501]
0.97782594


layer= 24


Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4439.68it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4676.20it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 4667.00it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 2897.80it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5116.12it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5401.55it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5365.89it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5500.34it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5589.34it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5727.97it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5435.17it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5872.32it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 6002.74it/s]
Reading embeddings: 100%|██████████| 56/56 [00:00<00:00, 5993.39it/s]
Reading embeddings: 

(1008, 2048) (1008,)
PCA for prompts: ['null_pattern', 'null_pattern_reversed', 'gpt_3_true_false_neither', 'gpt_3_yes_no_maybe', 'mnli_crowdsource', 'always_sometimes_never', 'based_on_previous_passage', 'infer', 'claim', 'consider', 'follow', 'imply', 'guaranteed', 'guaranteed_possible', 'justified', 'must_be_true', 'should_assume', 'take_the_following']
model:bigscience-T0_3B; module:encoder; layer:24; n_components: 1; variance explained: [0.10334048]
0.103340484
model:bigscience-T0_3B; module:encoder; layer:24; n_components: 2; variance explained: [0.10334042 0.08637156]
0.18971199
model:bigscience-T0_3B; module:encoder; layer:24; n_components: 3; variance explained: [0.10334035 0.08637142 0.06249465]
0.25220644


