In [2]:
import pandas as pd

import shap
import torch
from transformers import pipeline, BertTokenizerFast

# Load Data

In [3]:
data_path = "../../data/fine-tuning/"

In [4]:
test_df = pd.read_csv(data_path + "moravian_deu_test.csv")
test_df

Unnamed: 0,source,text,label
0,23,17 waren wir in Manakory,neutral
1,33,"ich grigte auch erlaubniß,",positive
2,11,"Wie mir dabey gewesen, deß waren alle meine Gl...",positive
3,26,In der Stunde machte sich der Heiland mir beka...,positive
4,27,"1744, am vierten Januar, wurde ich nebst meine...",neutral
...,...,...,...
437,9,Die lezte Zeit kränckelte er.,negative
438,38,Ich sahe sie oft auf ihrem Angesicht liegen un...,positive
439,13,Ich bat den Heiland mein Herz mit seinem Blute...,positive
440,34,nie hört’ man dich klagen;,positive


# Init Model and Tokenizer

In [5]:
gpu = -1
if torch.cuda.is_available():
    torch.device("cuda")
    gpu = torch.cuda.current_device()

model_path = "../../models/fine-tuned/gbert-base-moravian-sentiment"
model = pipeline("text-classification", model=model_path, device=gpu, top_k=None)
tokenizer = BertTokenizerFast.from_pretrained(model_path)

Xformers is not installed correctly. If you want to use memory_efficient_attention to accelerate training use the following command to install Xformers
pip install xformers.


# Init shap Explainer

In [6]:
explainer = shap.Explainer(model, tokenizer)

# Analyze Data

In [7]:
test_shap_values = explainer(list(test_df["text"]))
test_shap_values

You seem to be using the pipelines sequentially on GPU. In order to maximize efficiency please use a dataset
You seem to be using the pipelines sequentially on GPU. In order to maximize efficiency please use a dataset


  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:   1%|          | 3/442 [00:00<?, ?it/s]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:   1%|          | 5/442 [00:25<36:14,  4.98s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:   1%|▏         | 6/442 [00:30<37:05,  5.10s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:   2%|▏         | 8/442 [00:40<36:32,  5.05s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:   3%|▎         | 12/442 [00:56<29:19,  4.09s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:   3%|▎         | 14/442 [01:08<34:05,  4.78s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:   4%|▎         | 16/442 [01:18<35:16,  4.97s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:   4%|▍         | 17/442 [01:24<37:28,  5.29s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:   4%|▍         | 19/442 [01:33<33:46,  4.79s/it]

  0%|          | 0/462 [00:00<?, ?it/s]

PartitionExplainer explainer:   6%|▌         | 25/442 [02:01<32:05,  4.62s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:   6%|▌         | 27/442 [02:12<33:45,  4.88s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:   7%|▋         | 30/442 [02:27<33:31,  4.88s/it]

  0%|          | 0/342 [00:00<?, ?it/s]

PartitionExplainer explainer:   7%|▋         | 33/442 [02:41<31:52,  4.68s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:   8%|▊         | 35/442 [02:51<33:06,  4.88s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:   9%|▊         | 38/442 [03:06<33:21,  4.95s/it]

  0%|          | 0/306 [00:00<?, ?it/s]

PartitionExplainer explainer:  10%|▉         | 42/442 [03:18<23:03,  3.46s/it]

  0%|          | 0/306 [00:00<?, ?it/s]

PartitionExplainer explainer:  10%|▉         | 44/442 [03:28<28:14,  4.26s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  10%|█         | 45/442 [03:34<30:39,  4.63s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  10%|█         | 46/442 [03:39<31:40,  4.80s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  11%|█         | 48/442 [03:50<33:06,  5.04s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  11%|█         | 49/442 [04:03<50:29,  7.71s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  11%|█▏        | 50/442 [04:12<51:14,  7.84s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  12%|█▏        | 51/442 [04:22<55:07,  8.46s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  12%|█▏        | 52/442 [04:31<56:32,  8.70s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  12%|█▏        | 53/442 [04:38<54:28,  8.40s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  12%|█▏        | 54/442 [04:47<55:07,  8.52s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  12%|█▏        | 55/442 [04:57<57:19,  8.89s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  13%|█▎        | 56/442 [05:05<55:12,  8.58s/it]

  0%|          | 0/240 [00:00<?, ?it/s]

PartitionExplainer explainer:  13%|█▎        | 59/442 [05:19<37:00,  5.80s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  14%|█▍        | 62/442 [05:34<33:38,  5.31s/it]

  0%|          | 0/420 [00:00<?, ?it/s]

PartitionExplainer explainer:  15%|█▍        | 65/442 [05:46<26:08,  4.16s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  15%|█▌        | 67/442 [05:56<28:35,  4.58s/it]

  0%|          | 0/420 [00:00<?, ?it/s]

PartitionExplainer explainer:  16%|█▌        | 70/442 [06:08<26:15,  4.24s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  17%|█▋        | 73/442 [06:22<28:13,  4.59s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  17%|█▋        | 75/442 [06:32<28:53,  4.72s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  17%|█▋        | 76/442 [06:38<29:44,  4.88s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  17%|█▋        | 77/442 [06:43<31:06,  5.11s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  18%|█▊        | 78/442 [06:49<31:38,  5.22s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  18%|█▊        | 80/442 [06:59<31:38,  5.24s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  18%|█▊        | 81/442 [07:05<31:16,  5.20s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  19%|█▉        | 83/442 [07:15<30:47,  5.15s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  19%|█▉        | 86/442 [07:29<27:38,  4.66s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  20%|█▉        | 88/442 [07:39<28:47,  4.88s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  21%|██        | 91/442 [07:54<28:50,  4.93s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  21%|██        | 93/442 [08:05<29:16,  5.03s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  22%|██▏       | 96/442 [08:20<28:47,  4.99s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  22%|██▏       | 98/442 [08:31<29:33,  5.15s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  24%|██▍       | 105/442 [08:59<22:54,  4.08s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  24%|██▍       | 107/442 [09:10<25:52,  4.63s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  25%|██▍       | 110/442 [09:25<26:50,  4.85s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  25%|██▌       | 112/442 [09:36<28:00,  5.09s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  26%|██▌       | 113/442 [09:42<28:48,  5.25s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  26%|██▌       | 114/442 [09:48<29:52,  5.47s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  26%|██▋       | 117/442 [10:03<27:57,  5.16s/it]

  0%|          | 0/306 [00:00<?, ?it/s]

PartitionExplainer explainer:  27%|██▋       | 119/442 [10:13<27:31,  5.11s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  27%|██▋       | 120/442 [10:19<28:00,  5.22s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  28%|██▊       | 122/442 [10:29<27:12,  5.10s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  29%|██▉       | 128/442 [10:52<17:36,  3.36s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  29%|██▉       | 129/442 [10:57<20:26,  3.92s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  30%|███       | 134/442 [11:21<23:46,  4.63s/it]

  0%|          | 0/420 [00:00<?, ?it/s]

PartitionExplainer explainer:  31%|███       | 136/442 [11:31<24:49,  4.87s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  31%|███▏      | 139/442 [11:46<24:06,  4.77s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  32%|███▏      | 142/442 [12:00<22:39,  4.53s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  33%|███▎      | 144/442 [12:10<23:34,  4.75s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  33%|███▎      | 148/442 [12:28<21:12,  4.33s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  34%|███▍      | 151/442 [12:39<19:20,  3.99s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  35%|███▍      | 154/442 [12:52<18:40,  3.89s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  35%|███▌      | 156/442 [13:03<21:32,  4.52s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  36%|███▌      | 159/442 [13:18<22:43,  4.82s/it]

  0%|          | 0/380 [00:00<?, ?it/s]

PartitionExplainer explainer:  36%|███▋      | 161/442 [13:28<23:12,  4.96s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  37%|███▋      | 164/442 [13:44<22:58,  4.96s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  38%|███▊      | 166/442 [13:54<23:22,  5.08s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  38%|███▊      | 167/442 [14:00<24:03,  5.25s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  38%|███▊      | 169/442 [14:10<23:47,  5.23s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  39%|███▊      | 171/442 [14:21<23:44,  5.26s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  39%|███▉      | 173/442 [14:32<23:25,  5.22s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  39%|███▉      | 174/442 [14:37<23:09,  5.19s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  40%|███▉      | 176/442 [14:47<22:39,  5.11s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  40%|████      | 179/442 [15:02<22:16,  5.08s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  41%|████      | 181/442 [15:12<21:55,  5.04s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  42%|████▏     | 187/442 [15:38<16:51,  3.97s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  43%|████▎     | 189/442 [15:49<20:29,  4.86s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  43%|████▎     | 190/442 [15:54<20:45,  4.94s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  44%|████▍     | 194/442 [16:06<14:18,  3.46s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  45%|████▍     | 197/442 [16:18<15:09,  3.71s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  45%|████▌     | 199/442 [16:29<17:49,  4.40s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  45%|████▌     | 200/442 [16:34<18:51,  4.68s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  46%|████▌     | 202/442 [16:44<19:18,  4.83s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  46%|████▌     | 204/442 [16:55<20:04,  5.06s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  46%|████▋     | 205/442 [17:00<20:34,  5.21s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  47%|████▋     | 207/442 [17:10<19:49,  5.06s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  48%|████▊     | 210/442 [17:25<18:54,  4.89s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  48%|████▊     | 213/442 [17:36<15:52,  4.16s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  49%|████▉     | 217/442 [17:51<12:51,  3.43s/it]

  0%|          | 0/306 [00:00<?, ?it/s]

PartitionExplainer explainer:  50%|████▉     | 219/442 [18:01<15:28,  4.16s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  50%|█████     | 221/442 [18:12<17:28,  4.74s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  50%|█████     | 222/442 [18:17<18:02,  4.92s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  51%|█████     | 224/442 [18:27<17:47,  4.89s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  51%|█████▏    | 227/442 [18:38<14:41,  4.10s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  52%|█████▏    | 231/442 [18:54<14:33,  4.14s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  53%|█████▎    | 233/442 [19:05<16:02,  4.61s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  53%|█████▎    | 236/442 [19:20<16:28,  4.80s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  54%|█████▍    | 238/442 [19:30<16:38,  4.90s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  55%|█████▍    | 241/442 [19:45<16:28,  4.92s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  55%|█████▍    | 243/442 [19:55<16:41,  5.03s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  57%|█████▋    | 250/442 [20:24<13:12,  4.13s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  57%|█████▋    | 251/442 [20:30<14:20,  4.51s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  57%|█████▋    | 252/442 [20:35<14:56,  4.72s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  58%|█████▊    | 256/442 [20:49<10:38,  3.43s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  58%|█████▊    | 258/442 [20:59<13:00,  4.24s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  59%|█████▉    | 261/442 [21:14<14:00,  4.64s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  60%|█████▉    | 263/442 [21:25<14:29,  4.86s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  60%|█████▉    | 264/442 [21:30<14:54,  5.03s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  61%|██████    | 269/442 [21:52<12:57,  4.50s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  61%|██████▏   | 271/442 [22:03<13:41,  4.80s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  62%|██████▏   | 272/442 [22:08<14:04,  4.97s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  62%|██████▏   | 275/442 [22:21<12:18,  4.42s/it]

  0%|          | 0/342 [00:00<?, ?it/s]

PartitionExplainer explainer:  63%|██████▎   | 277/442 [22:30<12:46,  4.65s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  64%|██████▍   | 283/442 [22:56<10:02,  3.79s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  65%|██████▍   | 286/442 [23:09<10:37,  4.09s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  66%|██████▌   | 292/442 [23:32<09:54,  3.96s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  66%|██████▋   | 293/442 [23:37<10:51,  4.37s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  67%|██████▋   | 296/442 [23:48<08:39,  3.56s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  68%|██████▊   | 299/442 [24:00<08:13,  3.45s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  68%|██████▊   | 301/442 [24:11<10:10,  4.33s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  69%|██████▉   | 304/442 [24:23<09:43,  4.23s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  70%|██████▉   | 308/442 [24:41<09:52,  4.42s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  70%|███████   | 310/442 [24:52<10:38,  4.84s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  71%|███████   | 313/442 [25:07<10:38,  4.95s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  71%|███████▏  | 315/442 [25:18<10:44,  5.08s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  72%|███████▏  | 318/442 [25:33<10:22,  5.02s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  72%|███████▏  | 320/442 [25:43<10:21,  5.10s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  73%|███████▎  | 323/442 [25:59<10:02,  5.06s/it]

  0%|          | 0/462 [00:00<?, ?it/s]

PartitionExplainer explainer:  74%|███████▍  | 327/442 [26:12<06:12,  3.24s/it]

  0%|          | 0/420 [00:00<?, ?it/s]

PartitionExplainer explainer:  74%|███████▍  | 329/442 [26:23<07:48,  4.14s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  75%|███████▌  | 332/442 [26:38<08:33,  4.66s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  76%|███████▌  | 334/442 [26:48<08:47,  4.88s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  77%|███████▋  | 342/442 [27:18<05:50,  3.51s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  78%|███████▊  | 344/442 [27:29<07:11,  4.40s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  78%|███████▊  | 346/442 [27:39<07:34,  4.73s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  79%|███████▉  | 349/442 [27:53<07:06,  4.58s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  80%|███████▉  | 352/442 [28:09<07:21,  4.91s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  80%|████████  | 355/442 [28:22<06:13,  4.29s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  81%|████████  | 357/442 [28:32<06:41,  4.72s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  81%|████████▏ | 360/442 [28:43<04:58,  3.65s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  82%|████████▏ | 364/442 [29:00<05:05,  3.92s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  83%|████████▎ | 366/442 [29:10<05:41,  4.49s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  84%|████████▎ | 370/442 [29:25<04:39,  3.88s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  84%|████████▍ | 373/442 [29:37<04:33,  3.97s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  85%|████████▍ | 375/442 [29:49<05:25,  4.85s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  86%|████████▌ | 378/442 [30:04<05:17,  4.96s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  86%|████████▌ | 380/442 [30:14<05:09,  5.00s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  87%|████████▋ | 383/442 [30:29<04:32,  4.63s/it]

  0%|          | 0/342 [00:00<?, ?it/s]

PartitionExplainer explainer:  87%|████████▋ | 386/442 [30:44<04:27,  4.78s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  88%|████████▊ | 388/442 [30:55<04:32,  5.05s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  90%|████████▉ | 397/442 [31:34<03:17,  4.39s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  90%|█████████ | 399/442 [31:45<03:26,  4.81s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  91%|█████████ | 402/442 [32:00<03:17,  4.93s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  91%|█████████▏| 404/442 [32:10<03:10,  5.01s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  92%|█████████▏| 406/442 [32:17<02:22,  3.96s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  92%|█████████▏| 408/442 [32:24<01:57,  3.45s/it]

  0%|          | 0/462 [00:00<?, ?it/s]

PartitionExplainer explainer:  93%|█████████▎| 410/442 [32:32<01:58,  3.69s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  93%|█████████▎| 411/442 [32:39<02:20,  4.54s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  93%|█████████▎| 412/442 [32:44<02:23,  4.78s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  93%|█████████▎| 413/442 [32:49<02:23,  4.93s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  94%|█████████▍| 416/442 [33:03<01:56,  4.49s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  95%|█████████▍| 418/442 [33:13<01:54,  4.79s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  95%|█████████▌| 420/442 [33:20<01:23,  3.78s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  95%|█████████▌| 422/442 [33:29<01:23,  4.15s/it]

  0%|          | 0/462 [00:00<?, ?it/s]

PartitionExplainer explainer:  97%|█████████▋| 427/442 [33:53<01:08,  4.57s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  98%|█████████▊| 431/442 [34:07<00:38,  3.52s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  98%|█████████▊| 434/442 [34:22<00:35,  4.43s/it]

  0%|          | 0/462 [00:00<?, ?it/s]

PartitionExplainer explainer:  99%|█████████▊| 436/442 [34:32<00:28,  4.82s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer:  99%|█████████▉| 439/442 [34:45<00:12,  4.11s/it]

  0%|          | 0/498 [00:00<?, ?it/s]

PartitionExplainer explainer: 443it [35:01,  4.78s/it]


.values =
array([array([[ 0.00000000e+00,  0.00000000e+00,  0.00000000e+00],
              [-5.42174070e-03,  1.86360031e-02, -1.32142670e-02],
              [-5.74924254e-03,  1.77844167e-02, -1.20351558e-02],
              [-2.02578062e-03,  1.94443762e-03,  8.13530896e-05],
              [-3.75381812e-03,  1.03080571e-02, -6.55425194e-03],
              [-4.19489065e-03,  1.33005530e-02, -9.10567864e-03],
              [-7.74953989e-03,  2.21865773e-02, -1.44370301e-02],
              [-1.31878284e-03,  5.94078004e-03, -4.62198191e-03],
              [ 0.00000000e+00,  0.00000000e+00,  0.00000000e+00]]),
       array([[ 0.00000000e+00,  0.00000000e+00,  0.00000000e+00],
              [-2.28482210e-02, -7.67068280e-02,  9.95550677e-02],
              [-1.84809345e-03, -5.98378738e-02,  6.16859701e-02],
              [-7.27348575e-03, -2.73017485e-02,  3.45752379e-02],
              [-9.67608581e-03, -3.90091220e-02,  4.86852145e-02],
              [ 6.84127482e-03, -4.13784922e-01,  

# Build and Store DataFrame

In [8]:
data = []
for i in range(len(test_shap_values.data)):
    for j in range(len(test_shap_values.data[i])):
        if j == 0: # first token of instance
            token = "[CLS]"
        elif j == len(test_shap_values.data[i]) - 1: # last token of instance
            token = "[SEP]"
        else:
            token = test_shap_values.data[i][j]
        data.append([i, token] + list(test_shap_values.values[i][j]))
shap_df = pd.DataFrame(data, columns=["text_id", "token", "shap_neg", "shap_neut", "shap_pos"])
shap_df

Unnamed: 0,text_id,token,shap_neg,shap_neut,shap_pos
0,0,[CLS],0.000000,0.000000,0.000000
1,0,17,-0.005422,0.018636,-0.013214
2,0,waren,-0.005749,0.017784,-0.012035
3,0,wir,-0.002026,0.001944,0.000081
4,0,in,-0.003754,0.010308,-0.006554
...,...,...,...,...,...
16418,441,Liebe,-0.020607,-0.363338,0.383945
16419,441,zu,0.004014,-0.026877,0.022863
16420,441,begegnen,-0.007661,-0.043362,0.051023
16421,441,.,0.000910,-0.046910,0.046001


In [9]:
shap_df.to_csv("../../data/shap/gbert_test_shap-values.csv", index=False)