In [1]:
'''
Code source (with some changes):
https://levelup.gitconnected.com/huggingface-transformers-interpretability-with-captum-28e4ff4df234
https://gist.githubusercontent.com/theDestI/fe9ea0d89386cf00a12e60dd346f2109/raw/15c992f43ddecb0f0f857cea9f61cd22d59393ab/explain.py
'''

import torch
import pandas as pd

from torch import tensor 
import transformers
from transformers.pipelines import TextClassificationPipeline
from transformers import AutoTokenizer
from transformers import AutoModelForSequenceClassification
from captum.attr import LayerIntegratedGradients, TokenReferenceBase, visualization

import matplotlib.pyplot as plt

import argparse 
import jsonlines
import os 

  from .autonotebook import tqdm as notebook_tqdm


In [7]:
class ExplainableTransformerPipeline():
    """Wrapper for Captum framework usage with Huggingface Pipeline"""
    
    def __init__(self, name:str, pipeline: TextClassificationPipeline, device: str):
        self.__name = name
        self.__pipeline = pipeline
        self.__device = device
        self.indToLabel = ["Negative", "Positive"]
        self.labelToInd = {
            "Negative": 0,
            "Positive": 1,
        }
    
    def forward_func(self, inputs: tensor, position = 0):
        """
            Wrapper around prediction method of pipeline
        """
        pred = self.__pipeline.model(inputs,
                       attention_mask=torch.ones_like(inputs))
        return pred[position]
        
    def visualize(self, 
            inputs: list, 
            attributes: list, 
            outfile_path: str,
            pred, 
            label, 
            delta, 
        ):
        """
            Visualization method.
            Takes list of inputs and correspondent attributs for them to visualize in a barplot
        """
        #import pdb; pdb.set_trace()
        attr_sum = attributes.sum(-1) 
        
        attr = attr_sum / torch.norm(attr_sum)

        vis_data_record = visualization.VisualizationDataRecord(
            word_attributions=attr.numpy()[0],
            pred_prob=torch.nn.Softmax()(pred).max().item(),
            pred_class=self.indToLabel[pred.argmax().item()],
            true_class=self.indToLabel[label],
            attr_class=self.indToLabel[pred.argmax().item()],
            attr_score=attributes.sum(),
            raw_input_ids=inputs,
            convergence_score=delta.numpy()[0]
        )

        _ = visualization.visualize_text([vis_data_record])    

    def explain(self, text: str, label: int, outfile_path: str):
        """
            Main entry method. Passes text through series of transformations and through the model. 
            Calls visualization method.
        """
        prediction = self.__pipeline.predict(text)
        inputs = self.generate_inputs(text)
        baseline = self.generate_baseline(sequence_len = inputs.shape[1])
        
        preds = self.forward_func(inputs)

        lig = LayerIntegratedGradients(self.forward_func, getattr(self.__pipeline.model, 'deberta').embeddings)

        attributes, delta = lig.attribute(inputs=inputs,
                                  baselines=baseline,
                                  target = self.__pipeline.model.config.label2id[prediction[0]['label']], 
                                  return_convergence_delta = True)

        # Give a path to save
        self.visualize(
            self.tokenize_inputs(text), 
            attributes.cpu(), 
            outfile_path,
            preds.cpu(),
            label,
            delta
        )

    def tokenize_inputs(self, text: str) -> list:
        return self.__pipeline.tokenizer.tokenize(text)
    
    def generate_inputs(self, text: str) -> tensor:
        """
            Convenience method for generation of input ids as list of torch tensors
        """
        return torch.tensor(self.__pipeline.tokenizer.encode(text, add_special_tokens=False), device = self.__device).unsqueeze(0)
    
    def generate_baseline(self, sequence_len: int) -> tensor:
        """
            Convenience method for generation of baseline vector as list of torch tensors
        """        
        return torch.tensor([self.__pipeline.tokenizer.cls_token_id] + [self.__pipeline.tokenizer.pad_token_id] * (sequence_len - 2) + [self.__pipeline.tokenizer.sep_token_id], device = self.__device).unsqueeze(0)

In [3]:
def main(args):
    tokenizer = AutoTokenizer.from_pretrained(args.model_checkpoint) 
    model = AutoModelForSequenceClassification.from_pretrained(args.model_checkpoint, num_labels=args.num_labels)
    device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')

    clf = transformers.pipeline("text-classification", 
                                model=model, 
                                tokenizer=tokenizer, 
                                device=device
                                )
    exp_model = ExplainableTransformerPipeline(args.model_checkpoint, clf, device)

    idx=0
    with jsonlines.open(args.a1_analysis_file, 'r') as reader:
        for obj in reader:
            print("Explaining {}".format(idx+1))
            exp_model.explain(obj["review"], obj["label"], os.path.join(args.output_dir,f'example_{idx}'))
            idx+=1
    

In [8]:
if __name__ == '__main__':
    # parser = argparse.ArgumentParser()
    # parser.add_argument('--analsis_dir', default='out', type=str, help='Directory where attribution figures will be saved')
    # parser.add_argument('--model_checkpoint', type=str, default='microsoft/deberta-v3-base', help='model checkpoint')
    # parser.add_argument('--a1_analysis_file', type=str, default='out/a1_analysis_data.jsonl', help='path to a1 analysis file')
    # parser.add_argument('--num_labels', default=2, type=int, help='Task number of labels')
    # parser.add_argument('--output_dir', default='out', type=str, help='Directory where model checkpoints will be saved')    
    # args = parser.parse_args(args=[])
    class Args:
        def __init__(self):
            self.analsis_dir = "out"
            self.model_checkpoint = 'microsoft/deberta-v3-base'
            self.a1_analysis_file = 'out/a1_analysis_data.jsonl'
            self.num_labels = 2
            self.output_dir = 'out'
    args = Args()
    main(args)

Special tokens have been added in the vocabulary, make sure the associated word embeddings are fine-tuned or trained.
Special tokens have been added in the vocabulary, make sure the associated word embeddings are fine-tuned or trained.
Some weights of DebertaV2ForSequenceClassification were not initialized from the model checkpoint at microsoft/deberta-v3-base and are newly initialized: ['classifier.bias', 'pooler.dense.bias', 'pooler.dense.weight', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Explaining 1


  pred_prob=torch.nn.Softmax()(pred).max().item(),


True Label,Predicted Label,Attribution Label,Attribution Score,Word Importance
Negative,Negative (0.51),Negative,0.13,"▁This ▁show ▁is ▁awesome ▁and ▁we ▁have ▁been ▁enjoying ▁it ▁thoroughly . ▁Set ▁in ▁Alaska , ▁I ▁don ' t ▁agree ▁with ▁the ▁homosexual ▁content ▁on ▁tonight ' s ▁show . ▁I ▁feel ▁that ▁you ▁are ▁pushing ▁too ▁hard ▁to ▁bring ▁New ▁York ▁to ▁Alaska . ▁Its ▁one ▁thing ▁to ▁have ▁a ▁New ▁Yorker ▁struggling ▁in ▁the ▁Alaska ▁wild , ▁but ▁to ▁try ▁to ▁turn ▁the ▁Alaska ▁town ▁into ▁New ▁York ? ▁This ▁is ▁a ▁nice ▁show ▁about ▁dainty ▁women ▁and ▁true ▁Alaska ▁Men ▁and ▁to ▁bring ▁a ▁same ▁sex ▁couple ▁into ▁the ▁mix ▁is ▁throwing ▁the ▁balance ▁way ▁off . ▁Alaska ▁should ▁be ▁Port rayed ▁as ▁a ▁man ▁and ▁New ▁York ▁as ▁the ▁woman . ▁I ▁think ▁the ▁first ▁9 ▁shows ▁have ▁the ▁perfect ▁balance ▁with ▁what ▁you ▁all ▁are ▁doing . ▁Can ' t ▁we ▁have ▁a ▁nice ▁show ▁without ▁the ▁imbalance ▁of ▁nature ."
,,,,


Explaining 2


True Label,Predicted Label,Attribution Label,Attribution Score,Word Importance
Negative,Negative (0.55),Negative,1.99,"▁The ▁movie ▁was ▁a ▁pleasure ▁to ▁watch ▁if ▁you ▁are ▁a ▁fan ▁of ▁the ▁Stooges . ▁The ▁story ▁is ▁told ▁from ▁the ▁point ▁of ▁view ▁of ▁Moe ▁Howard ▁and ▁his ▁relationships ▁with ▁his ▁brothers ▁She mp ▁and ▁Jerome ▁( Cur ly ) ▁Howard , ▁also ▁the ▁life ▁long ▁friendship ▁with ▁Larry ▁Fine . ▁The ▁movie ▁deals ▁mostly ▁with ▁the ▁off ▁camera ▁high ▁points ▁and ▁pit ▁falls ▁of ▁the ▁Stooges ▁multi ▁decade ▁career . ▁The ▁casting ▁director ▁and ▁makeup ▁artist ▁did ▁a ▁fair ▁job ▁of ▁finding ▁actors ▁who ▁resembled ▁the ▁famous ▁ensemble . ▁The ▁actor ▁who ▁plays ▁"" Cur ly "" ▁Howard ▁did ▁a ▁fine ▁job ▁of ▁portraying ▁the ▁on ▁camera ▁antics ▁of ▁the ▁most ▁beloved ▁Sto oge . ▁A ▁must ▁see ▁for ▁any ▁fan ▁of ▁Three ▁Stooges ▁shorts ."
,,,,


Explaining 3


True Label,Predicted Label,Attribution Label,Attribution Score,Word Importance
Negative,Negative (0.61),Negative,0.21,"▁After ▁seeing ▁Forever ▁Hollywood , ▁it ▁would ▁be ▁natural ▁to ▁want ▁to ▁see ▁a ▁John ▁Waters ▁film . ▁At ▁least , ▁one ▁get ▁to ▁say ▁that ▁they ▁have ▁joined ▁the ▁legions ▁of ▁cinema ▁co gno s cent i ▁who ▁have ▁experienced ▁the ▁unique ▁cinematic ▁styling s ▁of ▁perhaps ▁the ▁best ▁known ▁non - mainstream ▁director . ▁It ' s ▁worth ▁the ▁effort , ▁and ▁PF ▁is ▁a ▁lot ▁better ▁than ▁Eraser head , and ▁there ▁is ▁a ▁certain ▁camp iness ▁about ▁his ▁films ▁which ▁his ▁followers ▁find ▁addicting ."
,,,,


Explaining 4


True Label,Predicted Label,Attribution Label,Attribution Score,Word Importance
Positive,Negative (0.53),Negative,0.43,"▁Man , ▁I ▁can ' t ▁believe ▁the ▁largely ▁harsh ▁and ▁negative ▁comments ▁for ▁this ▁movie . ▁Okay , ▁it ▁sure ▁a in ' t ▁no ▁sophisticated ▁work ▁of ▁cinematic ▁art . ▁But ▁it ▁is ▁a ▁good ▁deal ▁of ▁entertaining ly ▁tacky ▁fun . ▁For ▁starters , ▁the ▁titular ▁pumpkin - headed ▁supernatural ▁killer ▁dude ▁has ▁to ▁be ▁one ▁of ▁the ▁single ▁most ▁laughably ▁silly ▁and ▁un scary ▁things ▁to ▁ever ▁stumble ▁in ▁front ▁of ▁a ▁camera ; ▁he ▁looks ▁like ▁something ▁you ▁would ▁see ▁in ▁a ▁fourth - rate ▁carnival ▁spook house . ▁Secondly , ▁the ▁moderate ▁go re ▁is ▁ridiculously ▁fake ▁and ▁unconvincing , ▁with ▁the ▁definite ▁highlight ▁occurring ▁when ▁this ▁annoying ▁uptight ▁ultra - conservative ▁woman ▁gets ▁electrocuted ▁by ▁a ▁toaster . ▁Then ▁there ' s ▁the ▁always ▁welcome ▁presence ▁of ▁the ▁ever - lovely ▁Linnea ▁Quigley , ▁who ' s ▁memorably ▁introduced ▁taking ▁a ▁nice , ▁long , ▁utterly ▁gratuitous ▁shower ▁that ▁goes ▁on ▁for ▁two ▁minutes . ▁Amazingly , ▁we ▁also ▁have ▁appearances ▁by ▁deceased ▁sch lock ▁picture ▁legends ▁John ▁Carr adine ▁as ▁an ▁evil ▁warlock ▁and ▁Cameron ▁Mitchell ▁as ▁a ▁horror ▁TV ▁show ▁host . ▁Moreover , ▁scream ▁queens ▁Brink e ▁Stevens ▁and ▁Dawn ▁Wild smith ▁have ▁fleeting ▁cameos . ▁Lead ▁child ▁actor ▁Ryan ▁Lat shaw ▁projects ▁all ▁the ▁charm ▁and ▁acting ▁ability ▁of ▁a ▁moldy ▁old ▁tree ▁stump . ▁Pretty ▁brunette ▁Rachel ▁Carter ▁pops ▁her ▁top ▁and ▁bare s ▁her ▁cute ▁little ▁breasts . ▁The ▁crud dy ▁special ▁effects ▁are ▁decidedly ▁less ▁than ▁special . ▁The ▁score ▁is ▁suitably ▁overwrought . ▁Yet ▁this ▁film ▁overall ▁has ▁a ▁certain ▁endearing ly ▁hokey ▁appeal ▁to ▁it ▁which ▁in ▁turn ▁makes ▁this ▁honey ▁a ▁real ▁d elect ably ▁cheesy ▁hoot ▁to ▁watch ."
,,,,


Explaining 5


True Label,Predicted Label,Attribution Label,Attribution Score,Word Importance
Positive,Negative (0.54),Negative,-3.17,"▁U zu maki ▁succeeds ▁as ▁at ▁plunging ▁you ▁into ▁a ▁bizarre ▁surreal ity ▁where ▁U zu maki ▁shapes ▁haunt ▁and ▁curse ▁a ▁town . ▁It ▁fails ▁at ▁being ▁a ▁competent ▁horror ▁movie . ▁While ▁the ▁film ▁is ▁sure ▁to ▁draw ▁attention ▁mainly ▁to ▁it ' s ▁bizarre ▁plot ▁line ▁and ▁a ▁few ▁interesting ▁visual ▁treats , ▁it ' s ▁going ▁to ▁come ▁off ▁better ▁as ▁a ▁dark ▁comedy ▁than ▁a ▁horror ▁film . ▁It ' s ▁definitely ▁a ▁film ▁you ▁should ▁see ▁if ▁your ▁into ▁the ▁kind ▁of ▁stuff - ▁but ▁if ▁your ▁looking ▁for ▁a ▁scare ▁or ▁even ▁a ▁small ▁chill , ▁you ' ll ▁want ▁to ▁look ▁elsewhere . ▁U zu maki ▁doesn ' t ▁really ▁have ▁much ▁else ▁up ▁it ' s ▁sleeve ▁but ▁a ▁great ▁chain ▁of ▁odd ▁events . < br ▁/ > < br ▁/ > a"
,,,,


Explaining 6


True Label,Predicted Label,Attribution Label,Attribution Score,Word Importance
Negative,Negative (0.59),Negative,0.42,"▁Rabbit ▁Fever ▁is ▁one ▁of ▁those ▁film ▁oddities . ▁It ' s ▁an ▁enjoyable ▁90 ▁minutes , ▁demands ▁little ▁of ▁the ▁viewer , ▁and ▁delivers ▁as ▁much , ▁and ▁on ▁any ▁terrestrial ▁television ▁channel ▁even ▁in ▁a ▁prime ▁time ▁slot ▁I ▁think ▁that ▁Rabbit ▁Fever ▁would ▁be ▁rather ▁well ▁received . ▁Which ▁makes ▁me ▁wonder ▁why ▁it ▁has ▁been ▁pushed ▁into ▁cinemas . < br ▁/ > < br ▁/ > The ▁movie ▁is ▁filmed ▁in ▁the ▁style ▁of ▁a ▁television ▁documentary , ▁and ▁introduces ▁us ▁to ▁6 ▁women ▁who ▁have ▁am ▁addictive ▁relationship ▁with ▁the ▁Rabbit ▁Vib rator . ▁The ▁film ▁is ▁primarily ▁focused ▁on ▁investigating ▁a ▁supposed ▁addictive ▁quality ▁to ▁the ▁famous ▁sex ▁aid ▁product . ▁The ▁narrative ▁is ▁100 % ▁tongue ▁in ▁cheek ▁throughout . < br ▁/ > < br ▁/ > The ▁storyline ▁is ▁strong , ▁an ▁introduction ▁to ▁some ▁well ▁rounded ▁and ▁likable ▁characters , ▁some ▁enjoyable ▁back - story , ▁peripheral ▁characters ▁and ▁situations ▁develops ▁into ▁an ▁engaging ▁story , ▁and ▁pleasing ▁conclusions . ▁Sadly ▁there ' s ▁nothing ▁that ▁feels ▁clever ▁or ▁new . ▁< br ▁/ > < br ▁/ > Rabbit ▁Fever ▁has ▁some ▁sharp ▁moments , ▁a ▁few ▁switches ▁that ▁hint ▁at ▁what ▁the ▁writers ▁are ▁capable ▁of , ▁and ▁all ▁credit ▁to ▁them ▁it ' s ▁not ▁just ▁90 ▁minutes ▁of ▁knob ▁gags ▁and ▁innuendo , ▁I ▁could ▁probably ▁watch ▁it ▁with ▁my ▁mother . ▁But ▁there ' s ▁a ▁laziness ▁about ▁some ▁of ▁the ▁scenes ▁that ▁holds ▁it ▁back , ▁those ▁moments ▁went ▁you ▁are ▁up ▁for ▁it , ▁when ▁you ▁want ▁it ▁to ▁be ▁outrageous , ▁and ▁all ▁you ▁get ▁is ▁a ▁dollop ▁of ▁sit - com . < br ▁/ > < br ▁/ > I ▁chuckled , ▁I ▁left ▁the ▁theatre ▁feeling ▁empathy ▁for ▁the ▁characters , ▁but ▁I ▁also ▁left ▁with ▁the ▁bitter ▁thought ▁that ▁someone ▁had ▁taken ▁a ▁90 ▁minute ▁reel ▁of ▁made ▁for ▁TV , ▁light ▁entertainment ▁and ▁tried ▁to ▁put ▁it ▁into ▁national ▁cinema . ▁< br ▁/ > < br ▁/ > I ▁think ▁Rabbit ▁Fever ▁achieves ▁some ▁of ▁what ▁it ▁set ▁out ▁to ▁do , ▁it ' s ▁a ▁quirky ▁subject , ▁a ▁rounded ▁storyline , ▁a ▁well ▁presented ▁cast ▁and ▁a ▁good ▁diversion ▁for ▁90 ▁minutes . ▁But ▁there ' s ▁nothing ▁in ▁this ▁that ▁can ▁justify ▁the ▁extravagance ▁of ▁a ▁movie ▁theatre ▁environment . ▁Quite ▁the ▁opposite ▁- ▁a ▁few ▁commercial ▁breaks ▁would ▁have ▁given ▁the ▁viewer ▁chance ▁to ▁grab ▁a ▁breath ▁of ▁life ▁that ▁Rabbit ▁Fever ▁seems ▁to ▁lack ."
,,,,


Explaining 7


: 