Connected to venv (Python 3.11.5)

In [None]:
import os
import json
import torch
import torch.nn as nn
import torch.nn.functional as F
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
from typing import Dict, List, Tuple, Optional, Any
import joblib
from sklearn.preprocessing import LabelEncoder
from sklearn.metrics.pairwise import cosine_similarity
import nltk
from nltk.corpus import wordnet
import random
import warnings
from itertools import combinations
warnings.filterwarnings("ignore")

# HuggingFace imports
from transformers import AutoTokenizer, AutoConfig, AutoModel
from datasets import load_dataset

# Captum imports for Integrated Gradients
from captum.attr import IntegratedGradients, visualization as viz
from captum.attr import TokenReferenceBase, configure_interpretable_embedding_layer, remove_interpretable_embedding_layer

# Set seed for determinism
def set_seed(s=42):
    random.seed(s)
    np.random.seed(s)
    torch.manual_seed(s)
    if torch.cuda.is_available():
        torch.cuda.manual_seed_all(s)
    torch.backends.cudnn.deterministic = True
    torch.backends.cudnn.benchmark = False

set_seed(42)

Connected to .venv (Python 3.12.7)

In [None]:
import os
import json
import torch
import torch.nn as nn
import torch.nn.functional as F
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
from typing import Dict, List, Tuple, Optional, Any
import joblib
from sklearn.preprocessing import LabelEncoder
from sklearn.metrics.pairwise import cosine_similarity
import nltk
from nltk.corpus import wordnet
import random
import warnings
from itertools import combinations
warnings.filterwarnings("ignore")

# HuggingFace imports
from transformers import AutoTokenizer, AutoConfig, AutoModel
from datasets import load_dataset

# Captum imports for Integrated Gradients
from captum.attr import IntegratedGradients, visualization as viz
from captum.attr import TokenReferenceBase, configure_interpretable_embedding_layer, remove_interpretable_embedding_layer

# Set seed for determinism
def set_seed(s=42):
    random.seed(s)
    np.random.seed(s)
    torch.manual_seed(s)
    if torch.cuda.is_available():
        torch.cuda.manual_seed_all(s)
    torch.backends.cudnn.deterministic = True
    torch.backends.cudnn.benchmark = False

set_seed(42)

In [None]:
# Set device
device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
print(f"üîß Using device: {device}")


# ## Model Architecture

üîß Using device: cuda


In [None]:
class BERTweetSingleTaskTransformer(nn.Module):
    
    def __init__(
        self,
        model_name: str = "vinai/bertweet-base",
        num_classes: int = 3,
        hidden_dropout_prob: float = 0.1,
        attention_dropout_prob: float = 0.1,
        classifier_dropout: float = 0.1
    ):
        super(BERTweetSingleTaskTransformer, self).__init__()
        
        self.model_name = model_name
        self.num_classes = num_classes
        
        # Load BERTweet configuration
        config = AutoConfig.from_pretrained(model_name)
        config.hidden_dropout_prob = hidden_dropout_prob
        config.attention_probs_dropout_prob = attention_dropout_prob
        
        # BERTweet encoder
        self.encoder = AutoModel.from_pretrained(model_name, config=config)
        
        hidden_size = self.encoder.config.hidden_size
        
        # Classification head optimized for BERTweet
        self.classifier = nn.Sequential(
            nn.Linear(hidden_size, hidden_size),
            nn.GELU(),
            nn.Dropout(classifier_dropout),
            nn.Linear(hidden_size, hidden_size // 2),
            nn.GELU(),
            nn.Dropout(classifier_dropout),
            nn.Linear(hidden_size // 2, num_classes)
        )
        
        self._init_weights()
    
    def _init_weights(self):
        """Initialize classification head weights"""
        for layer in self.classifier:
            if isinstance(layer, nn.Linear):
                nn.init.xavier_uniform_(layer.weight)
                nn.init.zeros_(layer.bias)
    
    def forward(self, input_ids, attention_mask):
        encoder_outputs = self.encoder(
            input_ids=input_ids.long(),
            attention_mask=attention_mask,
            return_dict=True
        )
        
        pooled_output = encoder_outputs.last_hidden_state[:, 0, :]
        logits = self.classifier(pooled_output)
        
        return {'logits': logits}
    
    @classmethod
    def from_pretrained(cls, model_path: str, **kwargs):
        import torch
        import json
        import os

        # Load saved config
        config_path = os.path.join(model_path, "config.json")
        with open(config_path, 'r') as f:
            config = json.load(f)

        # Initialize model architecture
        model = cls(
            model_name=config["model_name"],
            num_classes=config["num_classes"],
            **kwargs
        )

        # Load state dict from HuggingFace-style checkpoint
        model_file = os.path.join(model_path, "pytorch_model.bin")
        state_dict = torch.load(model_file, map_location='cpu')

        # Rename keys if they use HuggingFace format (e.g., "bertweet.")
        renamed_state_dict = {}
        for k, v in state_dict.items():
            new_k = k
            if k.startswith("bertweet."):
                new_k = k.replace("bertweet.", "encoder.")
            renamed_state_dict[new_k] = v

        model.load_state_dict(renamed_state_dict, strict=False)

        return model

In [None]:
class BERTweetMultiTaskTransformer(nn.Module):
    
    def __init__(
        self,
        model_name: str = "vinai/bertweet-base",
        sentiment_num_classes: int = 3,
        emotion_num_classes: int = 6,
        hidden_dropout_prob: float = 0.1,
        attention_dropout_prob: float = 0.1,
        classifier_dropout: float = 0.1
    ):
        super(BERTweetMultiTaskTransformer, self).__init__()
        
        self.model_name = model_name
        self.sentiment_num_classes = sentiment_num_classes
        self.emotion_num_classes = emotion_num_classes
        
        config = AutoConfig.from_pretrained(model_name)
        config.hidden_dropout_prob = hidden_dropout_prob
        config.attention_probs_dropout_prob = attention_dropout_prob
        
        # Shared BERTweet encoder
        self.shared_encoder = AutoModel.from_pretrained(model_name, config=config)
        
        hidden_size = self.shared_encoder.config.hidden_size
        
        # Sentiment classification head
        self.sentiment_classifier = nn.Sequential(
            nn.Linear(hidden_size * 2, hidden_size),
            nn.ReLU(),
            nn.Dropout(classifier_dropout),
            nn.Linear(hidden_size, sentiment_num_classes)
        )

        # Emotion classification head
        self.emotion_classifier = nn.Sequential(
            nn.Linear(hidden_size * 2, hidden_size),
            nn.ReLU(),
            nn.Dropout(classifier_dropout),
            nn.Linear(hidden_size, emotion_num_classes)
        )
   
        self._init_weights()
    
    def _init_weights(self):
        for classifier in [self.sentiment_classifier, self.emotion_classifier]:
            for layer in classifier:
                if isinstance(layer, nn.Linear):
                    nn.init.xavier_uniform_(layer.weight)
                    nn.init.zeros_(layer.bias)
    
    def forward(self, input_ids, attention_mask):
        # Shared encoder
        encoder_outputs = self.shared_encoder(
            input_ids=input_ids,
            attention_mask=attention_mask,
            return_dict=True
        )
        
        cls_output = encoder_outputs.last_hidden_state[:, 0, :]     # [batch, 768]
        pooled_output = encoder_outputs.pooler_output               # [batch, 768]

        combined = torch.cat((cls_output, pooled_output), dim=1)    # [batch, 1536]

        # Task-specific predictions
        sentiment_logits = self.sentiment_classifier(combined)
        emotion_logits = self.emotion_classifier(combined)
        
        return {
            'sentiment_logits': sentiment_logits,
            'emotion_logits': emotion_logits
        }
    
    @classmethod
    def from_pretrained(cls, model_path: str, **kwargs):
        import torch
        import json
        from transformers import AutoModel

        # Load saved config
        config_path = os.path.join(model_path, "config.json")
        with open(config_path, 'r') as f:
            config = json.load(f)

        # Initialize model with architecture info
        model = cls(
            model_name=config["model_name"],
            sentiment_num_classes=config["sentiment_num_classes"],
            emotion_num_classes=config["emotion_num_classes"],
            **kwargs
        )

        # Load HuggingFace-style state dict (actual weights)
        model_file = os.path.join(model_path, "pytorch_model.bin")
        state_dict = torch.load(model_file, map_location='cpu')

        # Handle HuggingFace checkpoint key mismatch
        renamed_state_dict = {}
        for k, v in state_dict.items():
            new_k = k
            if k.startswith("bertweet."):
                new_k = k.replace("bertweet.", "encoder.")
            renamed_state_dict[new_k] = v

        model.load_state_dict(renamed_state_dict, strict=False)

        return model



# ## Model Loading

In [None]:
def load_single_task_models_by_seeds(base_dir: str, seeds=(42, 43, 44, 45, 46)):
    """Load multiple single-task models trained with different seeds"""
    model_dicts = []
    for s in seeds:
        path = os.path.join(base_dir, f"bertweet_sentiment_seed_{s}")
        print(f"üì• Loading single-task model (seed {s}) from {path}")
        m = BERTweetSingleTaskTransformer.from_pretrained(path)
        tok = AutoTokenizer.from_pretrained(path)
        if tok.pad_token is None:
            tok.pad_token = tok.eos_token
        enc = joblib.load(os.path.join(path, 'sentiment_encoder.pkl'))
        md = {'model': m.to(device).eval(), 'tokenizer': tok, 'sentiment_encoder': enc,
              'type': f'single_task_seed_{s}', 'seed': s}
        model_dicts.append(md)
    print(f"‚úÖ Loaded {len(model_dicts)} single-task models across seeds")
    return model_dicts

In [None]:
def load_test_examples(data_path: str = "data/cleaned_reddit_posts.csv", num_examples: int = 10) -> List[str]:

    print(f"üìä Loading {num_examples} test examples from {data_path}")
    
    if data_path.endswith('.csv'):
        df = pd.read_csv(data_path)
        texts = df['text_content'].head(num_examples).tolist()
    else:
        # Handle JSON files if needed
        with open(data_path, 'r') as f:
            data = json.load(f)
        texts = [item['text'] for item in data[:num_examples]]
    
    # Clean and filter texts
    cleaned_texts = []
    for text in texts:
        if isinstance(text, str) and len(text.strip()) > 10:
            # Basic cleaning
            cleaned_text = text.strip()
            if len(cleaned_text.split()) >= 5:  # At least 5 words
                cleaned_texts.append(cleaned_text)
        
        if len(cleaned_texts) >= num_examples:
            break
    
    print(f"‚úÖ Loaded {len(cleaned_texts)} valid test examples")
    return cleaned_texts


# ## IG Generation

In [None]:
def load_test_examples(data_path: str = "data/cleaned_reddit_posts.csv", num_examples: int = 10) -> List[str]:

    print(f"üìä Loading {num_examples} test examples from {data_path}")
    
    if data_path.endswith('.csv'):
        df = pd.read_csv(data_path)
        texts = df['text_content'].head(num_examples).tolist()
    else:
        # Handle JSON files if needed
        with open(data_path, 'r') as f:
            data = json.load(f)
        texts = [item['text'] for item in data[:num_examples]]
    
    # Clean and filter texts
    cleaned_texts = []
    for text in texts:
        if isinstance(text, str) and len(text.strip()) > 10:
            # Basic cleaning
            cleaned_text = text.strip()
            if len(cleaned_text.split()) >= 5:  # At least 5 words
                cleaned_texts.append(cleaned_text)
        
        if len(cleaned_texts) >= num_examples:
            break
    
    print(f"‚úÖ Loaded {len(cleaned_texts)} valid test examples")
    return cleaned_texts


# ## IG Generation

In [None]:
class BERTweetIntegratedGradients:
    
    def __init__(self):
        self.baseline_token_id = 0  # [PAD] token
        
    def _create_forward_function(self, model, task='sentiment'):
        def forward_fn(embeddings, attention_mask=None):
            model.eval()
            if hasattr(model, 'shared_encoder'):  # multitask
                enc = model.shared_encoder(inputs_embeds=embeddings, attention_mask=attention_mask, return_dict=True)
                cls_out = enc.last_hidden_state[:, 0, :]
                pooled = enc.pooler_output
                combined = torch.cat((cls_out, pooled), dim=1)
                if task == 'emotion':
                    return model.emotion_classifier(combined)
                return model.sentiment_classifier(combined)
            else:  # single-task
                enc = model.encoder(inputs_embeds=embeddings, attention_mask=attention_mask, return_dict=True)
                pooled = enc.last_hidden_state[:, 0, :]
                return model.classifier(pooled)
        return forward_fn
    
    def _get_embedding_layer(self, model):
        if hasattr(model, 'shared_encoder'):  # Multitask model
            return model.shared_encoder.embeddings.word_embeddings
        else:  # Single task model
            return model.encoder.embeddings.word_embeddings
    
    def generate_attributions(
            self, 
            text: str, 
            model_dict: Dict, 
            max_length: int = 128,
            n_steps: int = 25,
            force_target_class: Optional[int] = None,
            force_tokenizer: Optional[Any] = None
        ) -> Dict[str, Any]:
            model = model_dict['model']
            tokenizer = model_dict['tokenizer']
            
            print(f"üîç Generating IG attributions for {model_dict['type']} model...")
            
            # Ensure model is in eval mode
            model.eval()
            
            # Use forced tokenizer if provided, otherwise use model's tokenizer
            active_tokenizer = force_tokenizer if force_tokenizer is not None else tokenizer
            
            # Tokenize input
            inputs = active_tokenizer(
                text, 
                return_tensors="pt", 
                truncation=True, 
                padding=True,
                max_length=max_length
            )
            
            input_ids = inputs['input_ids'].to(device)
            attention_mask = inputs['attention_mask'].to(device)
            
            # Get embedding layer
            embedding_layer = self._get_embedding_layer(model)
            
            # Convert input_ids to embeddings
            input_embeddings = embedding_layer(input_ids)  # [batch_size, seq_len, embedding_dim]
            
            # Get predicted class first
            forward_fn = self._create_forward_function(model, 'sentiment')
            model.eval()
            with torch.no_grad():
                temp_outputs = forward_fn(input_embeddings, attention_mask)
                predictions = F.softmax(temp_outputs, dim=-1)
                
                # Use forced target class if provided, otherwise use model's prediction
                if force_target_class is not None:
                    predicted_class = force_target_class
                    confidence = predictions[0, predicted_class].item()
                    print(f"üéØ Using forced target class: {predicted_class}, Confidence: {confidence:.3f}")
                else:
                    predicted_class = torch.argmax(predictions, dim=-1).item()
                    confidence = predictions.max().item()
                    print(f"üéØ Predicted class: {predicted_class}, Confidence: {confidence:.3f}")
                
                print(f"üîí Target class locked: {predicted_class} for stability analysis")
            
            # Try Integrated Gradients with embeddings
            try:
                print("üîÑ Computing Integrated Gradients with embeddings...")
                
                # Create a wrapper function that only takes embeddings as input
                def embedding_forward_fn(embeddings):
                    return forward_fn(embeddings, attention_mask)
                
                # Initialize Integrated Gradients
                ig = IntegratedGradients(embedding_forward_fn)
                
                # Compute attributions
                attributions, convergence_delta = ig.attribute(
                    inputs=input_embeddings,
                    baselines=torch.zeros_like(input_embeddings),
                    target=predicted_class,
                    n_steps=200,
                    return_convergence_delta=True,
                    internal_batch_size=16
                )
                
                print("‚úÖ Integrated Gradients computation succeeded!")
                
            except Exception as e:
                print(f"‚ùå Integrated Gradients failed: {e}")
                
                # Fallback: Simple gradient method
                try:
                    print("üîÑ Fallback: Simple gradient method...")
                    
                    # Enable gradients for input embeddings
                    input_embeddings_grad = input_embeddings.clone().detach().requires_grad_(True)
                    
                    # Forward pass
                    logits = forward_fn(input_embeddings_grad, attention_mask)
                    target_logit = logits[0, predicted_class]
                    
                    # Backward pass
                    model.zero_grad()
                    target_logit.backward()
                    
                    # Get gradients as attributions
                    attributions = input_embeddings_grad.grad
                    convergence_delta = torch.tensor(0.0)
                    
                    print("‚úÖ Simple gradient method succeeded!")
                    
                except Exception as e2:
                    print(f"‚ùå All methods failed: {e2}")
                    print("üîÑ Using random attributions for debugging...")
                    
                    # Random fallback
                    attributions = torch.randn_like(input_embeddings)
                    convergence_delta = torch.tensor(0.0)
            
            # Process the attribution results
            try:
                # Get tokens using the active tokenizer
                tokens = active_tokenizer.convert_ids_to_tokens(input_ids[0])
                
                # Sum attribution scores across embedding dimensions
                if attributions.dim() == 3:  # [batch_size, seq_len, embedding_dim]
                    attribution_scores = attributions.sum(dim=-1).squeeze().cpu().detach().numpy()
                else:
                    attribution_scores = attributions.squeeze().cpu().detach().numpy()
                
                # Ensure we have the right number of scores
                if len(attribution_scores.shape) == 0:  # scalar
                    attribution_scores = np.array([attribution_scores])
                
                # Align scores with tokens
                if len(attribution_scores) != len(tokens):
                    print(f"‚ö†Ô∏è Score length ({len(attribution_scores)}) != token length ({len(tokens)})")
                    if len(attribution_scores) < len(tokens):
                        # Pad with zeros
                        padded_scores = np.zeros(len(tokens))
                        padded_scores[:len(attribution_scores)] = attribution_scores
                        attribution_scores = padded_scores
                    else:
                        # Truncate
                        attribution_scores = attribution_scores[:len(tokens)]
                
                # Clean tokens (remove special tokens for visualization)
                clean_tokens = []
                clean_scores = []
                for i, (token, score) in enumerate(zip(tokens, attribution_scores)):
                    if token not in ['<s>', '</s>', '<pad>', '[PAD]', '[CLS]', '[SEP]']:
                        clean_tokens.append(token)
                        clean_scores.append(float(score))
                
                if len(clean_tokens) == 0:
                    print("‚ö†Ô∏è No clean tokens found, using all tokens")
                    clean_tokens = [str(token) for token in tokens]
                    clean_scores = [float(score) for score in attribution_scores]
                
                result = {
                    'text': text,
                    'tokens': clean_tokens,
                    'attribution_scores': clean_scores,
                    'predicted_class': predicted_class,
                    'confidence': confidence,
                    'convergence_delta': float(convergence_delta.item()) if hasattr(convergence_delta, 'item') else 0.0,
                    'model_type': model_dict['type'],
                    'raw_tokens': [str(token) for token in tokens],
                    'raw_scores': [float(score) for score in attribution_scores]
                }
                
                print(f"‚úÖ Generated attributions for {len(clean_tokens)} tokens")
                return result
                
            except Exception as e:
                print(f"‚ùå Error processing attribution results: {e}")
                import traceback
                traceback.print_exc()
                return None

In [None]:
def generate_single_task_explanations(texts: List[str], ref_model_dict: Dict) -> List[Dict]:
    """Generate explanations using a single reference model"""
    ig_explainer = BERTweetIntegratedGradients()
    results = []
    for i, text in enumerate(texts):
        print(f"\nüìù Processing text {i+1}/{len(texts)}")
        r = ig_explainer.generate_attributions(text, ref_model_dict)
        if r: 
            results.append(r)
    print(f"‚úÖ Generated explanations for {len(results)} examples (single-task, seed {ref_model_dict.get('seed')})")
    return results


# ## Eval Metrics

In [None]:
def generate_single_task_explanations(texts: List[str], ref_model_dict: Dict) -> List[Dict]:
    """Generate explanations using a single reference model"""
    ig_explainer = BERTweetIntegratedGradients()
    results = []
    for i, text in enumerate(texts):
        print(f"\nüìù Processing text {i+1}/{len(texts)}")
        r = ig_explainer.generate_attributions(text, ref_model_dict)
        if r: 
            results.append(r)
    print(f"‚úÖ Generated explanations for {len(results)} examples (single-task, seed {ref_model_dict.get('seed')})")
    return results


# ## Eval Metrics

In [None]:
def evaluate_faithfulness(
    text: str,
    model_dict: Dict,
    attribution_result: Dict,
    top_k_ratios: List[float] = [0.1, 0.2, 0.3, 0.5]
) -> Dict[str, float]:

    print("üìä Evaluating faithfulness...")
    
    model = model_dict['model']
    tokenizer = model_dict['tokenizer']
    
    # Get original prediction
    inputs = tokenizer(text, return_tensors="pt", truncation=True, padding=True, max_length=128)
    input_ids = inputs['input_ids'].to(device)
    attention_mask = inputs['attention_mask'].to(device)
    
    with torch.no_grad():
        if hasattr(model, 'shared_encoder'):
            outputs = model(input_ids=input_ids, attention_mask=attention_mask)
            original_probs = F.softmax(outputs['sentiment_logits'], dim=-1)
        else:
            outputs = model(input_ids=input_ids, attention_mask=attention_mask)
            original_probs = F.softmax(outputs['logits'], dim=-1)
    
    # Get the reference class from attribution result (should be the same across seeds)
    reference_class = attribution_result['predicted_class']
    original_confidence = original_probs[0, reference_class].item()
    
    print(f"üîí Faithfulness: measuring confidence for class {reference_class}")
    print(f"üìä Original confidence: {original_confidence:.4f}")
    
    faithfulness_scores = {}
    
    # Get attribution scores and tokens
    tokens = attribution_result['raw_tokens']
    scores = attribution_result['raw_scores']
    
    # Use MASK token if available, fallback to PAD token
    mask_id = getattr(tokenizer, "mask_token_id", None) or tokenizer.pad_token_id
    
    for ratio in top_k_ratios:
        try:
            # attributions_per_token: 1D numpy array with SIGNED attributions for the locked target class
            pos_scores = np.array(scores).copy()
            pos_scores[pos_scores < 0] = 0.0
            
            # if no positive contributions, fall back to absolute values
            if np.all(pos_scores == 0):
                pos_scores = np.abs(np.array(scores))
            
            # Calculate how many tokens to remove
            num_tokens_to_remove = max(1, int(len(tokens) * ratio))
            
            # Get indices of top-k most important tokens from positive contributions
            top_indices = np.argsort(pos_scores)[-num_tokens_to_remove:]
            
            # Create modified input by masking top tokens with MASK token
            modified_input_ids = input_ids.clone()
            for idx in top_indices:
                if idx < modified_input_ids.shape[1]:
                    modified_input_ids[0, idx] = mask_id
            
            # Get prediction for modified input
            with torch.no_grad():
                if hasattr(model, 'shared_encoder'):
                    outputs = model(input_ids=modified_input_ids, attention_mask=attention_mask)
                    modified_probs = F.softmax(outputs['sentiment_logits'], dim=-1)
                else:
                    outputs = model(input_ids=modified_input_ids, attention_mask=attention_mask)
                    modified_probs = F.softmax(outputs['logits'], dim=-1)
            
            # Always measure the SAME class probability (reference class)
            modified_confidence = modified_probs[0, reference_class].item()
            
            # Calculate faithfulness as confidence drop for the SAME class
            confidence_drop = original_confidence - modified_confidence
            faithfulness_scores[f'faithfulness_top_{ratio}'] = confidence_drop
            
            print(f"üìä Ratio {ratio}: {num_tokens_to_remove} tokens masked, confidence: {modified_confidence:.4f} ‚Üí {confidence_drop:.4f}")
            
        except Exception as e:
            print(f"‚ö†Ô∏è Error in faithfulness evaluation for ratio {ratio}: {e}")
            faithfulness_scores[f'faithfulness_top_{ratio}'] = 0.0
    
    return faithfulness_scores

In [None]:
def evaluate_stability(
    text: str,
    model_dict: Dict,
    attribution_result: Dict,
    num_perturbations: int = 5
) -> Dict[str, float]:

    print("üìä Evaluating stability...")
    
    ig_explainer = BERTweetIntegratedGradients()
    original_scores = np.array(attribution_result['attribution_scores'])
    
    perturbed_scores = []
    
    for i in range(num_perturbations):
        try:
            # Create perturbed text
            perturbed_text = create_text_perturbation(text)
            
            # Generate attributions for perturbed text
            perturbed_result = ig_explainer.generate_attributions(perturbed_text, model_dict)
            
            if perturbed_result and len(perturbed_result['attribution_scores']) > 0:
                # Align scores (pad or truncate to match original length)
                perturbed_score = np.array(perturbed_result['attribution_scores'])
                min_len = min(len(original_scores), len(perturbed_score))
                
                if min_len > 0:
                    orig_aligned = original_scores[:min_len]
                    pert_aligned = perturbed_score[:min_len]
                    perturbed_scores.append(pert_aligned)
        
        except Exception as e:
            print(f"‚ö†Ô∏è Error generating perturbation {i}: {e}")
            continue
    
    if not perturbed_scores:
        return {'stability_cosine': 0.0, 'stability_correlation': 0.0}
    
    # Calculate stability metrics
    cosine_similarities = []
    correlations = []
    
    for pert_scores in perturbed_scores:
        min_len = min(len(original_scores), len(pert_scores))
        if min_len > 1:
            orig_aligned = original_scores[:min_len]
            pert_aligned = pert_scores[:min_len]
            
            # Cosine similarity
            if np.linalg.norm(orig_aligned) > 0 and np.linalg.norm(pert_aligned) > 0:
                cos_sim = cosine_similarity([orig_aligned], [pert_aligned])[0, 0]
                cosine_similarities.append(cos_sim)
            
            # Correlation
            if len(set(orig_aligned)) > 1 and len(set(pert_aligned)) > 1:
                corr = np.corrcoef(orig_aligned, pert_aligned)[0, 1]
                if not np.isnan(corr):
                    correlations.append(corr)
    
    # Average stability scores
    avg_cosine = np.mean(cosine_similarities) if cosine_similarities else 0.0
    avg_correlation = np.mean(correlations) if correlations else 0.0
    
    return {
        'stability_cosine': avg_cosine,
        'stability_correlation': avg_correlation,
        'num_valid_perturbations': len(perturbed_scores)
    }


def _standardize(v: np.ndarray) -> np.ndarray:
    """Standardize vector to remove scale/offset differences across seeds"""
    v = v.astype(np.float32)
    mu, sd = v.mean(), v.std()
    return (v - mu) / (sd + 1e-8)

def evaluate_stability_across_seeds(text: str, seed_model_dicts: List[Dict], ig_explainer=None):
    """Evaluate stability across different seed models for the same text"""
    print("üìä Evaluating stability across seeds...")
    if ig_explainer is None:
        ig_explainer = BERTweetIntegratedGradients()

    # 1) Get reference attribution + class with the first seed
    ref_md = seed_model_dicts[0]
    ref = ig_explainer.generate_attributions(text, ref_md)
    if not ref: 
        return {'stability_cosine': 0.0, 'stability_correlation': 0.0, 'num_seed_pairs': 0}
    
    ref_class = int(ref['predicted_class'])
    ref_scores = np.array(ref['attribution_scores'])
    
    # Store reference tokenization for consistency
    ref_tokenizer = ref_md['tokenizer']
    
    print(f"üîí Reference class: {ref_class}, using tokenizer from seed {ref_md['seed']}")
    
    # 2) For all seeds, recompute IG FOR THE SAME TARGET CLASS
    seed_attr = [(ref_md['seed'], ref_scores)]
    for md in seed_model_dicts[1:]:
        res = ig_explainer.generate_attributions(
            text, md, 
            force_target_class=ref_class,
            force_tokenizer=ref_tokenizer
        )
        if res and len(res['attribution_scores']) > 0:
            seed_attr.append((md['seed'], np.array(res['attribution_scores'])))
            print(f"‚úÖ Seed {md['seed']}: computed IG for target class {ref_class}")
        else:
            print(f"‚ùå Seed {md['seed']}: failed to compute IG")

    if len(seed_attr) < 2:
        return {'stability_cosine': 0.0, 'stability_correlation': 0.0, 'num_seed_pairs': 0}

    # 3) Pairwise similarities on same-length prefix
    cos_sims, cors = [], []
    for i in range(len(seed_attr)):
        for j in range(i+1, len(seed_attr)):
            a, b = seed_attr[i][1], seed_attr[j][1]
            L = min(len(a), len(b))
            if L > 1:
                A, B = a[:L], b[:L]
                # Standardize vectors before computing similarity
                A = _standardize(A)
                B = _standardize(B)
                # Cosine similarity
                na, nb = np.linalg.norm(A), np.linalg.norm(B)
                if na > 0 and nb > 0:
                    cos_sims.append((A @ B) / (na * nb))
                # Pearson correlation
                if A.std() > 0 and B.std() > 0:
                    cors.append(np.corrcoef(A, B)[0, 1])

    return {
        'stability_cosine': float(np.mean(cos_sims)) if cos_sims else 0.0,
        'stability_correlation': float(np.mean(cors)) if cors else 0.0,
        'num_seed_pairs': len(cos_sims)
    }

In [None]:
def evaluate_stability(
    text: str,
    model_dict: Dict,
    attribution_result: Dict,
    num_perturbations: int = 5
) -> Dict[str, float]:

    print("üìä Evaluating stability...")
    
    ig_explainer = BERTweetIntegratedGradients()
    original_scores = np.array(attribution_result['attribution_scores'])
    
    perturbed_scores = []
    
    for i in range(num_perturbations):
        try:
            # Create perturbed text
            perturbed_text = create_text_perturbation(text)
            
            # Generate attributions for perturbed text
            perturbed_result = ig_explainer.generate_attributions(perturbed_text, model_dict)
            
            if perturbed_result and len(perturbed_result['attribution_scores']) > 0:
                # Align scores (pad or truncate to match original length)
                perturbed_score = np.array(perturbed_result['attribution_scores'])
                min_len = min(len(original_scores), len(perturbed_score))
                
                if min_len > 0:
                    orig_aligned = original_scores[:min_len]
                    pert_aligned = perturbed_score[:min_len]
                    perturbed_scores.append(pert_aligned)
        
        except Exception as e:
            print(f"‚ö†Ô∏è Error generating perturbation {i}: {e}")
            continue
    
    if not perturbed_scores:
        return {'stability_cosine': 0.0, 'stability_correlation': 0.0}
    
    # Calculate stability metrics
    cosine_similarities = []
    correlations = []
    
    for pert_scores in perturbed_scores:
        min_len = min(len(original_scores), len(pert_scores))
        if min_len > 1:
            orig_aligned = original_scores[:min_len]
            pert_aligned = pert_scores[:min_len]
            
            # Cosine similarity
            if np.linalg.norm(orig_aligned) > 0 and np.linalg.norm(pert_aligned) > 0:
                cos_sim = cosine_similarity([orig_aligned], [pert_aligned])[0, 0]
                cosine_similarities.append(cos_sim)
            
            # Correlation
            if len(set(orig_aligned)) > 1 and len(set(pert_aligned)) > 1:
                corr = np.corrcoef(orig_aligned, pert_aligned)[0, 1]
                if not np.isnan(corr):
                    correlations.append(corr)
    
    # Average stability scores
    avg_cosine = np.mean(cosine_similarities) if cosine_similarities else 0.0
    avg_correlation = np.mean(correlations) if correlations else 0.0
    
    return {
        'stability_cosine': avg_cosine,
        'stability_correlation': avg_correlation,
        'num_valid_perturbations': len(perturbed_scores)
    }


def _standardize(v: np.ndarray) -> np.ndarray:
    """Standardize vector to remove scale/offset differences across seeds"""
    v = v.astype(np.float32)
    mu, sd = v.mean(), v.std()
    return (v - mu) / (sd + 1e-8)

def evaluate_stability_across_seeds(text: str, seed_model_dicts: List[Dict], ig_explainer=None):
    """Evaluate stability across different seed models for the same text"""
    print("üìä Evaluating stability across seeds...")
    if ig_explainer is None:
        ig_explainer = BERTweetIntegratedGradients()

    # 1) Get reference attribution + class with the first seed
    ref_md = seed_model_dicts[0]
    ref = ig_explainer.generate_attributions(text, ref_md)
    if not ref: 
        return {'stability_cosine': 0.0, 'stability_correlation': 0.0, 'num_seed_pairs': 0}
    
    ref_class = int(ref['predicted_class'])
    ref_scores = np.array(ref['attribution_scores'])
    
    # Store reference tokenization for consistency
    ref_tokenizer = ref_md['tokenizer']
    
    print(f"üîí Reference class: {ref_class}, using tokenizer from seed {ref_md['seed']}")
    
    # 2) For all seeds, recompute IG FOR THE SAME TARGET CLASS
    seed_attr = [(ref_md['seed'], ref_scores)]
    for md in seed_model_dicts[1:]:
        res = ig_explainer.generate_attributions(
            text, md, 
            force_target_class=ref_class,
            force_tokenizer=ref_tokenizer
        )
        if res and len(res['attribution_scores']) > 0:
            seed_attr.append((md['seed'], np.array(res['attribution_scores'])))
            print(f"‚úÖ Seed {md['seed']}: computed IG for target class {ref_class}")
        else:
            print(f"‚ùå Seed {md['seed']}: failed to compute IG")

    if len(seed_attr) < 2:
        return {'stability_cosine': 0.0, 'stability_correlation': 0.0, 'num_seed_pairs': 0}

    # 3) Pairwise similarities on same-length prefix
    cos_sims, cors = [], []
    for i in range(len(seed_attr)):
        for j in range(i+1, len(seed_attr)):
            a, b = seed_attr[i][1], seed_attr[j][1]
            L = min(len(a), len(b))
            if L > 1:
                A, B = a[:L], b[:L]
                # Standardize vectors before computing similarity
                A = _standardize(A)
                B = _standardize(B)
                # Cosine similarity
                na, nb = np.linalg.norm(A), np.linalg.norm(B)
                if na > 0 and nb > 0:
                    cos_sims.append((A @ B) / (na * nb))
                # Pearson correlation
                if A.std() > 0 and B.std() > 0:
                    cors.append(np.corrcoef(A, B)[0, 1])

    return {
        'stability_cosine': float(np.mean(cos_sims)) if cos_sims else 0.0,
        'stability_correlation': float(np.mean(cors)) if cors else 0.0,
        'num_seed_pairs': len(cos_sims)
    }

In [None]:
def create_text_perturbation(text: str) -> str:
    words = text.split()
    
    if len(words) < 2:
        return text
    
    perturbation_type = random.choice(['synonym', 'punctuation', 'order'])
    
    if perturbation_type == 'synonym':
        # Replace one word with a synonym
        word_idx = random.randint(0, len(words) - 1)
        original_word = words[word_idx].lower().strip('.,!?;')
        
        # Try to find synonyms
        synonyms = []
        try:
            for syn in wordnet.synsets(original_word):
                for lemma in syn.lemmas():
                    if lemma.name() != original_word and '_' not in lemma.name():
                        synonyms.append(lemma.name())
        except:
            pass
        
        if synonyms:
            words[word_idx] = random.choice(synonyms)
    
    elif perturbation_type == 'punctuation':
        # Add/remove punctuation
        if random.choice([True, False]) and not text.endswith('.'):
            return text + '.'
        else:
            return text.rstrip('.,!?;')
    
    elif perturbation_type == 'order' and len(words) > 2:
        # Swap two adjacent words
        idx = random.randint(0, len(words) - 2)
        words[idx], words[idx + 1] = words[idx + 1], words[idx]
    
    return ' '.join(words)

In [None]:
def evaluate_fairness(attribution_result: Dict) -> Dict[str, float]:

    print("üìä Evaluating fairness...")
    
    # Define sensitive word categories
    emotion_words = ['happy', 'sad', 'angry', 'excited', 'disappointed', 'frustrated', 
                    'joy', 'fear', 'love', 'hate', 'good', 'bad', 'terrible', 'amazing']
    
    bias_words = ['he', 'she', 'his', 'her', 'him', 'man', 'woman', 'male', 'female',
                 'guy', 'girl', 'boy', 'dude', 'lady']
    
    tokens = [token.lower().strip('‚ñÅ') for token in attribution_result['tokens']]
    scores = attribution_result['attribution_scores']
    
    # Calculate attribution statistics for different word types
    emotion_attributions = []
    bias_attributions = []
    other_attributions = []
    
    for token, score in zip(tokens, scores):
        clean_token = token.lower().strip('.,!?;')
        
        if clean_token in emotion_words:
            emotion_attributions.append(abs(score))
        elif clean_token in bias_words:
            bias_attributions.append(abs(score))
        else:
            other_attributions.append(abs(score))
    
    # Calculate fairness metrics
    fairness_metrics = {}
    
    # Emotion word focus
    if emotion_attributions and other_attributions:
        emotion_mean = np.mean(emotion_attributions)
        other_mean = np.mean(other_attributions)
        fairness_metrics['emotion_bias_ratio'] = emotion_mean / (other_mean + 1e-8)
    else:
        fairness_metrics['emotion_bias_ratio'] = 0.0
    
    # Gender/demographic bias
    if bias_attributions and other_attributions:
        bias_mean = np.mean(bias_attributions)
        other_mean = np.mean(other_attributions)
        fairness_metrics['demographic_bias_ratio'] = bias_mean / (other_mean + 1e-8)
    else:
        fairness_metrics['demographic_bias_ratio'] = 0.0
    
    # Attribution concentration (Gini coefficient approximation)
    if len(scores) > 1:
        abs_scores = np.abs(scores)
        sorted_scores = np.sort(abs_scores)
        n = len(sorted_scores)
        cumsum = np.cumsum(sorted_scores)
        gini = (2 * np.sum((np.arange(1, n + 1) * sorted_scores))) / (n * np.sum(sorted_scores)) - (n + 1) / n
        fairness_metrics['attribution_concentration'] = gini
    else:
        fairness_metrics['attribution_concentration'] = 0.0
    
    return fairness_metrics

In [None]:
def evaluate_single_task_explanations_across_seeds(explanations: List[Dict], seed_model_dicts: List[Dict]) -> List[Dict]:
    """Evaluate single-task explanations: faithfulness & fairness on reference seed, stability across seeds"""
    print("üî¨ Evaluating single-task explanations across seeds...")
    rows = []
    ref_model = seed_model_dicts[0]  # e.g., seed 42

    for i, res in enumerate(explanations):
        txt = res['text']
        faith = evaluate_faithfulness(txt, ref_model, res)        # uses MASK
        stab  = evaluate_stability_across_seeds(txt, seed_model_dicts)
        fair  = evaluate_fairness(res)

        rows.append({
            'text': txt,
            'predicted_class': res['predicted_class'],
            'confidence': res['confidence'],
            'convergence_delta': res['convergence_delta'],
            **faith, **stab, **fair
        })
    return rows


# ## Visualisation

In [None]:
def visualize_attributions(attribution_result: Dict, save_path: Optional[str] = None):
    """
    Enhanced attribution visualization with multiple plot types
    """
    tokens = attribution_result['tokens']
    scores = attribution_result['attribution_scores']
    model_type = attribution_result['model_type']
    
    # Create figure with subplots
    fig, ((ax1, ax2), (ax3, ax4)) = plt.subplots(2, 2, figsize=(20, 12))
    
    # Plot 1: Original bar plot
    abs_max = max(abs(min(scores)), abs(max(scores)))
    normalized_scores = [score / abs_max for score in scores] if abs_max > 0 else scores
    colors = plt.cm.RdYlBu_r([(score + 1) / 2 for score in normalized_scores])
    
    bars = ax1.bar(range(len(tokens)), [abs(score) for score in normalized_scores], 
                  color=colors, alpha=0.8)
    
    ax1.set_xticks(range(len(tokens)))
    ax1.set_xticklabels(tokens, rotation=45, ha='right')
    ax1.set_ylabel('Attribution Score (Absolute)')
    ax1.set_title(f'Token Attributions - {model_type.replace("_", " ").title()}\n'
                f'Class: {attribution_result["predicted_class"]} (Conf: {attribution_result["confidence"]:.3f})')
    
    # Add color bar
    sm = plt.cm.ScalarMappable(cmap=plt.cm.RdYlBu_r, 
                              norm=plt.Normalize(vmin=-abs_max, vmax=abs_max))
    sm.set_array([])
    cbar = plt.colorbar(sm, ax=ax1)
    cbar.set_label('Attribution Score')
    
    # Plot 2: Sorted attribution scores
    token_score_pairs = list(zip(tokens, scores))
    token_score_pairs.sort(key=lambda x: abs(x[1]), reverse=True)
    sorted_tokens, sorted_scores = zip(*token_score_pairs)
    
    colors_sorted = ['red' if score < 0 else 'green' for score in sorted_scores]
    ax2.bar(range(len(sorted_tokens)), sorted_scores, color=colors_sorted, alpha=0.7)
    ax2.set_xticks(range(len(sorted_tokens)))
    ax2.set_xticklabels(sorted_tokens, rotation=45, ha='right')
    ax2.set_ylabel('Attribution Score')
    ax2.set_title('Sorted Token Attributions')
    ax2.grid(True, alpha=0.3)
    ax2.axhline(y=0, color='black', linestyle='-', alpha=0.5)
    
    # Plot 3: Cumulative attribution
    cumulative_scores = np.cumsum([abs(score) for score in sorted_scores])
    total_attribution = cumulative_scores[-1]
    cumulative_percentage = cumulative_scores / total_attribution * 100 if total_attribution > 0 else cumulative_scores
    
    ax3.plot(range(len(sorted_tokens)), cumulative_percentage, 'b-o', linewidth=2, markersize=4)
    ax3.fill_between(range(len(sorted_tokens)), cumulative_percentage, alpha=0.3, color='blue')
    ax3.set_xticks(range(len(sorted_tokens)))
    ax3.set_xticklabels(sorted_tokens, rotation=45, ha='right')
    ax3.set_ylabel('Cumulative Attribution (%)')
    ax3.set_title('Cumulative Attribution Impact')
    ax3.grid(True, alpha=0.3)
    ax3.axhline(y=50, color='red', linestyle='--', alpha=0.7, label='50% threshold')
    ax3.axhline(y=80, color='orange', linestyle='--', alpha=0.7, label='80% threshold')
    ax3.legend()
    
    # Plot 4: Token importance ranking
    importance_ranks = [i+1 for i in range(len(sorted_tokens))]
    ax4.scatter(importance_ranks, [abs(score) for score in sorted_scores], 
               c=[abs(score) for score in sorted_scores], cmap='viridis', s=100, alpha=0.7)
    ax4.set_xlabel('Importance Rank')
    ax4.set_ylabel('Absolute Attribution Score')
    ax4.set_title('Token Importance Ranking')
    ax4.grid(True, alpha=0.3)
    
    plt.tight_layout()
    
    if save_path:
        plt.savefig(save_path, dpi=300, bbox_inches='tight')
        print(f"üíæ Saved enhanced visualization to {save_path}")
    
    plt.show()


def generate_comprehensive_visualizations(attribution_result: Dict, save_dir: str = "explainability_results"):
    """
    Generate all visualization types for a given attribution result
    """
    os.makedirs(save_dir, exist_ok=True)
    
    # Generate base filename
    base_filename = f"example_{attribution_result.get('text', 'unknown')[:30].replace(' ', '_')}"
    
    # 1. Token heatmap
    heatmap_path = os.path.join(save_dir, f"{base_filename}_heatmap.png")
    visualize_token_heatmap(attribution_result, heatmap_path)
    
    # 2. Attribution distribution
    dist_path = os.path.join(save_dir, f"{base_filename}_distribution.png")
    visualize_attribution_distribution(attribution_result, dist_path)
    
    # 3. Enhanced attributions (original function)
    attr_path = os.path.join(save_dir, f"{base_filename}_attributions.png")
    visualize_attributions(attribution_result, attr_path)
    
    print(f"‚úÖ Generated comprehensive visualizations for: {base_filename}")
    return {
        'heatmap': heatmap_path,
        'distribution': dist_path,
        'attributions': attr_path
    }


def visualize_token_heatmap(attribution_result: Dict, save_path: Optional[str] = None):
    """
    1. Token Attribute Heatmap
    Display input text where each token is highlighted by importance.
    Color code from red (negative influence) to green (positive influence).
    """
    tokens = attribution_result['tokens']
    scores = attribution_result['attribution_scores']
    text = attribution_result['text']
    model_type = attribution_result['model_type']
    
    # Create figure with larger size for better readability
    fig, ax = plt.subplots(figsize=(16, 6))
    
    # Normalize scores for color mapping (-1 to 1)
    abs_max = max(abs(min(scores)), abs(max(scores)))
    if abs_max > 0:
        normalized_scores = [score / abs_max for score in scores]
    else:
        normalized_scores = scores
    
    # Create color map: red (negative) to white (neutral) to green (positive)
    colors = []
    for score in normalized_scores:
        if score > 0:  # Positive influence - green
            colors.append(plt.cm.Greens(0.3 + 0.7 * score))
        elif score < 0:  # Negative influence - red
            colors.append(plt.cm.Reds(0.3 + 0.7 * abs(score)))
        else:  # Neutral - white
            colors.append('white')
    
    # Create text with colored tokens
    y_pos = 0.5
    x_pos = 0.05
    max_width = 0.9
    
    # Split text into words and align with tokens
    words = text.split()
    word_idx = 0
    
    for i, (token, score, color) in enumerate(zip(tokens, scores, colors)):
        # Skip special tokens for cleaner display
        if token in ['<s>', '</s>', '<pad>', '[PAD]', '[CLS]', '[SEP]']:
            continue
            
        # Calculate token width based on character count
        token_width = len(token) * 0.01
        
        # Check if we need to wrap to next line
        if x_pos + token_width > max_width:
            x_pos = 0.05
            y_pos -= 0.15
        
        # Add token with background color
        rect = plt.Rectangle((x_pos, y_pos - 0.05), token_width, 0.1, 
                           facecolor=color, edgecolor='black', linewidth=0.5, alpha=0.8)
        ax.add_patch(rect)
        
        # Add token text
        ax.text(x_pos + token_width/2, y_pos, token, 
               ha='center', va='center', fontsize=10, fontweight='bold')
        
        # Add attribution score above token
        ax.text(x_pos + token_width/2, y_pos + 0.08, f'{score:.3f}', 
               ha='center', va='center', fontsize=8, color='darkblue')
        
        x_pos += token_width + 0.02
    
    # Set plot properties
    ax.set_xlim(0, 1)
    ax.set_ylim(y_pos - 0.2, 0.7)
    ax.axis('off')
    
    # Add title and legend
    ax.text(0.5, 0.9, f'Token Attribution Heatmap - {model_type.replace("_", " ").title()}', 
           ha='center', va='center', fontsize=14, fontweight='bold')
    ax.text(0.5, 0.85, f'Class: {attribution_result["predicted_class"]} (Confidence: {attribution_result["confidence"]:.3f})', 
           ha='center', va='center', fontsize=12)
    
    # Add color legend
    legend_elements = [
        plt.Rectangle((0, 0), 1, 1, facecolor=plt.cm.Reds(0.8), label='Negative Influence'),
        plt.Rectangle((0, 0), 1, 1, facecolor=plt.cm.Greens(0.8), label='Positive Influence'),
        plt.Rectangle((0, 0), 1, 1, facecolor='white', edgecolor='black', label='Neutral')
    ]
    ax.legend(handles=legend_elements, loc='upper right', bbox_to_anchor=(0.98, 0.98))
    
    plt.tight_layout()
    
    if save_path:
        plt.savefig(save_path, dpi=300, bbox_inches='tight')
        print(f"üíæ Saved token heatmap to {save_path}")
    
    plt.show()


def visualize_attribution_distribution(attribution_result: Dict, save_path: Optional[str] = None):
    """
    2. Attribution Distribution Plot
    Bar plot showing token influence magnitude and ranking.
    """
    tokens = attribution_result['tokens']
    scores = attribution_result['attribution_scores']
    model_type = attribution_result['model_type']
    
    # Create figure
    fig, (ax1, ax2) = plt.subplots(2, 1, figsize=(16, 10))
    
    # Sort tokens by absolute attribution score
    token_score_pairs = list(zip(tokens, scores))
    token_score_pairs.sort(key=lambda x: abs(x[1]), reverse=True)
    sorted_tokens, sorted_scores = zip(*token_score_pairs)
    
    # Plot 1: Bar plot with color coding
    colors = ['red' if score < 0 else 'green' for score in sorted_scores]
    bars = ax1.bar(range(len(sorted_tokens)), sorted_scores, color=colors, alpha=0.7)
    
    # Customize first subplot
    ax1.set_xticks(range(len(sorted_tokens)))
    ax1.set_xticklabels(sorted_tokens, rotation=45, ha='right')
    ax1.set_ylabel('Attribution Score')
    ax1.set_title(f'Token Attribution Distribution - {model_type.replace("_", " ").title()}')
    ax1.grid(True, alpha=0.3)
    ax1.axhline(y=0, color='black', linestyle='-', alpha=0.5)
    
    # Add value labels on bars
    for i, (bar, score) in enumerate(zip(bars, sorted_scores)):
        height = bar.get_height()
        ax1.text(bar.get_x() + bar.get_width()/2., height + (0.01 if height >= 0 else -0.01),
                f'{score:.3f}', ha='center', va='bottom' if height >= 0 else 'top', fontsize=8)
    
    # Plot 2: Cumulative attribution plot
    cumulative_scores = np.cumsum([abs(score) for score in sorted_scores])
    total_attribution = cumulative_scores[-1]
    cumulative_percentage = cumulative_scores / total_attribution * 100 if total_attribution > 0 else cumulative_scores
    
    ax2.plot(range(len(sorted_tokens)), cumulative_percentage, 'b-o', linewidth=2, markersize=4)
    ax2.fill_between(range(len(sorted_tokens)), cumulative_percentage, alpha=0.3, color='blue')
    
    # Customize second subplot
    ax2.set_xticks(range(len(sorted_tokens)))
    ax2.set_xticklabels(sorted_tokens, rotation=45, ha='right')
    ax2.set_ylabel('Cumulative Attribution (%)')
    ax2.set_title('Cumulative Attribution Impact')
    ax2.grid(True, alpha=0.3)
    ax2.axhline(y=50, color='red', linestyle='--', alpha=0.7, label='50% threshold')
    ax2.axhline(y=80, color='orange', linestyle='--', alpha=0.7, label='80% threshold')
    ax2.legend()
    
    plt.tight_layout()
    
    if save_path:
        plt.savefig(save_path, dpi=300, bbox_inches='tight')
        print(f"üíæ Saved attribution distribution to {save_path}")
    
    plt.show()


def visualize_faithfulness_curves(faithfulness_results: List[Dict], save_path: Optional[str] = None):
    """
    3. Faithfulness Curves Plot
    Plot faithfulness for different k values across multiple examples.
    """
    if not faithfulness_results:
        print("‚ö†Ô∏è No faithfulness results to visualize")
        return
    
    # Extract k ratios and faithfulness scores
    k_ratios = [0.1, 0.2, 0.3, 0.5]  # Standard ratios
    
    # Create figure
    fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(16, 6))
    
    # Plot 1: Individual curves for each example
    for i, result in enumerate(faithfulness_results):
        scores = []
        for ratio in k_ratios:
            key = f'faithfulness_top_{ratio}'
            score = result.get(key, 0.0)
            scores.append(score)
        
        # Plot individual curve
        ax1.plot(k_ratios, scores, 'o-', alpha=0.7, linewidth=2, markersize=6,
                label=f'Example {i+1}' if i < 5 else None)  # Limit legend to first 5
    
    # Add average curve
    avg_scores = []
    for ratio in k_ratios:
        key = f'faithfulness_top_{ratio}'
        scores = [result.get(key, 0.0) for result in faithfulness_results]
        avg_scores.append(np.mean(scores))
    
    ax1.plot(k_ratios, avg_scores, 'k-o', linewidth=3, markersize=8, 
            label='Average', alpha=0.9)
    
    # Customize first subplot
    ax1.set_xlabel('Top-k Ratio')
    ax1.set_ylabel('Faithfulness Score (ŒîConfidence)')
    ax1.set_title('Faithfulness Curves by Example')
    ax1.grid(True, alpha=0.3)
    ax1.legend(bbox_to_anchor=(1.05, 1), loc='upper left')
    ax1.axhline(y=0, color='red', linestyle='--', alpha=0.7)
    
    # Plot 2: Box plot showing distribution across examples
    box_data = []
    for ratio in k_ratios:
        key = f'faithfulness_top_{ratio}'
        scores = [result.get(key, 0.0) for result in faithfulness_results]
        box_data.append(scores)
    
    bp = ax2.boxplot(box_data, labels=[f'{r*100}%' for r in k_ratios], patch_artist=True)
    
    # Color the boxes
    colors = ['lightblue', 'lightgreen', 'lightyellow', 'lightcoral']
    for patch, color in zip(bp['boxes'], colors):
        patch.set_facecolor(color)
    
    # Customize second subplot
    ax2.set_xlabel('Top-k Ratio')
    ax2.set_ylabel('Faithfulness Score Distribution')
    ax2.set_title('Faithfulness Score Distribution by k')
    ax2.grid(True, alpha=0.3)
    ax2.axhline(y=0, color='red', linestyle='--', alpha=0.7)
    
    plt.tight_layout()
    
    if save_path:
        plt.savefig(save_path, dpi=300, bbox_inches='tight')
        print(f"üíæ Saved faithfulness curves to {save_path}")
    
    plt.show()


def visualize_stability_heatmap(seed_model_dicts: List[Dict], text: str, save_path: Optional[str] = None):
    """
    4. Stability Visualization
    Heatmap showing pairwise cosine similarity of attribution vectors across seeds.
    """
    print("üìä Generating stability heatmap...")
    
    if len(seed_model_dicts) < 2:
        print("‚ö†Ô∏è Need at least 2 seed models for stability analysis")
        return
    
    # Get reference model (first seed)
    ref_md = seed_model_dicts[0]
    ig_explainer = BERTweetIntegratedGradients()
    
    # Generate reference attribution
    ref_result = ig_explainer.generate_attributions(text, ref_md)
    if not ref_result:
        print("‚ùå Failed to generate reference attribution")
        return
    
    ref_class = int(ref_result['predicted_class'])
    ref_tokenizer = ref_md['tokenizer']
    
    print(f"üîí Reference class: {ref_class}, using tokenizer from seed {ref_md['seed']}")
    
    # Generate attributions for all seeds
    seed_attributions = {}
    for md in seed_model_dicts:
        seed = md['seed']
        result = ig_explainer.generate_attributions(
            text, md, 
            force_target_class=ref_class,
            force_tokenizer=ref_tokenizer
        )
        if result and len(result['attribution_scores']) > 0:
            seed_attributions[seed] = np.array(result['attribution_scores'])
            print(f"‚úÖ Seed {seed}: computed IG for target class {ref_class}")
        else:
            print(f"‚ùå Seed {seed}: failed to compute IG")
    
    if len(seed_attributions) < 2:
        print("‚ö†Ô∏è Insufficient attributions for stability analysis")
        return
    
    # Compute pairwise cosine similarities
    seeds = list(seed_attributions.keys())
    n_seeds = len(seeds)
    similarity_matrix = np.zeros((n_seeds, n_seeds))
    
    for i, seed1 in enumerate(seeds):
        for j, seed2 in enumerate(seeds):
            if i == j:
                similarity_matrix[i, j] = 1.0  # Self-similarity
            else:
                vec1 = seed_attributions[seed1]
                vec2 = seed_attributions[seed2]
                
                # Standardize vectors before computing similarity
                L = min(len(vec1), len(vec2))
                if L > 1:
                    A = vec1[:L]
                    B = vec2[:L]
                    A = (A - A.mean()) / (A.std() + 1e-8)
                    B = (B - B.mean()) / (B.std() + 1e-8)
                    
                    # Compute cosine similarity
                    na, nb = np.linalg.norm(A), np.linalg.norm(B)
                    if na > 0 and nb > 0:
                        similarity_matrix[i, j] = (A @ B) / (na * nb)
                    else:
                        similarity_matrix[i, j] = 0.0
                else:
                    similarity_matrix[i, j] = 0.0
    
    # Create heatmap
    fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(16, 6))
    
    # Plot 1: Similarity heatmap
    im1 = ax1.imshow(similarity_matrix, cmap='RdYlBu_r', vmin=-1, vmax=1, aspect='auto')
    
    # Add text annotations
    for i in range(n_seeds):
        for j in range(n_seeds):
            text_val = f'{similarity_matrix[i, j]:.3f}'
            ax1.text(j, i, text_val, ha='center', va='center', 
                    color='black' if abs(similarity_matrix[i, j]) < 0.7 else 'white',
                    fontweight='bold')
    
    # Customize heatmap
    ax1.set_xticks(range(n_seeds))
    ax1.set_yticks(range(n_seeds))
    ax1.set_xticklabels([f'Seed {s}' for s in seeds])
    ax1.set_yticklabels([f'Seed {s}' for s in seeds])
    ax1.set_title(f'Stability Heatmap: Pairwise Cosine Similarity\nTarget Class: {ref_class}')
    
    # Add colorbar
    cbar1 = plt.colorbar(im1, ax=ax1)
    cbar1.set_label('Cosine Similarity')
    
    # Plot 2: Stability summary statistics
    # Calculate mean similarity excluding self-similarity
    mask = ~np.eye(n_seeds, dtype=bool)
    mean_similarity = similarity_matrix[mask].mean()
    std_similarity = similarity_matrix[mask].std()
    
    # Create bar plot of mean similarities per seed
    mean_similarities = []
    for i in range(n_seeds):
        seed_similarities = similarity_matrix[i, :]
        seed_similarities = np.delete(seed_similarities, i)  # Remove self-similarity
        mean_similarities.append(seed_similarities.mean())
    
    bars = ax2.bar(range(n_seeds), mean_similarities, color='skyblue', alpha=0.7)
    ax2.set_xticks(range(n_seeds))
    ax2.set_xticklabels([f'Seed {s}' for s in seeds])
    ax2.set_ylabel('Mean Similarity with Other Seeds')
    ax2.set_title(f'Stability Summary\nMean: {mean_similarity:.3f}, Std: {std_similarity:.3f}')
    ax2.grid(True, alpha=0.3)
    ax2.axhline(y=0.5, color='red', linestyle='--', alpha=0.7, label='Stability Threshold')
    ax2.legend()
    
    # Add value labels on bars
    for i, (bar, sim) in enumerate(zip(bars, mean_similarities)):
        height = bar.get_height()
        ax2.text(bar.get_x() + bar.get_width()/2., height + 0.01,
                f'{sim:.3f}', ha='center', va='bottom', fontsize=10)
    
    plt.tight_layout()
    
    if save_path:
        plt.savefig(save_path, dpi=300, bbox_inches='tight')
        print(f"üíæ Saved stability heatmap to {save_path}")
    
    plt.show()
    
    # Return stability metrics
    return {
        'mean_similarity': mean_similarity,
        'std_similarity': std_similarity,
        'similarity_matrix': similarity_matrix,
        'seeds': seeds
    }


def plot_evaluation_comparison(evaluation_results: Dict, save_path: Optional[str] = None):
    """
    Generate comparison plots for different evaluation metrics across models
    """
    if not evaluation_results:
        print("‚ö†Ô∏è No evaluation results to plot")
        return
    
    # Extract metrics for comparison
    metrics = ['faithfulness_top_0.1', 'faithfulness_top_0.2', 'faithfulness_top_0.3', 'faithfulness_top_0.5',
               'stability_cosine', 'stability_correlation', 'demographic_bias_ratio', 'attribution_concentration']
    
    # Create figure with subplots
    fig, axes = plt.subplots(2, 2, figsize=(20, 16))
    axes = axes.flatten()
    
    for i, metric in enumerate(metrics[:4]):  # Plot first 4 metrics
        ax = axes[i]
        
        # Extract data for this metric
        single_task_data = []
        multitask_data = []
        
        if 'single_task' in evaluation_results:
            single_task_data = [result.get(metric, 0.0) for result in evaluation_results['single_task']]
        
        if 'multitask' in evaluation_results:
            multitask_data = [result.get(metric, 0.0) for result in evaluation_results['multitask']]
        
        # Create box plots
        data_to_plot = []
        labels = []
        
        if single_task_data:
            data_to_plot.append(single_task_data)
            labels.append('Single-Task')
        
        if multitask_data:
            data_to_plot.append(multitask_data)
            labels.append('Multi-Task')
        
        if data_to_plot:
            bp = ax.boxplot(data_to_plot, labels=labels, patch_artist=True)
            
            # Color the boxes
            colors = ['lightblue', 'lightgreen']
            for patch, color in zip(bp['boxes'], colors):
                patch.set_facecolor(color)
            
            ax.set_title(f'{metric.replace("_", " ").title()}')
            ax.set_ylabel('Score')
            ax.grid(True, alpha=0.3)
            
            # Add mean values as text
            for j, data in enumerate(data_to_plot):
                mean_val = np.mean(data)
                ax.text(j+1, mean_val, f'Œº={mean_val:.3f}', 
                       ha='center', va='bottom', fontweight='bold')
    
    plt.tight_layout()
    
    if save_path:
        plt.savefig(save_path, dpi=300, bbox_inches='tight')
        print(f"üíæ Saved evaluation comparison to {save_path}")
    
    plt.show()

In [None]:
def save_eval_csv(rows: List[Dict], path: str):
    """Save evaluation results to CSV"""
    df = pd.DataFrame(rows)
    df.to_csv(path, index=False)
    print(f"üíæ Saved {len(df)} rows to {path}")
    return df

In [None]:
def run_complete_analysis(
    num_examples: int = 8,
    data_path: str = "data/cleaned_reddit_posts.csv",
    save_visualizations: bool = True,
    save_dir: str = "explainability_results"
):
    print("Starting Complete Explainability Analysis")
    print("=" * 80)
    
    # Create save directory
    if save_visualizations:
        os.makedirs(save_dir, exist_ok=True)
    
    # Step 1: Load models
    print("\n1Ô∏è‚É£ Loading Models...")
    single_task_dict, multitask_dict = load_bertweet_models()
    
    # Step 2: Load test examples
    print("\n2Ô∏è‚É£ Loading Test Examples...")
    test_texts = load_test_examples(data_path, num_examples)
    
    # Step 3: Generate explanations
    print("\n3Ô∏è‚É£ Generating Explanations...")
    explanations = generate_all_explanations(test_texts, single_task_dict, multitask_dict)
    
    # Step 4: Evaluate explanations
    print("\n4Ô∏è‚É£ Evaluating Explanations...")
    evaluation_results = evaluate_all_explanations(explanations)
    
    # Step 5: Generate visualizations
    if save_visualizations:
        print("\n5Ô∏è‚É£ Generating Visualizations...")
        
        # Generate comprehensive visualizations for first few examples
        for i in range(min(3, len(explanations['single_task']))):
            print(f"\nüìä Generating visualizations for example {i+1}...")
            
            # Single-task comprehensive visualizations
            single_task_result = explanations['single_task'][i]
            single_task_dir = os.path.join(save_dir, f"single_task_example_{i+1}")
            generate_comprehensive_visualizations(single_task_result, single_task_dir)
            
            # Multitask comprehensive visualizations
            multitask_result = explanations['multitask'][i]
            multitask_dir = os.path.join(save_dir, f"multitask_example_{i+1}")
            generate_comprehensive_visualizations(multitask_result, multitask_dir)
        
        # Generate faithfulness curves if we have multiple examples
        if len(explanations['single_task']) > 1:
            faithfulness_path = os.path.join(save_dir, "faithfulness_curves.png")
            visualize_faithfulness_curves(explanations['single_task'], faithfulness_path)
        
        # Comparison plot
        comparison_path = os.path.join(save_dir, "model_comparison.png")
        plot_evaluation_comparison(evaluation_results, comparison_path)
    
    # Step 6: Generate summary report
    print("\n6Ô∏è‚É£ Generating Summary Report...")
    report = generate_summary_report(evaluation_results)
    
    if save_visualizations:
        report_path = os.path.join(save_dir, "analysis_report.txt")
        with open(report_path, 'w') as f:
            f.write(report)
        print(f"üíæ Saved report to {report_path}")
    
    print(report)
    print("\nüéâ Analysis Complete!")
    
    return {
        'explanations': explanations,
        'evaluation_results': evaluation_results,
        'report': report,
        'models': {'single_task': single_task_dict, 'multitask': multitask_dict}
    }

def run_ig_analysis_single_task_across_seeds(
    base_dir="./bertweet_trained_models_seeds",
    seeds=(42,123,456,789,999),
    data_path="data/cleaned_reddit_posts.csv",
    num_examples=100,
    save_dir="explainability_results_single_task"
):
    print("Starting Single-Task BERTweet IG Analysis Across Seeds")
    print("=" * 80)
    
    os.makedirs(save_dir, exist_ok=True)
    
    # Step 1: Load models across seeds
    print("\n1Ô∏è‚É£ Loading Single-Task Models Across Seeds...")
    seed_models = load_single_task_models_by_seeds(base_dir, seeds)
    ref_model = seed_models[0]  # Reference model (seed 42)
    
    # Step 2: Load test examples
    print("\n2Ô∏è‚É£ Loading Test Examples...")
    texts = load_test_examples(data_path, num_examples)
    
    # Step 3: Generate explanations using reference model
    print("\n3Ô∏è‚É£ Generating Explanations (Reference Seed)...")
    explanations = generate_single_task_explanations(texts, ref_model)
    
    # Step 4: Evaluate explanations across seeds
    print("\n4Ô∏è‚É£ Evaluating Explanations Across Seeds...")
    rows = evaluate_single_task_explanations_across_seeds(explanations, seed_models)
    
    # Step 5: Generate stability visualizations
    print("\n5Ô∏è‚É£ Generating Stability Visualizations...")
    
    # Generate stability heatmaps for first few examples
    if len(texts) > 0:
        for i in range(min(3, len(texts))):
            text = texts[i]
            print(f"\nüìä Generating stability visualization for example {i+1}...")
            
            stability_path = os.path.join(save_dir, f"stability_example_{i+1}.png")
            stability_metrics = visualize_stability_heatmap(seed_models, text, stability_path)
            
            if stability_metrics:
                print(f"‚úÖ Stability metrics for example {i+1}: Mean={stability_metrics['mean_similarity']:.3f}, Std={stability_metrics['std_similarity']:.3f}")
    
    # Step 6: Save results
    print("\n6Ô∏è‚É£ Saving Results...")
    save_eval_csv(rows, os.path.join(save_dir, "xai_metrics_single_task_across_seeds.csv"))
    
    # Step 6: Generate faithfulness curves
    print("\n6Ô∏è‚É£ Generating Faithfulness Curves...")
    
    if len(rows) > 1:
        faithfulness_path = os.path.join(save_dir, "faithfulness_curves_single_task.png")
        visualize_faithfulness_curves(rows, faithfulness_path)
    
    # Step 7: Generate summary
    print("\n7Ô∏è‚É£ Generating Summary...")
    df = pd.DataFrame(rows)
    summary = df.agg({
        'faithfulness_top_0.1':['mean','std'],
        'faithfulness_top_0.2':['mean','std'],
        'faithfulness_top_0.3':['mean','std'],
        'faithfulness_top_0.5': ['mean', 'std'], 
        'stability_cosine':['mean','std'],
        'stability_correlation':['mean','std'],
        'demographic_bias_ratio':['mean','std'],
        'attribution_concentration':['mean','std'],
    })
    summary.to_csv(os.path.join(save_dir, "xai_metrics_summary.csv"))
    print("\nüìä Summary Statistics:")
    print(summary)
    
    print("\nüéâ Single-Task Analysis Complete!")
    return {'rows': rows, 'summary': summary}


# Main execution
if __name__ == "__main__":
    run_ig_analysis_single_task_across_seeds(
        base_dir="./bertweet_trained_models_seeds",
        seeds=(42,123,456,789,999),
        data_path="data/cleaned_reddit_posts.csv",
        num_examples=100,
        save_dir="explainability_results_single_task"
    )

Starting Single-Task BERTweet IG Analysis Across Seeds

1Ô∏è‚É£ Loading Single-Task Models Across Seeds...
üì• Loading single-task model (seed 42) from ./bertweet_trained_models_seeds\bertweet_sentiment_seed_42
üì• Loading single-task model (seed 123) from ./bertweet_trained_models_seeds\bertweet_sentiment_seed_123
üì• Loading single-task model (seed 456) from ./bertweet_trained_models_seeds\bertweet_sentiment_seed_456
üì• Loading single-task model (seed 789) from ./bertweet_trained_models_seeds\bertweet_sentiment_seed_789
üì• Loading single-task model (seed 999) from ./bertweet_trained_models_seeds\bertweet_sentiment_seed_999
‚úÖ Loaded 5 single-task models across seeds

2Ô∏è‚É£ Loading Test Examples...
üìä Loading 100 test examples from data/cleaned_reddit_posts.csv
‚úÖ Loaded 94 valid test examples

3Ô∏è‚É£ Generating Explanations (Reference Seed)...

üìù Processing text 1/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence:

In [None]:
print("Starting Single-Task BERTweet IG Analysis Across Seeds
================================================================================

1Ô∏è‚É£ Loading Single-Task Models Across Seeds...
üì• Loading single-task model (seed 42) from ./bertweet_trained_models_seeds\bertweet_sentiment_seed_42
üì• Loading single-task model (seed 123) from ./bertweet_trained_models_seeds\bertweet_sentiment_seed_123
üì• Loading single-task model (seed 456) from ./bertweet_trained_models_seeds\bertweet_sentiment_seed_456
üì• Loading single-task model (seed 789) from ./bertweet_trained_models_seeds\bertweet_sentiment_seed_789
üì• Loading single-task model (seed 999) from ./bertweet_trained_models_seeds\bertweet_sentiment_seed_999
‚úÖ Loaded 5 single-task models across seeds

2Ô∏è‚É£ Loading Test Examples...
üìä Loading 100 test examples from data/cleaned_reddit_posts.csv
‚úÖ Loaded 94 valid test examples

3Ô∏è‚É£ Generating Explanations (Reference Seed)...

üìù Processing text 1/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.368
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 50 tokens

üìù Processing text 2/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.353
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 20 tokens

üìù Processing text 3/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.376
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 38 tokens

üìù Processing text 4/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.369
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 16 tokens

üìù Processing text 5/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.364
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 10 tokens

üìù Processing text 6/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.383
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 56 tokens

üìù Processing text 7/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.366
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 19 tokens

üìù Processing text 8/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.357
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 61 tokens

üìù Processing text 9/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.382
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 98 tokens

üìù Processing text 10/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.376
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 73 tokens

üìù Processing text 11/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.364
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens

üìù Processing text 12/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.368
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 31 tokens

üìù Processing text 13/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.363
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 55 tokens

üìù Processing text 14/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.378
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 71 tokens

üìù Processing text 15/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.361
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens

üìù Processing text 16/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.366
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens

üìù Processing text 17/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.380
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 26 tokens

üìù Processing text 18/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.353
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 96 tokens

üìù Processing text 19/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.378
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens

üìù Processing text 20/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.362
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 5 tokens

üìù Processing text 21/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.363
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 14 tokens

üìù Processing text 22/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.372
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 15 tokens

üìù Processing text 23/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.367
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 28 tokens

üìù Processing text 24/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.361
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens

üìù Processing text 25/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.363
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens

üìù Processing text 26/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.373
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 60 tokens

üìù Processing text 27/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.362
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens

üìù Processing text 28/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.395
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 35 tokens

üìù Processing text 29/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.372
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 22 tokens

üìù Processing text 30/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.359
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens

üìù Processing text 31/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.361
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 36 tokens

üìù Processing text 32/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.378
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 26 tokens

üìù Processing text 33/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.350
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 11 tokens

üìù Processing text 34/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.360
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens

üìù Processing text 35/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.371
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 34 tokens

üìù Processing text 36/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.369
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 12 tokens

üìù Processing text 37/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.362
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 22 tokens

üìù Processing text 38/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.372
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 10 tokens

üìù Processing text 39/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.366
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 93 tokens

üìù Processing text 40/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.371
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 42 tokens

üìù Processing text 41/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.360
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 69 tokens

üìù Processing text 42/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.365
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 21 tokens

üìù Processing text 43/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.374
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 114 tokens

üìù Processing text 44/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.360
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens

üìù Processing text 45/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.377
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 101 tokens

üìù Processing text 46/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.368
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 45 tokens

üìù Processing text 47/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.353
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 12 tokens

üìù Processing text 48/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.359
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 34 tokens

üìù Processing text 49/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.386
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens

üìù Processing text 50/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.358
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 7 tokens

üìù Processing text 51/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.359
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 17 tokens

üìù Processing text 52/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.372
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 16 tokens

üìù Processing text 53/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.362
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens

üìù Processing text 54/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.364
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens

üìù Processing text 55/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.372
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 29 tokens

üìù Processing text 56/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.343
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 11 tokens

üìù Processing text 57/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.366
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 27 tokens

üìù Processing text 58/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.367
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 15 tokens

üìù Processing text 59/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.342
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 16 tokens

üìù Processing text 60/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.394
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens

üìù Processing text 61/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.369
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 33 tokens

üìù Processing text 62/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.381
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 11 tokens

üìù Processing text 63/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.355
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 14 tokens

üìù Processing text 64/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.365
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 81 tokens

üìù Processing text 65/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.375
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 20 tokens

üìù Processing text 66/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.381
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 26 tokens

üìù Processing text 67/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.366
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 97 tokens

üìù Processing text 68/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.383
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 53 tokens

üìù Processing text 69/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.366
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 77 tokens

üìù Processing text 70/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.368
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 13 tokens

üìù Processing text 71/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.366
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 76 tokens

üìù Processing text 72/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.360
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 32 tokens

üìù Processing text 73/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.378
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 13 tokens

üìù Processing text 74/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.366
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens

üìù Processing text 75/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.359
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 17 tokens

üìù Processing text 76/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.363
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 10 tokens

üìù Processing text 77/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.364
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens

üìù Processing text 78/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.348
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 6 tokens

üìù Processing text 79/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.337
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 5 tokens

üìù Processing text 80/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.377
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 7 tokens

üìù Processing text 81/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.337
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 18 tokens

üìù Processing text 82/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.379
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 34 tokens

üìù Processing text 83/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.370
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 41 tokens

üìù Processing text 84/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.368
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 11 tokens

üìù Processing text 85/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.366
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 40 tokens

üìù Processing text 86/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.356
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 12 tokens

üìù Processing text 87/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.384
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 19 tokens

üìù Processing text 88/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.373
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 17 tokens

üìù Processing text 89/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.386
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 61 tokens

üìù Processing text 90/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.377
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 7 tokens

üìù Processing text 91/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.368
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 42 tokens

üìù Processing text 92/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.366
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 38 tokens

üìù Processing text 93/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.356
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 119 tokens

üìù Processing text 94/94
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.357
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Generated explanations for 94 examples (single-task, seed 42)

4Ô∏è‚É£ Evaluating Explanations Across Seeds...
üî¨ Evaluating single-task explanations across seeds...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3685
üìä Ratio 0.1: 5 tokens masked, confidence: 0.3642 ‚Üí 0.0043
üìä Ratio 0.2: 10 tokens masked, confidence: 0.3662 ‚Üí 0.0023
üìä Ratio 0.3: 15 tokens masked, confidence: 0.3657 ‚Üí 0.0028
üìä Ratio 0.5: 26 tokens masked, confidence: 0.3537 ‚Üí 0.0148
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.368
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 50 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.269
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 50 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.359
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 50 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.327
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 50 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 50 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3530
üìä Ratio 0.1: 2 tokens masked, confidence: 0.3629 ‚Üí -0.0100
üìä Ratio 0.2: 4 tokens masked, confidence: 0.3580 ‚Üí -0.0051
üìä Ratio 0.3: 6 tokens masked, confidence: 0.3519 ‚Üí 0.0011
üìä Ratio 0.5: 11 tokens masked, confidence: 0.3479 ‚Üí 0.0050
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.353
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 20 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.316
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 20 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.375
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 20 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.320
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 20 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 20 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3755
üìä Ratio 0.1: 4 tokens masked, confidence: 0.3670 ‚Üí 0.0085
üìä Ratio 0.2: 8 tokens masked, confidence: 0.3590 ‚Üí 0.0166
üìä Ratio 0.3: 12 tokens masked, confidence: 0.3588 ‚Üí 0.0167
üìä Ratio 0.5: 20 tokens masked, confidence: 0.3628 ‚Üí 0.0128
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.376
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 38 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.360
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 38 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.387
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 38 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.359
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 38 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 38 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3693
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3653 ‚Üí 0.0041
üìä Ratio 0.2: 3 tokens masked, confidence: 0.3615 ‚Üí 0.0079
üìä Ratio 0.3: 5 tokens masked, confidence: 0.3740 ‚Üí -0.0047
üìä Ratio 0.5: 9 tokens masked, confidence: 0.3614 ‚Üí 0.0079
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.369
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 16 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.370
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 16 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.352
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 16 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.326
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 16 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 16 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3640
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3653 ‚Üí -0.0013
üìä Ratio 0.2: 2 tokens masked, confidence: 0.3681 ‚Üí -0.0041
üìä Ratio 0.3: 3 tokens masked, confidence: 0.3696 ‚Üí -0.0056
üìä Ratio 0.5: 6 tokens masked, confidence: 0.3654 ‚Üí -0.0014
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.364
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 10 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.294
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 10 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.373
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 10 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.292
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 10 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 10 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3827
üìä Ratio 0.1: 5 tokens masked, confidence: 0.3879 ‚Üí -0.0052
üìä Ratio 0.2: 11 tokens masked, confidence: 0.3673 ‚Üí 0.0153
üìä Ratio 0.3: 17 tokens masked, confidence: 0.3754 ‚Üí 0.0073
üìä Ratio 0.5: 29 tokens masked, confidence: 0.3740 ‚Üí 0.0086
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.383
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 56 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.346
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 56 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.343
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 56 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.360
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 56 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 56 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3660
üìä Ratio 0.1: 2 tokens masked, confidence: 0.3505 ‚Üí 0.0155
üìä Ratio 0.2: 4 tokens masked, confidence: 0.3640 ‚Üí 0.0020
üìä Ratio 0.3: 6 tokens masked, confidence: 0.3672 ‚Üí -0.0012
üìä Ratio 0.5: 10 tokens masked, confidence: 0.3773 ‚Üí -0.0113
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.366
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 19 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.365
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 19 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.374
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 19 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.354
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 19 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 19 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3574
üìä Ratio 0.1: 6 tokens masked, confidence: 0.3558 ‚Üí 0.0016
üìä Ratio 0.2: 12 tokens masked, confidence: 0.3575 ‚Üí -0.0001
üìä Ratio 0.3: 18 tokens masked, confidence: 0.3626 ‚Üí -0.0052
üìä Ratio 0.5: 31 tokens masked, confidence: 0.3535 ‚Üí 0.0039
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.357
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 61 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.257
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 61 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.362
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 61 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.300
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 61 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 61 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3817
üìä Ratio 0.1: 10 tokens masked, confidence: 0.3671 ‚Üí 0.0147
üìä Ratio 0.2: 20 tokens masked, confidence: 0.3635 ‚Üí 0.0182
üìä Ratio 0.3: 30 tokens masked, confidence: 0.3701 ‚Üí 0.0117
üìä Ratio 0.5: 50 tokens masked, confidence: 0.3664 ‚Üí 0.0154
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.382
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 98 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.356
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 98 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.372
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 98 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.316
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 98 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.322
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 98 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3755
üìä Ratio 0.1: 7 tokens masked, confidence: 0.3545 ‚Üí 0.0210
üìä Ratio 0.2: 15 tokens masked, confidence: 0.3564 ‚Üí 0.0191
üìä Ratio 0.3: 22 tokens masked, confidence: 0.3652 ‚Üí 0.0103
üìä Ratio 0.5: 37 tokens masked, confidence: 0.3642 ‚Üí 0.0114
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.376
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 73 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.341
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 73 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.365
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 73 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.319
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 73 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 73 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3640
üìä Ratio 0.1: 12 tokens masked, confidence: 0.3547 ‚Üí 0.0092
üìä Ratio 0.2: 25 tokens masked, confidence: 0.3645 ‚Üí -0.0005
üìä Ratio 0.3: 38 tokens masked, confidence: 0.3665 ‚Üí -0.0025
üìä Ratio 0.5: 64 tokens masked, confidence: 0.3723 ‚Üí -0.0084
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.364
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.348
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.337
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.331
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.322
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3681
üìä Ratio 0.1: 3 tokens masked, confidence: 0.3598 ‚Üí 0.0083
üìä Ratio 0.2: 6 tokens masked, confidence: 0.3555 ‚Üí 0.0126
üìä Ratio 0.3: 9 tokens masked, confidence: 0.3546 ‚Üí 0.0135
üìä Ratio 0.5: 16 tokens masked, confidence: 0.3623 ‚Üí 0.0058
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.368
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 31 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.381
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 31 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.363
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 31 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.331
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 31 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 31 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3633
üìä Ratio 0.1: 5 tokens masked, confidence: 0.3565 ‚Üí 0.0067
üìä Ratio 0.2: 11 tokens masked, confidence: 0.3519 ‚Üí 0.0114
üìä Ratio 0.3: 17 tokens masked, confidence: 0.3517 ‚Üí 0.0116
üìä Ratio 0.5: 28 tokens masked, confidence: 0.3750 ‚Üí -0.0117
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.363
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 55 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.291
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 55 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.368
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 55 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.330
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 55 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 55 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3779
üìä Ratio 0.1: 7 tokens masked, confidence: 0.3682 ‚Üí 0.0096
üìä Ratio 0.2: 14 tokens masked, confidence: 0.3698 ‚Üí 0.0081
üìä Ratio 0.3: 21 tokens masked, confidence: 0.3686 ‚Üí 0.0092
üìä Ratio 0.5: 36 tokens masked, confidence: 0.3618 ‚Üí 0.0160
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.378
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 71 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.367
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 71 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.359
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 71 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.320
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 71 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 71 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3609
üìä Ratio 0.1: 12 tokens masked, confidence: 0.3585 ‚Üí 0.0024
üìä Ratio 0.2: 25 tokens masked, confidence: 0.3525 ‚Üí 0.0084
üìä Ratio 0.3: 38 tokens masked, confidence: 0.3581 ‚Üí 0.0028
üìä Ratio 0.5: 64 tokens masked, confidence: 0.3524 ‚Üí 0.0085
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.361
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.299
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.355
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.329
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.316
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3664
üìä Ratio 0.1: 2 tokens masked, confidence: 0.3687 ‚Üí -0.0023
üìä Ratio 0.2: 5 tokens masked, confidence: 0.3806 ‚Üí -0.0142
üìä Ratio 0.3: 7 tokens masked, confidence: 0.3812 ‚Üí -0.0148
üìä Ratio 0.5: 13 tokens masked, confidence: 0.3777 ‚Üí -0.0114
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.366
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.278
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.359
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.290
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3796
üìä Ratio 0.1: 2 tokens masked, confidence: 0.3776 ‚Üí 0.0020
üìä Ratio 0.2: 5 tokens masked, confidence: 0.3754 ‚Üí 0.0042
üìä Ratio 0.3: 8 tokens masked, confidence: 0.3745 ‚Üí 0.0051
üìä Ratio 0.5: 14 tokens masked, confidence: 0.3607 ‚Üí 0.0189
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.380
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 26 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.370
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 26 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.370
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 26 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.309
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 26 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 26 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3534
üìä Ratio 0.1: 9 tokens masked, confidence: 0.3559 ‚Üí -0.0025
üìä Ratio 0.2: 19 tokens masked, confidence: 0.3561 ‚Üí -0.0027
üìä Ratio 0.3: 29 tokens masked, confidence: 0.3648 ‚Üí -0.0114
üìä Ratio 0.5: 49 tokens masked, confidence: 0.3515 ‚Üí 0.0019
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.353
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 96 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.273
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 96 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.354
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 96 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.315
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 96 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 96 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3784
üìä Ratio 0.1: 2 tokens masked, confidence: 0.3695 ‚Üí 0.0089
üìä Ratio 0.2: 5 tokens masked, confidence: 0.3737 ‚Üí 0.0047
üìä Ratio 0.3: 7 tokens masked, confidence: 0.3705 ‚Üí 0.0079
üìä Ratio 0.5: 13 tokens masked, confidence: 0.3921 ‚Üí -0.0137
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.378
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.280
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.353
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.314
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3618
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3518 ‚Üí 0.0100
üìä Ratio 0.2: 1 tokens masked, confidence: 0.3518 ‚Üí 0.0100
üìä Ratio 0.3: 2 tokens masked, confidence: 0.3622 ‚Üí -0.0004
üìä Ratio 0.5: 3 tokens masked, confidence: 0.3602 ‚Üí 0.0016
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.362
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 5 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.350
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 5 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.374
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 5 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.326
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 5 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 5 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3630
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3705 ‚Üí -0.0075
üìä Ratio 0.2: 3 tokens masked, confidence: 0.3769 ‚Üí -0.0139
üìä Ratio 0.3: 4 tokens masked, confidence: 0.3762 ‚Üí -0.0133
üìä Ratio 0.5: 8 tokens masked, confidence: 0.3866 ‚Üí -0.0236
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.363
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 14 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.392
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 14 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.361
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 14 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.320
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 14 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 14 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3717
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3699 ‚Üí 0.0018
üìä Ratio 0.2: 3 tokens masked, confidence: 0.3704 ‚Üí 0.0013
üìä Ratio 0.3: 5 tokens masked, confidence: 0.3607 ‚Üí 0.0110
üìä Ratio 0.5: 8 tokens masked, confidence: 0.3647 ‚Üí 0.0070
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.372
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 15 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.260
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 15 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.359
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 15 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.280
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 15 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 15 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3665
üìä Ratio 0.1: 3 tokens masked, confidence: 0.3627 ‚Üí 0.0039
üìä Ratio 0.2: 6 tokens masked, confidence: 0.3620 ‚Üí 0.0046
üìä Ratio 0.3: 9 tokens masked, confidence: 0.3617 ‚Üí 0.0049
üìä Ratio 0.5: 15 tokens masked, confidence: 0.3755 ‚Üí -0.0090
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.367
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 28 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.250
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 28 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.358
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 28 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.289
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 28 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 28 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3614
üìä Ratio 0.1: 12 tokens masked, confidence: 0.3586 ‚Üí 0.0029
üìä Ratio 0.2: 25 tokens masked, confidence: 0.3547 ‚Üí 0.0067
üìä Ratio 0.3: 38 tokens masked, confidence: 0.3509 ‚Üí 0.0105
üìä Ratio 0.5: 64 tokens masked, confidence: 0.3506 ‚Üí 0.0108
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.361
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.308
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.346
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.357
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.316
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3630
üìä Ratio 0.1: 12 tokens masked, confidence: 0.3621 ‚Üí 0.0009
üìä Ratio 0.2: 25 tokens masked, confidence: 0.3620 ‚Üí 0.0010
üìä Ratio 0.3: 38 tokens masked, confidence: 0.3641 ‚Üí -0.0011
üìä Ratio 0.5: 64 tokens masked, confidence: 0.3630 ‚Üí -0.0000
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.363
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.367
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.345
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.319
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.320
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3731
üìä Ratio 0.1: 6 tokens masked, confidence: 0.3735 ‚Üí -0.0004
üìä Ratio 0.2: 12 tokens masked, confidence: 0.3673 ‚Üí 0.0058
üìä Ratio 0.3: 18 tokens masked, confidence: 0.3660 ‚Üí 0.0071
üìä Ratio 0.5: 31 tokens masked, confidence: 0.3841 ‚Üí -0.0110
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.373
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 60 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.379
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 60 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.355
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 60 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.324
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 60 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 60 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3618
üìä Ratio 0.1: 12 tokens masked, confidence: 0.3610 ‚Üí 0.0007
üìä Ratio 0.2: 25 tokens masked, confidence: 0.3609 ‚Üí 0.0009
üìä Ratio 0.3: 38 tokens masked, confidence: 0.3589 ‚Üí 0.0029
üìä Ratio 0.5: 64 tokens masked, confidence: 0.3520 ‚Üí 0.0098
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.362
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.314
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.340
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.367
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.319
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3954
üìä Ratio 0.1: 3 tokens masked, confidence: 0.3931 ‚Üí 0.0023
üìä Ratio 0.2: 7 tokens masked, confidence: 0.3924 ‚Üí 0.0030
üìä Ratio 0.3: 11 tokens masked, confidence: 0.3828 ‚Üí 0.0126
üìä Ratio 0.5: 18 tokens masked, confidence: 0.3790 ‚Üí 0.0165
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.395
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 35 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.337
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 35 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.371
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 35 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.323
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 35 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 35 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3716
üìä Ratio 0.1: 2 tokens masked, confidence: 0.3582 ‚Üí 0.0133
üìä Ratio 0.2: 4 tokens masked, confidence: 0.3559 ‚Üí 0.0157
üìä Ratio 0.3: 7 tokens masked, confidence: 0.3643 ‚Üí 0.0073
üìä Ratio 0.5: 12 tokens masked, confidence: 0.3722 ‚Üí -0.0006
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.372
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 22 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.306
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 22 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.375
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 22 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.303
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 22 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 22 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3594
üìä Ratio 0.1: 12 tokens masked, confidence: 0.3582 ‚Üí 0.0012
üìä Ratio 0.2: 25 tokens masked, confidence: 0.3638 ‚Üí -0.0044
üìä Ratio 0.3: 38 tokens masked, confidence: 0.3624 ‚Üí -0.0030
üìä Ratio 0.5: 64 tokens masked, confidence: 0.3539 ‚Üí 0.0055
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.359
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.293
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.351
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.331
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.319
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3609
üìä Ratio 0.1: 3 tokens masked, confidence: 0.3605 ‚Üí 0.0004
üìä Ratio 0.2: 7 tokens masked, confidence: 0.3515 ‚Üí 0.0094
üìä Ratio 0.3: 11 tokens masked, confidence: 0.3481 ‚Üí 0.0128
üìä Ratio 0.5: 19 tokens masked, confidence: 0.3525 ‚Üí 0.0084
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.361
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 36 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.305
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 36 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.342
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 36 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.309
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 36 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 36 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3781
üìä Ratio 0.1: 2 tokens masked, confidence: 0.3580 ‚Üí 0.0201
üìä Ratio 0.2: 5 tokens masked, confidence: 0.3577 ‚Üí 0.0204
üìä Ratio 0.3: 8 tokens masked, confidence: 0.3621 ‚Üí 0.0160
üìä Ratio 0.5: 14 tokens masked, confidence: 0.3715 ‚Üí 0.0066
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.378
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 26 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.380
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 26 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.384
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 26 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.322
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 26 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 26 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3503
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3476 ‚Üí 0.0027
üìä Ratio 0.2: 2 tokens masked, confidence: 0.3459 ‚Üí 0.0044
üìä Ratio 0.3: 3 tokens masked, confidence: 0.3511 ‚Üí -0.0008
üìä Ratio 0.5: 6 tokens masked, confidence: 0.3362 ‚Üí 0.0141
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.350
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 11 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.394
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 11 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.365
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 11 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.342
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 11 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 11 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3596
üìä Ratio 0.1: 12 tokens masked, confidence: 0.3633 ‚Üí -0.0037
üìä Ratio 0.2: 25 tokens masked, confidence: 0.3607 ‚Üí -0.0010
üìä Ratio 0.3: 38 tokens masked, confidence: 0.3634 ‚Üí -0.0038
üìä Ratio 0.5: 64 tokens masked, confidence: 0.3565 ‚Üí 0.0031
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.360
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.289
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.344
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.361
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.323
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3708
üìä Ratio 0.1: 3 tokens masked, confidence: 0.3707 ‚Üí 0.0001
üìä Ratio 0.2: 7 tokens masked, confidence: 0.3721 ‚Üí -0.0012
üìä Ratio 0.3: 10 tokens masked, confidence: 0.3673 ‚Üí 0.0036
üìä Ratio 0.5: 18 tokens masked, confidence: 0.3619 ‚Üí 0.0090
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.371
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 34 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.256
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 34 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.360
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 34 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.279
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 34 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 34 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3688
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3736 ‚Üí -0.0048
üìä Ratio 0.2: 2 tokens masked, confidence: 0.3757 ‚Üí -0.0069
üìä Ratio 0.3: 4 tokens masked, confidence: 0.3526 ‚Üí 0.0162
üìä Ratio 0.5: 7 tokens masked, confidence: 0.3349 ‚Üí 0.0339
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.369
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 12 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.301
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 12 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.355
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 12 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.325
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 12 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 12 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3624
üìä Ratio 0.1: 2 tokens masked, confidence: 0.3647 ‚Üí -0.0023
üìä Ratio 0.2: 4 tokens masked, confidence: 0.3568 ‚Üí 0.0056
üìä Ratio 0.3: 7 tokens masked, confidence: 0.3617 ‚Üí 0.0007
üìä Ratio 0.5: 12 tokens masked, confidence: 0.3720 ‚Üí -0.0096
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.362
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 22 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.268
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 22 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.346
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 22 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.281
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 22 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 22 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3715
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3592 ‚Üí 0.0123
üìä Ratio 0.2: 2 tokens masked, confidence: 0.3598 ‚Üí 0.0117
üìä Ratio 0.3: 3 tokens masked, confidence: 0.3490 ‚Üí 0.0225
üìä Ratio 0.5: 6 tokens masked, confidence: 0.3444 ‚Üí 0.0271
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.372
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 10 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.352
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 10 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.395
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 10 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.330
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 10 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 10 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3660
üìä Ratio 0.1: 9 tokens masked, confidence: 0.3719 ‚Üí -0.0059
üìä Ratio 0.2: 19 tokens masked, confidence: 0.3671 ‚Üí -0.0011
üìä Ratio 0.3: 28 tokens masked, confidence: 0.3720 ‚Üí -0.0061
üìä Ratio 0.5: 47 tokens masked, confidence: 0.3766 ‚Üí -0.0106
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.366
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 93 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.335
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 93 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.352
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 93 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.343
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 93 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 93 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3710
üìä Ratio 0.1: 4 tokens masked, confidence: 0.3649 ‚Üí 0.0062
üìä Ratio 0.2: 8 tokens masked, confidence: 0.3600 ‚Üí 0.0111
üìä Ratio 0.3: 13 tokens masked, confidence: 0.3661 ‚Üí 0.0049
üìä Ratio 0.5: 22 tokens masked, confidence: 0.3537 ‚Üí 0.0174
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.371
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 42 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.301
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 42 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.369
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 42 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.329
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 42 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 42 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3601
üìä Ratio 0.1: 7 tokens masked, confidence: 0.3610 ‚Üí -0.0009
üìä Ratio 0.2: 14 tokens masked, confidence: 0.3586 ‚Üí 0.0015
üìä Ratio 0.3: 21 tokens masked, confidence: 0.3575 ‚Üí 0.0026
üìä Ratio 0.5: 35 tokens masked, confidence: 0.3709 ‚Üí -0.0108
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.360
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 69 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.258
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 69 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.375
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 69 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.289
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 69 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 69 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3651
üìä Ratio 0.1: 2 tokens masked, confidence: 0.3569 ‚Üí 0.0082
üìä Ratio 0.2: 4 tokens masked, confidence: 0.3659 ‚Üí -0.0008
üìä Ratio 0.3: 6 tokens masked, confidence: 0.3650 ‚Üí 0.0001
üìä Ratio 0.5: 11 tokens masked, confidence: 0.3576 ‚Üí 0.0075
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.365
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 21 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.343
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 21 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.366
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 21 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.339
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 21 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 21 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3742
üìä Ratio 0.1: 11 tokens masked, confidence: 0.3721 ‚Üí 0.0021
üìä Ratio 0.2: 23 tokens masked, confidence: 0.3634 ‚Üí 0.0108
üìä Ratio 0.3: 34 tokens masked, confidence: 0.3639 ‚Üí 0.0103
üìä Ratio 0.5: 58 tokens masked, confidence: 0.3598 ‚Üí 0.0144
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.374
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 114 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.329
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 114 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.379
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 114 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.331
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 114 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 114 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3596
üìä Ratio 0.1: 12 tokens masked, confidence: 0.3558 ‚Üí 0.0038
üìä Ratio 0.2: 25 tokens masked, confidence: 0.3566 ‚Üí 0.0030
üìä Ratio 0.3: 38 tokens masked, confidence: 0.3581 ‚Üí 0.0015
üìä Ratio 0.5: 64 tokens masked, confidence: 0.3575 ‚Üí 0.0021
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.360
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.348
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.368
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.323
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.316
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3770
üìä Ratio 0.1: 10 tokens masked, confidence: 0.3682 ‚Üí 0.0088
üìä Ratio 0.2: 20 tokens masked, confidence: 0.3712 ‚Üí 0.0057
üìä Ratio 0.3: 30 tokens masked, confidence: 0.3720 ‚Üí 0.0050
üìä Ratio 0.5: 51 tokens masked, confidence: 0.3641 ‚Üí 0.0129
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.377
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 101 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.344
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 101 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.340
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 101 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.318
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 101 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 101 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3684
üìä Ratio 0.1: 4 tokens masked, confidence: 0.3566 ‚Üí 0.0118
üìä Ratio 0.2: 9 tokens masked, confidence: 0.3638 ‚Üí 0.0046
üìä Ratio 0.3: 14 tokens masked, confidence: 0.3649 ‚Üí 0.0034
üìä Ratio 0.5: 23 tokens masked, confidence: 0.3538 ‚Üí 0.0146
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.368
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 45 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.356
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 45 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.375
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 45 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.332
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 45 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 45 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3529
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3549 ‚Üí -0.0020
üìä Ratio 0.2: 2 tokens masked, confidence: 0.3597 ‚Üí -0.0067
üìä Ratio 0.3: 4 tokens masked, confidence: 0.3580 ‚Üí -0.0051
üìä Ratio 0.5: 7 tokens masked, confidence: 0.3553 ‚Üí -0.0024
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.353
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 12 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.379
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 12 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.368
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 12 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.351
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 12 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 12 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3587
üìä Ratio 0.1: 3 tokens masked, confidence: 0.3592 ‚Üí -0.0005
üìä Ratio 0.2: 7 tokens masked, confidence: 0.3607 ‚Üí -0.0020
üìä Ratio 0.3: 10 tokens masked, confidence: 0.3612 ‚Üí -0.0025
üìä Ratio 0.5: 18 tokens masked, confidence: 0.3683 ‚Üí -0.0095
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.359
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 34 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.264
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 34 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.363
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 34 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.295
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 34 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 34 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3860
üìä Ratio 0.1: 2 tokens masked, confidence: 0.3703 ‚Üí 0.0157
üìä Ratio 0.2: 5 tokens masked, confidence: 0.3598 ‚Üí 0.0262
üìä Ratio 0.3: 7 tokens masked, confidence: 0.3511 ‚Üí 0.0349
üìä Ratio 0.5: 13 tokens masked, confidence: 0.3545 ‚Üí 0.0314
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.386
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.366
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.357
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.345
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3578
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3553 ‚Üí 0.0024
üìä Ratio 0.2: 1 tokens masked, confidence: 0.3553 ‚Üí 0.0024
üìä Ratio 0.3: 2 tokens masked, confidence: 0.3598 ‚Üí -0.0020
üìä Ratio 0.5: 4 tokens masked, confidence: 0.3822 ‚Üí -0.0245
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.358
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 7 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.357
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 7 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.381
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 7 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.343
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 7 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 7 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3591
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3604 ‚Üí -0.0013
üìä Ratio 0.2: 3 tokens masked, confidence: 0.3470 ‚Üí 0.0122
üìä Ratio 0.3: 5 tokens masked, confidence: 0.3471 ‚Üí 0.0121
üìä Ratio 0.5: 9 tokens masked, confidence: 0.3600 ‚Üí -0.0008
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.359
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 17 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.360
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 17 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.382
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 17 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.369
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 17 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 17 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3725
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3536 ‚Üí 0.0188
üìä Ratio 0.2: 3 tokens masked, confidence: 0.3352 ‚Üí 0.0372
üìä Ratio 0.3: 5 tokens masked, confidence: 0.3196 ‚Üí 0.0529
üìä Ratio 0.5: 9 tokens masked, confidence: 0.3176 ‚Üí 0.0549
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.372
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 16 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.280
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 16 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.349
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 16 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.316
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 16 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 16 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3624
üìä Ratio 0.1: 2 tokens masked, confidence: 0.3591 ‚Üí 0.0033
üìä Ratio 0.2: 5 tokens masked, confidence: 0.3496 ‚Üí 0.0128
üìä Ratio 0.3: 7 tokens masked, confidence: 0.3465 ‚Üí 0.0159
üìä Ratio 0.5: 13 tokens masked, confidence: 0.3656 ‚Üí -0.0032
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.362
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.287
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.378
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.342
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3643
üìä Ratio 0.1: 2 tokens masked, confidence: 0.3605 ‚Üí 0.0037
üìä Ratio 0.2: 5 tokens masked, confidence: 0.3614 ‚Üí 0.0029
üìä Ratio 0.3: 7 tokens masked, confidence: 0.3657 ‚Üí -0.0014
üìä Ratio 0.5: 13 tokens masked, confidence: 0.3655 ‚Üí -0.0012
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.364
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.398
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.352
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.314
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3717
üìä Ratio 0.1: 3 tokens masked, confidence: 0.3667 ‚Üí 0.0050
üìä Ratio 0.2: 6 tokens masked, confidence: 0.3551 ‚Üí 0.0167
üìä Ratio 0.3: 9 tokens masked, confidence: 0.3605 ‚Üí 0.0112
üìä Ratio 0.5: 15 tokens masked, confidence: 0.3659 ‚Üí 0.0059
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.372
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 29 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.390
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 29 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.367
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 29 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.303
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 29 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 29 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3425
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3585 ‚Üí -0.0160
üìä Ratio 0.2: 2 tokens masked, confidence: 0.3460 ‚Üí -0.0034
üìä Ratio 0.3: 3 tokens masked, confidence: 0.3410 ‚Üí 0.0015
üìä Ratio 0.5: 6 tokens masked, confidence: 0.3258 ‚Üí 0.0167
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.343
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 11 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.298
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 11 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.375
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 11 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.361
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 11 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 11 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3656
üìä Ratio 0.1: 2 tokens masked, confidence: 0.3742 ‚Üí -0.0086
üìä Ratio 0.2: 5 tokens masked, confidence: 0.3698 ‚Üí -0.0042
üìä Ratio 0.3: 8 tokens masked, confidence: 0.3591 ‚Üí 0.0065
üìä Ratio 0.5: 14 tokens masked, confidence: 0.3709 ‚Üí -0.0053
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.366
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 27 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.368
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 27 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.369
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 27 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.316
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 27 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 27 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3665
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3592 ‚Üí 0.0073
üìä Ratio 0.2: 3 tokens masked, confidence: 0.3487 ‚Üí 0.0178
üìä Ratio 0.3: 5 tokens masked, confidence: 0.3367 ‚Üí 0.0298
üìä Ratio 0.5: 8 tokens masked, confidence: 0.3514 ‚Üí 0.0152
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.367
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 15 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.359
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 15 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.385
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 15 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.331
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 15 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 15 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3419
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3386 ‚Üí 0.0033
üìä Ratio 0.2: 3 tokens masked, confidence: 0.3309 ‚Üí 0.0110
üìä Ratio 0.3: 5 tokens masked, confidence: 0.3317 ‚Üí 0.0103
üìä Ratio 0.5: 9 tokens masked, confidence: 0.3246 ‚Üí 0.0173
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.342
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 16 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.277
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 16 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.376
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 16 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.353
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 16 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 16 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3942
üìä Ratio 0.1: 2 tokens masked, confidence: 0.3781 ‚Üí 0.0161
üìä Ratio 0.2: 5 tokens masked, confidence: 0.3783 ‚Üí 0.0159
üìä Ratio 0.3: 7 tokens masked, confidence: 0.3663 ‚Üí 0.0279
üìä Ratio 0.5: 13 tokens masked, confidence: 0.3555 ‚Üí 0.0388
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.394
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.314
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.379
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.362
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 24 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3694
üìä Ratio 0.1: 3 tokens masked, confidence: 0.3499 ‚Üí 0.0195
üìä Ratio 0.2: 7 tokens masked, confidence: 0.3497 ‚Üí 0.0197
üìä Ratio 0.3: 10 tokens masked, confidence: 0.3560 ‚Üí 0.0134
üìä Ratio 0.5: 17 tokens masked, confidence: 0.3598 ‚Üí 0.0095
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.369
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 33 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.323
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 33 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.352
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 33 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.328
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 33 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 33 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3815
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3633 ‚Üí 0.0182
üìä Ratio 0.2: 2 tokens masked, confidence: 0.4001 ‚Üí -0.0186
üìä Ratio 0.3: 3 tokens masked, confidence: 0.3900 ‚Üí -0.0085
üìä Ratio 0.5: 6 tokens masked, confidence: 0.3755 ‚Üí 0.0060
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.381
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 11 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.323
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 11 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.376
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 11 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.345
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 11 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 11 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3548
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3539 ‚Üí 0.0008
üìä Ratio 0.2: 3 tokens masked, confidence: 0.3479 ‚Üí 0.0069
üìä Ratio 0.3: 4 tokens masked, confidence: 0.3414 ‚Üí 0.0133
üìä Ratio 0.5: 8 tokens masked, confidence: 0.3525 ‚Üí 0.0022
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.355
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 14 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.286
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 14 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.351
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 14 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.296
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 14 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 14 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3654
üìä Ratio 0.1: 8 tokens masked, confidence: 0.3671 ‚Üí -0.0017
üìä Ratio 0.2: 16 tokens masked, confidence: 0.3649 ‚Üí 0.0005
üìä Ratio 0.3: 24 tokens masked, confidence: 0.3593 ‚Üí 0.0061
üìä Ratio 0.5: 41 tokens masked, confidence: 0.3569 ‚Üí 0.0085
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.365
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 81 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.300
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 81 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.345
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 81 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.322
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 81 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 81 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3749
üìä Ratio 0.1: 2 tokens masked, confidence: 0.3700 ‚Üí 0.0049
üìä Ratio 0.2: 4 tokens masked, confidence: 0.3832 ‚Üí -0.0083
üìä Ratio 0.3: 6 tokens masked, confidence: 0.3805 ‚Üí -0.0057
üìä Ratio 0.5: 11 tokens masked, confidence: 0.3652 ‚Üí 0.0097
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.375
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 20 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.341
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 20 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.393
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 20 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.318
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 20 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 20 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3813
üìä Ratio 0.1: 2 tokens masked, confidence: 0.3756 ‚Üí 0.0057
üìä Ratio 0.2: 5 tokens masked, confidence: 0.3787 ‚Üí 0.0027
üìä Ratio 0.3: 8 tokens masked, confidence: 0.3677 ‚Üí 0.0136
üìä Ratio 0.5: 14 tokens masked, confidence: 0.3744 ‚Üí 0.0070
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.381
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 26 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.266
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 26 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.361
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 26 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.297
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 26 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 26 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3659
üìä Ratio 0.1: 9 tokens masked, confidence: 0.3599 ‚Üí 0.0060
üìä Ratio 0.2: 19 tokens masked, confidence: 0.3567 ‚Üí 0.0092
üìä Ratio 0.3: 29 tokens masked, confidence: 0.3610 ‚Üí 0.0049
üìä Ratio 0.5: 49 tokens masked, confidence: 0.3608 ‚Üí 0.0051
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.366
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 97 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.303
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 97 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.358
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 97 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.325
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 97 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.312
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 97 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3826
üìä Ratio 0.1: 5 tokens masked, confidence: 0.3751 ‚Üí 0.0075
üìä Ratio 0.2: 11 tokens masked, confidence: 0.3690 ‚Üí 0.0136
üìä Ratio 0.3: 16 tokens masked, confidence: 0.3752 ‚Üí 0.0074
üìä Ratio 0.5: 27 tokens masked, confidence: 0.3696 ‚Üí 0.0129
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.383
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 53 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.302
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 53 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.336
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 53 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.333
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 53 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 53 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3657
üìä Ratio 0.1: 7 tokens masked, confidence: 0.3540 ‚Üí 0.0117
üìä Ratio 0.2: 15 tokens masked, confidence: 0.3580 ‚Üí 0.0077
üìä Ratio 0.3: 23 tokens masked, confidence: 0.3546 ‚Üí 0.0111
üìä Ratio 0.5: 39 tokens masked, confidence: 0.3490 ‚Üí 0.0167
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.366
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 77 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.364
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 77 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.348
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 77 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.317
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 77 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 77 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3675
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3713 ‚Üí -0.0037
üìä Ratio 0.2: 3 tokens masked, confidence: 0.3680 ‚Üí -0.0005
üìä Ratio 0.3: 4 tokens masked, confidence: 0.3629 ‚Üí 0.0046
üìä Ratio 0.5: 7 tokens masked, confidence: 0.3659 ‚Üí 0.0016
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.368
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 13 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.256
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 13 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.357
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 13 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.274
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 13 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 13 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3659
üìä Ratio 0.1: 7 tokens masked, confidence: 0.3596 ‚Üí 0.0063
üìä Ratio 0.2: 15 tokens masked, confidence: 0.3572 ‚Üí 0.0087
üìä Ratio 0.3: 23 tokens masked, confidence: 0.3629 ‚Üí 0.0030
üìä Ratio 0.5: 39 tokens masked, confidence: 0.3616 ‚Üí 0.0043
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.366
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 76 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.359
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 76 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.369
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 76 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 76 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 76 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3603
üìä Ratio 0.1: 3 tokens masked, confidence: 0.3595 ‚Üí 0.0008
üìä Ratio 0.2: 6 tokens masked, confidence: 0.3610 ‚Üí -0.0007
üìä Ratio 0.3: 10 tokens masked, confidence: 0.3618 ‚Üí -0.0015
üìä Ratio 0.5: 17 tokens masked, confidence: 0.3711 ‚Üí -0.0108
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.360
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 32 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.404
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 32 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.345
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 32 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.316
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 32 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 32 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3783
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3876 ‚Üí -0.0093
üìä Ratio 0.2: 3 tokens masked, confidence: 0.3881 ‚Üí -0.0098
üìä Ratio 0.3: 4 tokens masked, confidence: 0.3840 ‚Üí -0.0057
üìä Ratio 0.5: 7 tokens masked, confidence: 0.3889 ‚Üí -0.0106
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.378
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 13 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.322
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 13 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.359
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 13 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.309
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 13 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 13 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3661
üìä Ratio 0.1: 12 tokens masked, confidence: 0.3688 ‚Üí -0.0026
üìä Ratio 0.2: 25 tokens masked, confidence: 0.3746 ‚Üí -0.0085
üìä Ratio 0.3: 38 tokens masked, confidence: 0.3696 ‚Üí -0.0034
üìä Ratio 0.5: 64 tokens masked, confidence: 0.3613 ‚Üí 0.0049
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.366
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.286
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.350
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.330
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.312
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3586
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3600 ‚Üí -0.0014
üìä Ratio 0.2: 3 tokens masked, confidence: 0.3566 ‚Üí 0.0020
üìä Ratio 0.3: 5 tokens masked, confidence: 0.3511 ‚Üí 0.0075
üìä Ratio 0.5: 9 tokens masked, confidence: 0.3479 ‚Üí 0.0107
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.359
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 17 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.322
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 17 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.374
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 17 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.336
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 17 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 17 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3634
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3634 ‚Üí -0.0001
üìä Ratio 0.2: 2 tokens masked, confidence: 0.3554 ‚Üí 0.0080
üìä Ratio 0.3: 3 tokens masked, confidence: 0.3531 ‚Üí 0.0103
üìä Ratio 0.5: 6 tokens masked, confidence: 0.3873 ‚Üí -0.0239
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.363
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 10 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.299
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 10 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.401
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 10 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.285
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 10 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 10 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3640
üìä Ratio 0.1: 12 tokens masked, confidence: 0.3627 ‚Üí 0.0012
üìä Ratio 0.2: 25 tokens masked, confidence: 0.3674 ‚Üí -0.0034
üìä Ratio 0.3: 38 tokens masked, confidence: 0.3659 ‚Üí -0.0019
üìä Ratio 0.5: 64 tokens masked, confidence: 0.3624 ‚Üí 0.0015
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.364
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.272
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.347
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.312
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.315
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3483
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3505 ‚Üí -0.0022
üìä Ratio 0.2: 1 tokens masked, confidence: 0.3505 ‚Üí -0.0022
üìä Ratio 0.3: 2 tokens masked, confidence: 0.3486 ‚Üí -0.0003
üìä Ratio 0.5: 4 tokens masked, confidence: 0.3472 ‚Üí 0.0011
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.348
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 6 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.459
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 6 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.348
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 6 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.339
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 6 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 6 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3374
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3292 ‚Üí 0.0082
üìä Ratio 0.2: 1 tokens masked, confidence: 0.3292 ‚Üí 0.0082
üìä Ratio 0.3: 2 tokens masked, confidence: 0.3284 ‚Üí 0.0091
üìä Ratio 0.5: 3 tokens masked, confidence: 0.3626 ‚Üí -0.0252
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.337
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 5 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.429
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 5 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.346
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 5 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.333
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 5 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 5 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3773
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3446 ‚Üí 0.0327
üìä Ratio 0.2: 1 tokens masked, confidence: 0.3446 ‚Üí 0.0327
üìä Ratio 0.3: 2 tokens masked, confidence: 0.3464 ‚Üí 0.0309
üìä Ratio 0.5: 4 tokens masked, confidence: 0.3394 ‚Üí 0.0379
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.377
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 7 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.363
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 7 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.364
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 7 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.292
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 7 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 7 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3374
üìä Ratio 0.1: 2 tokens masked, confidence: 0.3255 ‚Üí 0.0119
üìä Ratio 0.2: 4 tokens masked, confidence: 0.3643 ‚Üí -0.0269
üìä Ratio 0.3: 6 tokens masked, confidence: 0.3575 ‚Üí -0.0200
üìä Ratio 0.5: 10 tokens masked, confidence: 0.3821 ‚Üí -0.0447
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.337
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 18 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.457
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 18 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.371
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 18 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.367
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 18 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 18 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3791
üìä Ratio 0.1: 3 tokens masked, confidence: 0.3685 ‚Üí 0.0106
üìä Ratio 0.2: 7 tokens masked, confidence: 0.3749 ‚Üí 0.0042
üìä Ratio 0.3: 10 tokens masked, confidence: 0.3712 ‚Üí 0.0079
üìä Ratio 0.5: 18 tokens masked, confidence: 0.3692 ‚Üí 0.0099
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.379
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 34 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.309
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 34 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.357
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 34 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.336
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 34 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 34 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3695
üìä Ratio 0.1: 4 tokens masked, confidence: 0.3653 ‚Üí 0.0042
üìä Ratio 0.2: 8 tokens masked, confidence: 0.3631 ‚Üí 0.0065
üìä Ratio 0.3: 12 tokens masked, confidence: 0.3655 ‚Üí 0.0041
üìä Ratio 0.5: 21 tokens masked, confidence: 0.3675 ‚Üí 0.0020
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.370
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 41 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.283
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 41 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.358
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 41 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.301
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 41 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 41 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3683
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3754 ‚Üí -0.0071
üìä Ratio 0.2: 2 tokens masked, confidence: 0.3661 ‚Üí 0.0022
üìä Ratio 0.3: 3 tokens masked, confidence: 0.3590 ‚Üí 0.0093
üìä Ratio 0.5: 6 tokens masked, confidence: 0.3655 ‚Üí 0.0028
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.368
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 11 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.349
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 11 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.375
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 11 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.354
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 11 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 11 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3663
üìä Ratio 0.1: 4 tokens masked, confidence: 0.3551 ‚Üí 0.0113
üìä Ratio 0.2: 8 tokens masked, confidence: 0.3518 ‚Üí 0.0145
üìä Ratio 0.3: 12 tokens masked, confidence: 0.3537 ‚Üí 0.0127
üìä Ratio 0.5: 21 tokens masked, confidence: 0.3550 ‚Üí 0.0113
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.366
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 40 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.370
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 40 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.333
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 40 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.327
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 40 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 40 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3560
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3547 ‚Üí 0.0013
üìä Ratio 0.2: 2 tokens masked, confidence: 0.3601 ‚Üí -0.0042
üìä Ratio 0.3: 4 tokens masked, confidence: 0.3584 ‚Üí -0.0024
üìä Ratio 0.5: 7 tokens masked, confidence: 0.3629 ‚Üí -0.0069
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.356
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 12 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.306
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 12 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.354
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 12 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.284
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 12 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 12 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3844
üìä Ratio 0.1: 2 tokens masked, confidence: 0.3817 ‚Üí 0.0026
üìä Ratio 0.2: 4 tokens masked, confidence: 0.3852 ‚Üí -0.0009
üìä Ratio 0.3: 6 tokens masked, confidence: 0.3808 ‚Üí 0.0036
üìä Ratio 0.5: 10 tokens masked, confidence: 0.3867 ‚Üí -0.0024
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.384
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 19 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.290
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 19 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.393
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 19 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.334
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 19 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 19 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3731
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3734 ‚Üí -0.0002
üìä Ratio 0.2: 3 tokens masked, confidence: 0.3732 ‚Üí -0.0000
üìä Ratio 0.3: 5 tokens masked, confidence: 0.3783 ‚Üí -0.0052
üìä Ratio 0.5: 9 tokens masked, confidence: 0.3753 ‚Üí -0.0021
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.373
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 17 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.323
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 17 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.349
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 17 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.313
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 17 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 17 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 1
üìä Original confidence: 0.3857
üìä Ratio 0.1: 6 tokens masked, confidence: 0.3743 ‚Üí 0.0114
üìä Ratio 0.2: 12 tokens masked, confidence: 0.3742 ‚Üí 0.0115
üìä Ratio 0.3: 18 tokens masked, confidence: 0.3654 ‚Üí 0.0203
üìä Ratio 0.5: 31 tokens masked, confidence: 0.3586 ‚Üí 0.0271
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 1, Confidence: 0.386
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 61 tokens
üîí Reference class: 1, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 1, Confidence: 0.370
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 61 tokens
‚úÖ Seed 123: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 1, Confidence: 0.365
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 61 tokens
‚úÖ Seed 456: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 1, Confidence: 0.325
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 61 tokens
‚úÖ Seed 789: computed IG for target class 1
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 1, Confidence: 0.321
üîí Target class locked: 1 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 61 tokens
‚úÖ Seed 999: computed IG for target class 1
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3766
üìä Ratio 0.1: 1 tokens masked, confidence: 0.3759 ‚Üí 0.0007
üìä Ratio 0.2: 1 tokens masked, confidence: 0.3759 ‚Üí 0.0007
üìä Ratio 0.3: 2 tokens masked, confidence: 0.3842 ‚Üí -0.0076
üìä Ratio 0.5: 4 tokens masked, confidence: 0.3685 ‚Üí 0.0080
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.377
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 7 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.294
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 7 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.375
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 7 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.268
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 7 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 7 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3685
üìä Ratio 0.1: 4 tokens masked, confidence: 0.3591 ‚Üí 0.0094
üìä Ratio 0.2: 8 tokens masked, confidence: 0.3584 ‚Üí 0.0100
üìä Ratio 0.3: 13 tokens masked, confidence: 0.3570 ‚Üí 0.0115
üìä Ratio 0.5: 22 tokens masked, confidence: 0.3480 ‚Üí 0.0205
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.368
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 42 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.256
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 42 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.359
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 42 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.285
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 42 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 42 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3658
üìä Ratio 0.1: 4 tokens masked, confidence: 0.3415 ‚Üí 0.0244
üìä Ratio 0.2: 8 tokens masked, confidence: 0.3513 ‚Üí 0.0145
üìä Ratio 0.3: 12 tokens masked, confidence: 0.3567 ‚Üí 0.0091
üìä Ratio 0.5: 20 tokens masked, confidence: 0.3673 ‚Üí -0.0014
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.366
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 38 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.303
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 38 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.383
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 38 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.343
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 38 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 38 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3563
üìä Ratio 0.1: 12 tokens masked, confidence: 0.3542 ‚Üí 0.0021
üìä Ratio 0.2: 24 tokens masked, confidence: 0.3553 ‚Üí 0.0010
üìä Ratio 0.3: 36 tokens masked, confidence: 0.3622 ‚Üí -0.0060
üìä Ratio 0.5: 60 tokens masked, confidence: 0.3469 ‚Üí 0.0094
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.356
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 119 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.269
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 119 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.349
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 119 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.336
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 119 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.321
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 119 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...
üìä Evaluating faithfulness...
üîí Faithfulness: measuring confidence for class 0
üìä Original confidence: 0.3566
üìä Ratio 0.1: 12 tokens masked, confidence: 0.3515 ‚Üí 0.0051
üìä Ratio 0.2: 25 tokens masked, confidence: 0.3536 ‚Üí 0.0030
üìä Ratio 0.3: 38 tokens masked, confidence: 0.3546 ‚Üí 0.0020
üìä Ratio 0.5: 64 tokens masked, confidence: 0.3583 ‚Üí -0.0017
üìä Evaluating stability across seeds...
üîç Generating IG attributions for single_task_seed_42 model...
üéØ Predicted class: 0, Confidence: 0.357
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
üîí Reference class: 0, using tokenizer from seed 42
üîç Generating IG attributions for single_task_seed_123 model...
üéØ Using forced target class: 0, Confidence: 0.281
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 123: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_456 model...
üéØ Using forced target class: 0, Confidence: 0.358
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 456: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_789 model...
üéØ Using forced target class: 0, Confidence: 0.322
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 789: computed IG for target class 0
üîç Generating IG attributions for single_task_seed_999 model...
üéØ Using forced target class: 0, Confidence: 0.318
üîí Target class locked: 0 for stability analysis
üîÑ Computing Integrated Gradients with embeddings...
‚úÖ Integrated Gradients computation succeeded!
‚úÖ Generated attributions for 126 tokens
‚úÖ Seed 999: computed IG for target class 0
üìä Evaluating fairness...

5Ô∏è‚É£ Saving Results...
üíæ Saved 94 rows to explainability_results_single_task\xai_metrics_single_task_across_seeds.csv

6Ô∏è‚É£ Generating Summary...

üìä Summary Statistics:
      faithfulness_top_0.1  faithfulness_top_0.2  faithfulness_top_0.3  \
mean              0.004477              0.004836              0.005542   
std               0.007962              0.009882              0.010792   

      faithfulness_top_0.5  stability_cosine  stability_correlation  \
mean              0.004829          0.011367               0.011367   
std               0.014492          0.110762               0.110762   

      demographic_bias_ratio  attribution_concentration  
mean                0.004398                   0.461231  
std                 0.028842                   0.069159  

üéâ Single-Task Analysis Complete!")