In [1]:
from llama_lime.explainer import Explainer
from sklearn.ensemble import RandomForestClassifier
from sklearn.datasets import load_iris
import shap
import numpy as np

IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html


In [2]:
random_forest = RandomForestClassifier()
# For simplicity, we'll just fit the model on some dummy data
iris = load_iris()
# make up new names so maybe it won't know this is a famous dataset?
feature_names = ["length of table", "width of table", "length of dresser", "width of dresser"]
X, y = iris.data, iris.target
random_forest.fit(X, y)

In [3]:
# Create an explainer
explainer = Explainer(
    random_forest,
    features=X,
    feature_names=feature_names,
    output=y,
    class_names=["living room", "bedroom", "dining room"],
    target_audience="a business person with a solid understanding of basic statistics"
)

In [4]:
explainer.add_permutation_importance()

In [5]:
explainer.add_feature_importances()

In [6]:
explainer.add_class_importances()
explainer.add_instance_importances()
explainer.add_feature_class_interactions()

In [7]:
explainer.add_lime_instances(X[10:30])

In [8]:
explainer.explain(
    "is there anything interesting from the LIME results, and do it in one sentence"
)

The LIME results indicate that the width and length of the dresser have the most significant impact on the model's predictions, while the width and length of the table have a relatively smaller influence.


In [9]:
# Use the explainer to generate explanations
# explanations = explainer.explain(X)
explanations = explainer.explain()

Based on the analysis of the model, we have identified the following key findings:

1. Feature Importance:
   - The length of the dresser has the highest permutation importance, with a mean of 0.236 and a standard deviation of 0.022. This indicates that changes in the length of the dresser have the most significant impact on the model's predictions.
   - The width of the dresser is the second most important feature, with a mean permutation importance of 0.179 and a standard deviation of 0.020.
   - The length and width of the table have lower permutation importances, with means of 0.016 and 0.013 respectively. These features have less influence on the model's predictions compared to the dresser dimensions.

2. Class Importance:
   - The living room class has an importance of 0.329, indicating that it is influenced by the features to a moderate
