# Evaluation Metrics and Results

This notebook is dedicated to evaluating the performance of the healthcare medical coding assistant. We will load the evaluation dataset, compute various metrics, and visualize the results.

In [1]:
import pandas as pd
import matplotlib.pyplot as plt
from sklearn.metrics import accuracy_score, precision_score, recall_score, f1_score

# Load the evaluation dataset
evaluation_data = pd.read_csv('../data/processed/evaluation.tsv', sep='\t')
evaluation_data.head()

In [2]:
# Assuming the evaluation dataset has 'true_labels' and 'predicted_labels' columns
true_labels = evaluation_data['true_labels']
predicted_labels = evaluation_data['predicted_labels']

# Calculate evaluation metrics
accuracy = accuracy_score(true_labels, predicted_labels)
precision = precision_score(true_labels, predicted_labels, average='weighted')
recall = recall_score(true_labels, predicted_labels, average='weighted')
f1 = f1_score(true_labels, predicted_labels, average='weighted')

# Display the metrics
metrics = {'Accuracy': accuracy, 'Precision': precision, 'Recall': recall, 'F1 Score': f1}
metrics_df = pd.DataFrame(metrics, index=[0])
metrics_df

In [3]:
# Visualize the metrics
metrics_df.plot(kind='bar', figsize=(10, 6), legend=False)
plt.title('Evaluation Metrics')
plt.ylabel('Score')
plt.xticks(rotation=0)
plt.ylim(0, 1)
plt.grid(axis='y')
plt.show()