☆ 问题描述
如何计算和用matplotlib绘制训练集、验证集和测试集上的混淆矩阵:
★ 解决方案
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from sklearn.metrics import confusion_matrix
from sklearn.metrics import ConfusionMatrixDisplay
from sklearn.model_selection import train_test_split
# 假设你有训练集、验证集和测试集的实际标签和模型预测结果
train_actual_labels = np.array([1, 0, 1, 1, 0, 1, 0, 0, 1, 0])
train_predicted_labels = np.array([1, 0, 1, 0, 0, 1, 1, 0, 1, 1])
val_actual_labels = np.array([0, 1, 1, 0, 1, 0, 1, 0, 1, 0])
val_predicted_labels = np.array([1, 1, 1, 0, 0, 1, 0, 0, 1, 1])
test_actual_labels = np.array([1, 0, 0, 1, 1, 0, 0, 1, 1, 0])
test_predicted_labels = np.array([1, 0, 1, 1, 0, 0, 0, 1, 1, 1])
# 计算混淆矩阵
train_cm = confusion_matrix(train_actual_labels, train_predicted_labels)
val_cm = confusion_matrix(val_actual_labels, val_predicted_labels)
test_cm = confusion_matrix(test_actual_labels, test_predicted_labels)
# 打印混淆矩阵
print("Training Set Confusion Matrix:")
print(train_cm)
print("\nValidation Set Confusion Matrix:")
print(val_cm)
print("\nTest Set Confusion Matrix:")
print(test_cm)
# 可视化混淆矩阵
class_names = ['Negative', 'Positive']
# 训练集
plt.figure(figsize=(12, 4))
plt.subplot(1, 3, 1)
sns.heatmap(train_cm, annot=True, fmt='d', cmap='Blues', xticklabels=class_names, yticklabels=class_names)
plt.title('Training Set Confusion Matrix')
plt.xlabel('Predicted')
plt.ylabel('Actual')
# 验证集
plt.subplot(1, 3, 2)
sns.heatmap(val_cm, annot=True, fmt='d', cmap='Blues', xticklabels=class_names, yticklabels=class_names)
plt.title('Validation Set Confusion Matrix')
plt.xlabel('Predicted')
plt.ylabel('Actual')
# 测试集
plt.subplot(1, 3, 3)
sns.heatmap(test_cm, annot=True, fmt='d', cmap='Blues', xticklabels=class_names, yticklabels=class_names)
plt.title('Test Set Confusion Matrix')
plt.xlabel('Predicted')
plt.ylabel('Actual')
plt.tight_layout()
plt.show()