from IPython.display import display, Image
import warnings
warnings.filterwarnings(action='ignore')


import pandas as pd
import numpy as np
from sklearn.model_selection import train_test_split
import matplotlib.pyplot as plt
import seaborn as sns


## 머신러닝 작업 flow
display(Image(filename='img/model_validation_pixel01.png'))


from sklearn.datasets import load_digits

digits = load_digits()
print(digits.data.shape)
print(digits.keys(), digits.target)
print(np.unique( digits.target ) )
sns.countplot(digits.target)

(1797, 64)
dict_keys(['data', 'target', 'frame', 'feature_names', 'target_names', 'images', 'DESCR']) [0 1 2 ... 8 9 8]
[0 1 2 3 4 5 6 7 8 9]

<AxesSubplot:ylabel='count'>


X = digits.data             # 입력  
y = digits.target == 9      # 출력

X_train, X_test, y_train, y_test = train_test_split(X, y, random_state=0)


plt.figure(figsize=(15,6))
plt.subplot(1, 2, 1)
# y_train의 값 확인
sns.countplot(y_train)
plt.title("train")

plt.subplot(1, 2, 2)
# y_test의 값 확인
sns.countplot(y_test)
plt.title("test")

Text(0.5, 1.0, 'test')


from sklearn.dummy import DummyClassifier
dummy_model = DummyClassifier(strategy='most_frequent').fit(X_train, y_train)
pred_most_frequent = dummy_model.predict(X_test)

print("예측된 레이블의 고유값: {}".format(np.unique(pred_most_frequent)))
print("테스트 평가 정확도 : {:.2f}".format(dummy_model.score(X_test, y_test)))

예측된 레이블의 고유값: [False]
테스트 평가 정확도 : 0.90


dummy = DummyClassifier(strategy='stratified').fit(X_train, y_train)  
pred_dummy = dummy.predict(X_test)

print("예측된 레이블의 고유값: {}".format(np.unique(pred_dummy)))
print("테스트 평가 정확도 : {:.2f}".format(dummy.score(X_test, y_test)))

예측된 레이블의 고유값: [False  True]
테스트 평가 정확도 : 0.81


from sklearn.tree import DecisionTreeClassifier
tree = DecisionTreeClassifier(max_depth=2).fit(X_train, y_train)
pred_tree = tree.predict(X_test)

print("테스트 평가 정확도: {:.2f}".format(tree.score(X_test, y_test)))

테스트 평가 정확도: 0.92


from sklearn.linear_model import LogisticRegression

logreg = LogisticRegression(C=0.1).fit(X_train, y_train)
pred_logreg = logreg.predict(X_test)

print("logreg 점수: {:.2f}".format(logreg.score(X_test, y_test)))

logreg 점수: 0.98


import mglearn


mglearn.plots.plot_binary_confusion_matrix()


from sklearn.metrics import confusion_matrix

confusion = confusion_matrix(y_test, pred_logreg)
print("오차 행렬:\n{}".format(confusion))

오차 행렬:
[[402   1]
 [  6  41]]


mglearn.plots.plot_confusion_matrix_illustration()


print("빈도 기반 더미 모델:")
print(confusion_matrix(y_test, pred_most_frequent))

print("\n무작위 더미 모델:")
print(confusion_matrix(y_test, pred_dummy))

print("\n결정 트리:")
print(confusion_matrix(y_test, pred_tree))

print("\n로지스틱 회귀")
print(confusion_matrix(y_test, pred_logreg))

빈도 기반 더미 모델:
[[403   0]
 [ 47   0]]

무작위 더미 모델:
[[368  35]
 [ 43   4]]

결정 트리:
[[390  13]
 [ 24  23]]

로지스틱 회귀
[[402   1]
 [  6  41]]


## 혼동 행렬
display(Image(filename='img/model_validation01.png'))


from sklearn.metrics import f1_score

# 빈도기반 모델 f1-score
print("무작위 더미 모델의 f1 score: {:.2f}".format(f1_score(y_test, pred_most_frequent)))

# Dummy분류 f1-score
print("무작위 더미 모델의 f1 score: {:.2f}".format(f1_score(y_test, pred_dummy)))

# 의사결정트리
print("트리 모델의 f1 score: {:.2f}".format(f1_score(y_test, pred_tree)))

# 로지스틱 
print("로지스틱 회귀 모델의 f1 score: {:.2f}".format(f1_score(y_test, pred_logreg)))

무작위 더미 모델의 f1 score: 0.00
무작위 더미 모델의 f1 score: 0.09
트리 모델의 f1 score: 0.55
로지스틱 회귀 모델의 f1 score: 0.92


from sklearn.metrics import classification_report
print(classification_report(y_test, pred_most_frequent,
                           target_names=["not 9", "is 9"]))

              precision    recall  f1-score   support

       not 9       0.90      1.00      0.94       403
        is 9       0.00      0.00      0.00        47

    accuracy                           0.90       450
   macro avg       0.45      0.50      0.47       450
weighted avg       0.80      0.90      0.85       450


print(classification_report(y_test, pred_dummy,
                            target_names=["not 9", "is 9"]))

              precision    recall  f1-score   support

       not 9       0.90      0.91      0.90       403
        is 9       0.10      0.09      0.09        47

    accuracy                           0.83       450
   macro avg       0.50      0.50      0.50       450
weighted avg       0.81      0.83      0.82       450


print(classification_report(y_test, 
                            pred_tree,
                            target_names=["not 9", "is 9"]))

              precision    recall  f1-score   support

       not 9       0.94      0.97      0.95       403
        is 9       0.64      0.49      0.55        47

    accuracy                           0.92       450
   macro avg       0.79      0.73      0.75       450
weighted avg       0.91      0.92      0.91       450


print(classification_report(y_test, 
                            pred_logreg,
                            target_names=["not 9", "is 9"]))

              precision    recall  f1-score   support

       not 9       0.99      1.00      0.99       403
        is 9       0.98      0.87      0.92        47

    accuracy                           0.98       450
   macro avg       0.98      0.93      0.96       450
weighted avg       0.98      0.98      0.98       450

평가 지표 및 측정¶

1.1.1 이진 분류의 평가지표¶

1.1.2 임계값과 평가지표¶

1.1.3 평가지표 - ROC 커브, AUC¶

1.1.4 다중 분류의 평가지표¶

학습 내용¶

목차

01. 데이터 준비 및 라이브러리 임포트

데이터 셋¶

Target 값을 이진값으로 만들기¶

데이터 셋의 Target(타깃)을 9:1의 비율로 나누기¶

02. 다양한 모델의 평가 수행

02-01 기본 모델 DummyClassifier¶

02-02 DummyClassifier를 이용한 예측¶

02-03 실제 모델 - DecisionTreeClassifier¶

02-04 LogisticRegression(로지스틱 회귀) 모델¶

하나만 예측하는 기본 모델도 90% 이상의 정확도를 갖는다.¶

정확도 대신에 사용할 지표가 무엇이 있을까?¶

03 오차행렬(confusion matrix)을 이용하기

confusion_matrix 를 이용한 오차(혼동) 행렬 구하기¶

3-1 각각의 예측값에 대한 오차행렬을 확인해보기¶

3-2 분류의 다양한 평가지표를 살펴보기¶

Classification(분류)의 평가지표를 살펴보자.¶

정확도(accuracy) : 정확하게 예측/전체 예측수¶

정밀도(precision) : 예측을 양성(Positive)으로 한것 전체(TP+FP)중에 잘 예측한 것(TP)¶

민감도(sensitivity), 재현율(recall, TPRate), 진짜 양성 비율(TPR)¶

특이도¶

FPRate¶

다양한 분류 측정 방법¶

04. f1-score를 확인해보기

F-score¶

각각의 모델 예측값을 f1-score로 예측¶

f1-score를 요약해서 보여주기¶

dummyClassifier 모델¶

의사결정트리¶

로지스틱 회귀¶