Python如何使用Python pandas交叉表创建混淆矩阵统计信息

2024-05-22 01:15:27 发布

您现在位置:Python中文网/ 问答频道 /正文

下面是我的Phyton脚本,它生成以下混淆矩阵

enter image description here

# /usr/bin/python -tt

from __future__ import division
import csv
import os
import pandas as pd


#----------------------------------------------------------------------------
def get_tcp_variant(filepath):
    def tcp_congestion_variant(beta):
        print('predict({}; abs({})'.format(beta, abs(beta)))
        if (beta>0.61 and beta<=0.75):
            return "Cubic"
        if (beta>=0.45 and beta<0.61):
            return "Reno"
        if (beta>0.75 and beta<=0.99):
            return "BIC"

        return "None"
#----------------------------------------------------------------------------

    with open(filepath, "r") as csvfile:
        ff = csv.reader(csvfile)

        beta_values = []
        cwnd_loss = 0
        for current_cwnd, col2 in ff:
            value = int(current_cwnd)
            if value >= cwnd_loss:
                cwnd_loss = value
            else:
                beta_value = int(current_cwnd)/cwnd_loss
                beta_value=(round(beta_value,2))
                beta_values.append(beta_value)
                cwnd_loss = value

    return tcp_congestion_variant(sum(beta_values)/len(beta_values))

print ("*********************************************")
print ("Confusion matrix ")
print ("*********************************************")
matrix = {'actual':[], 'predict':[]}
path = './csv_files'

#----------------------------------------------------------------------------
def get_variant_predict(filename):
    if 'cubic' in filename:
        return 'Cubic'
    if 'reno' in filename:
        return "Reno"
    if 'bic' in filename:
        return "BIC"
    else:
        return filename [0]
#----------------------------------------------------------------------------

for filename in os.listdir(path):
    #matrix['predict'].append(filename[:4])
    matrix['predict'].append(get_variant_predict(filename))
    matrix['actual'].append(get_tcp_variant(os.path.join(path, filename)))

data_frame = pd.crosstab(pd.Series(matrix['actual'], name='Actual'),
                 pd.Series(matrix['predict'], name='    Predicted'))
                 #,margins=True) # To add "All"
print (" ")

print(data_frame)

如何添加混淆矩阵统计信息(例如:accuracyPythonpandas交叉表?如果我们手动执行,则accuracy将是(4+24+21)/(4+24+4+1+1+21)-但我想自动生成统计数据


Tags: inimportcwndgetreturnifvaluefilename