参考文献:利用 ChiMerge 分析鸢尾花数据集基本思想实战函数说明程序运行结果参考文献 - 码农教程
Python代码实现;
# coding=utf-8 import time from time import ctime ''' 输入:读取逗号文件 输出:返回列表,形如[['5.1', '3.5', '1.4', '0.2', 'Iris-setosa'], ['4.9', '3.0', '1.4', '0.2', 'Iris-setosa']] ''' def read(file): ls = [] fo = open(file, mode="r") for line in fo: line = line.removesuffix('\n') ls.append(line.split(',')) #print(ls) fo.close() return ls """ 输入: 参数1:列表数据,形如[['5.1', '3.5', '1.4', '0.2', 'Iris-setosa'], ['4.9', '3.0', '1.4', '0.2', 'Iris-setosa']] 参数2:属性序号 输出:属性值及所对应的三种鸢尾花类别的数量,形如,[('4.3', [1, 0, 0]), ('4.4', [3, 0, 0]), [2, 5, 1])],[(每列数据,[Setosa的数量,Versicolour的数量,Virginica的数量]), """ def collect(instance, i): ''' #处理成为这种格式:[ ['5.1', 'Iris-setosa'], ['4.9','Iris-setosa'], ... ] ''' arr = [] for e i