import numpy
from os import listdir
import jieba
import operator
from gensim import corpora,models,similarities
from numpy import *
#贝叶斯算法的实现
class Bayes:
def __init__(self):
self.length=-1
self.labelcount=dict()
self.vectorcount=dict()#key:value,{label:vect}
def fit(self,dataSet,labels):
if(len(dataSet)!=len(labels)):
raise ValueError("您输入的类别与我们的数据集个数不匹配")
self.length=len(dataSet[0])
labelsnum=len(labels)#数据记录数量,类别总数量
norelabel=set(labels)#不重复类别数组
for item in norelabel:
thislabel=item
#当前类别占总类别的比例,当前类别的概率
self.labelcount[thislabel]&#