词云
results = ['python','java','python','flask','django','flask']
result_dic = {}
for item_str in results:
if item_str not in result_dic:
result_dic[item_str] = 1
else:
result_dic[item_str] += 1
python里的运行结果
import pandas as pd
from pyecharts import WordCloud
results = ['python','java','python','flask','django','flask']
result = pd.Series(results)
# print(result.value_counts())
yuyan = result.value_counts().index
nums = result.value_counts().values
wd = WordCloud(width=1300,height=620)
wd.add("",yuyan,nums,word_size_range=(20,100))
wd.render('yuyancloud.html')
柱状图
a = [1,2,3,4,5,6]
b = [0.13,0.78,0.6,0.92,0.66,0.33]
zip(a,b)
Out[4]: <zip at 0x196647ce948>
for i in zip(a,b):
print(i)
(1, 0.13)
(2, 0.78)
(3, 0.6)
(4, 0.92)
(5, 0.66)
(6, 0.33)
for i in range(6):
a_i = a[i]
b_i = b[i]
print(a_i,b_i)
1 0.13
2 0.78
3 0.6
4 0.92
5 0.66
6 0.33
[i for i in zip(a,b)]
Out[7]: [(1, 0.13), (2, 0.78), (3, 0.6), (4, 0.92), (5, 0.66), (6, 0.33)]
import numpy as np
a_array = np.array(a)
b_array = np.array(b)
result = a_array*b_array
result
Out[16]: array([0.13, 1.56, 1.8 , 3.68, 3.3 , 1.98])
result.max()
Out[17]: 3.68
result.argmax()
Out[19]: 3
a[3]
Out[20]: 4
b[3]
Out[22]: 0.92
max=0
for i in range(6):
r = a[i]*b[i]
if r > max:
max = r
max
Out[25]: 3.68
jieba分词
import jieba
r = jieba.cut('孤舟蓑笠翁,独钓寒江雪')
for i in r:
print(i)
孤舟
蓑笠
翁
,
独钓
寒江雪
r=jieba.cut('孤舟蓑笠翁,独钓寒江雪')
result = []
for i in r:
result.append(i)
result
Out[39]: ['孤舟', '蓑笠', '翁', ',', '独钓', '寒江雪']
计数value_counts
import pandas as pd
results = ['python','java','python','flask','django','flask']
result = pd.Series(results)
result.value_counts()
Out[49]:
python 2
flask 2
django 1
java 1
dtype: int64