密码统计分析

最新推荐文章于 2020-10-13 15:06:28 发布

原创最新推荐文章于 2020-10-13 15:06:28 发布 · 466 阅读

0 ·

CC 4.0 BY-SA版权

❥Cryptography 专栏收录该内容

7 篇文章

订阅专栏

#函数
def do_something_with(l, dou):
    #统计单字母，双字母个数记录于字典a中
    l = filter(str.isalpha, l.lower())
    #对字符串l，只提取字母，且规定为小写
    for i in l:
        
        #遍历单字母
        if(i in a):
            a[i] = a[i] + 1
        else:
            a[i] = 1
        
        #遍历双字母
        dou = dou[1] + i
        if(dou[0] != ' '):
            if(dou in a):
                a[dou] = a[dou] + 1
            else:
                a[dou] = 1

a = {};
dou = '  '
file_object = open('statistics.txt', 'r')
try:
    for line in file_object:
        do_something_with(line, dou)
finally:
    file_object.close()
print(a)
len(a)

import pandas as pd
df = pd.DataFrame(list(a.items()))
df.sort_index(axis = 0,ascending = False,by = 1)

#output
  	0 	1
12 	e 	118461
26 	t 	79827
1 	a 	74240
24 	o 	71682
45 	i 	66301
6 	n 	64598
30 	s 	59412
3 	r 	56109
34 	h 	55006
8 	d 	44194


... 	... 	...


603 	éo 	1
639 	èt 	1
610 	ès 	1
625 	jy 	1
337 	xv 	1
630 	mê 	1
631 	êm 	1
336 	sx 	1
638 	lè 	1
662 	cj 	1
663 rows × 2 columns

import matplotlib.pyplot as plt
df.plot(kind='barh', figsize=(10, 6)) 
df.plot(kind='line') 
plt.xlabel('number') 
# add to x-label to the plot 
plt.ylabel('alpher') 
# add y-label to the plot 
plt.title("statistics") 
# add title to the plot 
plt.show()