CODE:
#!/usr/bin/python
# -*- coding: utf-8 -*-
'''
Created on 2014-7-8
@author: guaguastd
@name: plot_frequencies_words.py
'''
if __name__ == '__main__':
#import json
# import Counter
from collections import Counter
# import search
from search import search_for_tweet
# import visualize
from visualize import visualize_for_frequencies
# import login, see http://blog.youkuaiyun.com/guaguastd/article/details/31706155
from login import twitter_login
# get the twitter access api
twitter_api = twitter_login()
# import tweet
from tweet import extract_tweet_entities
while 1:
query = raw_input('\nInput the query (eg. #MentionSomeoneImportantForYou, exit to quit): ')
if query == 'exit':
print 'Successfully exit!'
break
statuses = search_for_tweet(twitter_api, query)
status_texts,screen_names,hashtags,words = extract_tweet_entities(statuses)
word_counts = sorted(Counter(words).values(), reverse=True)
visualize_for_frequencies(word_counts, "Word Rank", "Freq")
RESULT:
Input the query (eg. #MentionSomeoneImportantForYou, exit to quit): #MentionSomeoneImportantForYou
Length of statuses 100
Length of statuses 196
原文:http://blog.youkuaiyun.com/guaguastd/article/details/37554913
此博客展示了用Python实现单词频率可视化的代码。通过导入相关模块,获取Twitter API,输入查询词搜索推文,提取推文实体,统计单词频率,最后对单词频率进行可视化展示。
8881

被折叠的 条评论
为什么被折叠?



