import struct
import urllib
import re
webmutong=urllib.urlopen("http://www.baidu.com/")
str=webmutong.read()
#print str
str = unicode(str,"gb2312")
lstChinese = re.findall(ur'[/u2e80-/uffff]', str)
#print lstChinese
sChinese = u""
for c in lstChinese :
sChinese += c
#print sChinese
f = open("meun.txt",'wb')
f.write(sChinese.encode("gbk"))
f.close()