string 字符串(即不能修改的字符list)
字符串是一个整体。如果你想直接修改字符串的某一部分,是不可能的。但我们能够读出字符串的某一部分。
子字符串的提取
str[:6]
字符串包含判断操作符:in,not in
"He" in str
"she" not in str
替换
s = s.replace(c,'')
去掉空格和首末尾的字符
s.strip().lstrip().rstrip(',')
将字符串前n个字符替换为指定的字符
指定字符 = “”
n = 3
sstr1 = n * 指定 + sstr1[3:]
string模块
S.find(substring, [start [,end]]) #可指范围查找子串,返回索引值,否则返回-1
S.rfind(substring,[start [,end]]) #反向查找
S.index(substring,[start [,end]]) #同find,只是找不到产生ValueError异常
S.rindex(substring,[start [,end]])#同上反向查找
S.count(substring,[start [,end]]) #返回找到子串的个数
S.lowercase()
S.capitalize() #首字母大写
S.lower() #转小写
S.upper() #转大写
S.swapcase() #大小写互换
S.split(str, ' ') #将string转list,以空格切分
S.join(list, ' ') #将list转string,以空格连接
处理字符串的内置函数
len(str) #串长度
cmp("my friend", str) #字符串比较。第一个大,返回1
max('abcxyz') #寻找字符串中最大的字符
min('abcxyz') #寻找字符串中最小的字符
string的转换
float(str) #变成浮点数,float("1e-1") 结果为0.1
int(str) #变成整型, int("12") 结果为12
int(str,base) #变成base进制整型数,int("11",2) 结果为2
long(str) #变成长整型,
long(str,base) #变成base进制长整型,
字符串的格式化
str_format % (参数列表) #参数列表是以tuple的形式定义的,即不可运行中改变 ""%s's height is %dcm" % ("My brother", 180)
json数据交换语言
建立于两种结构
1“名称/值”对的集合(A collection of name/value pairs)
对象(object),纪录(record),结构(struct),字典(dictionary),哈希表(hash table),有键列表(keyed list)关联数组 (associative array)
2值的有序列表(An ordered list of values)
数组(array)
简单数据类型的encoding和decoding:
1用json.dumps()去encode编码返回了一个str对象,
2对这个str进行decode解码使用json.loads()
json.dumps 参数可供选择,
1.sort_keys对dict对象进行排序 有利于观察比
较
json.dumps(data1,sort_keys
=
True
)
2.indent增加缩进 数据存储的格式更优雅
json.dumps(data1,sort_keys
=
True
,indent
=
4
)
3.separator对数据进行压缩
json主要数据通信的格式存在
参数传递是一个元组,包含分割对象的字符串
json.dumps(data, separators=
(
','
,
':'
)
4.skipkeys 默认为False dumps方法存储dict对象时,key必须是str类型,如果出现了其他类型的话,那么会产生TypeError异常,如果开启该参数,设为True的话,则会比较优雅的过度
json.dumps(data,skipkeys
=
True
)
12data
=
{
'b'
:
789
,
'c'
:
456
,(
1
,
2
):
123
}
json.dumps(data,skipkeys
=
True
)
输出:
{"c": 456, "b": 789}
下面这个例子是研究微博关注的,我现在是想吧三十多页都集合到一个字典然后调用key的value 最终分析对比我关注的人和其他人关注的重叠。有想法的愿意教我的希望了留言~谢谢~
# -*- coding: utf-8 -*- import urllib2 url = 'http://m.weibo.cn/p/1005051854260585/detailJson?containerid=1005051854260585_-_FOLLOWERS&page=1' req = urllib2.Request(url) req.add_header('User-agent', 'Mozilla/5.0') data = urllib2.urlopen(req).read() #print data print type(data) import json ddata = json.loads(data)#json建立于“key/value”的集合也就是列表或字典 #print ddata print type(ddata) datareligne = json.dumps(ddata,sort_keys=True,indent=4) print datareligne print type(datareligne)
输出
<type 'str'> <type 'dict'> { "card_type_name": "\u5173\u6ce8", "count": 486, "maxPage": 31, "msg": "", "ok": 1, "title": "\u5173\u6ce8", "type": "pageuserlist", "userInfo": { "basicinfo": { "description": "", "error": "parameter (uid)'s value invalid,expect (long[1~9223372036854775807]), but get (0), see doc for more info.", "error_code": 10017, "request": "/2/account/profile/basic.json" }, "closeRelation": null, "err": null, "errno": null, "rank": null, "relation": -1, "sendMsg": 0, "weihao": "" }, "users": [ { "created_at": "\u4eca\u5929 11:29", "desc1": "\u516c\u53f8\u5c01\u4e86\u4e00\u5927\u7247\u7f51\u7ad9\uff0c\u6ca1\u60f3\u5230\u94c1\u8840\u793e\u533a\u5c45\u7136\u8fd8\u80fd\u4e0a\uff0c\u5947\u8ff9\u3002 \u6211\u5728\u8fd9\u91cc:http://t.cn/z8Afeh3", "desc2": "\u4eca\u5929 11:29", "fansNum": 1961, "gender": "m", "h5icon": { "main": "http://u1.sinaimg.cn/upload/2013/02/22/v_yellow_2x.png", "other": [] }, "icon": [ "http://u1.sinaimg.cn/upload/2013/01/23/v_yellow_2x.png" ], "id": 1656303911, "ismember": 0, "mbtype": 0, "profile_image_url": "http://tp4.sinaimg.cn/1656303911/50/40026529101/1", "profile_url": "pandor", "remark": "", "screen_name": "\u5047\u88c5\u5728\u7f16\u7a0b", "text": "\u516c\u53f8\u5c01\u4e86\u4e00\u5927\u7247\u7f51\u7ad9\uff0c\u6ca1\u60f3\u5230\u94c1\u8840\u793e\u533a\u5c45\u7136\u8fd8\u80fd\u4e0a\uff0c\u5947\u8ff9\u3002 \u6211\u5728\u8fd9\u91cc:http://t.cn/z8Afeh3", "valid": 0, "verified": true, "verified_type": 0, "vipInfo": { "valid": 0 } }, { "created_at": "09-10 09:25", "desc1": "\u4ec0\u4e48\u9985\u5440\uff1f", "desc2": "09-10 09:25", "fansNum": 1649, "gender": "f", "h5icon": { "main": "http://u1.sinaimg.cn/upload/2013/02/22/star_square_2x.png", "other": [] }, "icon": [ "http://u1.sinaimg.cn/upload/2013/01/23/star_square_2x.png" ], "id": 1793380877, "ismember": 0, "mbtype": 0, "profile_image_url": "http://tp2.sinaimg.cn/1793380877/50/40021664562/0", "profile_url": "juliewho", "remark": "", "screen_name": "\u6731\u5927\u529b", "text": "\u4ec0\u4e48\u9985\u5440\uff1f", "valid": 0, "verified": false, "verified_type": 220, "vipInfo": { "valid": 0 } }, { "created_at": "1\u5206\u949f\u524d", "desc1": "\u9c7c\u53f0:\u201c\u4f60\u7528\u7535\uff0c\u6211\u7528\u5fc3\u201d\u5b89\u5168\u670d\u52a1\u9001\u4e0a\u95e8 \u5207\u5b9e\u63d0\u9ad8...http://t.cn/z8oJmdh", "desc2": "1\u5206\u949f\u524d", "fansNum": 7403, "gender": "f", "h5icon": { "main": 0, "other": [] }, "icon": [], "id": 2236077040, "ismember": 0, "mbtype": 0, "profile_image_url": "http://tp1.sinaimg.cn/2236077040/50/5616889140/0", "profile_url": "infosecsupergirl", "remark": "", "screen_name": "\u975e\u8457\u540d\u5973\u9ed1\u5ba2", "text": "\u9c7c\u53f0:\u201c\u4f60\u7528\u7535\uff0c\u6211\u7528\u5fc3\u201d\u5b89\u5168\u670d\u52a1\u9001\u4e0a\u95e8 \u5207\u5b9e\u63d0\u9ad8...http://t.cn/z8oJmdh", "valid": 0, "verified": false, "verified_type": -1, "vipInfo": { "valid": 0 } }, { "created_at": "40\u5206\u949f\u524d", "desc1": "\u548c\u53f0\u6e7e\u4e00\u4f01\u4e1a\u7684\u8001\u677f\u5fae\u4fe1\uff0c\u6211\u53eb\u4eba\u5bb6\u300c\u963f\u5fb7\u300d\u3002\u6700\u540e\u6211\u8bf4\u300c\u597d\uff0c\u8c22\u8c22\u963f\u5fb7\u300d\u3002\u7ed3\u679c\u624b\u4e00\u5feb\uff0c\u53d1\u6210\u4e86\u300c\u597d\uff0c\u8c22\u8c22\u963f\u300d\u3002#\u53f0\u5317\u548c\u4e1c\u5317\u53ea\u662f\u90a3\u4e00\u4e2a\u5b57\u7684\u8ddd\u79bb# [\u6c57]", "desc2": "40\u5206\u949f\u524d", "fansNum": 1404, "gender": "m", "h5icon": { "main": 0, "other": [ "http://u1.sinaimg.cn/upload/2013/01/23/crown_2x.png" ] }, "icon": [ "http://u1.sinaimg.cn/upload/2013/01/23/crown_2x.png" ], "id": 1623611801, "ismember": 1, "mbtype": 12, "profile_image_url": "http://tp2.sinaimg.cn/1623611801/50/5651714023/1", "profile_url": "andypanda", "remark": "", "screen_name": "AndyPan\u7ae5\u978b", "text": "\u548c\u53f0\u6e7e\u4e00\u4f01\u4e1a\u7684\u8001\u677f\u5fae\u4fe1\uff0c\u6211\u53eb\u4eba\u5bb6\u300c\u963f\u5fb7\u300d\u3002\u6700\u540e\u6211\u8bf4\u300c\u597d\uff0c\u8c22\u8c22\u963f\u5fb7\u300d\u3002\u7ed3\u679c\u624b\u4e00\u5feb\uff0c\u53d1\u6210\u4e86\u300c\u597d\uff0c\u8c22\u8c22\u963f\u300d\u3002#\u53f0\u5317\u548c\u4e1c\u5317\u53ea\u662f\u90a3\u4e00\u4e2a\u5b57\u7684\u8ddd\u79bb# [\u6c57]", "valid": 1, "verified": false, "verified_type": -1, "vipInfo": { "valid": 1 } }, { "created_at": "\u4eca\u5929 11:34", "desc1": "9\u6708\u6570\u636e\u5e93\u6d41\u884c\u5ea6\u6392\u884c\u699c", "desc2": "\u4eca\u5929 11:34", "fansNum": "62\u4e07", "gender": "m", "h5icon": { "main": 0, "other": [ "http://u1.sinaimg.cn/upload/2013/01/23/crown_2x.png" ] }, "icon": [ "http://u1.sinaimg.cn/upload/2013/01/23/crown_2x.png" ], "id": 1784501333, "ismember": 1, "mbtype": 12, "profile_image_url": "http://tp2.sinaimg.cn/1784501333/50/5651634056/1", "profile_url": "betterdata", "remark": "", "screen_name": "\u6570\u636e\u6316\u6398\u4e0e\u6570\u636e\u5206\u6790", "text": "9\u6708\u6570\u636e\u5e93\u6d41\u884c\u5ea6\u6392\u884c\u699c", "valid": 1, "verified": false, "verified_type": -1, "vipInfo": { "valid": 1 } }, { "created_at": "2\u5206\u949f\u524d", "desc1": "\u3010\u81ea\u6211\u5ba1\u67e5\u548c\u4e25\u5389\u60e9\u7f5a\u6784\u5efa\u6709\u6548\u7684\u5ba1\u67e5\u4f53\u5236\u3011\u8bb0\u8005Mitch Moxley\u521a\u5230\u5317\u4eac\u8fdb\u5165\u5b98\u65b9\u82f1\u6587\u62a5\u7eb8\u300a\u4e2d\u56fd\u65e5\u62a5\u300b\u5de5\u4f5c\u65f6\uff0c\u4ee5\u4e3a\u4f1a\u6709\u4e00\u6bb5\u95f4\u8c0d\u7535\u5f71\u822c\u523a\u6fc0\u7684\u7ecf\u5386\uff0c\u5171\u4ea7\u4e3b\u4e49\u95f4\u8c0d\u8d8a\u8fc7\u80a9\u8180\u5077\u7aa5\uff0c\u8fc7\u6ee4\u7535\u5b50\u90ae\u4ef6\uff0c\u76d1\u542c\u7535\u8bdd\uff0c\u6df1\u591c\u906d\u7a7f\u6bdb\u5f0f\u670d\u88c5\u7684\u4eba\u7684\u5a01\u80c1\u3002...http://t.cn/z89ra5o", "desc2": "2\u5206\u949f\u524d", "fansNum": 13887, "gender": "m", "h5icon": { "main": "http://u1.sinaimg.cn/upload/2013/02/22/v_blue_2x.png", "other": [] }, "icon": [ "http://u1.sinaimg.cn/upload/2013/01/23/v_blue_2x.png" ], "id": 1686235170, "ismember": 0, "mbtype": 0, "profile_image_url": "http://tp3.sinaimg.cn/1686235170/50/1265076471/1", "profile_url": "solidot", "remark": "", "screen_name": "Solidot", "text": "\u3010\u81ea\u6211\u5ba1\u67e5\u548c\u4e25\u5389\u60e9\u7f5a\u6784\u5efa\u6709\u6548\u7684\u5ba1\u67e5\u4f53\u5236\u3011\u8bb0\u8005Mitch Moxley\u521a\u5230\u5317\u4eac\u8fdb\u5165\u5b98\u65b9\u82f1\u6587\u62a5\u7eb8\u300a\u4e2d\u56fd\u65e5\u62a5\u300b\u5de5\u4f5c\u65f6\uff0c\u4ee5\u4e3a\u4f1a\u6709\u4e00\u6bb5\u95f4\u8c0d\u7535\u5f71\u822c\u523a\u6fc0\u7684\u7ecf\u5386\uff0c\u5171\u4ea7\u4e3b\u4e49\u95f4\u8c0d\u8d8a\u8fc7\u80a9\u8180\u5077\u7aa5\uff0c\u8fc7\u6ee4\u7535\u5b50\u90ae\u4ef6\uff0c\u76d1\u542c\u7535\u8bdd\uff0c\u6df1\u591c\u906d\u7a7f\u6bdb\u5f0f\u670d\u88c5\u7684\u4eba\u7684\u5a01\u80c1\u3002...http://t.cn/z89ra5o", "valid": 0, "verified": true, "verified_type": 5, "vipInfo": { "valid": 0 } }, { "created_at": "27\u5206\u949f\u524d", "desc1": "\u4e0a\u5348\u90e8\u5206\u7b80\u8baf\u66f4\u65b0\uff1a\u300aiWork\u3001iMovie\u3001iPhoto \u5c06\u5168\u90e8\u514d\u8d39\u300b\u300a\u56fd\u65b0\u529e\u8521\u540d\u7167\u4f1a\u89c1Facebook COO\u6851\u5fb7\u4f2f\u683c\u4e00\u884c\u300b\u300a\u4e3aSpaceX\u706b\u7bad\u63a8\u51fa\u7684\u7c7b\u4f3c\u94a2\u94c1\u4fa0\u7684\u79d1\u6280\u53ca\u8bbe\u8ba1\u6280\u672f\u300b\u300a\u5df4\u58eb\u4e4b\u65c5\uff0c\u6539\u88c5\u5df4\u58eb\u6210\u79fb\u52a8\u7684\u5bb6\uff08\u7fa1\u6155\u6b7b\u4e86\uff01\uff09\u300b\u300aJava 8 Optional\u7c7b\u6df1\u5ea6\u89e3\u6790\uff08\u82f1\u6587\uff09\u300b-> http://t.cn/h4QZB0 \uff08\u652f\u6301\u624b\u673a\u9605\u8bfb\uff0c\u6b22\u8fce\u6295\u9012\uff09", "desc2": "27\u5206\u949f\u524d", "fansNum": "10\u4e07", "gender": "m", "h5icon": { "main": "http://u1.sinaimg.cn/upload/2013/02/22/v_blue_2x.png", "other": [] }, "icon": [ "http://u1.sinaimg.cn/upload/2013/01/23/v_blue_2x.png" ], "id": 1670481425, "ismember": 0, "mbtype": 0, "profile_image_url": "http://tp2.sinaimg.cn/1670481425/50/1286328769/1", "profile_url": "jobbole", "remark": "", "screen_name": "\u4f2f\u4e50\u5728\u7ebf\u5b98\u65b9\u5fae\u535a", "text": "\u4e0a\u5348\u90e8\u5206\u7b80\u8baf\u66f4\u65b0\uff1a\u300aiWork\u3001iMovie\u3001iPhoto \u5c06\u5168\u90e8\u514d\u8d39\u300b\u300a\u56fd\u65b0\u529e\u8521\u540d\u7167\u4f1a\u89c1Facebook COO\u6851\u5fb7\u4f2f\u683c\u4e00\u884c\u300b\u300a\u4e3aSpaceX\u706b\u7bad\u63a8\u51fa\u7684\u7c7b\u4f3c\u94a2\u94c1\u4fa0\u7684\u79d1\u6280\u53ca\u8bbe\u8ba1\u6280\u672f\u300b\u300a\u5df4\u58eb\u4e4b\u65c5\uff0c\u6539\u88c5\u5df4\u58eb\u6210\u79fb\u52a8\u7684\u5bb6\uff08\u7fa1\u6155\u6b7b\u4e86\uff01\uff09\u300b\u300aJava 8 Optional\u7c7b\u6df1\u5ea6\u89e3\u6790\uff08\u82f1\u6587\uff09\u300b-> http://t.cn/h4QZB0 \uff08\u652f\u6301\u624b\u673a\u9605\u8bfb\uff0c\u6b22\u8fce\u6295\u9012\uff09", "valid": 0, "verified": true, "verified_type": 5, "vipInfo": { "valid": 0 } }, { "created_at": "24\u5206\u949f\u524d", "desc1": "\u3010\u4e3aPHP\u5f00\u53d1\u8005\u51c6\u5907\u768412\u4e2a\u8c03\u8bd5\u5de5\u5177\u3011PHP\u662f\u5728\u5b9e\u8df5\u4e2d\u53d1\u5c55\u8fc5\u901f\u5e76\u88ab\u6700\u591a\u4f7f\u7528\u7684\u811a\u672c\u8bed\u8a00\u3002\u4e3a\u6784\u5efa\u6781\u5177\u521b\u65b0\u4e50\u8da3\u7684Web\u5e94\u7528\uff0cPHP\u5f00\u53d1\u4eba\u5458\u6301\u7eed\u641c\u5bfb\u7740\u6709\u7528\u7684\u5de5\u5177\u3002\u5728\u8fd9\u7bc7\u6587\u7ae0\u4e2d\u6536\u96c6\u4e86\u5f00\u53d1\u4eba\u5458\u768412\u4e2aPHP\u8c03\u8bd5\u5de5\u5177\uff0c\u5b83\u4eec\u5c06\u6709\u52a9\u4e8e\u5f00\u53d1\u4eba\u5458\u8f7b\u677e\u627e\u51fa\u5e76\u8c03\u8bd5\u5e94\u7528\u7a0b\u5e8f\u53ca\u811a\u672c\u4e2d\u7684\u9519\u8bef\u3002\u5168\u6587=>http://t.cn/z891std", "desc2": "24\u5206\u949f\u524d", "fansNum": 32511, "gender": "m", "h5icon": { "main": "http://u1.sinaimg.cn/upload/2013/02/22/v_blue_2x.png", "other": [] }, "icon": [ "http://u1.sinaimg.cn/upload/2013/01/23/v_blue_2x.png" ], "id": 2857596964, "ismember": 1, "mbtype": 2, "profile_image_url": "http://tp1.sinaimg.cn/2857596964/50/40014857714/1", "profile_url": "209091423", "remark": "", "screen_name": "WEB\u5f00\u53d1\u8005", "text": "\u3010\u4e3aPHP\u5f00\u53d1\u8005\u51c6\u5907\u768412\u4e2a\u8c03\u8bd5\u5de5\u5177\u3011PHP\u662f\u5728\u5b9e\u8df5\u4e2d\u53d1\u5c55\u8fc5\u901f\u5e76\u88ab\u6700\u591a\u4f7f\u7528\u7684\u811a\u672c\u8bed\u8a00\u3002\u4e3a\u6784\u5efa\u6781\u5177\u521b\u65b0\u4e50\u8da3\u7684Web\u5e94\u7528\uff0cPHP\u5f00\u53d1\u4eba\u5458\u6301\u7eed\u641c\u5bfb\u7740\u6709\u7528\u7684\u5de5\u5177\u3002\u5728\u8fd9\u7bc7\u6587\u7ae0\u4e2d\u6536\u96c6\u4e86\u5f00\u53d1\u4eba\u5458\u768412\u4e2aPHP\u8c03\u8bd5\u5de5\u5177\uff0c\u5b83\u4eec\u5c06\u6709\u52a9\u4e8e\u5f00\u53d1\u4eba\u5458\u8f7b\u677e\u627e\u51fa\u5e76\u8c03\u8bd5\u5e94\u7528\u7a0b\u5e8f\u53ca\u811a\u672c\u4e2d\u7684\u9519\u8bef\u3002\u5168\u6587=>http://t.cn/z891std", "valid": 0, "verified": true, "verified_type": 5, "vipInfo": { "valid": 0 } }, { "created_at": "09-08 18:08", "desc1": "\u4eca\u5929\u542c\u5230\u4e00\u4e2aMoco\u7684\u65b0\u7528\u6cd5\uff0c\u7528\u6765\u7834\u89e3\u6e38\u620f\uff0c\u6211\u90fd\u60ca\u5446\u4e86\u3002\u7528HTTP\u65b9\u5f0f\u9a8c\u8bc1\u7684\u6e38\u620f\uff0c\u4f60\u4eec\u90fd\u5c0f\u5fc3\u70b9\uff01", "desc2": "09-08 18:08", "fansNum": 1370, "gender": "m", "h5icon": { "main": 0, "other": [] }, "icon": [], "id": 2192241300, "ismember": 0, "mbtype": 0, "profile_image_url": "http://tp1.sinaimg.cn/2192241300/50/5625742561/1", "profile_url": "dreamhead", "remark": "", "screen_name": "dreamhead", "text": "\u4eca\u5929\u542c\u5230\u4e00\u4e2aMoco\u7684\u65b0\u7528\u6cd5\uff0c\u7528\u6765\u7834\u89e3\u6e38\u620f\uff0c\u6211\u90fd\u60ca\u5446\u4e86\u3002\u7528HTTP\u65b9\u5f0f\u9a8c\u8bc1\u7684\u6e38\u620f\uff0c\u4f60\u4eec\u90fd\u5c0f\u5fc3\u70b9\uff01", "valid": 0, "verified": false, "verified_type": -1, "vipInfo": { "valid": 0 } }, { "created_at": "09-04 14:39", "desc1": "[\u9f13\u638c]", "desc2": "09-04 14:39", "fansNum": 64172, "gender": "m", "h5icon": { "main": "http://u1.sinaimg.cn/upload/2013/02/22/v_blue_2x.png", "other": [] }, "icon": [ "http://u1.sinaimg.cn/upload/2013/01/23/v_blue_2x.png" ], "id": 1689230501, "ismember": 0, "mbtype": 0, "profile_image_url": "http://tp2.sinaimg.cn/1689230501/50/5664244979/1", "profile_url": "mckinseyquarterlycn", "remark": "", "screen_name": "\u9ea6\u80af\u9521\u5b63\u520a", "text": "[\u9f13\u638c]", "valid": 0, "verified": true, "verified_type": 3, "vipInfo": { "valid": 0 } } ] } <type 'str'> [Finished in 0.9s]
0918string的操作和json的初步了解~
最新推荐文章于 2021-12-15 16:08:08 发布