jsonpath
用于处理爬虫爬取的json结构化数据
from jsonpath import jsonpath
import requests import jsonpath import json # 获取拉勾网城市json字符串 url = 'http://www.lagou.com/lbs/getAllCitySearchLabels.json' headers = {"User-Agent": "Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; Trident/5.0)"} response =requests.get(url, headers=headers) html_str = response.content.decode() # 把json格式字符串转换成python对象 jsonobj = json.loads(html_str) # 从根节点开始,获取所有key为name的值 citylist = jsonpath.jsonpath(jsonobj,'$..name') # 写入文件 with open('city_name.txt','w') as f: content = json.dumps(citylist, ensure_ascii=False) f.write(content)


来源:博客园
作者:艺术就是π大星
链接:https://www.cnblogs.com/0916m/p/11484357.html
