PYTHON 抓去京东,百度的数据

来源:互联网 发布:统计师的python日记 编辑:程序博客网 时间:2024/06/08 18:52
# -*- coding:utf-8 -*-import urllibimport jsonfrom pyquery import PyQueryimport sysreload(sys)sys.setdefaultencoding('utf-8')def get_jd(keyword):    doc = PyQuery('https://search.jd.com/Search?keyword='+urllib.quote(keyword))    elements = doc(".gl-i-wrap")    for obj in elements:        product = {}        product["price"] = PyQuery(obj)(".p-price").text()        product["name"] = PyQuery(obj)(".p-name").text()        product["href"] = PyQuery(obj)(".p-name")("a").attr("href")        print str(product).decode('string_escape')def get_baidu(keyword):    doc = PyQuery('http://www.baidu.com/s?wd=' + urllib.quote(keyword))    elements = doc(".result")    for eme in elements:        obj  = json.loads(PyQuery(eme)("div")(".c-tools").attr("data-tools"))        obj["text"] =PyQuery(eme)(".c-abstract").text()        print str(obj).decode('unicode-escape').encode('utf-8')keyword = 'iphone'get_jd(keyword)get_baidu(keyword)