python 下载或者直接读取csv文件

来源:互联网 发布:手机端淘宝详情页高度 编辑:程序博客网 时间:2024/06/05 02:01
#! /usr/bin/python2# coding=utf-8import urllib2import csv#url = 'http://quotes.money.163.com/service/chddata.html?code=1000002'#url = 'http://table.finance.yahoo.com/table.csv?s=000002.sz'url = 'http://hq.sinajs.cn/?list=sh600127'#print urlreq_header = {'User-Agent':'Mozilla/5.0 (Windows NT 6.1) AppleWebKit/537.11 (KHTML, like Gecko) Chrome/23.0.1271.64 Safari/537.11','Accept':'text/html;q=0.9,*/*;q=0.8','Accept-Charset':'ISO-8859-1,utf-8;q=0.7,*;q=0.3','Accept-Encoding':'gzip','Connection':'close','Referer':None #注意如果依然不能抓取的话,这里可以设置抓取网站的host}req_timeout = 500#req = urllib2.Request(url,None,req_header)req = urllib2.Request(url)#print req# 如果不需要设置代理,下面的set_proxy就不用调用了。由于公司网络要代理才能连接外网,所以这里有set_proxy…# req.set_proxy('proxy.XXX.com:911', 'http')#socket = urllib2.urlopen(req,None,req_timeout)socket = urllib2.urlopen(req)content = socket.read()#content = socket.read().decode('GB18030')socket.close()'''import urllibimport csv#下载文件url = 'http://table.finance.yahoo.com/table.csv?s=000002.sz'urllib.urlretrieve(url, "1000002.csv")#从文件读取reader = csv.reader(file('1000002.csv','rb'))for line in reader:    #忽略第一行    print line,line[0],line[1]    if reader.line_num == 3:        break'''rows = content.split('\n')i = 0for row in rows:    #忽略第一行    print row    if i == 2:        break    i += 1'''#str = content.decode('gbk', 'ignore')#print content#data = csv.reader(content)rows = content.split('\n')for row in rows:    #print row    split_row = row.split(",")    #split_row[1] = int(split_row[1])    #full_data.append(split_row)    full_data = []    for row_s in split_row:        full_data.append(row_s)    print full_data    #print str#data = str.split('"')[1].split(',')#for i in str.split(','):#    print i        '''

0 0
原创粉丝点击