python 学习笔记

来源:互联网 发布:淘宝店铺降权处置 编辑:程序博客网 时间:2024/06/06 09:31

新手刚接触python 做了下面的例子,这个例子的功能下载指定网页上的图片:


import urllib.requestimport reimport threadingfrom time import sleep,ctimefrom html import parser#connect to a URLwebsite = urllib.request.urlopen("http://sc.chinaz.com/tupian/taikongtupian_3.html")#read html codehtml = website.read().decode()#use re.findall to get all the linkslinks = re.findall(r'(http:[^\s]*?(jpg|png|gif|JPG|PNG|GIF))', html)print(links)print ("网页抓取成功,开始下载图片:")def downjpg( filepath,FileName ="default.jpg" ): try:  print(str(filepath))  web = urllib.request.urlopen(filepath)  print("访问网络文件"+"\n")  jpg = web.read()  DstDir="G:\\image\\"  print("保存文件"+DstDir+FileName+"\n")  try:   File = open( DstDir+FileName,"wb" )   File.write( jpg)   File.close()   return  except IOError:   print("error\n")   return except Exception:  print("error\n")  returndef upload(url,name):       path = r"G:\\image\\"+name             data = urllib.request.urlopen(url).read()         print(url)   f = open(path,"wb")        print(path)     f.write(data)       print(data)      f.close()  i=150it = iter(links)    # 创建迭代器对象for x in it:    i+=1    name=str(i)+".jpg"    upload(x[0],name)    #downjpg(x[0],name)    #print(re.findall('"http:.*"', x)[0]+name)


0 0
原创粉丝点击