利用urllib和beautiful soup下载网页图片

来源:互联网 发布:上海行知小学招生简章 编辑:程序博客网 时间:2024/05/11 04:55

以百度贴吧为例

from urllib import request

import re
from bs4 import BeautifulSoup
import urllib

i = 0
html = request.urlopen(r'http://tieba.baidu.com/p/4380912114?pn=1').read()
soup = BeautifulSoup(html,"html.parser")
img_ = soup.find_all(name='img')
img_list = []
for each in img_:
    now_pic =  each.get('src')
    if  'forum' in now_pic:
        img_list.append(now_pic)
for each_img_url in img_list:
    try:
        request.urlretrieve(each_img_url,r'C:\Users\asus\Desktop\新建文件夹\%s.jpg'%i)  
        i+=1
        print(each_img_url)
    except:
        pass
0 0
原创粉丝点击