- # -*- coding: utf-8 -*-
- #---------------------------------------
- # 程序:暴走漫画的GIF趣图爬虫
- # 语言:Python 3.3
- # 说明:能自定义下载页数,默认全部下载,未加多线程功能
- #---------------------------------------
- import urllib.request
- import bs4,os
- page_sum = 1 #设置下载页数
- path = os.getcwd()
- path = os.path.join(path,'暴走GIF')
- if not os.path.exists(path):
- os.mkdir(path) #创建文件夹
- url = "http://baozoumanhua.com/gif/month/page/" #url地址
- headers = { #伪装浏览器
- 'User-Agent':'Mozilla/5.0 (Windows NT 6.1; WOW64) ApplewebKit/537.36 (Khtml, like Gecko)'
- ' Chrome/32.0.1700.76 Safari/537.36'
- }
- for count in range(page_sum):
- req = urllib.request.Request(
- url = url+str(count+1),
- headers = headers
- )
- print(req.full_url)
- content = urllib.request.urlopen(req).read()
- soup = bs4.BeautifulSoup(content) # BeautifulSoup
- img_content = soup.findAll('img',attrs={'style':'width:460px'})
- url_list = [img['src'] for img in img_content] #列表推导 url
- title_list = [img['alt'] for img in img_content] #图片名称
- for i in range(url_list.__len__()) :
- imgurl = url_list[i]
- filename = path + os.sep +title_list[i] + ".gif"
- print(filename+":"+imgurl) #打印下载信息
- urllib.request.urlretrieve(imgurl,filename) #下载图片
- #该片段来自于http://www.codesnippet.cn/detail/250220148792.html
来源: http://www.codesnippet.cn/detail/250220148792.html