20 行python代码抓取网页中所有JPG图片
时间:2014-10-11 23:57:32
收藏:0
阅读:211
#!/usr/bin/python import re import urllib def getHtml(url): page = urllib.urlopen(url) html = page.read() return html def getImg(html): reg = r'src="(.*?\.jpg)" width' imgre = re.compile(reg) imglist = re.findall(imgre, html) num = 0 for imgurl in imglist: urllib.urlretrieve(imgurl, '%d.jpg' % num) num += 1 html = getHtml('http://tieba.baidu.com/p/1805615679') getImg(html)
评论(0)