代码如下:
#coding:utf8
import re
import urllib
def getHTML(url):
page = urllib.urlopen(url)
html = page.read()
return html
def getImg(html,imgType):
reg = r'src="(.*?/.+'+imgType+'!slider)" '
imgre = re.compile(reg)
imgList = re.findall(imgre, html)
x=0
for imgurl in imgList:
print imgurl
urllib.urlretrieve(imgurl, '%s.%s' % (x, imgType))
x =x+1
html= getHTML("//www.jb51.net")
getImg(html,'jpg')
新闻热点
疑难解答