首页 > 编程 > Python > 正文

Python实现批量下载图片的方法

2019-11-25 17:12:58
字体:
来源:转载
供稿:网友

本文实例讲述了Python实现批量下载图片的方法。分享给大家供大家参考。具体实现方法如下:

#!/usr/bin/env python#-*-coding:utf-8-*-'#Filename:download_file.pyimport os,sysimport reimport urllibimport urllib2base_url = 'xxx'array_url = list()pic_url = list()inner_url = list()def get_array_url(array_url,base_url):  content = urllib.urlopen(base_url).read()  array_url_a = re.findall(r'/rihan.*?.html',content)  for url in array_url_a:    url_a = 'xxx'+url    #print url_a    array_url.append(url_a)def get_inner_url(array_url,inner_url):  inner_url.append(array_url)  content = urllib.urlopen(array_url[10]).read()  content = content.replace(" ","")  url_a = re.findall(r'<li>.*?</li>',content)  for i in url_a:    url = re.findall(r'ahref=//'.*?.html//'target',i)    if len(url)>0:      # print url[0]      url_b = re.sub(r'ahref=//'','',url[0])      # print url_b      url_c = re.sub(r'//'target','',url_b)      url_c = 'http://xxx/'+re.sub(r'/.*/','',url_c)      inner_url.append(url_c)  del inner_url[1]  # print inner_urldef get_pic_url(pic_url,inner_url,array_url):  content = urllib.urlopen(array_url).read()  pic_url_a = re.findall(r'center.*?.jpg',content)  print 'bbbbbbbbb',len(pic_url_a)  pic_url_a = re.findall(r'http://.*.jpg',pic_url_a[0])  pic_url.append(pic_url_a[0])  j=2  for i in inner_url:    jj = '/'+str(j)+'.jpg'    pic = re.sub(r'/1.jpg',jj,pic_url_a[0])    pic_url.append(pic)    j = j+1  del pic_url[-1]  for i in pic_url:    print idef urlcallback(a,b,c):  """    call back function    a,已下载的数据块    b,数据块的大小    c,远程文件的大小  """  print "callback"  prec=100.0*a*b/c  if 100 < prec:    prec=100  print "%.2f%%"%(prec,)def download(img_url,file_num):    for img in img_url:      print img      img_name = re.sub(r'http://.*/','',img)      path = 'C:/'+str(file_num)+'/'+img_name      urllib.urlretrieve(img,path,urlcallback)get_array_url(array_url,base_url)file_num = 3#download(pic_url,file_num)get_inner_url(url,inner_url)get_pic_url(pic_url,inner_url,url)'''for url in array_url:  print url  # get_inner_url(url,inner_url) # get_pic_url(pic_url,inner_url)  get_inner_url(url,inner_url)  get_pic_url(pic_url,inner_url,url)  download(pic_url,file_num)  file_num = file_num+1  del inner_url[:]  del pic_url[:]'''

希望本文所述对大家的Python程序设计有所帮助。

发表评论 共有条评论
用户名: 密码:
验证码: 匿名发表