#coding=utf-8
#download pictures of the url
#useage: python downpicture.py www.baidu.com
import os
import sys
from html.parser import HTMLParser
from urllib.request import urlopen
from urllib.parse import urlparse
def getpicname(path):
  '''  retrive filename of url    '''
  if os.path.splitext(path)[1] == '':
    return None
  pr=urlparse(path)
  path='http://'+pr[1]+pr[2]
  return os.path.split(path)[1]
def saveimgto(path, urls):
  '''
  save img of url to local path
  '''
  if not os.path.isdir(path):
    print('path is invalid')
    sys.exit()
  else:
    for url in urls:
      of=open(os.path.join(path, getpicname(url)), 'w+b')
      q=urlopen(url)
      of.write(q.read())
      q.close()
      of.close()
class myhtmlparser(HTMLParser):
  '''put all src of img into urls'''
  def __init__(self):
    HTMLParser.__init__(self)
    self.urls=list()
    self.num=0
  def handle_starttag(self, tag, attr):
    if tag.lower() == 'img':
      srcs=[u[1] for u in attr if u[0].lower() == 'src']
      self.urls.extend(srcs)
      self.num = self.num+1
if __name__ == '__main__':
  url=sys.argv[1]
  if not url.startswith('http://'):
    url='http://' + sys.argv[1]
  parseresult=urlparse(url)
  domain='http://' + parseresult[1]
  q=urlopen(url)
  content=q.read().decode('utf-8', 'ignore')
  q.close()
  myparser=myhtmlparser()
  myparser.feed(content)
  for u in myparser.urls:
    if (u.startswith('//')):
      myparser.urls[myparser.urls.index(u)]= 'http:'+u
    elif u.startswith('/'):
      myparser.urls[myparser.urls.index(u)]= domain+u
  saveimgto(r'D:\python\song', myparser.urls)
  print('num of download pictures is {}'.format(myparser.num))

運行結(jié)果如下：

num of download pictures is 19

希望本文所述對大家的Python程序設計有所幫助。

您可能感興趣的文章:

通過代碼實例解析Pytest運行流程
這篇文章主要介紹了通過代碼實例解析Pytest運行流程,文中通過示例代碼介紹的非常詳細，對大家的學習或者工作具有一定的參考學習價值,需要的朋友可以參考下
2020-08-08
python列表推導式的原理及使用方法
這篇文章主要介紹了python列表推導式的原理及使用方法，列表推導式即list?comprehension，有時也被翻譯為列表解析式，是一種創(chuàng)建列表的簡潔語法，更多詳細內(nèi)容需要的小伙伴可以參考一下下面文章相關資料
2022-03-03
對網(wǎng)站內(nèi)嵌gradio應用的輸入輸出做審核實現(xiàn)詳解
這篇文章主要為大家介紹了對網(wǎng)站內(nèi)嵌gradio應用的輸入輸出做審核實現(xiàn)詳解，有需要的朋友可以借鑒參考下，希望能夠有所幫助，祝大家多多進步，早日升職加薪
2023-04-04
Python selenium的這三種等待方式一定要會!
今天給大家?guī)淼氖顷P于Python的相關知識,文章圍繞著selenium三種等待方式展開,文中有非常詳細的介紹,需要的朋友可以參考下
2021-06-06
Python利用heapq實現(xiàn)一個優(yōu)先級隊列的方法
今天小編就為大家分享一篇Python利用heapq實現(xiàn)一個優(yōu)先級隊列的方法，具有很好的參考價值，希望對大家有所幫助。一起跟隨小編過來看看吧
2019-02-02
這篇文章主要介紹了python實現(xiàn)車輛跟隨滑?？刂?采用指數(shù)趨近律、等速趨近律、準滑?？刂频姆椒ㄍ瓿绍囕v跟隨問題的仿真，運行結(jié)果以圖片形式保存在同目錄下，需要的朋友可以參考下
2022-05-05