Python實現(xiàn)多線程下載腳本的示例代碼

更新時間：2020年04月03日 15:04:23 作者：LetheSec

這篇文章主要介紹了Python實現(xiàn)多線程下載腳本的示例代碼，文中通過示例代碼介紹的非常詳細，對大家的學習或者工作具有一定的參考學習價值，需要的朋友們下面隨著小編來一起學習學習吧

0x01 分析

一個簡單的多線程下載資源的Python腳本，主要實現(xiàn)部分包含兩個類：

Download類：包含download()和get_complete_rate()兩種方法。

download()方法種首先用 urlopen() 方法打開遠程資源并通過 Content-Length獲取資源的大小，然后計算每個線程應(yīng)該下載網(wǎng)絡(luò)資源的大小及對應(yīng)部分嗎，最后依次創(chuàng)建并啟動多個線程來下載網(wǎng)絡(luò)資源的指定部分。
get_complete_rate()則是用來返回已下載的部分占全部資源大小的比例，用來回顯進度。

ThreadDownload類：該線程類繼承了threading.Thread類，包含了一個run()方法。

run()方法主要負責每個線程讀取網(wǎng)絡(luò)數(shù)據(jù)并寫入本地。

0x02 代碼

# 文件名：ThreadDownload.py
import threading
from urllib.request import *


class Download:
  def __init__(self, link, file_path, thread_num):
    # 下載路徑
    self.link = link
    # 保存位置
    self.file_path = file_path
    # 使用多少線程
    self.thread_num = thread_num
    # 初始化threads數(shù)組
    self.threads = []

  def download(self):
    req = Request(url=self.link, method='GET')
    req.add_header('Accept', '*/*')
    req.add_header('Charset', 'UTF-8')
    req.add_header('Connection', 'Keep-Alive')
    f = urlopen(req)
    # 獲取要下載的文件的大小
    self.file_size = int(dict(f.headers).get('Content-Length', 0))
    f.close()
    # 計算每個線程要下載的資源的大小
    current_part_size = self.file_size // self.thread_num + 1
    for i in range(self.thread_num):
      # 計算每個線程下載的開始位置
      start_pos = i * current_part_size
      # 每個線程使用一個wb模式打開的文件進行下載
      t = open(self.file_path, 'wb')
      t.seek(start_pos, 0)
      # 創(chuàng)建下載線程
      td = ThreadDownload(self.link, start_pos, current_part_size, t)
      self.threads.append(td)
      td.start()

  # 獲下載的完成百分比
  def get_complete_rate(self):
    sum_size = 0
    for i in range(self.thread_num):
      sum_size += self.threads[i].length
    return sum_size / self.file_size

class ThreadDownload(threading.Thread):
  def __init__(self, link, start_pos, current_part_size, current_part):
    super().__init__() 
    # 下載路徑
    self.link = link
    # 當前線程的下載位置
    self.start_pos = start_pos
    # 定義當前線程負責下載的文件大小
    self.current_part_size = current_part_size
    # 當前文件需要下載的文件快
    self.current_part = current_part
    # 定義該線程已經(jīng)下載的字節(jié)數(shù)
    self.length = 0
  
  def run(self):
    req = Request(url = self.link, method='GET')
    req.add_header('Accept', '*/*')
    req.add_header('Charset', 'UTF-8')
    req.add_header('Connection', 'Keep-Alive')

    f = urlopen(req)
    # 跳過self.start_pos個字節(jié)，表明該線程只負責下載自己負責的那部分內(nèi)容
    for i in range(self.start_pos):
      f.read(1)
    # 讀取網(wǎng)絡(luò)數(shù)據(jù)，并寫入本地
    while self.length < self.current_part_size:
      data = f.read(1024)
      if data is None or len(data) <= 0:
        break
      self.current_part.write(data)
      # 累計該線程下載的總大小
      self.length += len(data)
    self.current_part.close()
    f.close()

#!/usr/bin/env python 
# -*- coding: utf-8 -*- 
# 文件名：thread_download-master.py

import sys
import time

from ThreadDownload import *


def show_process(dl):
  while dl.get_complete_rate() < 1:
    complete_rate = int(dl.get_complete_rate()*100) 
    print('\r' + '下載中···（已下載' + str(complete_rate) + '%）', end='', flush=True)
    time.sleep(0.01)


def main():
  try:  
    Link = input('[+]' + 'Link: ')
    file_path = input('[+]' + 'File Path: ')
    thread_number = input('[+]' + 'Thread Number: ')
    thread_number = int(thread_number)
    dl = Download(Link, file_path, thread_number)
    dl.download()
    print('\n開始下載!')
    show_process(dl)
    print('\r' + '下載中···（已下載' + '100%)', end='', flush=True)
    print('\n下載完成!')
  except Exception:
      print('Parameter Setting Error')
      sys.exit(1)

if __name__=='__main__':
    main()

0x03 運行結(jié)果

下載歌曲《男孩》為例，下載到./Download/目錄下并命名為男孩.mp3，設(shè)置5個線程：