|
1 |
| -from io import BufferedWriter |
2 |
| -import os |
3 |
| -import time |
4 |
| -import traceback |
5 |
| -from typing import Callable |
6 |
| -import requests |
7 |
| -from threading import Thread |
8 |
| -from exceptions import DownloadException |
9 |
| - |
10 |
| - |
11 |
| -class FileDownloader: |
12 |
| - on_download_progress: Callable[[str, int, int, int], None] = None |
13 |
| - on_download_completed: Callable[[str, Exception], None] = None |
14 |
| - url: str |
15 |
| - filename: str |
16 |
| - basename: str |
17 |
| - total_size: int |
18 |
| - download_size: int |
19 |
| - download_stop: bool |
20 |
| - prev_sec_download_size: int |
21 |
| - |
22 |
| - def __init__(self): |
23 |
| - self.download_stop = False |
24 |
| - self.download_size = 0 |
25 |
| - self.completed = False |
26 |
| - self.total_size = 0 |
27 |
| - self.prev_sec_download_size = 0 |
28 |
| - self.report_thread = None |
29 |
| - |
30 |
| - def download_file(self, url: str, file_path: str): |
31 |
| - self.url = url |
32 |
| - self.basename = os.path.basename(file_path) |
33 |
| - self.download_stop = False |
34 |
| - self.filename = file_path |
35 |
| - self.prev_sec_download_size = 0 |
36 |
| - self.download_size = 0 |
37 |
| - self.completed = False |
38 |
| - self.report_thread = None |
39 |
| - error = None |
40 |
| - report_thread = None |
41 |
| - try: |
42 |
| - response, fw = self.__init_download(self.url, self.filename) |
43 |
| - self.total_size = int(response.headers.get("Content-Length")) |
44 |
| - if self.on_download_progress is not None: |
45 |
| - report_thread = self.__start_report_download_progress() |
46 |
| - self.__start_download(response, fw) |
47 |
| - except Exception as e: |
48 |
| - error = e |
49 |
| - finally: |
50 |
| - self.completed = True |
51 |
| - if report_thread is not None: |
52 |
| - report_thread.join() |
53 |
| - |
54 |
| - if self.on_download_completed is not None: |
55 |
| - self.on_download_completed(self.basename, error) |
56 |
| - |
57 |
| - def __init_download( |
58 |
| - self, url: str, file_path: str |
59 |
| - ) -> tuple[requests.Response, BufferedWriter]: |
60 |
| - if os.path.exists(file_path): |
61 |
| - start_pos = os.path.getsize(file_path) |
62 |
| - else: |
63 |
| - os.makedirs(os.path.dirname(file_path), exist_ok=True) |
64 |
| - start_pos = 0 |
65 |
| - |
66 |
| - if start_pos > 0: |
67 |
| - # download skip exists part |
68 |
| - response = requests.get( |
69 |
| - url, |
70 |
| - stream=True, |
71 |
| - verify=False, |
72 |
| - headers={"Range": f"bytes={start_pos}-"}, |
73 |
| - ) |
74 |
| - fw = open(file_path, "ab") |
75 |
| - else: |
76 |
| - response = requests.get(url, stream=True, verify=False) |
77 |
| - fw = open(file_path, "wb") |
78 |
| - |
79 |
| - return response, fw |
80 |
| - |
81 |
| - def __start_download(self, response: requests.Response, fw: BufferedWriter): |
82 |
| - retry = 0 |
83 |
| - while True: |
84 |
| - try: |
85 |
| - with response: |
86 |
| - with fw: |
87 |
| - for bytes in response.iter_content(chunk_size=4096): |
88 |
| - self.download_size += bytes.__len__() |
89 |
| - fw.write(bytes) |
90 |
| - |
91 |
| - if self.download_stop: |
92 |
| - print( |
93 |
| - f"FileDownloader thread {Thread.native_id} exit by stop" |
94 |
| - ) |
95 |
| - break |
96 |
| - break |
97 |
| - except Exception: |
98 |
| - traceback.print_exc() |
99 |
| - retry += 1 |
100 |
| - if retry > 3: |
101 |
| - raise DownloadException(self.url) |
102 |
| - else: |
103 |
| - print( |
104 |
| - f"FileDownloader thread {Thread.native_id} retry {retry} times" |
105 |
| - ) |
106 |
| - time.sleep(1) |
107 |
| - response, fw = self.__init_download(self.url, self.filename) |
108 |
| - |
109 |
| - def __start_report_download_progress(self): |
110 |
| - report_thread = Thread(target=self.__report_download_progress) |
111 |
| - report_thread.start() |
112 |
| - return report_thread |
113 |
| - |
114 |
| - def __report_download_progress(self): |
115 |
| - while not self.download_stop and not self.completed: |
116 |
| - self.on_download_progress( |
117 |
| - self.basename, |
118 |
| - self.download_size, |
119 |
| - self.total_size, |
120 |
| - self.download_size - self.prev_sec_download_size, |
121 |
| - ) |
122 |
| - |
123 |
| - self.prev_sec_download_size = self.download_size |
124 |
| - time.sleep(1) |
125 |
| - |
126 |
| - def stop_download(self): |
127 |
| - self.download_stop = True |
| 1 | +from io import BufferedWriter |
| 2 | +import os |
| 3 | +import time |
| 4 | +import traceback |
| 5 | +from typing import Callable |
| 6 | +import requests |
| 7 | +from threading import Thread |
| 8 | +from exceptions import DownloadException |
| 9 | + |
| 10 | + |
| 11 | +class FileDownloader: |
| 12 | + on_download_progress: Callable[[str, int, int, int], None] = None |
| 13 | + on_download_completed: Callable[[str, Exception], None] = None |
| 14 | + url: str |
| 15 | + filename: str |
| 16 | + basename: str |
| 17 | + total_size: int |
| 18 | + download_size: int |
| 19 | + download_stop: bool |
| 20 | + prev_sec_download_size: int |
| 21 | + |
| 22 | + def __init__(self): |
| 23 | + self.download_stop = False |
| 24 | + self.download_size = 0 |
| 25 | + self.completed = False |
| 26 | + self.total_size = 0 |
| 27 | + self.prev_sec_download_size = 0 |
| 28 | + self.report_thread = None |
| 29 | + |
| 30 | + def download_file(self, url: str, file_path: str): |
| 31 | + self.url = url |
| 32 | + self.basename = os.path.basename(file_path) |
| 33 | + self.download_stop = False |
| 34 | + self.filename = file_path |
| 35 | + self.prev_sec_download_size = 0 |
| 36 | + self.download_size = 0 |
| 37 | + self.completed = False |
| 38 | + self.report_thread = None |
| 39 | + error = None |
| 40 | + report_thread = None |
| 41 | + try: |
| 42 | + response, fw = self.__init_download(self.url, self.filename) |
| 43 | + self.total_size = int(response.headers.get("Content-Length")) |
| 44 | + if self.on_download_progress is not None: |
| 45 | + report_thread = self.__start_report_download_progress() |
| 46 | + self.__start_download(response, fw) |
| 47 | + except Exception as e: |
| 48 | + error = e |
| 49 | + finally: |
| 50 | + self.completed = True |
| 51 | + if report_thread is not None: |
| 52 | + report_thread.join() |
| 53 | + |
| 54 | + if self.on_download_completed is not None: |
| 55 | + self.on_download_completed(self.basename, error) |
| 56 | + |
| 57 | + def __init_download( |
| 58 | + self, url: str, file_path: str |
| 59 | + ) -> tuple[requests.Response, BufferedWriter]: |
| 60 | + if os.path.exists(file_path): |
| 61 | + start_pos = os.path.getsize(file_path) |
| 62 | + else: |
| 63 | + os.makedirs(os.path.dirname(file_path), exist_ok=True) |
| 64 | + start_pos = 0 |
| 65 | + |
| 66 | + if start_pos > 0: |
| 67 | + # download skip exists part |
| 68 | + response = requests.get( |
| 69 | + url, |
| 70 | + stream=True, |
| 71 | + headers={"Range": f"bytes={start_pos}-"}, |
| 72 | + ) |
| 73 | + fw = open(file_path, "ab") |
| 74 | + else: |
| 75 | + response = requests.get(url, stream=True) |
| 76 | + fw = open(file_path, "wb") |
| 77 | + |
| 78 | + return response, fw |
| 79 | + |
| 80 | + def __start_download(self, response: requests.Response, fw: BufferedWriter): |
| 81 | + retry = 0 |
| 82 | + while True: |
| 83 | + try: |
| 84 | + with response: |
| 85 | + with fw: |
| 86 | + for bytes in response.iter_content(chunk_size=4096): |
| 87 | + self.download_size += bytes.__len__() |
| 88 | + fw.write(bytes) |
| 89 | + |
| 90 | + if self.download_stop: |
| 91 | + print( |
| 92 | + f"FileDownloader thread {Thread.native_id} exit by stop" |
| 93 | + ) |
| 94 | + break |
| 95 | + break |
| 96 | + except Exception: |
| 97 | + traceback.print_exc() |
| 98 | + retry += 1 |
| 99 | + if retry > 3: |
| 100 | + raise DownloadException(self.url) |
| 101 | + else: |
| 102 | + print( |
| 103 | + f"FileDownloader thread {Thread.native_id} retry {retry} times" |
| 104 | + ) |
| 105 | + time.sleep(1) |
| 106 | + response, fw = self.__init_download(self.url, self.filename) |
| 107 | + |
| 108 | + def __start_report_download_progress(self): |
| 109 | + report_thread = Thread(target=self.__report_download_progress) |
| 110 | + report_thread.start() |
| 111 | + return report_thread |
| 112 | + |
| 113 | + def __report_download_progress(self): |
| 114 | + while not self.download_stop and not self.completed: |
| 115 | + self.on_download_progress( |
| 116 | + self.basename, |
| 117 | + self.download_size, |
| 118 | + self.total_size, |
| 119 | + self.download_size - self.prev_sec_download_size, |
| 120 | + ) |
| 121 | + |
| 122 | + self.prev_sec_download_size = self.download_size |
| 123 | + time.sleep(1) |
| 124 | + |
| 125 | + def stop_download(self): |
| 126 | + self.download_stop = True |
0 commit comments