1
1
import time
2
2
import asyncio
3
3
4
- import richka
5
-
6
4
import aiohttp
7
5
8
- async def __download_range (session : aiohttp .ClientSession , url : str , start : int , end : int , destination : str ) -> None :
6
+ import richka
7
+ from .controller import Controller
8
+
9
+ async def __download_range (session : aiohttp .ClientSession , url : str , start : int , end : int , destination : str , controller : Controller = None ) -> None :
9
10
richka .logger .info (f'Downloading part { start } -{ end } of { url } to { destination } .' )
10
11
11
12
headers = {** richka .HEADERS , ** {'range' : f'bytes={ start } -{ end } ' }}
12
-
13
- async with session .get (url , headers = headers ) as response :
14
- content = await response .read ()
15
- with open (destination , 'r+b' ) as f :
16
- f .seek (start )
17
- f .write (content )
18
-
19
- richka .logger .info (f'Downloaded part { start } -{ end } of { destination } .' )
20
-
21
- async def __download_single (session : aiohttp .ClientSession , url : str , destination : str ) -> None :
13
+ retry_times = richka .RETRY_TIMES
14
+
15
+ while retry_times > 0 :
16
+ try :
17
+ async with session .get (url , headers = headers , timeout = aiohttp .ClientTimeout (sock_read = richka .TIMEOUT , sock_connect = richka .TIMEOUT )) as response :
18
+ with open (destination , 'r+b' ) as f :
19
+ f .seek (start )
20
+ # Read stream
21
+ length = 0
22
+ async for chunk in response .content .iter_chunked (richka .CHUNK_SIZE ):
23
+ while controller .paused :
24
+ await asyncio .sleep (1 )
25
+ # noinspection PyTypeChecker
26
+ f .write (chunk )
27
+ # noinspection PyTypeChecker
28
+ length += len (chunk )
29
+ # Update tracker
30
+ if controller is not None :
31
+ await controller .update_progress (length , chunk_id = f"{ start } -{ end } " )
32
+ break
33
+ except (aiohttp .ClientError , asyncio .TimeoutError ):
34
+ retry_times -= 1
35
+ richka .logger .info (f'Download part { start } -{ end } of { url } to { destination } failed for { richka .RETRY_TIMES - retry_times } times, retrying...' )
36
+ await asyncio .sleep (1 )
37
+
38
+ if retry_times > 0 :
39
+ richka .logger .info (f'Downloaded part { start } -{ end } of { url } to { destination } .' )
40
+ else :
41
+ raise TimeoutError (f'Download part { start } -{ end } of { url } to { destination } timed out.' )
42
+
43
+ async def __download_single (session : aiohttp .ClientSession , url : str , destination : str , controller : Controller = None ) -> None :
22
44
richka .logger .info (f'Downloading { url } to { destination } .' )
23
45
24
- async with session .get (url , headers = richka .HEADERS ) as response :
25
- content = await response .read ()
26
- with open (destination , 'r+b' ) as f :
27
- f .write (content )
28
-
29
- richka .logger .info (f'Downloaded { url } to { destination } .' )
30
-
31
- async def download (url : str , destination : str ) -> float :
46
+ retry_times = richka .RETRY_TIMES \
47
+
48
+ while retry_times > 0 :
49
+ try :
50
+ async with session .get (url , headers = richka .HEADERS , timeout = aiohttp .ClientTimeout (sock_read = richka .TIMEOUT , sock_connect = richka .TIMEOUT )) as response :
51
+ with open (destination , 'r+b' ) as f :
52
+ # Read stream
53
+ length = 0
54
+ async for chunk in response .content .iter_chunked (richka .CHUNK_SIZE ):
55
+ while controller .paused :
56
+ await asyncio .sleep (1 )
57
+ # noinspection PyTypeChecker
58
+ f .write (chunk )
59
+ # noinspection PyTypeChecker
60
+ length += len (chunk )
61
+ # Update tracker
62
+ if controller is not None :
63
+ await controller .update_progress (length )
64
+ break
65
+ except (aiohttp .ClientError , asyncio .TimeoutError ):
66
+ retry_times -= 1
67
+ richka .logger .info (f'Download { url } to { destination } failed for { richka .RETRY_TIMES - retry_times } times, retrying...' )
68
+ await asyncio .sleep (1 )
69
+
70
+ if retry_times > 0 :
71
+ richka .logger .info (f'Downloaded { url } to { destination } .' )
72
+ else :
73
+ raise TimeoutError (f'Download { url } to { destination } timed out.' )
74
+
75
+ async def download (url : str , destination : str , controller : Controller = None ) -> tuple [float , int ]:
76
+ """
77
+ Download a single file.
78
+ :param url: String Source URL.
79
+ :param destination: Destination Path.
80
+ :param controller: Download Controller.
81
+ :return: [Float, Integer] [Time Used, File Size]
82
+ """
32
83
async with aiohttp .ClientSession () as session :
33
84
# Get file size
34
85
async with session .head (url ) as response :
35
86
file_size = int (response .headers .get ('Content-Length' , 0 ))
36
87
37
- if not file_size or file_size / pow (1024 , 2 ) <= 10 :
88
+ if not file_size or file_size / pow (1024 , 2 ) <= richka . SLICE_THRESHOLD :
38
89
if not file_size :
39
90
richka .logger .info (f'Failed to get file size, directly downloading { url } .' )
40
91
else :
41
- richka .logger .info (f"Downloading { url } ({ file_size } ) to { destination } with signle mode." )
92
+ richka .logger .info (f"Downloading { url } ({ file_size } ) to { destination } with single mode." )
93
+ if controller is not None :
94
+ controller .total_size = file_size
42
95
43
96
# Create an empty file
44
97
with open (destination , 'wb' ) as f :
45
98
f .truncate (file_size )
46
99
47
100
# Start task
48
101
start_time = time .time ()
49
- await __download_single (session , url , destination )
102
+ await __download_single (session , url , destination , controller )
50
103
end_time = time .time ()
51
- return end_time - start_time
104
+ richka .logger .info (f"Downloaded { url } ({ file_size } ) to { destination } with single mode." )
105
+ return end_time - start_time , file_size
52
106
53
107
richka .logger .info (f'Downloading { url } ({ file_size } ) to { destination } with slicing mode.' )
108
+ if controller is not None :
109
+ controller .total_size = file_size
54
110
55
111
# Calc slice size
56
112
part_size = file_size // richka .COROUTINE_LIMIT
@@ -64,11 +120,12 @@ async def download(url: str, destination: str) -> float:
64
120
for i in range (richka .COROUTINE_LIMIT ):
65
121
start = i * part_size
66
122
end = (start + part_size - 1 ) if i < richka .COROUTINE_LIMIT - 1 else (file_size - 1 )
67
- task = __download_range (session , url , start , end , destination )
123
+ task = __download_range (session , url , start , end , destination , controller )
68
124
tasks .append (task )
69
125
70
126
# Start all task
71
127
start_time = time .time ()
72
128
await asyncio .gather (* tasks )
73
129
end_time = time .time ()
74
- return end_time - start_time
130
+ richka .logger .info (f'Downloaded { url } ({ file_size } ) to { destination } with slicing mode.' )
131
+ return end_time - start_time , file_size
0 commit comments