[downloader/http] Randomize HTTP chunk size

This commit is contained in:
Sergey M․ 2018-02-04 07:29:11 +07:00
parent e4a60912b8
commit b91a7a4e5e
No known key found for this signature in database
GPG Key ID: 2C393E0F18A9236D

View File

@ -4,6 +4,7 @@
import os import os
import socket import socket
import time import time
import random
import re import re
from .common import FileDownloader from .common import FileDownloader
@ -53,6 +54,7 @@ class DownloadContext(dict):
ctx.data_len = None ctx.data_len = None
ctx.block_size = self.params.get('buffersize', 1024) ctx.block_size = self.params.get('buffersize', 1024)
ctx.start_time = time.time() ctx.start_time = time.time()
ctx.chunk_size = None
if self.params.get('continuedl', True): if self.params.get('continuedl', True):
# Establish possible resume length # Establish possible resume length
@ -82,17 +84,19 @@ def set_range(req, start, end):
req.add_header('Range', range_header) req.add_header('Range', range_header)
def establish_connection(): def establish_connection():
ctx.chunk_size = (random.randint(int(chunk_size * 0.95), chunk_size)
if not is_test and chunk_size else chunk_size)
if ctx.resume_len > 0: if ctx.resume_len > 0:
range_start = ctx.resume_len range_start = ctx.resume_len
if ctx.is_resume: if ctx.is_resume:
self.report_resuming_byte(ctx.resume_len) self.report_resuming_byte(ctx.resume_len)
ctx.open_mode = 'ab' ctx.open_mode = 'ab'
elif chunk_size > 0: elif ctx.chunk_size > 0:
range_start = 0 range_start = 0
else: else:
range_start = None range_start = None
ctx.is_resume = False ctx.is_resume = False
range_end = range_start + chunk_size - 1 if chunk_size else None range_end = range_start + ctx.chunk_size - 1 if ctx.chunk_size else None
if range_end and ctx.data_len is not None and range_end >= ctx.data_len: if range_end and ctx.data_len is not None and range_end >= ctx.data_len:
range_end = ctx.data_len - 1 range_end = ctx.data_len - 1
has_range = range_start is not None has_range = range_start is not None
@ -119,7 +123,7 @@ def establish_connection():
content_len = int_or_none(content_range_m.group(3)) content_len = int_or_none(content_range_m.group(3))
accept_content_len = ( accept_content_len = (
# Non-chunked download # Non-chunked download
not chunk_size or not ctx.chunk_size or
# Chunked download and requested piece or # Chunked download and requested piece or
# its part is promised to be served # its part is promised to be served
content_range_end == range_end or content_range_end == range_end or
@ -297,7 +301,7 @@ def retry(e):
if is_test and byte_counter == data_len: if is_test and byte_counter == data_len:
break break
if not is_test and chunk_size and ctx.data_len is not None and byte_counter < ctx.data_len: if not is_test and ctx.chunk_size and ctx.data_len is not None and byte_counter < ctx.data_len:
ctx.resume_len = byte_counter ctx.resume_len = byte_counter
# ctx.block_size = block_size # ctx.block_size = block_size
raise NextFragment() raise NextFragment()