2015-04-10 21:45:41 +02:00
|
|
|
# -*- coding: utf-8 -*-
|
|
|
|
|
2017-03-16 04:17:35 +01:00
|
|
|
# Copyright 2014-2017 Mike Fährmann
|
2015-04-10 21:45:41 +02:00
|
|
|
#
|
|
|
|
# This program is free software; you can redistribute it and/or modify
|
|
|
|
# it under the terms of the GNU General Public License version 2 as
|
|
|
|
# published by the Free Software Foundation.
|
|
|
|
|
2017-06-30 19:38:14 +02:00
|
|
|
"""Downloader module for http:// and https:// URLs"""
|
2015-04-10 21:45:41 +02:00
|
|
|
|
2016-09-30 12:32:48 +02:00
|
|
|
import mimetypes
|
2017-10-24 12:53:03 +02:00
|
|
|
from .common import DownloaderBase
|
2017-10-20 18:56:18 +02:00
|
|
|
from .. import config, util
|
2014-10-12 21:56:44 +02:00
|
|
|
|
|
|
|
|
2017-10-24 12:53:03 +02:00
|
|
|
class Downloader(DownloaderBase):
|
2017-03-27 13:22:02 +02:00
|
|
|
retries = config.interpolate(("downloader", "http", "retries",), 5)
|
2017-08-31 15:21:08 +02:00
|
|
|
timeout = config.interpolate(("downloader", "http", "timeout",), 30)
|
|
|
|
verify = config.interpolate(("downloader", "http", "verify",), True)
|
2017-03-26 18:24:46 +02:00
|
|
|
|
2017-06-30 19:38:14 +02:00
|
|
|
def __init__(self, session, output):
|
2017-10-24 12:53:03 +02:00
|
|
|
DownloaderBase.__init__(self, session, output)
|
|
|
|
self.response = None
|
|
|
|
|
|
|
|
def connect(self, url, offset):
|
|
|
|
headers = {}
|
|
|
|
if offset:
|
|
|
|
headers["Range"] = "bytes={}-".format(offset)
|
|
|
|
|
|
|
|
self.response = self.session.request(
|
|
|
|
"GET", url, stream=True, headers=headers, allow_redirects=True,
|
|
|
|
timeout=self.timeout, verify=self.verify)
|
|
|
|
|
|
|
|
code = self.response.status_code
|
|
|
|
if code == 200:
|
|
|
|
offset = 0
|
|
|
|
size = self.response.headers.get("Content-Length")
|
|
|
|
elif code == 206:
|
|
|
|
size = self.response.headers["Content-Range"].rpartition("/")[2]
|
|
|
|
elif code == 416:
|
|
|
|
# file is already complete
|
|
|
|
return -1, 0
|
|
|
|
else:
|
|
|
|
self.response.raise_for_status()
|
|
|
|
|
|
|
|
return offset, util.safe_int(size)
|
|
|
|
|
|
|
|
def receive(self, file):
|
|
|
|
for data in self.response.iter_content(16384):
|
|
|
|
file.write(data)
|
|
|
|
|
|
|
|
def reset(self):
|
|
|
|
if self.response:
|
|
|
|
self.response.close()
|
|
|
|
self.response = None
|
|
|
|
|
|
|
|
def get_extension(self):
|
|
|
|
mtype = self.response.headers.get("Content-Type", "image/jpeg")
|
|
|
|
mtype = mtype.partition(";")[0]
|
|
|
|
exts = mimetypes.guess_all_extensions(mtype, strict=False)
|
|
|
|
if exts:
|
|
|
|
exts.sort()
|
|
|
|
return exts[-1][1:]
|
|
|
|
self.log.warning(
|
|
|
|
"No filename extension found for MIME type '%s'", mtype)
|
|
|
|
return "txt"
|