pferd/PFERD/downloaders.py

59 lines
1.8 KiB
Python
Raw Normal View History

2020-04-20 19:08:51 +02:00
"""
General downloaders useful in many situations
"""
2020-04-20 17:43:41 +02:00
from pathlib import Path
from typing import Any, Dict, Optional
import requests
import requests.auth
2020-04-20 18:50:23 +02:00
from .organizer import Organizer
2020-04-20 17:43:41 +02:00
from .tmp_dir import TmpDir
from .utils import stream_to_path
2020-04-20 19:27:26 +02:00
# pylint: disable=too-few-public-methods
2020-04-20 17:43:41 +02:00
class HttpDownloader():
"""A HTTP downloader that can handle HTTP basic auth."""
2020-04-20 19:08:51 +02:00
def __init__(
self,
tmp_dir: TmpDir,
organizer: Organizer,
username: Optional[str],
password: Optional[str],
):
2020-04-20 17:43:41 +02:00
"""Create a new http downloader."""
self._organizer = organizer
self._tmp_dir = tmp_dir
self._username = username
self._password = password
self._session = self._build_session()
def _build_session(self) -> requests.Session:
session = requests.Session()
if self._username and self._password:
session.auth = requests.auth.HTTPBasicAuth(
self._username, self._password
)
return session
2020-04-20 19:48:59 +02:00
def download(
self,
url: str,
target_path: Path,
parameters: Optional[Dict[str, Any]] = None,
) -> None:
2020-04-20 17:43:41 +02:00
"""Download a given url to a given path, optionally with some get parameters."""
2020-04-20 19:45:25 +02:00
parameters = parameters if parameters else {}
with self._session.get(url, params=parameters, stream=True) as response:
2020-04-20 18:04:56 +02:00
if response.status_code == 200:
tmp_file = self._tmp_dir.new_file()
stream_to_path(response, tmp_file)
self._organizer.accept_file(tmp_file, target_path)
else:
raise Exception(
f"Could not download file, got response {response.status_code}"
)