2021-04-29 13:44:29 +02:00
|
|
|
import asyncio
|
|
|
|
import random
|
2021-04-29 16:52:00 +02:00
|
|
|
from pathlib import PurePath
|
2021-04-29 13:44:29 +02:00
|
|
|
from typing import Any
|
|
|
|
|
|
|
|
from rich.markup import escape
|
|
|
|
|
|
|
|
from ..crawler import Crawler
|
2021-04-29 15:26:10 +02:00
|
|
|
from ..utils import ainput
|
2021-04-29 13:44:29 +02:00
|
|
|
|
|
|
|
DUMMY_TREE = {
|
|
|
|
"Blätter": {
|
|
|
|
"Blatt_01.pdf": (),
|
|
|
|
"Blatt_02.pdf": (),
|
|
|
|
"Blatt_03.pdf": (),
|
|
|
|
"Blatt_04.pdf": (),
|
|
|
|
"Blatt_05.pdf": (),
|
2021-04-29 13:53:16 +02:00
|
|
|
"Lösungen": {
|
|
|
|
"Blatt_01_Lösung.pdf": (),
|
|
|
|
"Blatt_02_Lösung.pdf": (),
|
2021-04-29 15:26:10 +02:00
|
|
|
"Blatt_03_Lösung.pdf": True,
|
2021-04-29 13:53:16 +02:00
|
|
|
"Blatt_04_Lösung.pdf": (),
|
|
|
|
"Blatt_05_Lösung.pdf": (),
|
|
|
|
},
|
2021-04-29 13:44:29 +02:00
|
|
|
},
|
|
|
|
"Vorlesungsfolien": {
|
|
|
|
"VL_01.pdf": (),
|
|
|
|
"VL_02.pdf": (),
|
|
|
|
"VL_03.pdf": (),
|
|
|
|
"VL_04.pdf": (),
|
|
|
|
"VL_05.pdf": (),
|
|
|
|
},
|
|
|
|
"noch_mehr.txt": (),
|
|
|
|
"dateien.jar": (),
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
class DummyCrawler(Crawler):
|
|
|
|
async def crawl(self) -> None:
|
2021-04-29 16:52:00 +02:00
|
|
|
await self._crawl_entry(PurePath(), DUMMY_TREE)
|
2021-04-29 13:44:29 +02:00
|
|
|
|
2021-04-29 16:52:00 +02:00
|
|
|
async def _crawl_entry(self, path: PurePath, value: Any) -> None:
|
2021-04-29 15:26:10 +02:00
|
|
|
if value is True:
|
|
|
|
async with self.exclusive_output():
|
|
|
|
await ainput(f"File {path}, please press enter: ")
|
|
|
|
if value == () or value is True:
|
2021-04-29 13:44:29 +02:00
|
|
|
n = random.randint(5, 20)
|
2021-04-29 13:53:16 +02:00
|
|
|
async with self.download_bar(path, n) as bar:
|
2021-04-29 13:44:29 +02:00
|
|
|
await asyncio.sleep(random.random() / 2)
|
|
|
|
for i in range(n):
|
|
|
|
await asyncio.sleep(0.5)
|
|
|
|
bar.advance()
|
|
|
|
self.print(f"[green]Downloaded {escape(str(path))}")
|
|
|
|
else:
|
|
|
|
t = random.random() * 2 + 1
|
2021-04-29 13:53:16 +02:00
|
|
|
async with self.crawl_bar(path) as bar:
|
2021-04-29 13:44:29 +02:00
|
|
|
await asyncio.sleep(t)
|
|
|
|
tasks = [self._crawl_entry(path / k, v) for k, v in value.items()]
|
|
|
|
await asyncio.gather(*tasks)
|