1
0
mirror of https://github.com/Garmelon/PFERD.git synced 2023-12-21 10:23:01 +01:00
pferd/PFERD/cli/command_kit_ilias_web.py

121 lines
3.3 KiB
Python
Raw Normal View History

import argparse
import configparser
from pathlib import Path
from ..crawl.ilias.file_templates import Links
2021-05-26 10:52:04 +02:00
from ..logging import log
from .parser import (CRAWLER_PARSER, SUBPARSERS, BooleanOptionalAction, ParserLoadError, load_crawler,
show_value_error)
SUBPARSER = SUBPARSERS.add_parser(
"kit-ilias-web",
parents=[CRAWLER_PARSER],
)
GROUP = SUBPARSER.add_argument_group(
2021-05-25 14:12:19 +02:00
title="kit-ilias-web crawler arguments",
description="arguments for the 'kit-ilias-web' crawler",
)
GROUP.add_argument(
"target",
type=str,
metavar="TARGET",
2021-05-25 14:12:19 +02:00
help="course id, 'desktop', or ILIAS URL to crawl"
)
GROUP.add_argument(
"output",
type=Path,
metavar="OUTPUT",
help="output directory"
)
GROUP.add_argument(
2021-05-25 14:12:19 +02:00
"--username", "-u",
type=str,
2021-05-25 14:12:19 +02:00
metavar="USERNAME",
help="user name for authentication"
)
GROUP.add_argument(
"--keyring",
action=BooleanOptionalAction,
help="use the system keyring to store and retrieve passwords"
)
GROUP.add_argument(
"--credential-file",
type=Path,
metavar="PATH",
help="read username and password from a credential file"
)
GROUP.add_argument(
"--links",
type=show_value_error(Links.from_string),
metavar="OPTION",
2021-05-25 14:12:19 +02:00
help="how to represent external links"
)
GROUP.add_argument(
2021-05-25 14:12:19 +02:00
"--link-redirect-delay",
type=int,
metavar="SECONDS",
2021-05-25 14:12:19 +02:00
help="time before 'fancy' links redirect to to their target (-1 to disable)"
)
GROUP.add_argument(
"--videos",
action=BooleanOptionalAction,
help="crawl and download videos"
)
GROUP.add_argument(
"--forums",
action=BooleanOptionalAction,
help="crawl and download forum posts"
)
2021-05-23 23:40:28 +02:00
GROUP.add_argument(
2021-05-25 14:12:19 +02:00
"--http-timeout", "-t",
2021-05-23 23:40:28 +02:00
type=float,
metavar="SECONDS",
2021-05-25 14:12:19 +02:00
help="timeout for all HTTP requests"
2021-05-23 23:40:28 +02:00
)
def load(
args: argparse.Namespace,
parser: configparser.ConfigParser,
) -> None:
2021-05-26 10:52:04 +02:00
log.explain("Creating config for command 'kit-ilias-web'")
2021-05-25 14:12:19 +02:00
parser["crawl:ilias"] = {}
section = parser["crawl:ilias"]
load_crawler(args, section)
section["type"] = "kit-ilias-web"
section["target"] = str(args.target)
section["output_dir"] = str(args.output)
2021-05-25 14:12:19 +02:00
section["auth"] = "auth:ilias"
if args.links is not None:
section["links"] = str(args.links.value)
2021-05-25 14:12:19 +02:00
if args.link_redirect_delay is not None:
section["link_redirect_delay"] = str(args.link_redirect_delay)
if args.videos is not None:
2021-05-25 14:12:19 +02:00
section["videos"] = "yes" if args.videos else "no"
if args.forums is not None:
section["forums"] = "yes" if args.forums else "no"
2021-05-23 23:40:28 +02:00
if args.http_timeout is not None:
section["http_timeout"] = str(args.http_timeout)
2021-05-25 14:12:19 +02:00
parser["auth:ilias"] = {}
auth_section = parser["auth:ilias"]
if args.credential_file is not None:
if args.username is not None:
raise ParserLoadError("--credential-file and --username can't be used together")
if args.keyring:
raise ParserLoadError("--credential-file and --keyring can't be used together")
auth_section["type"] = "credential-file"
auth_section["path"] = str(args.credential_file)
elif args.keyring:
auth_section["type"] = "keyring"
else:
auth_section["type"] = "simple"
2021-05-25 14:12:19 +02:00
if args.username is not None:
auth_section["username"] = args.username
SUBPARSER.set_defaults(command=load)