]> git.scottworley.com Git - paperdoorknob/blob - args.py
Extensible, flag-controlled DOM filters
[paperdoorknob] / args.py
1 # paperdoorknob: Print glowfic
2 #
3 # This program is free software: you can redistribute it and/or modify it
4 # under the terms of the GNU General Public License as published by the
5 # Free Software Foundation, version 3.
6
7
8 from argparse import ArgumentParser
9 from contextlib import contextmanager
10 import os.path
11
12 from typing import Iterator
13
14 from xdg_base_dirs import xdg_cache_home
15
16 from domfilter import ApplyDOMFilters, DOMFilters
17 from fetch import CachingFetcher
18 from htmlfilter import ApplyHTMLFilters, HTMLFilters
19 from spec import Spec
20 from texify import PandocTexifier
21
22
23 def _command_line_parser() -> ArgumentParser:
24 parser = ArgumentParser(prog='paperdoorknob', description='Print glowfic')
25 parser.add_argument(
26 '--cache_path',
27 metavar='PATH',
28 help='Where to keep the http cache (instead of %(default)s)',
29 default=os.path.join(xdg_cache_home(), "paperdoorknob"))
30 parser.add_argument(
31 '--domfilters',
32 help='Which DOM filters to use (default: %(default)s)',
33 default=','.join(f[0] for f in DOMFilters))
34 parser.add_argument(
35 '--htmlfilters',
36 help='Which HTML filters to use (default: %(default)s)',
37 default=','.join(f[0] for f in HTMLFilters))
38 parser.add_argument(
39 '--out',
40 help='The filename stem at which to write output ' +
41 '(eg: "%(default)s" produces %(default)s.tex, %(default)s.pdf, etc.)',
42 default='book')
43 parser.add_argument('--pandoc', help='Location of the pandoc executable')
44 parser.add_argument(
45 '--timeout',
46 help='How long to wait for HTTP requests, in seconds',
47 default=30)
48 parser.add_argument('url', help='URL to retrieve')
49 return parser
50
51
52 @contextmanager
53 def spec_from_commandline_args() -> Iterator[Spec]:
54 args = _command_line_parser().parse_args()
55 with CachingFetcher(args.cache_path, args.timeout) as fetcher:
56 with open(args.out + '.tex', 'wb') as texout:
57 yield Spec(
58 args.url,
59 fetcher,
60 lambda x: ApplyHTMLFilters(args.htmlfilters, x),
61 lambda x: ApplyDOMFilters(args.domfilters, x),
62 PandocTexifier(args.pandoc or 'pandoc'),
63 texout)