]>
git.scottworley.com Git - paperdoorknob/blob - glowfic.py
a700995bf93f6950d2b63a403ee57c4f757c0d9a
1 # paperdoorknob: Print glowfic
3 # This program is free software: you can redistribute it and/or modify it
4 # under the terms of the GNU General Public License as published by the
5 # Free Software Foundation, version 3.
8 from abc
import ABC
, abstractmethod
9 from dataclasses
import dataclass
11 from urllib
.parse
import parse_qsl
, urlencode
, urlparse
, urlunparse
13 from typing
import Iterable
15 from bs4
import BeautifulSoup
16 from bs4
.element
import Tag
18 from images
import ImageStore
19 from texify
import Texifier
22 def _removeViewFromURL(url
: str) -> str:
24 old_qs
= parse_qsl(u
.query
)
25 new_qs
= [(k
, v
) for k
, v
in old_qs
if k
!= 'view']
26 return urlunparse(u
._replace
(query
=urlencode(new_qs
)))
29 def nonFlatURL(url
: str) -> str:
30 return _removeViewFromURL(url
)
33 def flatURL(url
: str) -> str:
34 u
= urlparse(_removeViewFromURL(url
))
35 qs
= parse_qsl(u
.query
) + [('view', 'flat')]
36 return urlunparse(u
._replace
(query
=urlencode(qs
)))
39 @dataclass(frozen
=True)
43 screen_name
: Tag |
None
47 # We avoid the name "post" because the Glowfic community uses the term
49 # * The Glowfic software sometimes uses "post" to refer to a whole thread
50 # (in the URL), sometimes uses "post" to refer to chunks (in the CSS),
51 # but mostly uses "post" to refer to just the first chunk in a thread
52 # (in the HTML and UI). The non-first chunks are "replies".
53 # * Readers and this software don't need to distinguish first-chunks and
55 # * Humans in the community tend to use "posts" to mean chunks.
58 def chunkDOMs(html
: BeautifulSoup
) -> Iterable
[Tag
]:
62 text
= body
.find_next("div", class_
="post-post")
63 assert isinstance(text
, Tag
)
66 def the_replies() -> Iterable
[Tag
]:
67 rs
= html
.find_all("div", class_
="post-reply")
68 assert all(isinstance(r
, Tag
) for r
in rs
)
71 return itertools
.chain([text()], the_replies())
74 def makeChunk(chunk_dom
: Tag
, image_store
: ImageStore
) -> Chunk
:
76 def getIcon() -> str |
None:
77 icon_div
= chunk_dom
.find_next('div', class_
='post-icon')
80 icon_img
= icon_div
.find_next('img')
83 assert isinstance(icon_img
, Tag
)
84 return image_store
.get_image(icon_img
.attrs
['src'])
86 def getByClass(css_class
: str) -> Tag |
None:
87 tag
= chunk_dom
.find_next('div', class_
=css_class
)
88 assert tag
is None or isinstance(tag
, Tag
)
91 content
= chunk_dom
.find_next('div', class_
='post-content')
92 assert isinstance(content
, Tag
)
94 return Chunk(getIcon(),
95 getByClass('post-character'),
96 getByClass('post-screenname'),
97 getByClass('post-author'),
101 def renderIcon(icon_path
: str |
None, image_size
: float) -> str |
None:
102 params
= f
'width={image_size}mm,height={image_size}mm,keepaspectratio'
103 return f
'\\includegraphics[{params}]{{{icon_path}}}' if icon_path
else None
109 def renderChunk(self
, chunk
: Chunk
) -> bytes:
110 raise NotImplementedError()
113 class ContentOnlyLayout(Layout
):
115 def __init__(self
, texifier
: Texifier
) -> None:
116 self
._texifier
= texifier
118 def renderChunk(self
, chunk
: Chunk
) -> bytes:
119 return self
._texifier
.texify(chunk
.content
) + b
'\n'
122 class BelowIconLayout(Layout
):
124 def __init__(self
, texifier
: Texifier
, image_size
: float) -> None:
125 self
._texifier
= texifier
126 self
._image
_size
= image_size
128 def renderChunk(self
, chunk
: Chunk
) -> bytes:
129 icon
= renderIcon(chunk
.icon
, self
._image
_size
)
130 meta
= [icon
.encode('UTF-8')] if icon
else []
131 meta
+= [self
._texifier
.texify(x
)
132 for x
in [chunk
.character
, chunk
.screen_name
, chunk
.author
]
135 return b
'''\\wrapstuffclear
136 \\begin{wrapstuff}[l]
138 \\begin{varwidth}{0.5\\textwidth}
139 \\smash{\\parbox[t][0pt]{0pt}{
140 \\setlength{\\fboxrule}{0.2pt}
141 \\setlength{\\fboxsep}{0pt}
143 \\fbox{\\hspace{107mm}}
158 self
._texifier
.texify(chunk
.content
))
161 class BesideIconLayout(Layout
):
163 def __init__(self
, texifier
: Texifier
, image_size
: float) -> None:
164 self
._texifier
= texifier
165 self
._image
_size
= image_size
167 def renderChunk(self
, chunk
: Chunk
) -> bytes:
168 icon
= renderIcon(chunk
.icon
, self
._image
_size
)
175 # Why is \textwidth not the width of the text?
176 # Why is the width of the text .765\textwidth?
177 return b
'''\\noindent\\fbox{
179 \\parbox[b]{.765\\textwidth}{
185 \\vspace{-0.75em}\\\\*
191 icon
.encode('UTF-8') if icon
else b
'',
192 b
'\\\\*'.join(self
._texifier
.texify(x
) for x
in meta
if x
is not None),
193 self
._texifier
.texify(chunk
.content
))