Remove the ContentParser class, use functions instead

It did not help, just added to the indent.
2023-11-06 18:14:21 +01:00 · 2023-11-06 18:14:21 +01:00 · 073dd3025c
commit 073dd3025c
parent a544453338
4 changed files with 394 additions and 391 deletions
--- a/toot/tui/overlays.py
+++ b/toot/tui/overlays.py
@ -7,7 +7,7 @@ from toot import __version__
 from toot import api
 from toot.tui.utils import highlight_keys
 from toot.tui.widgets import Button, EditBox, SelectableText
-from toot.tui.richtext import ContentParser
+from toot.tui.richtext import html_to_widgets


 class StatusSource(urwid.Padding):
@ -255,8 +255,6 @@ class Account(urwid.ListBox):
        super().__init__(walker)

    def generate_contents(self, account, relationship=None, last_action=None):
-        parser = ContentParser()
-
        if self.last_action and not self.last_action.startswith("Confirm"):
            yield Button(f"Confirm {self.last_action}", on_press=take_action, user_data=self)
            yield Button("Cancel", on_press=cancel_action, user_data=self)
@ -282,7 +280,7 @@ class Account(urwid.ListBox):
        if account["note"]:
            yield urwid.Divider()

-            widgetlist = parser.html_to_widgets(account["note"])
+            widgetlist = html_to_widgets(account["note"])
            for line in widgetlist:
                yield (line)

@ -317,7 +315,7 @@ class Account(urwid.ListBox):
                yield urwid.Divider()
                yield urwid.Text([("bold", f"{name.rstrip(':')}"), ":"])

-                widgetlist = parser.html_to_widgets(field["value"])
+                widgetlist = html_to_widgets(field["value"])
                for line in widgetlist:
                    yield (line)

--- a/toot/tui/poll.py
+++ b/toot/tui/poll.py
@ -4,7 +4,7 @@ from toot import api
 from toot.exceptions import ApiError
 from toot.utils.datetime import parse_datetime
 from .widgets import Button, CheckBox, RadioButton
-from .richtext import ContentParser
+from .richtext import html_to_widgets


 class Poll(urwid.ListBox):
@ -86,8 +86,7 @@ class Poll(urwid.ListBox):
    def generate_contents(self, status):
        yield urwid.Divider()

-        parser = ContentParser()
-        widgetlist = parser.html_to_widgets(status.data["content"])
+        widgetlist = html_to_widgets(status.data["content"])

        for line in widgetlist:
            yield (line)
--- a/toot/tui/richtext.py
+++ b/toot/tui/richtext.py
@ -16,430 +16,438 @@ STYLE_NAMES = [p[0] for p in PALETTE]
 BLOCK_TAGS = ["p", "pre", "li", "blockquote", "h1", "h2", "h3", "h4", "h5", "h6"]


-class ContentParser:
-    """Parse a limited subset of HTML and create urwid widgets."""
+def html_to_widgets(html, recovery_attempt=False) -> List[urwid.Widget]:
+    """Convert html to urwid widgets"""
+    widgets: List[urwid.Widget] = []
+    html = unicodedata.normalize("NFKC", html)
+    soup = parse_html(html)

-    def html_to_widgets(self, html, recovery_attempt=False) -> List[urwid.Widget]:
-        """Convert html to urwid widgets"""
-        widgets: List[urwid.Widget] = []
-        html = unicodedata.normalize("NFKC", html)
-        soup = parse_html(html)
-
-        first_tag = True
-        for e in soup.body or soup:
-            if isinstance(e, NavigableString):
-                if first_tag and not recovery_attempt:
-                    # if our first "tag" is a navigable string
-                    # the HTML is out of spec, doesn't start with a tag,
-                    # we see this in content from Pixelfed servers.
-                    # attempt a fix by wrapping the HTML with <p></p>
-                    return self.html_to_widgets(f"<p>{html}</p>", recovery_attempt=True)
-                else:
-                    continue
+    first_tag = True
+    for e in soup.body or soup:
+        if isinstance(e, NavigableString):
+            if first_tag and not recovery_attempt:
+                # if our first "tag" is a navigable string
+                # the HTML is out of spec, doesn't start with a tag,
+                # we see this in content from Pixelfed servers.
+                # attempt a fix by wrapping the HTML with <p></p>
+                return html_to_widgets(f"<p>{html}</p>", recovery_attempt=True)
            else:
-                name = e.name
-                # if our HTML starts with a tag, but not a block tag
-                # the HTML is out of spec. Attempt a fix by wrapping the
-                # HTML with <p></p>
-                if (first_tag and not recovery_attempt and name not in BLOCK_TAGS):
-                    return self.html_to_widgets(f"<p>{html}</p>", recovery_attempt=True)
-
-                markup = self.render(name, e)
-                first_tag = False
-
-            if not isinstance(markup, urwid.Widget):
-                # plaintext, so create a padded text widget
-                txt = self.text_to_widget("", markup)
-                markup = urwid.Padding(
-                    txt,
-                    align="left",
-                    width=("relative", 100),
-                    min_width=None,
-                )
-            widgets.append(markup)
-            # separate top level widgets with a blank line
-            widgets.append(urwid.Divider(" "))
-        return widgets[:-1]  # but suppress the last blank line
-
-    def inline_tag_to_text(self, tag) -> Tuple:
-        """Convert html tag to plain text with tag as attributes recursively"""
-        markups = self.process_inline_tag_children(tag)
-        if not markups:
-            return (tag.name, "")
-        return (tag.name, markups)
-
-    def process_inline_tag_children(self, tag) -> List:
-        """Recursively retrieve all children
-        and convert to a list of markup text"""
-        markups = []
-        for child in tag.children:
-            if isinstance(child, Tag):
-                markup = self.render(child.name, child)
-                markups.append(markup)
-            else:
-                markups.append(child)
-        return markups
-
-    def text_to_widget(self, attr, markup) -> urwid.Widget:
-        if not has_urwidgets:
-            return urwid.Text((attr, markup))
-
-        TRANSFORM = {
-            # convert http[s] URLs to Hyperlink widgets for nesting in a TextEmbed widget
-            re.compile(r"(^.+)\x03(.+$)"): lambda g: (
-                len(g[1]),
-                urwid.Filler(Hyperlink(g[2], anchor_attr, g[1])),
-            ),
-        }
-        markup_list = []
-
-        for run in markup:
-            if isinstance(run, tuple):
-                txt, attr_list = decompose_tagmarkup(run)
-                # find anchor titles with an ETX separator followed by href
-                m = re.match(r"(^.+)\x03(.+$)", txt)
-                if m:
-                    anchor_attr = self.get_best_anchor_attr(attr_list)
-                    markup_list.append(
-                        parse_text(
-                            txt,
-                            TRANSFORM,
-                            lambda pattern, groups, span: TRANSFORM[pattern](groups),
-                        )
-                    )
-                else:
-                    markup_list.append(run)
-            else:
-                markup_list.append(run)
-
-        return TextEmbed(markup_list)
-
-    def process_block_tag_children(self, tag) -> List[urwid.Widget]:
-        """Recursively retrieve all children
-        and convert to a list of widgets
-        any inline tags containing text will be
-        converted to Text widgets"""
-
-        pre_widget_markups = []
-        post_widget_markups = []
-        child_widgets = []
-        found_nested_widget = False
-
-        for child in tag.children:
-            if isinstance(child, Tag):
-                # child is a nested tag; process using custom method
-                # or default to inline_tag_to_text
-                result = self.render(child.name, child)
-                if isinstance(result, urwid.Widget):
-                    found_nested_widget = True
-                    child_widgets.append(result)
-                else:
-                    if not found_nested_widget:
-                        pre_widget_markups.append(result)
-                    else:
-                        post_widget_markups.append(result)
-            else:
-                # child is text; append to the appropriate markup list
-                if not found_nested_widget:
-                    pre_widget_markups.append(child)
-                else:
-                    post_widget_markups.append(child)
-
-        widget_list = []
-        if len(pre_widget_markups):
-            widget_list.append(self.text_to_widget(tag.name, pre_widget_markups))
-
-        if len(child_widgets):
-            widget_list += child_widgets
-
-        if len(post_widget_markups):
-            widget_list.append(self.text_to_widget(tag.name, post_widget_markups))
-
-        return widget_list
-
-    def get_urwid_attr_name(self, tag) -> str:
-        """Get the class name and translate to a
-        name suitable for use as an urwid
-        text attribute name"""
-
-        if "class" in tag.attrs:
-            clss = tag.attrs["class"]
-            if len(clss) > 0:
-                style_name = "class_" + "_".join(clss)
-                # return the class name, only if we
-                # find it as a defined palette name
-                if style_name in STYLE_NAMES:
-                    return style_name
-
-        # fallback to returning the tag name
-        return tag.name
-
-    # Tag handlers start here.
-    # Tags not explicitly listed are "supported" by
-    # rendering as text.
-    # Inline tags return a list of marked up text for urwid.Text
-    # Block tags return urwid.Widget
-
-    def basic_block_tag_handler(self, tag) -> urwid.Widget:
-        """default for block tags that need no special treatment"""
-        return urwid.Pile(self.process_block_tag_children(tag))
-
-    def get_best_anchor_attr(self, attrib_list) -> str:
-        if not attrib_list:
-            return ""
-        flat_al = list(flatten(attrib_list))
-
-        for a in flat_al[0]:
-            # ref: https://docs.joinmastodon.org/spec/activitypub/
-            # these are the class names (translated to attrib names)
-            # that we can support for display
-
-            try:
-                if a[0] in ["class_hashtag", "class_mention_hashtag", "class_mention"]:
-                    return a[0]
-            except KeyError:
                continue
+        else:
+            name = e.name
+            # if our HTML starts with a tag, but not a block tag
+            # the HTML is out of spec. Attempt a fix by wrapping the
+            # HTML with <p></p>
+            if (first_tag and not recovery_attempt and name not in BLOCK_TAGS):
+                return html_to_widgets(f"<p>{html}</p>", recovery_attempt=True)

-        return "a"
+            markup = render(name, e)
+            first_tag = False

-    def render(self, attr: str, content: str):
-        if attr in ["a"]:
-            return self.render_anchor(content)
-
-        if attr in ["blockquote"]:
-            return self.render_blockquote(content)
-
-        if attr in ["br"]:
-            return self.render_br(content)
-
-        if attr in ["em"]:
-            return self.render_em(content)
-
-        if attr in ["ol"]:
-            return self.render_ol(content)
-
-        if attr in ["pre"]:
-            return self.render_pre(content)
-
-        if attr in ["span"]:
-            return self.render_span(content)
-
-        if attr in ["b", "strong"]:
-            return self.render_strong(content)
-
-        if attr in ["ul"]:
-            return self.render_ul(content)
-
-        # Glitch-soc and Pleroma allow <H1>...<H6> in content
-        # Mastodon (PR #23913) does not; header tags are converted to <P><STRONG></STRONG></P>
-        if attr in ["p", "div", "li", "h1", "h2", "h3", "h4", "h5", "h6"]:
-            return self.basic_block_tag_handler(content)
-
-        # Fall back to inline_tag_to_text handler
-        return self.inline_tag_to_text(content)
-
-    def render_anchor(self, tag) -> Tuple:
-        """anchor tag handler"""
-
-        markups = self.process_inline_tag_children(tag)
-        if not markups:
-            return (tag.name, "")
-
-        href = tag.attrs["href"]
-        title, attrib_list = decompose_tagmarkup(markups)
-        if not attrib_list:
-            attrib_list = [tag]
-        if href and has_urwidgets:
-            # only if we have urwidgets loaded for OCS 8 hyperlinks:
-            # urlencode the path and query portions of the URL
-            href = urlencode_url(href)
-            # use ASCII ETX (end of record) as a
-            # delimiter between the title and the HREF
-            title += f"\x03{href}"
-
-        attr = self.get_best_anchor_attr(attrib_list)
-
-        if attr == "a":
-            # didn't find an attribute to use
-            # in the child markup, so let's
-            # try the anchor tag's own attributes
-
-            attr = self.get_urwid_attr_name(tag)
-
-        # hashtag anchors have a class of "mention hashtag"
-        # or "hashtag"
-        # we'll return style "class_mention_hashtag"
-        # or "class_hashtag"
-        # in that case; see corresponding palette entry
-        # in constants.py controlling hashtag highlighting
-
-        return (attr, title)
-
-    def render_blockquote(self, tag) -> urwid.Widget:
-        widget_list = self.process_block_tag_children(tag)
-        blockquote_widget = urwid.LineBox(
-            urwid.Padding(
-                urwid.Pile(widget_list),
+        if not isinstance(markup, urwid.Widget):
+            # plaintext, so create a padded text widget
+            txt = text_to_widget("", markup)
+            markup = urwid.Padding(
+                txt,
                align="left",
                width=("relative", 100),
                min_width=None,
-                left=1,
-                right=1,
-            ),
-            tlcorner="",
-            tline="",
-            lline="│",
-            trcorner="",
-            blcorner="",
-            rline="",
-            bline="",
-            brcorner="",
-        )
-        return urwid.Pile([urwid.AttrMap(blockquote_widget, "blockquote")])
+            )
+        widgets.append(markup)
+        # separate top level widgets with a blank line
+        widgets.append(urwid.Divider(" "))
+    return widgets[:-1]  # but suppress the last blank line

-    def render_br(self, tag) -> Tuple:
-        return ("br", "\n")

-    def render_em(self, tag) -> Tuple:
-        # to simplify the number of palette entries
-        # translate EM to I (italic)
-        markups = self.process_inline_tag_children(tag)
-        if not markups:
-            return ("i", "")
+def inline_tag_to_text(tag) -> Tuple:
+    """Convert html tag to plain text with tag as attributes recursively"""
+    markups = process_inline_tag_children(tag)
+    if not markups:
+        return (tag.name, "")
+    return (tag.name, markups)

-        # special case processing for bold and italic
-        for parent in tag.parents:
-            if parent.name == "b" or parent.name == "strong":
-                return ("bi", markups)

-        return ("i", markups)
+def process_inline_tag_children(tag) -> List:
+    """Recursively retrieve all children
+    and convert to a list of markup text"""
+    markups = []
+    for child in tag.children:
+        if isinstance(child, Tag):
+            markup = render(child.name, child)
+            markups.append(markup)
+        else:
+            markups.append(child)
+    return markups

-    def render_ol(self, tag) -> urwid.Widget:
-        """ordered list tag handler"""

-        widgets = []
-        list_item_num = 1
-        increment = -1 if tag.has_attr("reversed") else 1
+def text_to_widget(attr, markup) -> urwid.Widget:
+    if not has_urwidgets:
+        return urwid.Text((attr, markup))

-        # get ol start= attribute if present
-        if tag.has_attr("start") and len(tag.attrs["start"]) > 0:
-            try:
-                list_item_num = int(tag.attrs["start"])
-            except ValueError:
-                pass
+    TRANSFORM = {
+        # convert http[s] URLs to Hyperlink widgets for nesting in a TextEmbed widget
+        re.compile(r"(^.+)\x03(.+$)"): lambda g: (
+            len(g[1]),
+            urwid.Filler(Hyperlink(g[2], anchor_attr, g[1])),
+        ),
+    }
+    markup_list = []

-        for li in tag.find_all("li", recursive=False):
-            markup = self.render("li", li)
-
-            # li value= attribute will change the item number
-            # it also overrides any ol start= attribute
-
-            if li.has_attr("value") and len(li.attrs["value"]) > 0:
-                try:
-                    list_item_num = int(li.attrs["value"])
-                except ValueError:
-                    pass
-
-            if not isinstance(markup, urwid.Widget):
-                txt = self.text_to_widget("li", [str(list_item_num), ". ", markup])
-                # 1. foo, 2. bar, etc.
-                widgets.append(txt)
-            else:
-                txt = self.text_to_widget("li", [str(list_item_num), ". "])
-                columns = urwid.Columns(
-                    [txt, ("weight", 9999, markup)], dividechars=1, min_width=3
+    for run in markup:
+        if isinstance(run, tuple):
+            txt, attr_list = decompose_tagmarkup(run)
+            # find anchor titles with an ETX separator followed by href
+            m = re.match(r"(^.+)\x03(.+$)", txt)
+            if m:
+                anchor_attr = get_best_anchor_attr(attr_list)
+                markup_list.append(
+                    parse_text(
+                        txt,
+                        TRANSFORM,
+                        lambda pattern, groups, span: TRANSFORM[pattern](groups),
+                    )
                )
-                widgets.append(columns)
+            else:
+                markup_list.append(run)
+        else:
+            markup_list.append(run)

-            list_item_num += increment
+    return TextEmbed(markup_list)

-        return urwid.Pile(widgets)

-    def render_pre(self, tag) -> urwid.Widget:
-        # <PRE> tag spec says that text should not wrap,
-        # but horizontal screen space is at a premium
-        # and we have no horizontal scroll bar, so allow
-        # wrapping.
+def process_block_tag_children(tag) -> List[urwid.Widget]:
+    """Recursively retrieve all children
+    and convert to a list of widgets
+    any inline tags containing text will be
+    converted to Text widgets"""

-        widget_list = [urwid.Divider(" ")]
-        widget_list += self.process_block_tag_children(tag)
+    pre_widget_markups = []
+    post_widget_markups = []
+    child_widgets = []
+    found_nested_widget = False

-        pre_widget = urwid.Padding(
+    for child in tag.children:
+        if isinstance(child, Tag):
+            # child is a nested tag; process using custom method
+            # or default to inline_tag_to_text
+            result = render(child.name, child)
+            if isinstance(result, urwid.Widget):
+                found_nested_widget = True
+                child_widgets.append(result)
+            else:
+                if not found_nested_widget:
+                    pre_widget_markups.append(result)
+                else:
+                    post_widget_markups.append(result)
+        else:
+            # child is text; append to the appropriate markup list
+            if not found_nested_widget:
+                pre_widget_markups.append(child)
+            else:
+                post_widget_markups.append(child)
+
+    widget_list = []
+    if len(pre_widget_markups):
+        widget_list.append(text_to_widget(tag.name, pre_widget_markups))
+
+    if len(child_widgets):
+        widget_list += child_widgets
+
+    if len(post_widget_markups):
+        widget_list.append(text_to_widget(tag.name, post_widget_markups))
+
+    return widget_list
+
+
+def get_urwid_attr_name(tag) -> str:
+    """Get the class name and translate to a
+    name suitable for use as an urwid
+    text attribute name"""
+
+    if "class" in tag.attrs:
+        clss = tag.attrs["class"]
+        if len(clss) > 0:
+            style_name = "class_" + "_".join(clss)
+            # return the class name, only if we
+            # find it as a defined palette name
+            if style_name in STYLE_NAMES:
+                return style_name
+
+    # fallback to returning the tag name
+    return tag.name
+
+
+def basic_block_tag_handler(tag) -> urwid.Widget:
+    """default for block tags that need no special treatment"""
+    return urwid.Pile(process_block_tag_children(tag))
+
+
+def get_best_anchor_attr(attrib_list) -> str:
+    if not attrib_list:
+        return ""
+    flat_al = list(flatten(attrib_list))
+
+    for a in flat_al[0]:
+        # ref: https://docs.joinmastodon.org/spec/activitypub/
+        # these are the class names (translated to attrib names)
+        # that we can support for display
+
+        try:
+            if a[0] in ["class_hashtag", "class_mention_hashtag", "class_mention"]:
+                return a[0]
+        except KeyError:
+            continue
+
+    return "a"
+
+
+def render(attr: str, content: str):
+    if attr in ["a"]:
+        return render_anchor(content)
+
+    if attr in ["blockquote"]:
+        return render_blockquote(content)
+
+    if attr in ["br"]:
+        return render_br(content)
+
+    if attr in ["em"]:
+        return render_em(content)
+
+    if attr in ["ol"]:
+        return render_ol(content)
+
+    if attr in ["pre"]:
+        return render_pre(content)
+
+    if attr in ["span"]:
+        return render_span(content)
+
+    if attr in ["b", "strong"]:
+        return render_strong(content)
+
+    if attr in ["ul"]:
+        return render_ul(content)
+
+    # Glitch-soc and Pleroma allow <H1>...<H6> in content
+    # Mastodon (PR #23913) does not; header tags are converted to <P><STRONG></STRONG></P>
+    if attr in ["p", "div", "li", "h1", "h2", "h3", "h4", "h5", "h6"]:
+        return basic_block_tag_handler(content)
+
+    # Fall back to inline_tag_to_text handler
+    return inline_tag_to_text(content)
+
+
+def render_anchor(tag) -> Tuple:
+    """anchor tag handler"""
+
+    markups = process_inline_tag_children(tag)
+    if not markups:
+        return (tag.name, "")
+
+    href = tag.attrs["href"]
+    title, attrib_list = decompose_tagmarkup(markups)
+    if not attrib_list:
+        attrib_list = [tag]
+    if href and has_urwidgets:
+        # only if we have urwidgets loaded for OCS 8 hyperlinks:
+        # urlencode the path and query portions of the URL
+        href = urlencode_url(href)
+        # use ASCII ETX (end of record) as a
+        # delimiter between the title and the HREF
+        title += f"\x03{href}"
+
+    attr = get_best_anchor_attr(attrib_list)
+
+    if attr == "a":
+        # didn't find an attribute to use
+        # in the child markup, so let's
+        # try the anchor tag's own attributes
+
+        attr = get_urwid_attr_name(tag)
+
+    # hashtag anchors have a class of "mention hashtag"
+    # or "hashtag"
+    # we'll return style "class_mention_hashtag"
+    # or "class_hashtag"
+    # in that case; see corresponding palette entry
+    # in constants.py controlling hashtag highlighting
+
+    return (attr, title)
+
+
+def render_blockquote(tag) -> urwid.Widget:
+    widget_list = process_block_tag_children(tag)
+    blockquote_widget = urwid.LineBox(
+        urwid.Padding(
            urwid.Pile(widget_list),
            align="left",
            width=("relative", 100),
            min_width=None,
            left=1,
            right=1,
-        )
-        return urwid.Pile([urwid.AttrMap(pre_widget, "pre")])
+        ),
+        tlcorner="",
+        tline="",
+        lline="│",
+        trcorner="",
+        blcorner="",
+        rline="",
+        bline="",
+        brcorner="",
+    )
+    return urwid.Pile([urwid.AttrMap(blockquote_widget, "blockquote")])

-    def render_span(self, tag) -> Tuple:
-        markups = self.process_inline_tag_children(tag)

-        if not markups:
-            return (tag.name, "")
+def render_br(tag) -> Tuple:
+    return ("br", "\n")

-        # span inherits its parent's class definition
-        # unless it has a specific class definition
-        # of its own

-        if "class" in tag.attrs:
-            # uncomment the following code to hide all HTML marked
-            # invisible (generally, the http:// prefix of URLs)
-            # could be a user preference, it's only advisable if
-            # the terminal supports OCS 8 hyperlinks (and that's not
-            # automatically detectable)
+def render_em(tag) -> Tuple:
+    # to simplify the number of palette entries
+    # translate EM to I (italic)
+    markups = process_inline_tag_children(tag)
+    if not markups:
+        return ("i", "")

-            # if "invisible" in tag.attrs["class"]:
-            #     return (tag.name, "")
+    # special case processing for bold and italic
+    for parent in tag.parents:
+        if parent.name == "b" or parent.name == "strong":
+            return ("bi", markups)

-            style_name = self.get_urwid_attr_name(tag)
+    return ("i", markups)

-            if style_name != "span":
-                # unique class name matches an entry in our palette
-                return (style_name, markups)

-        if tag.parent:
-            return (self.get_urwid_attr_name(tag.parent), markups)
+def render_ol(tag) -> urwid.Widget:
+    """ordered list tag handler"""
+
+    widgets = []
+    list_item_num = 1
+    increment = -1 if tag.has_attr("reversed") else 1
+
+    # get ol start= attribute if present
+    if tag.has_attr("start") and len(tag.attrs["start"]) > 0:
+        try:
+            list_item_num = int(tag.attrs["start"])
+        except ValueError:
+            pass
+
+    for li in tag.find_all("li", recursive=False):
+        markup = render("li", li)
+
+        # li value= attribute will change the item number
+        # it also overrides any ol start= attribute
+
+        if li.has_attr("value") and len(li.attrs["value"]) > 0:
+            try:
+                list_item_num = int(li.attrs["value"])
+            except ValueError:
+                pass
+
+        if not isinstance(markup, urwid.Widget):
+            txt = text_to_widget("li", [str(list_item_num), ". ", markup])
+            # 1. foo, 2. bar, etc.
+            widgets.append(txt)
        else:
-            # fallback
-            return ("span", markups)
+            txt = text_to_widget("li", [str(list_item_num), ". "])
+            columns = urwid.Columns(
+                [txt, ("weight", 9999, markup)], dividechars=1, min_width=3
+            )
+            widgets.append(columns)

-    def render_strong(self, tag) -> Tuple:
-        # to simplify the number of palette entries
-        # translate STRONG to B (bold)
-        markups = self.process_inline_tag_children(tag)
-        if not markups:
-            return ("b", "")
+        list_item_num += increment

-        # special case processing for bold and italic
-        for parent in tag.parents:
-            if parent.name == "i" or parent.name == "em":
-                return ("bi", markups)
+    return urwid.Pile(widgets)

-        return ("b", markups)

-    def render_ul(self, tag) -> urwid.Widget:
-        """unordered list tag handler"""
+def render_pre(tag) -> urwid.Widget:
+    # <PRE> tag spec says that text should not wrap,
+    # but horizontal screen space is at a premium
+    # and we have no horizontal scroll bar, so allow
+    # wrapping.

-        widgets = []
+    widget_list = [urwid.Divider(" ")]
+    widget_list += process_block_tag_children(tag)

-        for li in tag.find_all("li", recursive=False):
-            markup = self.render("li", li)
+    pre_widget = urwid.Padding(
+        urwid.Pile(widget_list),
+        align="left",
+        width=("relative", 100),
+        min_width=None,
+        left=1,
+        right=1,
+    )
+    return urwid.Pile([urwid.AttrMap(pre_widget, "pre")])

-            if not isinstance(markup, urwid.Widget):
-                txt = self.text_to_widget("li", ["\N{bullet} ", markup])
-                # * foo, * bar, etc.
-                widgets.append(txt)
-            else:
-                txt = self.text_to_widget("li", ["\N{bullet} "])
-                columns = urwid.Columns(
-                    [txt, ("weight", 9999, markup)], dividechars=1, min_width=3
-                )
-                widgets.append(columns)

-        return urwid.Pile(widgets)
+def render_span(tag) -> Tuple:
+    markups = process_inline_tag_children(tag)
+
+    if not markups:
+        return (tag.name, "")
+
+    # span inherits its parent's class definition
+    # unless it has a specific class definition
+    # of its own
+
+    if "class" in tag.attrs:
+        # uncomment the following code to hide all HTML marked
+        # invisible (generally, the http:// prefix of URLs)
+        # could be a user preference, it's only advisable if
+        # the terminal supports OCS 8 hyperlinks (and that's not
+        # automatically detectable)
+
+        # if "invisible" in tag.attrs["class"]:
+        #     return (tag.name, "")
+
+        style_name = get_urwid_attr_name(tag)
+
+        if style_name != "span":
+            # unique class name matches an entry in our palette
+            return (style_name, markups)
+
+    if tag.parent:
+        return (get_urwid_attr_name(tag.parent), markups)
+    else:
+        # fallback
+        return ("span", markups)
+
+
+def render_strong(tag) -> Tuple:
+    # to simplify the number of palette entries
+    # translate STRONG to B (bold)
+    markups = process_inline_tag_children(tag)
+    if not markups:
+        return ("b", "")
+
+    # special case processing for bold and italic
+    for parent in tag.parents:
+        if parent.name == "i" or parent.name == "em":
+            return ("bi", markups)
+
+    return ("b", markups)
+
+
+def render_ul(tag) -> urwid.Widget:
+    """unordered list tag handler"""
+
+    widgets = []
+
+    for li in tag.find_all("li", recursive=False):
+        markup = render("li", li)
+
+        if not isinstance(markup, urwid.Widget):
+            txt = text_to_widget("li", ["\N{bullet} ", markup])
+            # * foo, * bar, etc.
+            widgets.append(txt)
+        else:
+            txt = text_to_widget("li", ["\N{bullet} "])
+            columns = urwid.Columns(
+                [txt, ("weight", 9999, markup)], dividechars=1, min_width=3
+            )
+            widgets.append(columns)
+
+    return urwid.Pile(widgets)


 def flatten(data):
--- a/toot/tui/timeline.py
+++ b/toot/tui/timeline.py
@ -6,6 +6,7 @@ import webbrowser
 from typing import List, Optional

 from toot.tui import app
+from toot.tui.richtext import html_to_widgets
 from toot.utils.datetime import parse_datetime, time_ago
 from toot.utils.language import language_name

@ -13,7 +14,6 @@ from toot.entities import Status
 from toot.tui.scroll import Scrollable, ScrollBar
 from toot.tui.utils import highlight_keys
 from toot.tui.widgets import SelectableText, SelectableColumns
-from toot.tui.richtext import ContentParser
 from toot.utils import urlencode_url
 from toot.tui.stubs.urwidgets import Hyperlink, TextEmbed, parse_text, has_urwidgets

@ -356,9 +356,7 @@ class StatusDetails(urwid.Pile):
            yield ("pack", urwid.Text(("content_warning", "Marked as sensitive. Press S to view.")))
        else:
            content = status.original.translation if status.original.show_translation else status.data["content"]
-
-            parser = ContentParser()
-            widgetlist = parser.html_to_widgets(content)
+            widgetlist = html_to_widgets(content)

            for line in widgetlist:
                yield (line)