Unicode normalize 'NKFC' incoming HTML text before rendering

2023-04-04 19:43:37 -04:00 · 2023-04-04 19:43:37 -04:00 · 0dba44ff5e
parent 874baf1ef0
commit 0dba44ff5e
1 changed files with 2 additions and 0 deletions
--- a/toot/tui/richtext.py
+++ b/toot/tui/richtext.py
@ -3,6 +3,7 @@ richtext
 """
 from typing import List
 import urwid
 import unicodedata
 from bs4 import BeautifulSoup
 from bs4.element import NavigableString, Tag
@ -14,6 +15,7 @@ class ContentParser:
    def html_to_widgets(self, html) -> List[urwid.Widget]:
        """Convert html to urwid widgets"""
        widgets: List[urwid.Widget] = []
        html = unicodedata.normalize('NFKC', html)
        soup = BeautifulSoup(html.replace("&apos;", "'"), "html.parser")
        for e in soup.body or soup:
            if isinstance(e, NavigableString):