Toot-Mastodon-CLI-TUI-clien.../toot/utils.py

# -*- coding: utf-8 -*-

import os
import re
import socket
import subprocess
import tempfile
import unicodedata
import warnings

from bs4 import BeautifulSoup

from toot.exceptions import ConsoleError


def str_bool(b):
    """Convert boolean to string, in the way expected by the API."""
    return "true" if b else "false"


def get_text(html):
    """Converts html to text, strips all tags."""

    # Ignore warnings made by BeautifulSoup, if passed something that looks like
    # a file (e.g. a dot which matches current dict), it will warn that the file
    # should be opened instead of passing a filename.
    with warnings.catch_warnings():
        warnings.simplefilter("ignore")
        text = BeautifulSoup(html.replace('&apos;', "'"), "html.parser").get_text()

    return unicodedata.normalize('NFKC', text)


def parse_html(html):
    """Attempt to convert html to plain text while keeping line breaks.
    Returns a list of paragraphs, each being a list of lines.
    """
    paragraphs = re.split("</?p[^>]*>", html)

    # Convert <br>s to line breaks and remove empty paragraphs
    paragraphs = [re.split("<br */?>", p) for p in paragraphs if p]

    # Convert each line in each paragraph to plain text:
    return [[get_text(l) for l in p] for p in paragraphs]


def format_content(content):
    """Given a Status contents in HTML, converts it into lines of plain text.

    Returns a generator yielding lines of content.
    """

    paragraphs = parse_html(content)

    first = True

    for paragraph in paragraphs:
        if not first:
            yield ""

        for line in paragraph:
            yield line

        first = False


def domain_exists(name):
    try:
        socket.gethostbyname(name)
        return True
    except OSError:
        return False


def assert_domain_exists(domain):
    if not domain_exists(domain):
        raise ConsoleError("Domain {} not found".format(domain))


EOF_KEY = "Ctrl-Z" if os.name == 'nt' else "Ctrl-D"


def multiline_input():
    """Lets user input multiple lines of text, terminated by EOF."""
    lines = []
    while True:
        try:
            lines.append(input())
        except EOFError:
            break

    return "\n".join(lines).strip()


EDITOR_INPUT_INSTRUCTIONS = """
# Please enter your toot. Lines starting with '#' will be ignored, and an empty
# message aborts the post.
"""


def editor_input(editor, initial_text):
    """Lets user input text using an editor."""
    initial_text = (initial_text or "") + EDITOR_INPUT_INSTRUCTIONS

    with tempfile.NamedTemporaryFile() as f:
        f.write(initial_text.encode())
        f.flush()

        subprocess.run([editor, f.name])

        f.seek(0)
        text = f.read().decode()

    lines = text.strip().splitlines()
    lines = (l for l in lines if not l.startswith("#"))
    return "\n".join(lines)
Rework status content wrapping 2017-04-24 16:25:34 +02:00			`# -- coding: utf-8 --`

Make toot post prompt for input if no text is given fixes #82 2019-01-02 10:49:49 +01:00			`import os`
Rework status content wrapping 2017-04-24 16:25:34 +02:00			`import re`
Add instance command 2017-12-29 14:26:40 +01:00			`import socket`
Implement composing tweets using an editor fixes #90 2019-08-22 17:10:37 +02:00			`import subprocess`
			`import tempfile`
Normalize unicode 2018-01-21 16:39:40 +01:00			`import unicodedata`
Ignore bs4 warnings These are triggered by false positives and get printed to screen when running `toot curses`. 2019-02-13 13:38:37 +01:00			`import warnings`
Rework status content wrapping 2017-04-24 16:25:34 +02:00
			`from bs4 import BeautifulSoup`

Use http methods instead of requests directly 2017-12-30 16:30:35 +01:00			`from toot.exceptions import ConsoleError`

Rework status content wrapping 2017-04-24 16:25:34 +02:00
Make boolen params a bit less verbose 2019-01-24 11:18:28 +01:00			`def str_bool(b):`
			`"""Convert boolean to string, in the way expected by the API."""`
			`return "true" if b else "false"`


Rework status content wrapping 2017-04-24 16:25:34 +02:00			`def get_text(html):`
			`"""Converts html to text, strips all tags."""`
Ignore bs4 warnings These are triggered by false positives and get printed to screen when running `toot curses`. 2019-02-13 13:38:37 +01:00
			`# Ignore warnings made by BeautifulSoup, if passed something that looks like`
			`# a file (e.g. a dot which matches current dict), it will warn that the file`
			`# should be opened instead of passing a filename.`
			`with warnings.catch_warnings():`
			`warnings.simplefilter("ignore")`
			`text = BeautifulSoup(html.replace(''', "'"), "html.parser").get_text()`
Normalize unicode 2018-01-21 16:39:40 +01:00
			`return unicodedata.normalize('NFKC', text)`
Rework status content wrapping 2017-04-24 16:25:34 +02:00

			`def parse_html(html):`
			`"""Attempt to convert html to plain text while keeping line breaks.`
			`Returns a list of paragraphs, each being a list of lines.`
			`"""`
			`paragraphs = re.split("</?p[^>]*>", html)`

			`# Convert <br>s to line breaks and remove empty paragraphs`
			`paragraphs = [re.split("<br */?>", p) for p in paragraphs if p]`

			`# Convert each line in each paragraph to plain text:`
			`return [[get_text(l) for l in p] for p in paragraphs]`


			`def format_content(content):`
			`"""Given a Status contents in HTML, converts it into lines of plain text.`

			`Returns a generator yielding lines of content.`
			`"""`

			`paragraphs = parse_html(content)`

			`first = True`

			`for paragraph in paragraphs:`
			`if not first:`
			`yield ""`

			`for line in paragraph:`
			`yield line`

			`first = False`
Add instance command 2017-12-29 14:26:40 +01:00

			`def domain_exists(name):`
			`try:`
			`socket.gethostbyname(name)`
			`return True`
			`except OSError:`
			`return False`
Use http methods instead of requests directly 2017-12-30 16:30:35 +01:00

			`def assert_domain_exists(domain):`
			`if not domain_exists(domain):`
			`raise ConsoleError("Domain {} not found".format(domain))`
Dynamically size the status list window This makes toot more usable on narrow screens. Still requires 60 columns minimum. fixes #26 2018-01-04 12:36:14 +01:00

Make toot post prompt for input if no text is given fixes #82 2019-01-02 10:49:49 +01:00			`EOF_KEY = "Ctrl-Z" if os.name == 'nt' else "Ctrl-D"`


			`def multiline_input():`
			`"""Lets user input multiple lines of text, terminated by EOF."""`
			`lines = []`
			`while True:`
			`try:`
			`lines.append(input())`
			`except EOFError:`
			`break`

			`return "\n".join(lines).strip()`
Implement composing tweets using an editor fixes #90 2019-08-22 17:10:37 +02:00

			`EDITOR_INPUT_INSTRUCTIONS = """`
			`# Please enter your toot. Lines starting with '#' will be ignored, and an empty`
			`# message aborts the post.`
			`"""`


			`def editor_input(editor, initial_text):`
			`"""Lets user input text using an editor."""`
			`initial_text = (initial_text or "") + EDITOR_INPUT_INSTRUCTIONS`

			`with tempfile.NamedTemporaryFile() as f:`
			`f.write(initial_text.encode())`
			`f.flush()`

			`subprocess.run([editor, f.name])`

			`f.seek(0)`
			`text = f.read().decode()`

			`lines = text.strip().splitlines()`
			`lines = (l for l in lines if not l.startswith("#"))`
			`return "\n".join(lines)`