microblog.pub/app/webfinger.py

91 lines
2.7 KiB
Python
Raw Normal View History

2022-06-22 20:11:22 +02:00
from typing import Any
from urllib.parse import urlparse
import httpx
from loguru import logger
2022-06-26 10:01:26 +02:00
from app import config
2022-07-15 20:50:27 +02:00
from app.utils.url import check_url
2022-06-22 20:11:22 +02:00
2022-06-30 00:28:07 +02:00
async def webfinger(
2022-06-22 20:11:22 +02:00
resource: str,
) -> dict[str, Any] | None: # noqa: C901
"""Mastodon-like WebFinger resolution to retrieve the activity stream Actor URL."""
logger.info(f"performing webfinger resolution for {resource}")
protos = ["https", "http"]
if resource.startswith("http://"):
protos.reverse()
host = urlparse(resource).netloc
elif resource.startswith("https://"):
host = urlparse(resource).netloc
else:
if resource.startswith("acct:"):
resource = resource[5:]
if resource.startswith("@"):
resource = resource[1:]
_, host = resource.split("@", 1)
resource = "acct:" + resource
is_404 = False
2022-06-30 00:28:07 +02:00
async with httpx.AsyncClient() as client:
for i, proto in enumerate(protos):
try:
url = f"{proto}://{host}/.well-known/webfinger"
2022-07-15 20:50:27 +02:00
check_url(url)
2022-06-30 00:28:07 +02:00
resp = await client.get(
url,
params={"resource": resource},
headers={
"User-Agent": config.USER_AGENT,
},
2022-07-08 12:10:20 +02:00
follow_redirects=True,
2022-06-30 00:28:07 +02:00
)
2022-07-08 12:10:20 +02:00
resp.raise_for_status()
2022-06-30 00:28:07 +02:00
break
except httpx.HTTPStatusError as http_error:
logger.exception("HTTP error")
if http_error.response.status_code in [403, 404, 410]:
is_404 = True
continue
raise
except httpx.HTTPError:
logger.exception("req failed")
# If we tried https first and the domain is "http only"
if i == 0:
continue
break
2022-06-22 20:11:22 +02:00
if is_404:
return None
2022-06-26 10:01:26 +02:00
return resp.json()
2022-06-22 20:11:22 +02:00
2022-06-30 00:28:07 +02:00
async def get_remote_follow_template(resource: str) -> str | None:
data = await webfinger(resource)
2022-06-22 20:11:22 +02:00
if data is None:
return None
for link in data["links"]:
if link.get("rel") == "http://ostatus.org/schema/1.0/subscribe":
return link.get("template")
return None
2022-06-30 00:28:07 +02:00
async def get_actor_url(resource: str) -> str | None:
2022-06-22 20:11:22 +02:00
"""Mastodon-like WebFinger resolution to retrieve the activity stream Actor URL.
Returns:
the Actor URL or None if the resolution failed.
"""
2022-06-30 00:28:07 +02:00
data = await webfinger(resource)
2022-06-22 20:11:22 +02:00
if data is None:
return None
for link in data["links"]:
if (
link.get("rel") == "self"
and link.get("type") == "application/activity+json"
):
return link.get("href")
return None