import httpx from bs4 import BeautifulSoup # type: ignore from fastapi import APIRouter from fastapi import Depends from fastapi import HTTPException from fastapi import Request from fastapi.responses import JSONResponse from loguru import logger from sqlalchemy import select from app import models from app.boxes import get_outbox_object_by_ap_id from app.database import AsyncSession from app.database import get_db_session from app.utils import microformats from app.utils.url import check_url from app.utils.url import is_url_valid router = APIRouter() def is_source_containing_target(source_html: str, target_url: str) -> bool: soup = BeautifulSoup(source_html, "html5lib") for link in soup.find_all("a"): h = link.get("href") if not is_url_valid(h): continue if h == target_url: return True return False @router.post("/webmentions") async def webmention_endpoint( request: Request, db_session: AsyncSession = Depends(get_db_session), ) -> JSONResponse: form_data = await request.form() try: source = form_data["source"] target = form_data["target"] if source == target: raise ValueError("source URL is the same as target") check_url(source) check_url(target) except Exception: logger.exception("Invalid webmention request") raise HTTPException(status_code=400, detail="Invalid payload") logger.info(f"Received webmention {source=} {target=}") existing_webmention_in_db = ( await db_session.execute( select(models.Webmention).where( models.Webmention.source == source, models.Webmention.target == target, ) ) ).scalar_one_or_none() if existing_webmention_in_db: logger.info("Found existing Webmention, will try to update or delete") mentioned_object = await get_outbox_object_by_ap_id(db_session, target) if not mentioned_object: logger.info(f"Invalid target {target=}") if existing_webmention_in_db: logger.info("Deleting existing Webmention") existing_webmention_in_db.is_deleted = True await db_session.commit() raise HTTPException(status_code=400, detail="Invalid target") is_webmention_deleted = False try: data_and_html = await microformats.fetch_and_parse(source) except microformats.URLNotFoundOrGone: is_webmention_deleted = True except httpx.HTTPError: raise HTTPException(status_code=500, detail=f"Fetch to process {source}") data, html = data_and_html is_target_found_in_source = is_source_containing_target(html, target) data, html = data_and_html if is_webmention_deleted or not is_target_found_in_source: logger.warning(f"target {target=} not found in source") if existing_webmention_in_db: logger.info("Deleting existing Webmention") mentioned_object.webmentions_count = mentioned_object.webmentions_count - 1 existing_webmention_in_db.is_deleted = True notif = models.Notification( notification_type=models.NotificationType.DELETED_WEBMENTION, outbox_object_id=mentioned_object.id, webmention_id=existing_webmention_in_db.id, ) db_session.add(notif) await db_session.commit() if not is_target_found_in_source: raise HTTPException( status_code=400, detail="target not found in source", ) else: return JSONResponse(content={}, status_code=200) if existing_webmention_in_db: # Undelete if needed existing_webmention_in_db.is_deleted = False existing_webmention_in_db.source_microformats = data notif = models.Notification( notification_type=models.NotificationType.UPDATED_WEBMENTION, outbox_object_id=mentioned_object.id, webmention_id=existing_webmention_in_db.id, ) db_session.add(notif) else: new_webmention = models.Webmention( source=source, target=target, source_microformats=data, outbox_object_id=mentioned_object.id, ) db_session.add(new_webmention) await db_session.flush() notif = models.Notification( notification_type=models.NotificationType.NEW_WEBMENTION, outbox_object_id=mentioned_object.id, webmention_id=new_webmention.id, ) db_session.add(notif) mentioned_object.webmentions_count = mentioned_object.webmentions_count + 1 await db_session.commit() return JSONResponse(content={}, status_code=200)