import base64 import os import sys import time from datetime import timezone from io import BytesIO from typing import Any from typing import MutableMapping from typing import Type import fastapi import httpx import starlette from asgiref.typing import ASGI3Application from asgiref.typing import ASGIReceiveCallable from asgiref.typing import ASGISendCallable from asgiref.typing import Scope from cachetools import LFUCache from fastapi import Depends from fastapi import FastAPI from fastapi import Form from fastapi import Request from fastapi import Response from fastapi.exception_handlers import http_exception_handler from fastapi.exceptions import HTTPException from fastapi.responses import FileResponse from fastapi.responses import PlainTextResponse from fastapi.responses import RedirectResponse from fastapi.responses import StreamingResponse from fastapi.staticfiles import StaticFiles from feedgen.feed import FeedGenerator # type: ignore from loguru import logger from PIL import Image from sqlalchemy import func from sqlalchemy import select from sqlalchemy.orm import joinedload from starlette.background import BackgroundTask from starlette.datastructures import Headers from starlette.datastructures import MutableHeaders from starlette.exceptions import HTTPException as StarletteHTTPException from starlette.responses import JSONResponse from starlette.types import Message from uvicorn.middleware.proxy_headers import ProxyHeadersMiddleware # type: ignore from app import activitypub as ap from app import admin from app import boxes from app import config from app import httpsig from app import indieauth from app import media from app import micropub from app import models from app import templates from app import webmentions from app.actor import LOCAL_ACTOR from app.actor import get_actors_metadata from app.boxes import public_outbox_objects_count from app.config import BASE_URL from app.config import DEBUG from app.config import DOMAIN from app.config import ID from app.config import USER_AGENT from app.config import USERNAME from app.config import is_activitypub_requested from app.config import verify_csrf_token from app.customization import get_custom_router from app.database import AsyncSession from app.database import async_session from app.database import get_db_session from app.incoming_activities import new_ap_incoming_activity from app.templates import is_current_user_admin from app.uploads import UPLOAD_DIR from app.utils import pagination from app.utils.emoji import EMOJIS_BY_NAME from app.utils.facepile import Face from app.utils.facepile import WebmentionReply from app.utils.facepile import merge_faces from app.utils.highlight import HIGHLIGHT_CSS_HASH from app.utils.url import check_url from app.webfinger import get_remote_follow_template # Only images <1MB will be cached, so 32MB of data will be cached _RESIZED_CACHE: MutableMapping[tuple[str, int], tuple[bytes, str, Any]] = LFUCache(32) # TODO(ts): # Next: # - self-destruct + move support and actions/tasks for # - doc for prune/move/delete # - fix issue with followers from a blocked server (skip it?) # - allow to share old notes # - only show 10 most recent threads in DMs # - prevent double accept/double follow # - UI support for updating posts # - indieauth tweaks # - support update post with history? class CustomMiddleware: """Raw ASGI middleware as using starlette base middleware causes issues with both: - Jinja2: https://github.com/encode/starlette/issues/472 - async SQLAchemy: https://github.com/tiangolo/fastapi/issues/4719 """ def __init__( self, app: ASGI3Application, ) -> None: self.app = app async def __call__( self, scope: Scope, receive: ASGIReceiveCallable, send: ASGISendCallable ) -> None: # We only care about HTTP requests if scope["type"] != "http": await self.app(scope, receive, send) return response_details = {"status_code": None} start_time = time.perf_counter() request_id = os.urandom(8).hex() async def send_wrapper(message: Message) -> None: if message["type"] == "http.response.start": # Extract the HTTP response status code response_details["status_code"] = message["status"] # And add the security headers headers = MutableHeaders(scope=message) headers["X-Request-ID"] = request_id headers["x-powered-by"] = "microblogpub" headers[ "referrer-policy" ] = "no-referrer, strict-origin-when-cross-origin" headers["x-content-type-options"] = "nosniff" headers["x-xss-protection"] = "1; mode=block" headers["x-frame-options"] = "DENY" headers["permissions-policy"] = "interest-cohort=()" headers["content-security-policy"] = ( ( f"default-src 'self'; " f"style-src 'self' 'sha256-{HIGHLIGHT_CSS_HASH}'; " f"frame-ancestors 'none'; base-uri 'self'; form-action 'self';" ) if not config.CUSTOM_CONTENT_SECURITY_POLICY else config.CUSTOM_CONTENT_SECURITY_POLICY.format( HIGHLIGHT_CSS_HASH=HIGHLIGHT_CSS_HASH ) ) if not DEBUG: headers["strict-transport-security"] = "max-age=63072000;" await send(message) # type: ignore # Make loguru ouput the request ID on every log statement within # the request with logger.contextualize(request_id=request_id): client_host, client_port = scope["client"] # type: ignore scheme = scope["scheme"] server_host, server_port = scope["server"] # type: ignore request_method = scope["method"] request_path = scope["path"] headers = Headers(raw=scope["headers"]) # type: ignore user_agent = headers.get("user-agent") logger.info( f"{client_host}:{client_port} - " f"{request_method} " f"{scheme}://{server_host}:{server_port}{request_path} - " f'"{user_agent}"' ) try: await self.app(scope, receive, send_wrapper) # type: ignore finally: elapsed_time = time.perf_counter() - start_time logger.info( f"status_code={response_details['status_code']} " f"{elapsed_time=:.2f}s" ) return None def _check_0rtt_early_data(request: Request) -> None: """Disable TLS1.3 0-RTT requests for non-GET.""" if request.headers.get("Early-Data", None) == "1" and request.method != "GET": raise fastapi.HTTPException(status_code=425, detail="Too early") app = FastAPI( docs_url=None, redoc_url=None, dependencies=[Depends(_check_0rtt_early_data)] ) app.mount( "/custom_emoji", StaticFiles(directory="data/custom_emoji"), name="custom_emoji", ) app.mount("/static", StaticFiles(directory="app/static"), name="static") app.include_router(admin.router, prefix="/admin") app.include_router(admin.unauthenticated_router, prefix="/admin") app.include_router(indieauth.router) app.include_router(micropub.router) app.include_router(webmentions.router) config.load_custom_routes() if custom_router := get_custom_router(): app.include_router(custom_router) # XXX: order matters, the proxy middleware needs to be last app.add_middleware(CustomMiddleware) app.add_middleware(ProxyHeadersMiddleware, trusted_hosts=config.CONFIG.trusted_hosts) logger.configure(extra={"request_id": "no_req_id"}) logger.remove() logger_format = ( "{time:YYYY-MM-DD HH:mm:ss.SSS} | " "{level: <8} | " "{name}:{function}:{line} | " "{extra[request_id]} - {message}" ) logger.add(sys.stdout, format=logger_format, level="DEBUG" if DEBUG else "INFO") @app.exception_handler(StarletteHTTPException) async def custom_http_exception_handler( request: Request, exc: StarletteHTTPException, ) -> templates.TemplateResponse | JSONResponse: accept_value = request.headers.get("accept") if ( accept_value and accept_value.startswith("text/html") and 400 <= exc.status_code < 600 ): async with async_session() as db_session: title = ( { 404: "Oops, nothing to see here", 500: "Oops, something went wrong", } ).get(exc.status_code, exc.detail) try: return await templates.render_template( db_session, request, "error.html", {"title": title}, status_code=exc.status_code, ) finally: await db_session.close() return await http_exception_handler(request, exc) class ActivityPubResponse(JSONResponse): media_type = "application/activity+json" async def redirect_to_remote_instance( request: Request, db_session: AsyncSession, url: str, ) -> templates.TemplateResponse: """ Similar to RedirectResponse, but uses a 200 response with HTML. Needed for remote redirects on form submission endpoints, since our CSP policy disallows remote form submission. https://github.com/w3c/webappsec-csp/issues/8#issuecomment-810108984 """ return await templates.render_template( db_session, request, "redirect_to_remote_instance.html", { "request": request, "url": url, }, headers={"Refresh": "0;url=" + url}, ) @app.get(config.NavBarItems.NOTES_PATH) async def index( request: Request, db_session: AsyncSession = Depends(get_db_session), page: int | None = None, ) -> templates.TemplateResponse | ActivityPubResponse: if is_activitypub_requested(request): return ActivityPubResponse(LOCAL_ACTOR.ap_actor) page = page or 1 where = ( models.OutboxObject.visibility == ap.VisibilityEnum.PUBLIC, models.OutboxObject.is_deleted.is_(False), models.OutboxObject.is_hidden_from_homepage.is_(False), models.OutboxObject.ap_type.in_(["Announce", "Note", "Video", "Question"]), ) q = select(models.OutboxObject).where(*where) total_count = await db_session.scalar( select(func.count(models.OutboxObject.id)).where(*where) ) page_size = 20 page_offset = (page - 1) * page_size outbox_objects_result = await db_session.scalars( q.options( joinedload(models.OutboxObject.outbox_object_attachments).options( joinedload(models.OutboxObjectAttachment.upload) ), joinedload(models.OutboxObject.relates_to_inbox_object).options( joinedload(models.InboxObject.actor), ), joinedload(models.OutboxObject.relates_to_outbox_object).options( joinedload(models.OutboxObject.outbox_object_attachments).options( joinedload(models.OutboxObjectAttachment.upload) ), ), ) .order_by(models.OutboxObject.is_pinned.desc()) .order_by(models.OutboxObject.ap_published_at.desc()) .offset(page_offset) .limit(page_size) ) outbox_objects = outbox_objects_result.unique().all() return await templates.render_template( db_session, request, "index.html", { "request": request, "objects": outbox_objects, "current_page": page, "has_next_page": page_offset + len(outbox_objects) < total_count, "has_previous_page": page > 1, }, ) @app.get("/articles") async def articles( request: Request, db_session: AsyncSession = Depends(get_db_session), _: httpsig.HTTPSigInfo = Depends(httpsig.httpsig_checker), page: int | None = None, ) -> templates.TemplateResponse | ActivityPubResponse: # TODO: special ActivityPub collection for Article where = ( models.OutboxObject.visibility == ap.VisibilityEnum.PUBLIC, models.OutboxObject.is_deleted.is_(False), models.OutboxObject.is_hidden_from_homepage.is_(False), models.OutboxObject.ap_type == "Article", ) q = select(models.OutboxObject).where(*where) outbox_objects_result = await db_session.scalars( q.options( joinedload(models.OutboxObject.outbox_object_attachments).options( joinedload(models.OutboxObjectAttachment.upload) ), joinedload(models.OutboxObject.relates_to_inbox_object).options( joinedload(models.InboxObject.actor), ), joinedload(models.OutboxObject.relates_to_outbox_object).options( joinedload(models.OutboxObject.outbox_object_attachments).options( joinedload(models.OutboxObjectAttachment.upload) ), ), ).order_by(models.OutboxObject.ap_published_at.desc()) ) outbox_objects = outbox_objects_result.unique().all() return await templates.render_template( db_session, request, "articles.html", { "request": request, "objects": outbox_objects, }, ) async def _build_followx_collection( db_session: AsyncSession, model_cls: Type[models.Following | models.Follower], path: str, page: bool | None, next_cursor: str | None, ) -> ap.RawObject: total_items = await db_session.scalar(select(func.count(model_cls.id))) if not page and not next_cursor: return { "@context": ap.AS_CTX, "id": ID + path, "first": ID + path + "?page=true", "type": "OrderedCollection", "totalItems": total_items, } q = select(model_cls).order_by(model_cls.created_at.desc()) # type: ignore if next_cursor: q = q.where( model_cls.created_at < pagination.decode_cursor(next_cursor) # type: ignore ) q = q.limit(20) items = [followx for followx in (await db_session.scalars(q)).all()] next_cursor = None if ( items and await db_session.scalar( select(func.count(model_cls.id)).where( model_cls.created_at < items[-1].created_at ) ) > 0 ): next_cursor = pagination.encode_cursor(items[-1].created_at) collection_page = { "@context": ap.AS_CTX, "id": ( ID + path + "?page=true" if not next_cursor else ID + path + f"?next_cursor={next_cursor}" ), "partOf": ID + path, "type": "OrderedCollectionPage", "orderedItems": [item.ap_actor_id for item in items], } if next_cursor: collection_page["next"] = ID + path + f"?next_cursor={next_cursor}" return collection_page async def _empty_followx_collection( db_session: AsyncSession, model_cls: Type[models.Following | models.Follower], path: str, ) -> ap.RawObject: total_items = await db_session.scalar(select(func.count(model_cls.id))) return { "@context": ap.AS_CTX, "id": ID + path, "type": "OrderedCollection", "totalItems": total_items, } @app.get("/followers") async def followers( request: Request, page: bool | None = None, next_cursor: str | None = None, prev_cursor: str | None = None, db_session: AsyncSession = Depends(get_db_session), _: httpsig.HTTPSigInfo = Depends(httpsig.httpsig_checker), ) -> ActivityPubResponse | templates.TemplateResponse: if is_activitypub_requested(request): maybe_access_token_info = await indieauth.check_access_token( request, db_session, ) if config.HIDES_FOLLOWERS and not maybe_access_token_info: return ActivityPubResponse( await _empty_followx_collection( db_session=db_session, model_cls=models.Follower, path="/followers", ) ) else: return ActivityPubResponse( await _build_followx_collection( db_session=db_session, model_cls=models.Follower, path="/followers", page=page, next_cursor=next_cursor, ) ) if config.HIDES_FOLLOWERS and not is_current_user_admin(request): raise HTTPException(status_code=404) # We only show the most recent 20 followers on the public website followers_result = await db_session.scalars( select(models.Follower) .options(joinedload(models.Follower.actor)) .order_by(models.Follower.created_at.desc()) .limit(20) ) followers = followers_result.unique().all() actors_metadata = {} if is_current_user_admin(request): actors_metadata = await get_actors_metadata( db_session, [f.actor for f in followers], ) return await templates.render_template( db_session, request, "followers.html", { "followers": followers, "actors_metadata": actors_metadata, }, ) @app.get("/following") async def following( request: Request, page: bool | None = None, next_cursor: str | None = None, prev_cursor: str | None = None, db_session: AsyncSession = Depends(get_db_session), _: httpsig.HTTPSigInfo = Depends(httpsig.httpsig_checker), ) -> ActivityPubResponse | templates.TemplateResponse: if is_activitypub_requested(request): maybe_access_token_info = await indieauth.check_access_token( request, db_session, ) if config.HIDES_FOLLOWING and not maybe_access_token_info: return ActivityPubResponse( await _empty_followx_collection( db_session=db_session, model_cls=models.Following, path="/following", ) ) else: return ActivityPubResponse( await _build_followx_collection( db_session=db_session, model_cls=models.Following, path="/following", page=page, next_cursor=next_cursor, ) ) if config.HIDES_FOLLOWING and not is_current_user_admin(request): raise HTTPException(status_code=404) # We only show the most recent 20 follows on the public website following = ( ( await db_session.scalars( select(models.Following) .options(joinedload(models.Following.actor)) .order_by(models.Following.created_at.desc()) .limit(20) ) ) .unique() .all() ) actors_metadata = {} if is_current_user_admin(request): actors_metadata = await get_actors_metadata( db_session, [f.actor for f in following], ) return await templates.render_template( db_session, request, "following.html", { "following": following, "actors_metadata": actors_metadata, }, ) @app.get("/outbox") async def outbox( request: Request, db_session: AsyncSession = Depends(get_db_session), _: httpsig.HTTPSigInfo = Depends(httpsig.httpsig_checker), ) -> ActivityPubResponse: maybe_access_token_info = await indieauth.check_access_token( request, db_session, ) # Default restrictions unless the request is authenticated with an access token restricted_where = [ models.OutboxObject.visibility == ap.VisibilityEnum.PUBLIC, models.OutboxObject.ap_type.in_(["Create", "Note", "Article", "Announce"]), ] # By design, we only show the last 20 public activities in the oubox outbox_objects = ( await db_session.scalars( select(models.OutboxObject) .where( models.OutboxObject.is_deleted.is_(False), *([] if maybe_access_token_info else restricted_where), ) .order_by(models.OutboxObject.ap_published_at.desc()) .limit(20) ) ).all() return ActivityPubResponse( { "@context": ap.AS_EXTENDED_CTX, "id": f"{ID}/outbox", "type": "OrderedCollection", "totalItems": len(outbox_objects), "orderedItems": [ ap.remove_context(ap.wrap_object_if_needed(a.ap_object)) for a in outbox_objects ], } ) @app.get("/featured") async def featured( db_session: AsyncSession = Depends(get_db_session), _: httpsig.HTTPSigInfo = Depends(httpsig.httpsig_checker), ) -> ActivityPubResponse: outbox_objects = ( await db_session.scalars( select(models.OutboxObject) .filter( models.OutboxObject.visibility == ap.VisibilityEnum.PUBLIC, models.OutboxObject.is_deleted.is_(False), models.OutboxObject.is_pinned.is_(True), ) .order_by(models.OutboxObject.ap_published_at.desc()) .limit(5) ) ).all() return ActivityPubResponse( { "@context": ap.AS_EXTENDED_CTX, "id": f"{ID}/featured", "type": "OrderedCollection", "totalItems": len(outbox_objects), "orderedItems": [ap.remove_context(a.ap_object) for a in outbox_objects], } ) async def _check_outbox_object_acl( request: Request, db_session: AsyncSession, ap_object: models.OutboxObject, httpsig_info: httpsig.HTTPSigInfo, ) -> None: if templates.is_current_user_admin(request): return None maybe_access_token_info = await indieauth.check_access_token( request, db_session, ) if maybe_access_token_info: # TODO: check scopes return None if ap_object.visibility in [ ap.VisibilityEnum.PUBLIC, ap.VisibilityEnum.UNLISTED, ]: return None elif ap_object.visibility == ap.VisibilityEnum.FOLLOWERS_ONLY: # Is the signing actor a follower? followers = await boxes.fetch_actor_collection( db_session, BASE_URL + "/followers" ) if httpsig_info.signed_by_ap_actor_id in [actor.ap_id for actor in followers]: return None elif ap_object.visibility == ap.VisibilityEnum.DIRECT: # Is the signing actor targeted in the object audience? audience = ap_object.ap_object.get("to", []) + ap_object.ap_object.get("cc", []) if httpsig_info.signed_by_ap_actor_id in audience: return None raise HTTPException(status_code=404) async def _fetch_likes( db_session: AsyncSession, outbox_object: models.OutboxObject, ) -> list[models.InboxObject]: return ( ( await db_session.scalars( select(models.InboxObject) .where( models.InboxObject.ap_type == "Like", models.InboxObject.activity_object_ap_id == outbox_object.ap_id, models.InboxObject.is_deleted.is_(False), ) .options(joinedload(models.InboxObject.actor)) .order_by(models.InboxObject.ap_published_at.desc()) .limit(10) ) ) .unique() .all() ) async def _fetch_shares( db_session: AsyncSession, outbox_object: models.OutboxObject, ) -> list[models.InboxObject]: return ( ( await db_session.scalars( select(models.InboxObject) .filter( models.InboxObject.ap_type == "Announce", models.InboxObject.activity_object_ap_id == outbox_object.ap_id, models.InboxObject.is_deleted.is_(False), ) .options(joinedload(models.InboxObject.actor)) .order_by(models.InboxObject.ap_published_at.desc()) .limit(10) ) ) .unique() .all() ) async def _fetch_webmentions( db_session: AsyncSession, outbox_object: models.OutboxObject, ) -> list[models.Webmention]: return ( await db_session.scalars( select(models.Webmention) .filter( models.Webmention.outbox_object_id == outbox_object.id, models.Webmention.is_deleted.is_(False), ) .limit(50) ) ).all() @app.get("/o/{public_id}") async def outbox_by_public_id( public_id: str, request: Request, db_session: AsyncSession = Depends(get_db_session), httpsig_info: httpsig.HTTPSigInfo = Depends(httpsig.httpsig_checker), ) -> ActivityPubResponse | templates.TemplateResponse | RedirectResponse: maybe_object = ( ( await db_session.execute( select(models.OutboxObject) .options( joinedload(models.OutboxObject.outbox_object_attachments).options( joinedload(models.OutboxObjectAttachment.upload) ) ) .where( models.OutboxObject.public_id == public_id, models.OutboxObject.is_deleted.is_(False), ) ) ) .unique() .scalar_one_or_none() ) if not maybe_object: raise HTTPException(status_code=404) await _check_outbox_object_acl(request, db_session, maybe_object, httpsig_info) if is_activitypub_requested(request): return ActivityPubResponse(maybe_object.ap_object) if maybe_object.ap_type == "Article": return RedirectResponse( f"{BASE_URL}/articles/{public_id[:7]}/{maybe_object.slug}", status_code=301, ) replies_tree = await boxes.get_replies_tree( db_session, maybe_object, is_current_user_admin=is_current_user_admin(request), ) webmentions = await _fetch_webmentions(db_session, maybe_object) likes = await _fetch_likes(db_session, maybe_object) shares = await _fetch_shares(db_session, maybe_object) return await templates.render_template( db_session, request, "object.html", { "replies_tree": _merge_replies(replies_tree, webmentions), "outbox_object": maybe_object, "likes": _merge_faces_from_inbox_object_and_webmentions( likes, webmentions, models.WebmentionType.LIKE, ), "shares": _merge_faces_from_inbox_object_and_webmentions( shares, webmentions, models.WebmentionType.REPOST, ), "webmentions": _filter_webmentions(webmentions), }, ) def _filter_webmentions( webmentions: list[models.Webmention], ) -> list[models.Webmention]: return [ wm for wm in webmentions if wm.webmention_type not in [ models.WebmentionType.LIKE, models.WebmentionType.REPOST, models.WebmentionType.REPLY, ] ] def _merge_faces_from_inbox_object_and_webmentions( inbox_objects: list[models.InboxObject], webmentions: list[models.Webmention], webmention_type: models.WebmentionType, ) -> list[Face]: wm_faces = [] for wm in webmentions: if wm.webmention_type != webmention_type: continue if face := Face.from_webmention(wm): wm_faces.append(face) return merge_faces( [Face.from_inbox_object(obj) for obj in inbox_objects] + wm_faces ) def _merge_replies( reply_tree_node: boxes.ReplyTreeNode, webmentions: list[models.Webmention], ) -> boxes.ReplyTreeNode: # TODO: return None as we update the object in place webmention_replies = [] for wm in [ wm for wm in webmentions if wm.webmention_type == models.WebmentionType.REPLY ]: if rep := WebmentionReply.from_webmention(wm): webmention_replies.append( boxes.ReplyTreeNode( ap_object=None, wm_reply=rep, is_requested=False, children=[], ) ) reply_tree_node.children = sorted( reply_tree_node.children + webmention_replies, key=lambda node: node.published_at, reverse=True, ) return reply_tree_node @app.get("/articles/{short_id}/{slug}") async def article_by_slug( short_id: str, slug: str, request: Request, db_session: AsyncSession = Depends(get_db_session), httpsig_info: httpsig.HTTPSigInfo = Depends(httpsig.httpsig_checker), ) -> ActivityPubResponse | templates.TemplateResponse | RedirectResponse: maybe_object = await boxes.get_outbox_object_by_slug_and_short_id( db_session, slug, short_id ) if not maybe_object: raise HTTPException(status_code=404) await _check_outbox_object_acl(request, db_session, maybe_object, httpsig_info) if is_activitypub_requested(request): return ActivityPubResponse(maybe_object.ap_object) replies_tree = await boxes.get_replies_tree( db_session, maybe_object, is_current_user_admin=is_current_user_admin(request), ) likes = await _fetch_likes(db_session, maybe_object) shares = await _fetch_shares(db_session, maybe_object) webmentions = await _fetch_webmentions(db_session, maybe_object) return await templates.render_template( db_session, request, "object.html", { "replies_tree": _merge_replies(replies_tree, webmentions), "outbox_object": maybe_object, "likes": _merge_faces_from_inbox_object_and_webmentions( likes, webmentions, models.WebmentionType.LIKE, ), "shares": _merge_faces_from_inbox_object_and_webmentions( shares, webmentions, models.WebmentionType.REPOST, ), "webmentions": _filter_webmentions(webmentions), }, ) @app.get("/o/{public_id}/activity") async def outbox_activity_by_public_id( public_id: str, request: Request, db_session: AsyncSession = Depends(get_db_session), httpsig_info: httpsig.HTTPSigInfo = Depends(httpsig.httpsig_checker), ) -> ActivityPubResponse: maybe_object = ( await db_session.execute( select(models.OutboxObject).where( models.OutboxObject.public_id == public_id, models.OutboxObject.is_deleted.is_(False), ) ) ).scalar_one_or_none() if not maybe_object: raise HTTPException(status_code=404) await _check_outbox_object_acl(request, db_session, maybe_object, httpsig_info) return ActivityPubResponse(ap.wrap_object(maybe_object.ap_object)) @app.get("/t/{tag}") async def tag_by_name( tag: str, request: Request, db_session: AsyncSession = Depends(get_db_session), _: httpsig.HTTPSigInfo = Depends(httpsig.httpsig_checker), ) -> ActivityPubResponse | templates.TemplateResponse: where = [ models.TaggedOutboxObject.tag == tag.lower(), models.OutboxObject.visibility == ap.VisibilityEnum.PUBLIC, models.OutboxObject.is_deleted.is_(False), ] tagged_count = await db_session.scalar( select(func.count(models.OutboxObject.id)) .join(models.TaggedOutboxObject) .where(*where) ) if is_activitypub_requested(request): if not tagged_count: raise HTTPException(status_code=404) outbox_object_ids = await db_session.execute( select(models.OutboxObject.ap_id) .join( models.TaggedOutboxObject, models.TaggedOutboxObject.outbox_object_id == models.OutboxObject.id, ) .where(*where) .order_by(models.OutboxObject.ap_published_at.desc()) .limit(20) ) return ActivityPubResponse( { "@context": ap.AS_CTX, "id": BASE_URL + f"/t/{tag.lower()}", "type": "OrderedCollection", "totalItems": tagged_count, "orderedItems": [ outbox_object.ap_id for outbox_object in outbox_object_ids ], } ) outbox_objects_result = await db_session.scalars( select(models.OutboxObject) .where(*where) .join( models.TaggedOutboxObject, models.TaggedOutboxObject.outbox_object_id == models.OutboxObject.id, ) .options( joinedload(models.OutboxObject.outbox_object_attachments).options( joinedload(models.OutboxObjectAttachment.upload) ) ) .order_by(models.OutboxObject.ap_published_at.desc()) .limit(20) ) outbox_objects = outbox_objects_result.unique().all() return await templates.render_template( db_session, request, "index.html", { "request": request, "objects": outbox_objects, }, status_code=200 if len(outbox_objects) else 404, ) @app.get("/e/{name}") def emoji_by_name(name: str) -> ActivityPubResponse: try: emoji = EMOJIS_BY_NAME[f":{name}:"] except KeyError: raise HTTPException(status_code=404) return ActivityPubResponse({"@context": ap.AS_EXTENDED_CTX, **emoji}) @app.post("/inbox") async def inbox( request: Request, db_session: AsyncSession = Depends(get_db_session), httpsig_info: httpsig.HTTPSigInfo = Depends(httpsig.enforce_httpsig), ) -> Response: # logger.info(f"headers={request.headers}") payload = await request.json() logger.info(f"{payload=}") await new_ap_incoming_activity(db_session, httpsig_info, payload) return Response(status_code=202) @app.get("/remote_follow") async def get_remote_follow( request: Request, db_session: AsyncSession = Depends(get_db_session), ) -> templates.TemplateResponse: return await templates.render_template( db_session, request, "remote_follow.html", {}, ) @app.post("/remote_follow") async def post_remote_follow( request: Request, db_session: AsyncSession = Depends(get_db_session), csrf_check: None = Depends(verify_csrf_token), profile: str = Form(), ) -> templates.TemplateResponse: if not profile.startswith("@"): profile = f"@{profile}" remote_follow_template = await get_remote_follow_template(profile) if not remote_follow_template: # TODO(ts): error message to user raise HTTPException(status_code=404) return await redirect_to_remote_instance( request, db_session, remote_follow_template.format(uri=ID), ) @app.get("/remote_interaction") async def remote_interaction( request: Request, ap_id: str, db_session: AsyncSession = Depends(get_db_session), ) -> templates.TemplateResponse: outbox_object = await boxes.get_outbox_object_by_ap_id( db_session, ap_id, ) if not outbox_object: raise HTTPException(status_code=404) return await templates.render_template( db_session, request, "remote_interact.html", {"outbox_object": outbox_object}, ) @app.post("/remote_interaction") async def post_remote_interaction( request: Request, db_session: AsyncSession = Depends(get_db_session), csrf_check: None = Depends(verify_csrf_token), profile: str = Form(), ap_id: str = Form(), ) -> templates.TemplateResponse: if not profile.startswith("@"): profile = f"@{profile}" remote_follow_template = await get_remote_follow_template(profile) if not remote_follow_template: # TODO(ts): error message to user raise HTTPException(status_code=404) return await redirect_to_remote_instance( request, db_session, remote_follow_template.format(uri=ID), ) @app.get("/.well-known/webfinger") async def wellknown_webfinger(resource: str) -> JSONResponse: """Exposes/servers WebFinger data.""" if resource not in [f"acct:{USERNAME}@{DOMAIN}", ID]: logger.info(f"Got invalid req for {resource}") raise HTTPException(status_code=404) out = { "subject": f"acct:{USERNAME}@{DOMAIN}", "aliases": [ID], "links": [ { "rel": "http://webfinger.net/rel/profile-page", "type": "text/html", "href": ID + "/", }, {"rel": "self", "type": "application/activity+json", "href": ID}, { "rel": "http://ostatus.org/schema/1.0/subscribe", "template": BASE_URL + "/admin/lookup?query={uri}", }, ], } return JSONResponse( out, media_type="application/jrd+json; charset=utf-8", headers={"Access-Control-Allow-Origin": "*"}, ) @app.get("/.well-known/nodeinfo") async def well_known_nodeinfo() -> dict[str, Any]: return { "links": [ { "rel": "http://nodeinfo.diaspora.software/ns/schema/2.1", "href": f"{BASE_URL}/nodeinfo", } ] } @app.get("/nodeinfo") async def nodeinfo( db_session: AsyncSession = Depends(get_db_session), ): local_posts = await public_outbox_objects_count(db_session) return JSONResponse( { "version": "2.1", "software": { "name": "microblogpub", "version": config.VERSION, "repository": "https://sr.ht/~tsileo/microblog.pub", "homepage": "https://docs.microblog.pub", }, "protocols": ["activitypub"], "services": {"inbound": [], "outbound": []}, "openRegistrations": False, "usage": {"users": {"total": 1}, "localPosts": local_posts}, "metadata": { "nodeName": LOCAL_ACTOR.handle, }, }, media_type=( "application/json; " "profile=http://nodeinfo.diaspora.software/ns/schema/2.1#" ), ) async def _proxy_get( proxy_client: httpx.AsyncClient, request: starlette.requests.Request, url: str, stream: bool, ) -> httpx.Response: # Request the URL (and filter request headers) proxy_req = proxy_client.build_request( request.method, url, headers=[ (k, v) for (k, v) in request.headers.raw if k.lower() not in [ b"host", b"cookie", b"x-forwarded-for", b"x-forwarded-proto", b"x-real-ip", b"user-agent", ] ] + [(b"user-agent", USER_AGENT.encode())], ) return await proxy_client.send(proxy_req, stream=stream) def _filter_proxy_resp_headers( proxy_resp: httpx.Response, allowed_headers: list[str], ) -> dict[str, str]: return { k: v for (k, v) in proxy_resp.headers.items() if k.lower() in allowed_headers } def _strip_content_type(headers: dict[str, str]) -> dict[str, str]: return {k: v for k, v in headers.items() if k.lower() != "content-type"} def _add_cache_control(headers: dict[str, str]) -> dict[str, str]: return {**headers, "Cache-Control": "max-age=31536000"} @app.get("/proxy/media/{exp}/{sig}/{encoded_url}") async def serve_proxy_media( request: Request, exp: int, sig: str, encoded_url: str, background_tasks: fastapi.BackgroundTasks, ) -> StreamingResponse | PlainTextResponse: # Decode the base64-encoded URL url = base64.urlsafe_b64decode(encoded_url).decode() check_url(url) media.verify_proxied_media_sig(exp, url, sig) proxy_client = httpx.AsyncClient( follow_redirects=True, timeout=httpx.Timeout(timeout=10.0), transport=httpx.AsyncHTTPTransport(retries=1), ) async def _close_proxy_client(): await proxy_client.aclose() background_tasks.add_task(_close_proxy_client) proxy_resp = await _proxy_get(proxy_client, request, url, stream=True) if proxy_resp.status_code >= 300: logger.info(f"failed to proxy {url}, got {proxy_resp.status_code}") await proxy_resp.aclose() return PlainTextResponse( status_code=proxy_resp.status_code, ) return StreamingResponse( proxy_resp.aiter_raw(), status_code=proxy_resp.status_code, headers=_add_cache_control( _filter_proxy_resp_headers( proxy_resp, [ "content-length", "content-type", "content-range", "accept-ranges", "etag", "expires", "date", "last-modified", ], ) ), background=BackgroundTask(proxy_resp.aclose), ) @app.get("/proxy/media/{exp}/{sig}/{encoded_url}/{size}") async def serve_proxy_media_resized( request: Request, exp: int, sig: str, encoded_url: str, size: int, background_tasks: fastapi.BackgroundTasks, ) -> PlainTextResponse: if size not in {50, 740}: raise ValueError("Unsupported size") is_webp_supported = "image/webp" in request.headers.get("accept") # Decode the base64-encoded URL url = base64.urlsafe_b64decode(encoded_url).decode() check_url(url) media.verify_proxied_media_sig(exp, url, sig) if (cached_resp := _RESIZED_CACHE.get((url, size))) and is_webp_supported: resized_content, resized_mimetype, resp_headers = cached_resp return PlainTextResponse( resized_content, media_type=resized_mimetype, headers=resp_headers, ) proxy_client = httpx.AsyncClient( follow_redirects=True, timeout=httpx.Timeout(timeout=10.0), transport=httpx.AsyncHTTPTransport(retries=1), ) async def _close_proxy_client(): await proxy_client.aclose() background_tasks.add_task(_close_proxy_client) proxy_resp = await _proxy_get(proxy_client, request, url, stream=False) if proxy_resp.status_code >= 300: logger.info(f"failed to proxy {url}, got {proxy_resp.status_code}") await proxy_resp.aclose() return PlainTextResponse( status_code=proxy_resp.status_code, ) # Filter the headers proxy_resp_headers = _add_cache_control( _filter_proxy_resp_headers( proxy_resp, [ "content-type", "etag", "expires", "last-modified", ], ) ) try: out = BytesIO(proxy_resp.content) i = Image.open(out) if getattr(i, "is_animated", False): raise ValueError i.thumbnail((size, size)) is_webp = False try: resized_buf = BytesIO() i.save(resized_buf, format="webp" if is_webp_supported else i.format) is_webp = is_webp_supported except Exception: logger.exception("Failed to create thumbnail") resized_buf = BytesIO() i.save(resized_buf, format=i.format) resized_buf.seek(0) resized_content = resized_buf.read() resized_mimetype = ( "image/webp" if is_webp else i.get_format_mimetype() # type: ignore ) # Only cache images < 1MB if len(resized_content) < 2**20: _RESIZED_CACHE[(url, size)] = ( resized_content, resized_mimetype, _strip_content_type(proxy_resp_headers), ) return PlainTextResponse( resized_content, media_type=resized_mimetype, headers=_strip_content_type(proxy_resp_headers), ) except ValueError: return PlainTextResponse( proxy_resp.content, headers=proxy_resp_headers, ) except Exception: logger.exception(f"Failed to resize {url} on the fly") return PlainTextResponse( proxy_resp.content, headers=proxy_resp_headers, ) @app.get("/attachments/{content_hash}/{filename}") async def serve_attachment( content_hash: str, filename: str, db_session: AsyncSession = Depends(get_db_session), ): upload = ( await db_session.execute( select(models.Upload).where( models.Upload.content_hash == content_hash, ) ) ).scalar_one_or_none() if not upload: raise HTTPException(status_code=404) return FileResponse( UPLOAD_DIR / content_hash, media_type=upload.content_type, headers={"Cache-Control": "max-age=31536000"}, ) @app.get("/attachments/thumbnails/{content_hash}/{filename}") async def serve_attachment_thumbnail( request: Request, content_hash: str, filename: str, db_session: AsyncSession = Depends(get_db_session), ): upload = ( await db_session.execute( select(models.Upload).where( models.Upload.content_hash == content_hash, ) ) ).scalar_one_or_none() if not upload or not upload.has_thumbnail: raise HTTPException(status_code=404) is_webp_supported = "image/webp" in request.headers.get("accept") if is_webp_supported: return FileResponse( UPLOAD_DIR / (content_hash + "_resized"), media_type="image/webp", headers={"Cache-Control": "max-age=31536000"}, ) else: return FileResponse( UPLOAD_DIR / content_hash, media_type=upload.content_type, headers={"Cache-Control": "max-age=31536000"}, ) @app.get("/robots.txt", response_class=PlainTextResponse) async def robots_file(): return """User-agent: * Disallow: /followers Disallow: /following Disallow: /admin Disallow: /remote_interaction Disallow: /remote_follow""" async def _get_outbox_for_feed(db_session: AsyncSession) -> list[models.OutboxObject]: return ( ( await db_session.scalars( select(models.OutboxObject) .where( models.OutboxObject.visibility == ap.VisibilityEnum.PUBLIC, models.OutboxObject.is_deleted.is_(False), models.OutboxObject.ap_type.in_(["Note", "Article", "Video"]), ) .options( joinedload(models.OutboxObject.outbox_object_attachments).options( joinedload(models.OutboxObjectAttachment.upload) ) ) .order_by(models.OutboxObject.ap_published_at.desc()) .limit(20) ) ) .unique() .all() ) @app.get("/feed.json") async def json_feed( db_session: AsyncSession = Depends(get_db_session), ) -> dict[str, Any]: outbox_objects = await _get_outbox_for_feed(db_session) data = [] for outbox_object in outbox_objects: if not outbox_object.ap_published_at: raise ValueError(f"{outbox_object} has no published date") data.append( { "id": outbox_object.public_id, "url": outbox_object.url, "content_html": outbox_object.content, "content_text": outbox_object.source, "date_published": outbox_object.ap_published_at.isoformat(), "attachments": [ {"url": a.url, "mime_type": a.media_type} for a in outbox_object.attachments ], } ) result = { "version": "https://jsonfeed.org/version/1", "title": f"{LOCAL_ACTOR.display_name}'s microblog'", "home_page_url": LOCAL_ACTOR.url, "feed_url": BASE_URL + "/feed.json", "author": { "name": LOCAL_ACTOR.display_name, "url": LOCAL_ACTOR.url, }, "items": data, } if LOCAL_ACTOR.icon_url: result["author"]["avatar"] = LOCAL_ACTOR.icon_url # type: ignore return result async def _gen_rss_feed( db_session: AsyncSession, ): fg = FeedGenerator() fg.id(BASE_URL + "/feed.rss") fg.title(f"{LOCAL_ACTOR.display_name}'s microblog") fg.description(f"{LOCAL_ACTOR.display_name}'s microblog") fg.author({"name": LOCAL_ACTOR.display_name}) fg.link(href=LOCAL_ACTOR.url, rel="alternate") if LOCAL_ACTOR.icon_url: fg.logo(LOCAL_ACTOR.icon_url) fg.language("en") outbox_objects = await _get_outbox_for_feed(db_session) for outbox_object in outbox_objects: if not outbox_object.ap_published_at: raise ValueError(f"{outbox_object} has no published date") content = outbox_object.content if content is None: raise ValueError("Should never happen") if outbox_object.attachments: for attachment in outbox_object.attachments: if attachment.type == "Image" or ( attachment.media_type and attachment.media_type.startswith("image") ): content += f'' # TODO(ts): other attachment types fe = fg.add_entry() fe.id(outbox_object.url) fe.link(href=outbox_object.url) fe.title(outbox_object.url) fe.description(content) fe.content(content) fe.published(outbox_object.ap_published_at.replace(tzinfo=timezone.utc)) return fg @app.get("/feed.rss") async def rss_feed( db_session: AsyncSession = Depends(get_db_session), ) -> PlainTextResponse: return PlainTextResponse( (await _gen_rss_feed(db_session)).rss_str(), headers={"Content-Type": "application/rss+xml"}, ) @app.get("/feed.atom") async def atom_feed( db_session: AsyncSession = Depends(get_db_session), ) -> PlainTextResponse: return PlainTextResponse( (await _gen_rss_feed(db_session)).atom_str(), headers={"Content-Type": "application/atom+xml"}, )