From 93ccb5dd32f4e3942d08814e5a86fb30c90c9ff6 Mon Sep 17 00:00:00 2001 From: Andrew Godwin Date: Sun, 4 Dec 2022 21:13:33 -0700 Subject: Make search work with URLs --- activities/views/search.py | 86 ++++++++++++++++++++++++++++++++++++++++++---- 1 file changed, 79 insertions(+), 7 deletions(-) (limited to 'activities/views') diff --git a/activities/views/search.py b/activities/views/search.py index 8bdef78..ab37e17 100644 --- a/activities/views/search.py +++ b/activities/views/search.py @@ -1,11 +1,14 @@ from typing import Set +import httpx from asgiref.sync import async_to_sync from django import forms from django.views.generic import FormView -from activities.models import Hashtag +from activities.models import Hashtag, Post +from core.ld import canonicalise from users.models import Domain, Identity, IdentityStates +from users.models.system_actor import SystemActor class Search(FormView): @@ -14,11 +17,20 @@ class Search(FormView): class form_class(forms.Form): query = forms.CharField( - help_text="Search for a user by @username@domain or hashtag by #tagname", + help_text="Search for:\nA user by @username@domain or their profile URL\nA hashtag by #tagname\nA post by its URL", widget=forms.TextInput(attrs={"type": "search", "autofocus": "autofocus"}), ) - def search_identities(self, query: str): + def search_identities_handle(self, query: str): + """ + Searches for identities by their handles + """ + + # Short circuit if it's obviously not for us + if "://" in query: + return set() + + # Try to fetch the user by handle query = query.lstrip("@") results: Set[Identity] = set() if "@" in query: @@ -52,12 +64,65 @@ class Search(FormView): results.add(identity) return results + def search_url(self, query: str) -> Post | Identity | None: + """ + Searches for an identity or post by URL. + """ + + # Short circuit if it's obviously not for us + if "://" not in query: + return None + + # Clean up query + query = query.strip() + + # Fetch the provided URL as the system actor to retrieve the AP JSON + try: + response = async_to_sync(SystemActor().signed_request)( + method="get", uri=query + ) + except (httpx.RequestError, httpx.ConnectError): + return None + if response.status_code >= 400: + return None + document = canonicalise(response.json(), include_security=True) + type = document.get("type", "unknown").lower() + + # Is it an identity? + if type == "person": + # Try and retrieve the profile by actor URI + identity = Identity.by_actor_uri(document["id"], create=True) + if identity and identity.state == IdentityStates.outdated: + async_to_sync(identity.fetch_actor)() + return identity + + # Is it a post? + elif type == "note": + # Try and retrieve the post by URI + # (we do not trust the JSON we just got - fetch from source!) + try: + post = Post.by_object_uri(document["id"], fetch=True) + # We may need to live-fetch the identity too + if post.author.state == IdentityStates.outdated: + async_to_sync(post.author.fetch_actor)() + return post + except Post.DoesNotExist: + return None + + # Dunno what it is + else: + return None + def search_hashtags(self, query: str): - results: Set[Hashtag] = set() + """ + Searches for hashtags by their name + """ - if "@" in query: - return results + # Short circuit out if it's obviously not a hashtag + if "@" in query or "://" in query: + return set() + results: Set[Hashtag] = set() query = query.lstrip("#") for hashtag in Hashtag.objects.public().hashtag_or_alias(query)[:10]: results.add(hashtag) @@ -68,10 +133,17 @@ class Search(FormView): def form_valid(self, form): query = form.cleaned_data["query"].lower() results = { - "identities": self.search_identities(query), + "identities": self.search_identities_handle(query), "hashtags": self.search_hashtags(query), + "posts": set(), } + url_result = self.search_url(query) + if isinstance(url_result, Identity): + results["identities"].add(url_result) + if isinstance(url_result, Post): + results["posts"].add(url_result) + # Render results context = self.get_context_data(form=form) context["results"] = results -- cgit v1.2.3