a9984c6da7
The original approach to search in GIN indexes is to use `to_tsvector(text)` in the WHERE clause of the query. According to postgres docs [pdoc], this method does not make use of the index, while `to_tsvector(config, text)` does. This commit changed the query to use the two-argument `to_tsvector()`. [pdoc]: https://www.postgresql.org/docs/12/textsearch-tables.html To obtain the search config in use, we make a query to the db first. The `::regconfig::oid` hack is needed because Postgrex does not support regconfig type directly [postgrexbug]. I use the conversion from and to `oid` instead of `text` because I tested in the actual DB and querying using the conversion via `text` is slow just as the one-argument `to_tsvector()` variant. [postgrexbug]: https://github.com/elixir-ecto/postgrex/issues/502 BUG: https://git.pleroma.social/pleroma/pleroma/-/issues/2758
150 lines
4.1 KiB
Elixir
150 lines
4.1 KiB
Elixir
# Pleroma: A lightweight social networking server
|
|
# Copyright © 2017-2021 Pleroma Authors <https://pleroma.social/>
|
|
# SPDX-License-Identifier: AGPL-3.0-only
|
|
|
|
defmodule Pleroma.Activity.Search do
|
|
alias Pleroma.Activity
|
|
alias Pleroma.Object.Fetcher
|
|
alias Pleroma.Pagination
|
|
alias Pleroma.User
|
|
alias Pleroma.Web.ActivityPub.Visibility
|
|
|
|
require Pleroma.Constants
|
|
|
|
import Ecto.Query
|
|
|
|
def search(user, search_query, options \\ []) do
|
|
index_type = if Pleroma.Config.get([:database, :rum_enabled]), do: :rum, else: :gin
|
|
limit = Enum.min([Keyword.get(options, :limit), 40])
|
|
offset = Keyword.get(options, :offset, 0)
|
|
author = Keyword.get(options, :author)
|
|
|
|
search_function =
|
|
if :persistent_term.get({Pleroma.Repo, :postgres_version}) >= 11 do
|
|
:websearch
|
|
else
|
|
:plain
|
|
end
|
|
|
|
try do
|
|
Activity
|
|
|> Activity.with_preloaded_object()
|
|
|> Activity.restrict_deactivated_users()
|
|
|> restrict_public()
|
|
|> query_with(index_type, search_query, search_function)
|
|
|> maybe_restrict_local(user)
|
|
|> maybe_restrict_author(author)
|
|
|> maybe_restrict_blocked(user)
|
|
|> Pagination.fetch_paginated(
|
|
%{"offset" => offset, "limit" => limit, "skip_order" => index_type == :rum},
|
|
:offset
|
|
)
|
|
|> maybe_fetch(user, search_query)
|
|
rescue
|
|
_ -> maybe_fetch([], user, search_query)
|
|
end
|
|
end
|
|
|
|
def maybe_restrict_author(query, %User{} = author) do
|
|
Activity.Queries.by_author(query, author)
|
|
end
|
|
|
|
def maybe_restrict_author(query, _), do: query
|
|
|
|
def maybe_restrict_blocked(query, %User{} = user) do
|
|
Activity.Queries.exclude_authors(query, User.blocked_users_ap_ids(user))
|
|
end
|
|
|
|
def maybe_restrict_blocked(query, _), do: query
|
|
|
|
defp restrict_public(q) do
|
|
from([a, o] in q,
|
|
where: fragment("?->>'type' = 'Create'", a.data),
|
|
where: ^Pleroma.Constants.as_public() in a.recipients
|
|
)
|
|
end
|
|
|
|
defp query_with(q, :gin, search_query, :plain) do
|
|
%{rows: [[tsc]]} =
|
|
Ecto.Adapters.SQL.query!(
|
|
Pleroma.Repo,
|
|
"select current_setting('default_text_search_config')::regconfig::oid;"
|
|
)
|
|
|
|
from([a, o] in q,
|
|
where:
|
|
fragment(
|
|
"to_tsvector(?::oid::regconfig, ?->>'content') @@ plainto_tsquery(?)",
|
|
^tsc,
|
|
o.data,
|
|
^search_query
|
|
)
|
|
)
|
|
end
|
|
|
|
defp query_with(q, :gin, search_query, :websearch) do
|
|
%{rows: [[tsc]]} =
|
|
Ecto.Adapters.SQL.query!(
|
|
Pleroma.Repo,
|
|
"select current_setting('default_text_search_config')::regconfig::oid;"
|
|
)
|
|
|
|
from([a, o] in q,
|
|
where:
|
|
fragment(
|
|
"to_tsvector(?::oid::regconfig, ?->>'content') @@ websearch_to_tsquery(?)",
|
|
^tsc,
|
|
o.data,
|
|
^search_query
|
|
)
|
|
)
|
|
end
|
|
|
|
defp query_with(q, :rum, search_query, :plain) do
|
|
from([a, o] in q,
|
|
where:
|
|
fragment(
|
|
"? @@ plainto_tsquery(?)",
|
|
o.fts_content,
|
|
^search_query
|
|
),
|
|
order_by: [fragment("? <=> now()::date", o.inserted_at)]
|
|
)
|
|
end
|
|
|
|
defp query_with(q, :rum, search_query, :websearch) do
|
|
from([a, o] in q,
|
|
where:
|
|
fragment(
|
|
"? @@ websearch_to_tsquery(?)",
|
|
o.fts_content,
|
|
^search_query
|
|
),
|
|
order_by: [fragment("? <=> now()::date", o.inserted_at)]
|
|
)
|
|
end
|
|
|
|
defp maybe_restrict_local(q, user) do
|
|
limit = Pleroma.Config.get([:instance, :limit_to_local_content], :unauthenticated)
|
|
|
|
case {limit, user} do
|
|
{:all, _} -> restrict_local(q)
|
|
{:unauthenticated, %User{}} -> q
|
|
{:unauthenticated, _} -> restrict_local(q)
|
|
{false, _} -> q
|
|
end
|
|
end
|
|
|
|
defp restrict_local(q), do: where(q, local: true)
|
|
|
|
defp maybe_fetch(activities, user, search_query) do
|
|
with true <- Regex.match?(~r/https?:/, search_query),
|
|
{:ok, object} <- Fetcher.fetch_object_from_id(search_query),
|
|
%Activity{} = activity <- Activity.get_create_by_object_ap_id(object.data["id"]),
|
|
true <- Visibility.visible_for_user?(activity, user) do
|
|
[activity | activities]
|
|
else
|
|
_ -> activities
|
|
end
|
|
end
|
|
end
|