2019-07-10 05:13:23 +00:00
|
|
|
# Pleroma: A lightweight social networking server
|
2020-03-03 22:44:49 +00:00
|
|
|
# Copyright © 2017-2020 Pleroma Authors <https://pleroma.social/>
|
2019-07-10 05:13:23 +00:00
|
|
|
# SPDX-License-Identifier: AGPL-3.0-only
|
|
|
|
|
2019-01-23 15:37:25 +00:00
|
|
|
defmodule Pleroma.Instances.Instance do
|
|
|
|
@moduledoc "Instance."
|
|
|
|
|
2019-02-09 15:16:26 +00:00
|
|
|
alias Pleroma.Instances
|
2019-01-23 15:37:25 +00:00
|
|
|
alias Pleroma.Instances.Instance
|
2019-03-05 02:52:23 +00:00
|
|
|
alias Pleroma.Repo
|
2019-01-23 15:37:25 +00:00
|
|
|
|
|
|
|
use Ecto.Schema
|
|
|
|
|
2019-02-09 15:20:18 +00:00
|
|
|
import Ecto.Query
|
|
|
|
import Ecto.Changeset
|
2019-01-23 15:37:25 +00:00
|
|
|
|
2020-09-05 04:38:07 +00:00
|
|
|
require Logger
|
|
|
|
|
2019-01-23 15:37:25 +00:00
|
|
|
schema "instances" do
|
|
|
|
field(:host, :string)
|
2019-03-20 12:59:27 +00:00
|
|
|
field(:unreachable_since, :naive_datetime_usec)
|
2020-07-07 09:13:38 +00:00
|
|
|
field(:favicon, :string)
|
|
|
|
field(:favicon_updated_at, :naive_datetime)
|
2019-01-23 15:37:25 +00:00
|
|
|
|
|
|
|
timestamps()
|
|
|
|
end
|
|
|
|
|
2019-01-28 12:25:06 +00:00
|
|
|
defdelegate host(url_or_host), to: Instances
|
2019-01-24 16:15:23 +00:00
|
|
|
|
|
|
|
def changeset(struct, params \\ %{}) do
|
2019-01-23 15:37:25 +00:00
|
|
|
struct
|
2020-07-07 09:13:38 +00:00
|
|
|
|> cast(params, [:host, :unreachable_since, :favicon, :favicon_updated_at])
|
2019-01-24 16:15:23 +00:00
|
|
|
|> validate_required([:host])
|
2019-01-23 15:37:25 +00:00
|
|
|
|> unique_constraint(:host)
|
|
|
|
end
|
|
|
|
|
2019-02-03 09:41:27 +00:00
|
|
|
def filter_reachable([]), do: %{}
|
2019-01-24 16:15:23 +00:00
|
|
|
|
2019-01-28 12:25:06 +00:00
|
|
|
def filter_reachable(urls_or_hosts) when is_list(urls_or_hosts) do
|
2019-01-24 16:15:23 +00:00
|
|
|
hosts =
|
2019-01-28 12:25:06 +00:00
|
|
|
urls_or_hosts
|
2019-01-24 16:15:23 +00:00
|
|
|
|> Enum.map(&(&1 && host(&1)))
|
|
|
|
|> Enum.filter(&(to_string(&1) != ""))
|
|
|
|
|
2019-02-03 09:41:27 +00:00
|
|
|
unreachable_since_by_host =
|
2019-01-24 16:15:23 +00:00
|
|
|
Repo.all(
|
|
|
|
from(i in Instance,
|
2019-02-03 09:41:27 +00:00
|
|
|
where: i.host in ^hosts,
|
|
|
|
select: {i.host, i.unreachable_since}
|
2019-01-24 16:15:23 +00:00
|
|
|
)
|
|
|
|
)
|
2019-02-03 09:41:27 +00:00
|
|
|
|> Map.new(& &1)
|
2019-01-24 16:15:23 +00:00
|
|
|
|
2019-02-03 09:41:27 +00:00
|
|
|
reachability_datetime_threshold = Instances.reachability_datetime_threshold()
|
|
|
|
|
|
|
|
for entry <- Enum.filter(urls_or_hosts, &is_binary/1) do
|
|
|
|
host = host(entry)
|
|
|
|
unreachable_since = unreachable_since_by_host[host]
|
|
|
|
|
|
|
|
if !unreachable_since ||
|
|
|
|
NaiveDateTime.compare(unreachable_since, reachability_datetime_threshold) == :gt do
|
|
|
|
{entry, unreachable_since}
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|> Enum.filter(& &1)
|
|
|
|
|> Map.new(& &1)
|
2019-01-24 16:15:23 +00:00
|
|
|
end
|
|
|
|
|
2019-01-28 12:25:06 +00:00
|
|
|
def reachable?(url_or_host) when is_binary(url_or_host) do
|
2019-01-23 15:37:25 +00:00
|
|
|
!Repo.one(
|
|
|
|
from(i in Instance,
|
|
|
|
where:
|
2019-01-28 12:25:06 +00:00
|
|
|
i.host == ^host(url_or_host) and
|
2019-01-25 12:10:21 +00:00
|
|
|
i.unreachable_since <= ^Instances.reachability_datetime_threshold(),
|
2019-01-23 15:37:25 +00:00
|
|
|
select: true
|
|
|
|
)
|
|
|
|
)
|
|
|
|
end
|
|
|
|
|
2019-01-24 14:37:23 +00:00
|
|
|
def reachable?(_), do: true
|
|
|
|
|
2019-01-28 12:25:06 +00:00
|
|
|
def set_reachable(url_or_host) when is_binary(url_or_host) do
|
|
|
|
with host <- host(url_or_host),
|
2019-01-24 16:15:23 +00:00
|
|
|
%Instance{} = existing_record <- Repo.get_by(Instance, %{host: host}) do
|
|
|
|
{:ok, _instance} =
|
|
|
|
existing_record
|
2019-01-28 08:03:52 +00:00
|
|
|
|> changeset(%{unreachable_since: nil})
|
2019-01-24 16:15:23 +00:00
|
|
|
|> Repo.update()
|
|
|
|
end
|
2019-01-23 15:37:25 +00:00
|
|
|
end
|
|
|
|
|
2019-01-28 12:25:06 +00:00
|
|
|
def set_reachable(_), do: {:error, nil}
|
2019-01-24 14:37:23 +00:00
|
|
|
|
2019-01-28 12:25:06 +00:00
|
|
|
def set_unreachable(url_or_host, unreachable_since \\ nil)
|
2019-01-24 14:37:23 +00:00
|
|
|
|
2019-01-28 12:25:06 +00:00
|
|
|
def set_unreachable(url_or_host, unreachable_since) when is_binary(url_or_host) do
|
2019-08-10 17:38:31 +00:00
|
|
|
unreachable_since = parse_datetime(unreachable_since) || NaiveDateTime.utc_now()
|
2019-01-28 12:25:06 +00:00
|
|
|
host = host(url_or_host)
|
2019-01-23 15:37:25 +00:00
|
|
|
existing_record = Repo.get_by(Instance, %{host: host})
|
|
|
|
|
2019-01-28 08:03:52 +00:00
|
|
|
changes = %{unreachable_since: unreachable_since}
|
2019-01-23 15:37:25 +00:00
|
|
|
|
2019-01-28 08:03:52 +00:00
|
|
|
cond do
|
|
|
|
is_nil(existing_record) ->
|
2019-01-24 16:15:23 +00:00
|
|
|
%Instance{}
|
|
|
|
|> changeset(Map.put(changes, :host, host))
|
|
|
|
|> Repo.insert()
|
2019-01-28 08:03:52 +00:00
|
|
|
|
|
|
|
existing_record.unreachable_since &&
|
|
|
|
NaiveDateTime.compare(existing_record.unreachable_since, unreachable_since) != :gt ->
|
2019-01-28 12:25:06 +00:00
|
|
|
{:ok, existing_record}
|
2019-01-28 08:03:52 +00:00
|
|
|
|
|
|
|
true ->
|
|
|
|
existing_record
|
|
|
|
|> changeset(changes)
|
|
|
|
|> Repo.update()
|
2019-01-23 15:37:25 +00:00
|
|
|
end
|
|
|
|
end
|
|
|
|
|
2019-01-28 12:25:06 +00:00
|
|
|
def set_unreachable(_, _), do: {:error, nil}
|
2019-08-10 17:38:31 +00:00
|
|
|
|
|
|
|
defp parse_datetime(datetime) when is_binary(datetime) do
|
|
|
|
NaiveDateTime.from_iso8601(datetime)
|
|
|
|
end
|
|
|
|
|
|
|
|
defp parse_datetime(datetime), do: datetime
|
2020-07-07 09:13:38 +00:00
|
|
|
|
|
|
|
def get_or_update_favicon(%URI{host: host} = instance_uri) do
|
|
|
|
existing_record = Repo.get_by(Instance, %{host: host})
|
|
|
|
now = NaiveDateTime.utc_now()
|
|
|
|
|
2020-07-07 10:07:30 +00:00
|
|
|
if existing_record && existing_record.favicon_updated_at &&
|
2020-07-07 09:13:38 +00:00
|
|
|
NaiveDateTime.diff(now, existing_record.favicon_updated_at) < 86_400 do
|
|
|
|
existing_record.favicon
|
|
|
|
else
|
|
|
|
favicon = scrape_favicon(instance_uri)
|
|
|
|
|
2020-07-07 10:07:30 +00:00
|
|
|
if existing_record do
|
|
|
|
existing_record
|
|
|
|
|> changeset(%{favicon: favicon, favicon_updated_at: now})
|
|
|
|
|> Repo.update()
|
|
|
|
else
|
|
|
|
%Instance{}
|
|
|
|
|> changeset(%{host: host, favicon: favicon, favicon_updated_at: now})
|
|
|
|
|> Repo.insert()
|
2020-07-07 09:13:38 +00:00
|
|
|
end
|
2020-07-07 10:07:30 +00:00
|
|
|
|
|
|
|
favicon
|
2020-07-07 09:13:38 +00:00
|
|
|
end
|
2020-09-04 05:52:22 +00:00
|
|
|
rescue
|
2020-09-05 04:38:07 +00:00
|
|
|
e ->
|
|
|
|
Logger.warn("Instance.get_or_update_favicon(\"#{host}\") error: #{inspect(e)}")
|
|
|
|
nil
|
2020-07-07 09:13:38 +00:00
|
|
|
end
|
|
|
|
|
|
|
|
defp scrape_favicon(%URI{} = instance_uri) do
|
|
|
|
try do
|
|
|
|
with {:ok, %Tesla.Env{body: html}} <-
|
2020-09-02 06:16:51 +00:00
|
|
|
Pleroma.HTTP.get(to_string(instance_uri), [{"accept", "text/html"}],
|
2020-09-09 16:30:42 +00:00
|
|
|
pool: :media
|
2020-09-02 06:16:51 +00:00
|
|
|
),
|
2020-07-07 09:13:38 +00:00
|
|
|
favicon_rel <-
|
|
|
|
html
|
|
|
|
|> Floki.parse_document!()
|
|
|
|
|> Floki.attribute("link[rel=icon]", "href")
|
|
|
|
|> List.first(),
|
|
|
|
favicon <- URI.merge(instance_uri, favicon_rel) |> to_string(),
|
2020-09-05 04:38:07 +00:00
|
|
|
true <- is_binary(favicon) do
|
2020-07-07 09:13:38 +00:00
|
|
|
favicon
|
|
|
|
else
|
|
|
|
_ -> nil
|
|
|
|
end
|
|
|
|
rescue
|
2020-09-05 04:38:07 +00:00
|
|
|
e ->
|
|
|
|
Logger.warn(
|
|
|
|
"Instance.scrape_favicon(\"#{to_string(instance_uri)}\") error: #{inspect(e)}"
|
|
|
|
)
|
|
|
|
|
|
|
|
nil
|
2020-07-07 09:13:38 +00:00
|
|
|
end
|
|
|
|
end
|
2019-01-23 15:37:25 +00:00
|
|
|
end
|