rich media: use cachex to avoid flooding remote servers
[akkoma] / lib / pleroma / web / rich_media / parser.ex
1 defmodule Pleroma.Web.RichMedia.Parser do
2 @parsers [Pleroma.Web.RichMedia.Parsers.OGP]
3
4 def parse(url) do
5 Cachex.fetch!(:rich_media_cache, url, fn _ ->
6 {:ok, %Tesla.Env{body: html}} = Pleroma.HTTP.get(url)
7
8 result = html |> maybe_parse() |> get_parsed_data()
9
10 {:commit, result}
11 end)
12 end
13
14 defp maybe_parse(html) do
15 Enum.reduce_while(@parsers, %{}, fn parser, acc ->
16 case parser.parse(html, acc) do
17 {:ok, data} -> {:halt, data}
18 {:error, _msg} -> {:cont, acc}
19 end
20 end)
21 end
22
23 defp get_parsed_data(data) when data == %{} do
24 {:error, "No metadata found"}
25 end
26
27 defp get_parsed_data(data) do
28 {:ok, data}
29 end
30 end