pleroma.database fill_old_hashtags: Add month_limit argument
authorHaelwenn (lanodan) Monnier <contact@hacktivis.me>
Tue, 22 Dec 2020 04:11:19 +0000 (05:11 +0100)
committerHaelwenn (lanodan) Monnier <contact@hacktivis.me>
Mon, 28 Dec 2020 10:05:25 +0000 (11:05 +0100)
docs/administration/CLI_tasks/database.md
lib/mix/tasks/pleroma/database.ex

index a2d2e8cdda516b57db0d2bdb322f7346a3f6876a..eb85381ffa779eb49af9f72cf6ac7fa04391fd04 100644 (file)
@@ -93,12 +93,14 @@ Can be safely re-run
 
 ## Fill hashtags for old objects
 
+Migrate hashags fields for old objects, from now to `months_limit` months.
+
 ```sh tab="OTP"
-./bin/pleroma_ctl database fill_old_hashtags
+./bin/pleroma_ctl database fill_old_hashtags <months_limit>
 ```
 
 ```sh tab="From Source"
-mix pleroma.database fill_old_hashtags
+mix pleroma.database fill_old_hashtags <months_limit>
 ```
 
 ## Vacuum the database
index 0c1343313118749930993926d4de8d3922fe6d19..a098525038e008b77fcadbfa6fce1aa651295e24 100644 (file)
@@ -128,47 +128,55 @@ defmodule Mix.Tasks.Pleroma.Database do
     |> Stream.run()
   end
 
-  def run(["fill_old_hashtags"]) do
+  def run(["fill_old_hashtags", month_limit]) do
     import Ecto.Query
 
     start_pleroma()
 
-    from(
-      o in Object,
-      where: fragment("(?)->>'hashtags' is null", o.data),
-      where: fragment("(?)->>'tag' != '[]'", o.data),
-      select: %{id: o.id, tag: fragment("(?)->>'tag'", o.data)},
-      order_by: [:desc, o.id]
-    )
-    |> Pleroma.Repo.chunk_stream(200, :batches)
-    |> Stream.each(fn objects ->
-      Repo.transaction(fn ->
-        objects_first = objects |> List.first()
-        objects_last = objects |> List.last()
-
-        Logger.info(
-          "fill_old_hashtags: #{objects_first.id} (#{objects_first.inserted_at}) -- #{
-            objects_last.id
-          } (#{objects_last.inserted_at})"
-        )
+    month_limit = String.to_integer(month_limit)
 
-        objects
-        |> Enum.map(fn object ->
-          tags =
-            object.tag
-            |> Jason.decode!()
-            |> Enum.filter(&is_bitstring(&1))
-
-          Object
-          |> where([o], o.id == ^object.id)
-          |> update([o],
-            set: [data: fragment("safe_jsonb_set(?, '{hashtags}', ?, true)", o.data, ^tags)]
+    if month_limit < 1 do
+      shell_error("Invalid `month_limit` argument, needs to be greater than 1")
+    else
+      time_limit = DateTime.utc_now() |> Timex.shift(months: -month_limit)
+
+      from(
+        o in Object,
+        where: fragment("(?)->>'hashtags' is null", o.data),
+        where: fragment("(?)->>'tag' != '[]'", o.data),
+        where: o.inserted_at < ^time_limit,
+        select: %{id: o.id, tag: fragment("(?)->>'tag'", o.data)}
+      )
+      |> Pleroma.Repo.chunk_stream(200, :batches)
+      |> Stream.each(fn objects ->
+        Repo.transaction(fn ->
+          objects_first = objects |> List.first()
+          objects_last = objects |> List.last()
+
+          Logger.info(
+            "fill_old_hashtags: #{objects_first.id} (#{objects_first.inserted_at}) -- #{
+              objects_last.id
+            } (#{objects_last.inserted_at})"
           )
-          |> Repo.update_all([], timeout: :infinity)
+
+          objects
+          |> Enum.map(fn object ->
+            tags =
+              object.tag
+              |> Jason.decode!()
+              |> Enum.filter(&is_bitstring(&1))
+
+            Object
+            |> where([o], o.id == ^object.id)
+            |> update([o],
+              set: [data: fragment("safe_jsonb_set(?, '{hashtags}', ?, true)", o.data, ^tags)]
+            )
+            |> Repo.update_all([], timeout: :infinity)
+          end)
         end)
       end)
-    end)
-    |> Stream.run()
+      |> Stream.run()
+    end
   end
 
   def run(["vacuum", args]) do