2021-08-15 12:53:04 -06:00
|
|
|
# Pleroma: A lightweight social networking server
|
|
|
|
# Copyright © 2017-2021 Pleroma Authors <https://pleroma.social/>
|
|
|
|
# SPDX-License-Identifier: AGPL-3.0-only
|
|
|
|
|
|
|
|
defmodule Mix.Tasks.Pleroma.Search.Meilisearch do
|
2021-08-16 01:18:01 -06:00
|
|
|
require Logger
|
2021-08-16 13:24:31 -06:00
|
|
|
require Pleroma.Constants
|
2021-08-15 12:53:04 -06:00
|
|
|
|
2021-08-16 01:18:01 -06:00
|
|
|
import Mix.Pleroma
|
2021-08-15 12:53:04 -06:00
|
|
|
import Ecto.Query
|
|
|
|
|
2021-08-23 11:21:46 -06:00
|
|
|
import Pleroma.Search.Meilisearch, only: [meili_post!: 2, meili_delete!: 1, meili_get!: 1]
|
2021-08-23 10:35:21 -06:00
|
|
|
|
2021-11-10 11:25:12 -07:00
|
|
|
def run(["index" | args]) do
|
2021-08-15 12:53:04 -06:00
|
|
|
start_pleroma()
|
|
|
|
|
2021-11-10 11:25:12 -07:00
|
|
|
is_reindex = "--reindex" in args
|
|
|
|
|
2021-08-23 10:35:21 -06:00
|
|
|
meili_post!(
|
|
|
|
"/indexes/objects/settings/ranking-rules",
|
|
|
|
[
|
|
|
|
"desc(published)",
|
|
|
|
"words",
|
2021-08-28 06:59:13 -06:00
|
|
|
"exactness",
|
2021-08-23 10:35:21 -06:00
|
|
|
"proximity",
|
|
|
|
"wordsPosition",
|
2021-08-28 06:59:13 -06:00
|
|
|
"typo",
|
|
|
|
"attribute"
|
2021-08-23 10:35:21 -06:00
|
|
|
]
|
|
|
|
)
|
2021-08-16 01:18:01 -06:00
|
|
|
|
2021-08-23 10:35:21 -06:00
|
|
|
meili_post!(
|
|
|
|
"/indexes/objects/settings/searchable-attributes",
|
|
|
|
[
|
|
|
|
"content"
|
|
|
|
]
|
|
|
|
)
|
2021-08-22 09:47:41 -06:00
|
|
|
|
2021-08-16 16:37:43 -06:00
|
|
|
chunk_size = 10_000
|
2021-08-16 13:30:56 -06:00
|
|
|
|
|
|
|
Pleroma.Repo.transaction(
|
|
|
|
fn ->
|
2021-08-23 11:02:34 -06:00
|
|
|
query =
|
2021-08-16 13:30:56 -06:00
|
|
|
from(Pleroma.Object,
|
|
|
|
# Only index public posts which are notes and have some text
|
|
|
|
where:
|
|
|
|
fragment("data->>'type' = 'Note'") and
|
2021-08-16 15:57:53 -06:00
|
|
|
fragment("LENGTH(data->>'content') > 0") and
|
2021-08-16 13:30:56 -06:00
|
|
|
fragment("data->'to' \\? ?", ^Pleroma.Constants.as_public()),
|
2021-08-16 15:30:14 -06:00
|
|
|
order_by: [desc: fragment("data->'published'")]
|
2021-08-23 11:02:34 -06:00
|
|
|
)
|
|
|
|
|
|
|
|
count = query |> Pleroma.Repo.aggregate(:count, :data)
|
|
|
|
IO.puts("Entries to index: #{count}")
|
|
|
|
|
|
|
|
Pleroma.Repo.stream(
|
|
|
|
query,
|
2021-08-16 13:30:56 -06:00
|
|
|
timeout: :infinity
|
2021-08-15 12:53:04 -06:00
|
|
|
)
|
2021-08-22 13:53:18 -06:00
|
|
|
|> Stream.map(&Pleroma.Search.Meilisearch.object_to_search_data/1)
|
|
|
|
|> Stream.filter(fn o -> not is_nil(o) end)
|
2021-08-16 13:30:56 -06:00
|
|
|
|> Stream.chunk_every(chunk_size)
|
2021-08-22 10:38:03 -06:00
|
|
|
|> Stream.transform(0, fn objects, acc ->
|
|
|
|
new_acc = acc + Enum.count(objects)
|
|
|
|
|
2021-08-22 14:47:43 -06:00
|
|
|
# Reset to the beginning of the line and rewrite it
|
|
|
|
IO.write("\r")
|
|
|
|
IO.write("Indexed #{new_acc} entries")
|
2021-08-22 10:38:03 -06:00
|
|
|
|
|
|
|
{[objects], new_acc}
|
2021-08-16 13:30:56 -06:00
|
|
|
end)
|
|
|
|
|> Stream.each(fn objects ->
|
2021-11-10 11:25:12 -07:00
|
|
|
objects =
|
|
|
|
objects
|
|
|
|
|> Enum.filter(fn o ->
|
|
|
|
if is_reindex do
|
|
|
|
result = meili_get!("/indexes/objects/documents/#{o.id}")
|
|
|
|
|
|
|
|
# Filter out the already indexed documents. This is true when the document does not exist
|
|
|
|
result["errorCode"] == "document_not_found"
|
|
|
|
else
|
|
|
|
true
|
|
|
|
end
|
|
|
|
end)
|
|
|
|
|
2021-08-23 10:35:21 -06:00
|
|
|
result =
|
|
|
|
meili_post!(
|
|
|
|
"/indexes/objects/documents",
|
|
|
|
objects
|
2021-08-16 13:30:56 -06:00
|
|
|
)
|
2021-08-16 15:30:14 -06:00
|
|
|
|
2021-08-23 10:35:21 -06:00
|
|
|
if not Map.has_key?(result, "updateId") do
|
|
|
|
IO.puts("Failed to index: #{inspect(result)}")
|
2021-08-16 15:30:14 -06:00
|
|
|
end
|
2021-08-16 13:30:56 -06:00
|
|
|
end)
|
|
|
|
|> Stream.run()
|
|
|
|
end,
|
|
|
|
timeout: :infinity
|
|
|
|
)
|
2021-08-22 14:47:43 -06:00
|
|
|
|
|
|
|
IO.write("\n")
|
2021-08-15 12:53:04 -06:00
|
|
|
end
|
2021-08-16 13:24:31 -06:00
|
|
|
|
|
|
|
def run(["clear"]) do
|
|
|
|
start_pleroma()
|
|
|
|
|
2021-08-23 10:35:21 -06:00
|
|
|
meili_delete!("/indexes/objects/documents")
|
|
|
|
end
|
|
|
|
|
|
|
|
def run(["show-private-key", master_key]) do
|
|
|
|
start_pleroma()
|
|
|
|
|
2021-08-16 13:24:31 -06:00
|
|
|
endpoint = Pleroma.Config.get([Pleroma.Search.Meilisearch, :url])
|
|
|
|
|
2021-08-23 10:35:21 -06:00
|
|
|
{:ok, result} =
|
|
|
|
Pleroma.HTTP.get(
|
|
|
|
Path.join(endpoint, "/keys"),
|
|
|
|
[{"X-Meili-API-Key", master_key}]
|
2021-08-22 10:38:03 -06:00
|
|
|
)
|
2021-08-23 10:35:21 -06:00
|
|
|
|
|
|
|
decoded = Jason.decode!(result.body)
|
|
|
|
|
|
|
|
if decoded["private"] do
|
|
|
|
IO.puts(decoded["private"])
|
|
|
|
else
|
|
|
|
IO.puts("Error fetching the key, check the master key is correct: #{inspect(decoded)}")
|
|
|
|
end
|
2021-08-16 13:24:31 -06:00
|
|
|
end
|
2021-08-23 11:21:46 -06:00
|
|
|
|
|
|
|
def run(["stats"]) do
|
|
|
|
start_pleroma()
|
|
|
|
|
|
|
|
result = meili_get!("/indexes/objects/stats")
|
|
|
|
IO.puts("Number of entries: #{result["numberOfDocuments"]}")
|
|
|
|
IO.puts("Indexing? #{result["isIndexing"]}")
|
|
|
|
end
|
2021-08-15 12:53:04 -06:00
|
|
|
end
|