[#477] User: FTS and trigram search results mixing (to handle misspelled requests).

This commit is contained in:
Ivan Tashkinov 2019-01-18 10:35:45 +03:00
parent 0bc6d30f7d
commit ed8f55ab8e
3 changed files with 87 additions and 59 deletions

View File

@ -679,13 +679,35 @@ defmodule Pleroma.User do
end
def search(query, resolve \\ false, for_user \\ nil) do
# strip the beginning @ off if there is a query
# Strip the beginning @ off if there is a query
query = String.trim_leading(query, "@")
if resolve do
User.get_or_fetch_by_nickname(query)
if resolve, do: User.get_or_fetch_by_nickname(query)
fts_results = do_search(fts_search_subquery(query), for_user)
trigram_results = do_search(trigram_search_subquery(query), for_user)
Enum.uniq_by(fts_results ++ trigram_results, & &1.id)
end
defp do_search(subquery, for_user, options \\ []) do
q =
from(
s in subquery(subquery),
order_by: [desc: s.search_rank],
limit: ^(options[:limit] || 20)
)
results =
q
|> Repo.all()
|> Enum.filter(&(&1.search_rank > 0))
boost_search_results(results, for_user)
end
defp fts_search_subquery(query) do
processed_query =
query
|> String.replace(~r/\W+/, " ")
@ -694,7 +716,6 @@ defmodule Pleroma.User do
|> Enum.map(&(&1 <> ":*"))
|> Enum.join(" | ")
inner =
from(
u in User,
select_merge: %{
@ -715,21 +736,27 @@ defmodule Pleroma.User do
},
where: not is_nil(u.nickname)
)
end
q =
defp trigram_search_subquery(query) do
from(
s in subquery(inner),
order_by: [desc: s.search_rank],
limit: 20
u in User,
select_merge: %{
search_rank:
fragment(
"similarity(?, ? || ' ' || coalesce(?, ''))",
^query,
u.nickname,
u.name
)
},
where: not is_nil(u.nickname)
)
end
results =
q
|> Repo.all()
|> Enum.filter(&(&1.search_rank > 0))
defp boost_search_results(results, nil), do: results
weighted_results =
if for_user do
defp boost_search_results(results, for_user) do
friends_ids = get_friends_ids(for_user)
followers_ids = get_followers_ids(for_user)
@ -752,11 +779,6 @@ defmodule Pleroma.User do
end
)
|> Enum.sort_by(&(-&1.search_rank))
else
results
end
weighted_results
end
def blocks_import(%User{} = blocker, blocked_identifiers) when is_list(blocked_identifiers) do

View File

@ -814,6 +814,12 @@ defmodule Pleroma.UserTest do
assert [u4.id, u3.id, u1.id] == Enum.map(User.search("lain@ple"), & &1.id)
end
test "finds users, handling misspelled requests" do
u1 = insert(:user, %{name: "lain"})
assert [u1.id] == Enum.map(User.search("laiin"), & &1.id)
end
test "finds users, boosting ranks of friends and followers" do
u1 = insert(:user)
u2 = insert(:user, %{name: "Doe"})

View File

@ -1656,7 +1656,7 @@ defmodule Pleroma.Web.TwitterAPI.ControllerTest do
test "it returns users, ordered by similarity", %{conn: conn} do
user = insert(:user, %{name: "eal"})
user_two = insert(:user, %{name: "eal me"})
_user_three = insert(:user, %{name: "ebn"})
_user_three = insert(:user, %{name: "zzz"})
resp =
conn