akkoma/lib/pleroma/web/metadata/opengraph.ex

157 lines
5 KiB
Elixir
Raw Normal View History

# Pleroma: A lightweight social networking server
# Copyright © 2017-2019 Pleroma Authors <https://pleroma.social/>
# SPDX-License-Identifier: AGPL-3.0-only
defmodule Pleroma.Web.Metadata.Providers.OpenGraph do
2019-02-09 08:16:26 -07:00
alias Pleroma.HTML
alias Pleroma.Formatter
alias Pleroma.User
alias Pleroma.Web.Metadata
alias Pleroma.Web.MediaProxy
2019-02-06 12:20:02 -07:00
alias Pleroma.Web.Metadata.Providers.Provider
@behaviour Provider
@impl Provider
def build_tags(%{
object: object,
url: url,
user: user
}) do
attachments = build_attachments(object)
scrubbed_content = scrub_html_and_truncate(object)
# Zero width space
content =
if scrubbed_content != "" and scrubbed_content != "\u200B" do
": “" <> scrubbed_content <> ""
else
""
end
2019-01-15 11:20:27 -07:00
2019-01-16 23:18:46 -07:00
# Most previews only show og:title which is inconvenient. Instagram
# hacks this by putting the description in the title and making the
# description longer prefixed by how many likes and shares the post
# has. Here we use the descriptive nickname in the title, and expand
# the full account & nickname in the description. We also use the cute^Wevil
# smart quotes around the status text like Instagram, too.
2019-01-16 08:02:46 -07:00
[
{:meta,
[
property: "og:title",
content: "#{user.name}" <> content
2019-01-16 08:02:46 -07:00
], []},
{:meta, [property: "og:url", content: url], []},
2019-01-16 23:18:46 -07:00
{:meta,
[
property: "og:description",
content: "#{user_name_string(user)}" <> content
2019-01-16 23:18:46 -07:00
], []},
{:meta, [property: "og:type", content: "website"], []}
2019-01-16 08:02:46 -07:00
] ++
if attachments == [] or Metadata.activity_nsfw?(object) do
2019-01-16 08:02:46 -07:00
[
{:meta, [property: "og:image", content: attachment_url(User.avatar_url(user))], []},
2019-01-16 23:18:46 -07:00
{:meta, [property: "og:image:width", content: 150], []},
{:meta, [property: "og:image:height", content: 150], []}
2019-01-16 08:02:46 -07:00
]
else
attachments
end
end
@impl Provider
def build_tags(%{user: user}) do
with truncated_bio = scrub_html_and_truncate(user.bio || "") do
[
{:meta,
[
property: "og:title",
content: user_name_string(user)
], []},
{:meta, [property: "og:url", content: User.profile_url(user)], []},
{:meta, [property: "og:description", content: truncated_bio], []},
2019-01-16 23:18:46 -07:00
{:meta, [property: "og:type", content: "website"], []},
2019-01-15 11:17:56 -07:00
{:meta, [property: "og:image", content: attachment_url(User.avatar_url(user))], []},
2019-01-16 23:18:46 -07:00
{:meta, [property: "og:image:width", content: 150], []},
{:meta, [property: "og:image:height", content: 150], []}
]
end
end
defp build_attachments(%{data: %{"attachment" => attachments}}) do
2019-01-16 06:52:01 -07:00
Enum.reduce(attachments, [], fn attachment, acc ->
2019-01-15 11:17:56 -07:00
rendered_tags =
2019-01-16 06:52:01 -07:00
Enum.reduce(attachment["url"], [], fn url, acc ->
2019-01-15 11:17:56 -07:00
media_type =
Enum.find(["image", "audio", "video"], fn media_type ->
String.starts_with?(url["mediaType"], media_type)
end)
2019-01-16 23:18:46 -07:00
# TODO: Add additional properties to objects when we have the data available.
# Also, Whatsapp only wants JPEG or PNGs. It seems that if we add a second og:image
# object when a Video or GIF is attached it will display that in the Whatsapp Rich Preview.
case media_type do
"audio" ->
[
{:meta, [property: "og:" <> media_type, content: attachment_url(url["href"])], []}
| acc
]
"image" ->
[
{:meta, [property: "og:" <> media_type, content: attachment_url(url["href"])],
[]},
{:meta, [property: "og:image:width", content: 150], []},
{:meta, [property: "og:image:height", content: 150], []}
| acc
]
"video" ->
[
{:meta, [property: "og:" <> media_type, content: attachment_url(url["href"])], []}
| acc
]
_ ->
acc
2019-01-15 11:17:56 -07:00
end
end)
acc ++ rendered_tags
end)
end
defp scrub_html_and_truncate(%{data: %{"content" => content}} = object) do
2019-01-15 14:07:28 -07:00
content
# html content comes from DB already encoded, decode first and scrub after
|> HtmlEntities.decode()
|> String.replace(~r/<br\s?\/?>/, " ")
|> HTML.get_cached_stripped_html_for_object(object, __MODULE__)
|> Formatter.demojify()
2019-01-15 14:07:28 -07:00
|> Formatter.truncate()
end
defp scrub_html_and_truncate(content) when is_binary(content) do
content
# html content comes from DB already encoded, decode first and scrub after
|> HtmlEntities.decode()
|> String.replace(~r/<br\s?\/?>/, " ")
|> HTML.strip_tags()
|> Formatter.demojify()
|> Formatter.truncate()
end
2019-01-15 11:17:56 -07:00
defp attachment_url(url) do
MediaProxy.url(url)
end
defp user_name_string(user) do
2019-01-15 11:47:45 -07:00
"#{user.name} " <>
if user.local do
"(@#{user.nickname}@#{Pleroma.Web.Endpoint.host()})"
else
"(@#{user.nickname})"
end
end
end