2019-07-10 05:13:23 +00:00
|
|
|
|
# Pleroma: A lightweight social networking server
|
2020-03-03 22:44:49 +00:00
|
|
|
|
# Copyright © 2017-2020 Pleroma Authors <https://pleroma.social/>
|
2019-07-10 05:13:23 +00:00
|
|
|
|
# SPDX-License-Identifier: AGPL-3.0-only
|
|
|
|
|
|
2019-01-01 20:26:40 +00:00
|
|
|
|
defmodule Pleroma.Web.RichMedia.ParserTest do
|
|
|
|
|
use ExUnit.Case, async: true
|
|
|
|
|
|
2020-09-02 09:38:43 +00:00
|
|
|
|
alias Pleroma.Web.RichMedia.Parser
|
|
|
|
|
|
2019-01-01 20:26:40 +00:00
|
|
|
|
setup do
|
|
|
|
|
Tesla.Mock.mock(fn
|
|
|
|
|
%{
|
|
|
|
|
method: :get,
|
|
|
|
|
url: "http://example.com/ogp"
|
|
|
|
|
} ->
|
|
|
|
|
%Tesla.Env{status: 200, body: File.read!("test/fixtures/rich_media/ogp.html")}
|
2019-01-02 14:02:50 +00:00
|
|
|
|
|
2019-06-22 14:22:59 +00:00
|
|
|
|
%{
|
|
|
|
|
method: :get,
|
|
|
|
|
url: "http://example.com/non-ogp"
|
|
|
|
|
} ->
|
|
|
|
|
%Tesla.Env{status: 200, body: File.read!("test/fixtures/rich_media/non_ogp_embed.html")}
|
|
|
|
|
|
2019-06-22 13:12:57 +00:00
|
|
|
|
%{
|
|
|
|
|
method: :get,
|
|
|
|
|
url: "http://example.com/ogp-missing-title"
|
|
|
|
|
} ->
|
|
|
|
|
%Tesla.Env{
|
|
|
|
|
status: 200,
|
|
|
|
|
body: File.read!("test/fixtures/rich_media/ogp-missing-title.html")
|
|
|
|
|
}
|
|
|
|
|
|
2019-01-10 18:09:56 +00:00
|
|
|
|
%{
|
|
|
|
|
method: :get,
|
|
|
|
|
url: "http://example.com/twitter-card"
|
|
|
|
|
} ->
|
|
|
|
|
%Tesla.Env{status: 200, body: File.read!("test/fixtures/rich_media/twitter_card.html")}
|
|
|
|
|
|
2019-01-13 00:06:50 +00:00
|
|
|
|
%{
|
|
|
|
|
method: :get,
|
|
|
|
|
url: "http://example.com/oembed"
|
|
|
|
|
} ->
|
|
|
|
|
%Tesla.Env{status: 200, body: File.read!("test/fixtures/rich_media/oembed.html")}
|
|
|
|
|
|
|
|
|
|
%{
|
|
|
|
|
method: :get,
|
|
|
|
|
url: "http://example.com/oembed.json"
|
|
|
|
|
} ->
|
|
|
|
|
%Tesla.Env{status: 200, body: File.read!("test/fixtures/rich_media/oembed.json")}
|
|
|
|
|
|
2019-01-02 14:02:50 +00:00
|
|
|
|
%{method: :get, url: "http://example.com/empty"} ->
|
|
|
|
|
%Tesla.Env{status: 200, body: "hello"}
|
2020-09-02 09:38:43 +00:00
|
|
|
|
|
|
|
|
|
%{method: :get, url: "http://example.com/malformed"} ->
|
|
|
|
|
%Tesla.Env{status: 200, body: File.read!("test/fixtures/rich_media/malformed-data.html")}
|
|
|
|
|
|
|
|
|
|
%{method: :get, url: "http://example.com/error"} ->
|
|
|
|
|
{:error, :overload}
|
2020-09-14 12:38:00 +00:00
|
|
|
|
|
|
|
|
|
%{
|
|
|
|
|
method: :head,
|
|
|
|
|
url: "http://example.com/huge-page"
|
|
|
|
|
} ->
|
|
|
|
|
%Tesla.Env{
|
|
|
|
|
status: 200,
|
|
|
|
|
headers: [{"content-length", "2000001"}, {"content-type", "text/html"}]
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
%{
|
|
|
|
|
method: :head,
|
|
|
|
|
url: "http://example.com/pdf-file"
|
|
|
|
|
} ->
|
|
|
|
|
%Tesla.Env{
|
|
|
|
|
status: 200,
|
|
|
|
|
headers: [{"content-length", "1000000"}, {"content-type", "application/pdf"}]
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
%{method: :head} ->
|
|
|
|
|
%Tesla.Env{status: 404, body: "", headers: []}
|
2019-01-01 20:26:40 +00:00
|
|
|
|
end)
|
|
|
|
|
|
|
|
|
|
:ok
|
|
|
|
|
end
|
|
|
|
|
|
2019-01-02 14:02:50 +00:00
|
|
|
|
test "returns error when no metadata present" do
|
2020-09-02 09:38:43 +00:00
|
|
|
|
assert {:error, _} = Parser.parse("http://example.com/empty")
|
2019-01-02 14:02:50 +00:00
|
|
|
|
end
|
|
|
|
|
|
2019-06-22 14:22:59 +00:00
|
|
|
|
test "doesn't just add a title" do
|
2020-09-02 09:38:43 +00:00
|
|
|
|
assert Parser.parse("http://example.com/non-ogp") ==
|
2019-07-23 22:58:31 +00:00
|
|
|
|
{:error,
|
2020-06-09 17:49:24 +00:00
|
|
|
|
"Found metadata was invalid or incomplete: %{\"url\" => \"http://example.com/non-ogp\"}"}
|
2019-06-22 14:22:59 +00:00
|
|
|
|
end
|
|
|
|
|
|
2019-01-01 20:26:40 +00:00
|
|
|
|
test "parses ogp" do
|
2020-09-02 09:38:43 +00:00
|
|
|
|
assert Parser.parse("http://example.com/ogp") ==
|
2019-01-02 14:02:50 +00:00
|
|
|
|
{:ok,
|
|
|
|
|
%{
|
2020-06-09 17:49:24 +00:00
|
|
|
|
"image" => "http://ia.media-imdb.com/images/rock.jpg",
|
|
|
|
|
"title" => "The Rock",
|
|
|
|
|
"description" =>
|
2019-05-30 21:03:31 +00:00
|
|
|
|
"Directed by Michael Bay. With Sean Connery, Nicolas Cage, Ed Harris, John Spencer.",
|
2020-06-09 17:49:24 +00:00
|
|
|
|
"type" => "video.movie",
|
|
|
|
|
"url" => "http://example.com/ogp"
|
2019-01-02 14:02:50 +00:00
|
|
|
|
}}
|
2019-01-01 20:26:40 +00:00
|
|
|
|
end
|
2019-01-10 18:09:56 +00:00
|
|
|
|
|
2019-06-22 13:12:57 +00:00
|
|
|
|
test "falls back to <title> when ogp:title is missing" do
|
2020-09-02 09:38:43 +00:00
|
|
|
|
assert Parser.parse("http://example.com/ogp-missing-title") ==
|
2019-06-22 13:12:57 +00:00
|
|
|
|
{:ok,
|
|
|
|
|
%{
|
2020-06-09 17:49:24 +00:00
|
|
|
|
"image" => "http://ia.media-imdb.com/images/rock.jpg",
|
|
|
|
|
"title" => "The Rock (1996)",
|
|
|
|
|
"description" =>
|
2019-06-22 13:12:57 +00:00
|
|
|
|
"Directed by Michael Bay. With Sean Connery, Nicolas Cage, Ed Harris, John Spencer.",
|
2020-06-09 17:49:24 +00:00
|
|
|
|
"type" => "video.movie",
|
|
|
|
|
"url" => "http://example.com/ogp-missing-title"
|
2019-06-22 13:12:57 +00:00
|
|
|
|
}}
|
|
|
|
|
end
|
|
|
|
|
|
2019-01-10 18:09:56 +00:00
|
|
|
|
test "parses twitter card" do
|
2020-09-02 09:38:43 +00:00
|
|
|
|
assert Parser.parse("http://example.com/twitter-card") ==
|
2019-01-10 18:09:56 +00:00
|
|
|
|
{:ok,
|
|
|
|
|
%{
|
2020-06-09 17:49:24 +00:00
|
|
|
|
"card" => "summary",
|
|
|
|
|
"site" => "@flickr",
|
|
|
|
|
"image" => "https://farm6.staticflickr.com/5510/14338202952_93595258ff_z.jpg",
|
|
|
|
|
"title" => "Small Island Developing States Photo Submission",
|
|
|
|
|
"description" => "View the album on Flickr.",
|
|
|
|
|
"url" => "http://example.com/twitter-card"
|
2019-01-10 18:09:56 +00:00
|
|
|
|
}}
|
|
|
|
|
end
|
2019-01-13 00:06:50 +00:00
|
|
|
|
|
|
|
|
|
test "parses OEmbed" do
|
2020-09-02 09:38:43 +00:00
|
|
|
|
assert Parser.parse("http://example.com/oembed") ==
|
2019-01-13 00:06:50 +00:00
|
|
|
|
{:ok,
|
|
|
|
|
%{
|
2020-06-09 17:49:24 +00:00
|
|
|
|
"author_name" => "bees",
|
|
|
|
|
"author_url" => "https://www.flickr.com/photos/bees/",
|
|
|
|
|
"cache_age" => 3600,
|
|
|
|
|
"flickr_type" => "photo",
|
|
|
|
|
"height" => "768",
|
|
|
|
|
"html" =>
|
2019-01-13 00:06:50 +00:00
|
|
|
|
"<a data-flickr-embed=\"true\" href=\"https://www.flickr.com/photos/bees/2362225867/\" title=\"Bacon Lollys by bees, on Flickr\"><img src=\"https://farm4.staticflickr.com/3040/2362225867_4a87ab8baf_b.jpg\" width=\"1024\" height=\"768\" alt=\"Bacon Lollys\"></a><script async src=\"https://embedr.flickr.com/assets/client-code.js\" charset=\"utf-8\"></script>",
|
2020-06-09 17:49:24 +00:00
|
|
|
|
"license" => "All Rights Reserved",
|
|
|
|
|
"license_id" => 0,
|
|
|
|
|
"provider_name" => "Flickr",
|
|
|
|
|
"provider_url" => "https://www.flickr.com/",
|
|
|
|
|
"thumbnail_height" => 150,
|
|
|
|
|
"thumbnail_url" =>
|
|
|
|
|
"https://farm4.staticflickr.com/3040/2362225867_4a87ab8baf_q.jpg",
|
|
|
|
|
"thumbnail_width" => 150,
|
|
|
|
|
"title" => "Bacon Lollys",
|
|
|
|
|
"type" => "photo",
|
|
|
|
|
"url" => "http://example.com/oembed",
|
|
|
|
|
"version" => "1.0",
|
|
|
|
|
"web_page" => "https://www.flickr.com/photos/bees/2362225867/",
|
|
|
|
|
"web_page_short_url" => "https://flic.kr/p/4AK2sc",
|
|
|
|
|
"width" => "1024"
|
2019-01-13 00:06:50 +00:00
|
|
|
|
}}
|
|
|
|
|
end
|
2019-01-31 16:19:53 +00:00
|
|
|
|
|
|
|
|
|
test "rejects invalid OGP data" do
|
2020-09-02 09:38:43 +00:00
|
|
|
|
assert {:error, _} = Parser.parse("http://example.com/malformed")
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
test "returns error if getting page was not successful" do
|
|
|
|
|
assert {:error, :overload} = Parser.parse("http://example.com/error")
|
2019-01-31 16:19:53 +00:00
|
|
|
|
end
|
2020-09-14 12:38:00 +00:00
|
|
|
|
|
|
|
|
|
test "does a HEAD request to check if the body is too large" do
|
|
|
|
|
assert {:error, :body_too_large} = Parser.parse("http://example.com/huge-page")
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
test "does a HEAD request to check if the body is html" do
|
|
|
|
|
assert {:error, {:content_type, _}} = Parser.parse("http://example.com/pdf-file")
|
|
|
|
|
end
|
2019-01-01 20:26:40 +00:00
|
|
|
|
end
|