# frozen_string_literal: true require "pretty_text" RSpec.describe PrettyText do fab!(:user) fab!(:post) before { SiteSetting.enable_markdown_typographer = false } def n(html) html.strip end def cook(*args) PrettyText.cook(*args) end let(:wrapped_image) do "" end describe "Quoting" do context "with avatar" do let(:default_avatar) do "//test.localhost/uploads/default/avatars/42d/57c/46ce7ee487/{size}.png" end before { User.stubs(:default_template).returns(default_avatar) } it "correctly extracts usernames from the new quote format" do topic = Fabricate(:topic, title: "this is a test topic :slight_smile:") expected = <<~HTML HTML expect( cook( "[quote=\"Jeff, post:2, topic:#{topic.id}, username:codinghorror\"]\nddd\n[/quote]", topic_id: 1, ), ).to eq(n(expected)) end it "do off topic quoting with emoji unescape" do topic = Fabricate(:topic, title: "this is a test topic :slight_smile:") expected = <<~HTML HTML expect( cook("[quote=\"EvilTrout, post:2, topic:#{topic.id}\"]\nddd\n[/quote]", topic_id: 1), ).to eq(n(expected)) end context "with emojis" do let(:md) { <<~MD } > This is a quote with a regular emoji :upside_down_face: > This is a quote with an emoji shortcut :) > This is a quote with a Unicode emoji 😎 MD it "does not unescape emojis when emojis are disabled" do SiteSetting.enable_emoji = false html = <<~HTML

This is a quote with a regular emoji :upside_down_face:

This is a quote with an emoji shortcut :)

This is a quote with a Unicode emoji 😎

HTML expect(cook(md)).to eq(html.strip) end it "does not convert emoji shortcuts when emoji shortcuts are disabled" do SiteSetting.enable_emoji_shortcuts = false html = <<~HTML

This is a quote with a regular emoji

This is a quote with an emoji shortcut :)

This is a quote with a Unicode emoji

HTML expect(cook(md)).to eq(html.strip) end it "unescapes all emojis" do html = <<~HTML

This is a quote with a regular emoji

This is a quote with an emoji shortcut

This is a quote with a Unicode emoji

HTML expect(cook(md)).to eq(html.strip) end it "adds an only-emoji class when a line has only one emoji" do md = <<~MD ☹️ foo 😀 foo 😀 bar :smile_cat: :smile_cat: :smile_cat: :smile_cat: :smile_cat: :smile_cat: :smile_cat: baz? :smile_cat: 😀 😉 foo 😉 😉 😉 😉 😉 😉 😉 😉😉😉 😉 😉 😉 😉d😉 😉 😉 😉 😉d 😉😉😉😉 MD html = <<~HTML

foo
foo bar

baz?

foo

d:wink:
d

HTML expect(cook(md)).to eq(html.strip) end it "does use emoji CDN when enabled" do SiteSetting.external_emoji_url = "https://emoji.cdn.com" html = <<~HTML

This is a quote with a regular emoji

This is a quote with an emoji shortcut

This is a quote with a Unicode emoji

HTML expect(cook(md)).to eq(html.strip) end it "does use emoji CDN when others CDNs are also enabled" do set_cdn_url("https://cdn.com") setup_s3 SiteSetting.s3_cdn_url = "https://s3.cdn.com" SiteSetting.external_emoji_url = "https://emoji.cdn.com" html = <<~HTML

This is a quote with a regular emoji

This is a quote with an emoji shortcut

This is a quote with a Unicode emoji

HTML expect(cook(md)).to eq(html.strip) end end it "do off topic quoting of posts from secure categories" do category = Fabricate(:category, read_restricted: true) topic = Fabricate(:topic, title: "this is topic with secret category", category: category) expected = <<~HTML HTML expect( cook( "[quote=\"maja, post:3, topic:#{topic.id}\"]\nI have nothing to say.\n[/quote]", topic_id: 1, ), ).to eq(n(expected)) end it "do off topic quoting with the force_quote_link opt and no topic_id opt provided" do topic = Fabricate(:topic, title: "This is an off-topic topic") expected = <<~HTML HTML cooked = cook( "[quote=\"maja, post:3, topic:#{topic.id}\"]\nI have nothing to say.\n[/quote]", force_quote_link: true, ) expect(cooked).to eq(n(expected)) end it "indifferent about missing quotations" do md = <<~MD [quote=#{user.username}, post:123, topic:456, full:true] ddd [/quote] MD html = <<~HTML HTML expect(PrettyText.cook(md)).to eq(html.strip) end it "indifferent about curlies and no curlies" do md = <<~MD [quote=“#{user.username}, post:123, topic:456, full:true”] ddd [/quote] MD html = <<~HTML HTML expect(PrettyText.cook(md)).to eq(html.strip) end it "trims spaces on quote params" do md = <<~MD [quote="#{user.username}, post:555, topic: 666"] ddd [/quote] MD html = <<~HTML HTML expect(PrettyText.cook(md)).to eq(html.strip) end end context "with primary user group" do let(:default_avatar) do "//test.localhost/uploads/default/avatars/42d/57c/46ce7ee487/{size}.png" end fab!(:group) fab!(:user) { Fabricate(:user, primary_group: group) } before { User.stubs(:default_template).returns(default_avatar) } it "adds primary group class to referenced users quote" do topic = Fabricate(:topic, title: "this is a test topic") expected = <<~HTML HTML expect( cook( "[quote=\"#{user.username}, post:2, topic:#{topic.id}\"]\nddd\n[/quote]", topic_id: 1, ), ).to eq(n(expected)) end end it "can handle inline block bbcode" do cooked = PrettyText.cook("[quote]te **s** t[/quote]") html = <<~HTML HTML expect(cooked).to eq(html.strip) end it "handles bbcode edge cases" do expect(PrettyText.cook "[constructor]\ntest").to eq("

[constructor]
\ntest

") end it "can handle quote edge cases" do expect(PrettyText.cook("[quote]abc\ntest\n[/quote]")).not_to include("aside") expect(PrettyText.cook("[quote] \ntest\n[/quote] ")).to include("aside") expect(PrettyText.cook("a\n[quote]\ntest\n[/quote]\n\n\na")).to include("aside") expect(PrettyText.cook("- a\n[quote]\ntest\n[/quote]\n\n\na")).to include("aside") expect(PrettyText.cook("[quote]\ntest")).not_to include("aside") expect(PrettyText.cook("[quote]\ntest\n[/quote]z")).not_to include("aside") nested = <<~MD [quote] a [quote] b [/quote] c [/quote] MD cooked = PrettyText.cook(nested) expect(cooked.scan("aside").length).to eq(4) expect(cooked.scan("quote]").length).to eq(0) end context "with letter avatar" do context "with subfolder" do it "should have correct avatar url" do set_subfolder "/forum" md = <<~MD [quote="#{user.username}, post:123, topic:456, full:true"] ddd [/quote] MD expect(PrettyText.cook(md)).to include("/forum/letter_avatar_proxy") end end end end describe "Mentions" do it "can handle mentions after abbr" do expect(PrettyText.cook("test test\n\n@bob")).to eq( "

test test

@bob

", ) end it "should handle 3 mentions in a row" do expect( PrettyText.cook("@hello @hello @hello"), ).to match_html "

@hello @hello @hello

" end it "can handle mention edge cases" do expect(PrettyText.cook("hi\n@s")).to eq("

hi
\n@s

") expect(PrettyText.cook("hi\n@ss")).to eq("

hi
\n@ss

") expect(PrettyText.cook("hi\n@s.")).to eq("

hi
\n@s.

") expect(PrettyText.cook("hi\n@s.s")).to eq( "

hi
\n@s.s

", ) expect(PrettyText.cook("hi\n@.s.s")).to eq("

hi
\n@.s.s

") end it "handles user and group mentions correctly" do %w[User user2].each { |username| Fabricate(:user, username: username) } Fabricate(:group, name: "Group", mentionable_level: Group::ALIAS_LEVELS[:everyone]) Fabricate( :group, name: "Group2", mentionable_level: Group::ALIAS_LEVELS[:members_mods_and_admins], ) [ [ "hi @uSer! @user2 hi", '

hi @uSer! @user2 hi

', ], [ "hi\n@user. @GROUP @somemention @group2", %Q|

hi
\n@user. @GROUP @somemention @group2

|, ], ].each { |input, expected| expect(PrettyText.cook(input)).to eq(expected) } end context "with subfolder" do it "handles user and group mentions correctly" do set_subfolder "/forum" Fabricate(:user, username: "user1") Fabricate(:group, name: "groupA", mentionable_level: Group::ALIAS_LEVELS[:everyone]) input = "hi there @user1 and @groupA" expected = '

hi there @user1 and @groupA

' expect(PrettyText.cook(input)).to eq(expected) end end it "does not assign the notify class to a group that can't be mentioned" do group = Fabricate( :group, visibility_level: Group.visibility_levels[:members], mentionable_level: Group::ALIAS_LEVELS[:nobody], ) expect(PrettyText.cook("test @#{group.name} test")).to eq( %Q|

test @#{group.name} test

|, ) end it "assigns the notify class if the user can mention" do group = Fabricate( :group, visibility_level: Group.visibility_levels[:members], mentionable_level: Group::ALIAS_LEVELS[:members_mods_and_admins], ) expect(PrettyText.cook("test @#{group.name} test", user_id: Fabricate(:admin).id)).to eq( %Q|

test @#{group.name} test

|, ) end it "does not mention staged users" do user = Fabricate(:user, staged: true) expect(PrettyText.cook("something @#{user.username} something")).to eq( %Q|

something @#{user.username} something

|, ) end context "when mentions are disabled" do before { SiteSetting.enable_mentions = false } it "should not convert mentions to links" do expect(PrettyText.cook("hi @user")).to eq("

hi @user

") end end it "can handle mentions inside a hyperlink" do expect(PrettyText.cook(" @inner ")).to match_html "

@inner

" end it "can handle mentions inside a hyperlink" do expect( PrettyText.cook("[link @inner](http://site.com)"), ).to match_html '

link @inner

' end it "can handle a list of mentions" do expect(PrettyText.cook("@a,@b")).to match_html( '

@a,@b

', ) end it "should handle group mentions with a hyphen and without" do expect( PrettyText.cook("@hello @hello-hello"), ).to match_html "

@hello @hello-hello

" end it "should allow for @mentions to have punctuation" do expect(PrettyText.cook("hello @bob's @bob,@bob; @bob\"")).to match_html( "

hello @bob's @bob,@bob; @bob\"

", ) end it "should not treat a medium link as a mention" do expect(PrettyText.cook(". http://test/@sam")).not_to include("mention") end context "with Unicode usernames disabled" do before { SiteSetting.unicode_usernames = false } it "does not detect mention" do expect(PrettyText.cook("Hello @狮子")).to_not include("mention") end end context "with Unicode usernames enabled" do before { SiteSetting.unicode_usernames = true } it "does detect mention" do expect( PrettyText.cook("Hello @狮子"), ).to match_html '

Hello @狮子

' end end context "with pretty_text_extract_mentions modifier" do it "allows changing the mentions extracted" do cooked_html = <<~HTML

@test, @test-group, @test-custom, test1, this is a test

HTML extracted_mentions = PrettyText.extract_mentions(Nokogiri::HTML5.fragment(cooked_html)) expect(extracted_mentions).to contain_exactly("test", "test-group") Plugin::Instance .new .register_modifier(:pretty_text_extract_mentions) do |mentions, cooked_text| custom_mentions = cooked_text .css(".custom-mention") .map do |e| if (name = e.inner_text) name = name[1..-1] name = User.normalize_username(name) name end end mentions + custom_mentions end extracted_mentions = PrettyText.extract_mentions(Nokogiri::HTML5.fragment(cooked_html)) expect(extracted_mentions).to include("test", "test-group", "test-custom") ensure DiscoursePluginRegistry.clear_modifiers! end end end describe "code fences" do it "indents code correctly" do code = <<~MD X ``` # x ``` MD cooked = PrettyText.cook(code) html = <<~HTML

     #
             x

HTML expect(cooked).to eq(html.strip) end it "doesn't replace emoji in code blocks with our emoji sets if emoji is enabled" do expect(PrettyText.cook("```\n💣`\n```\n")).not_to match(/\:bomb\:/) end it "can include code class correctly" do SiteSetting.highlighted_languages += "|c++|structured-text|p21" # keep in mind spaces should be trimmed per spec expect(PrettyText.cook("``` ruby the mooby\n`````")).to eq( '

', ) expect(PrettyText.cook("```cpp\ncpp\n```")).to match_html( "

cpp\n

", ) expect(PrettyText.cook("```\ncpp\n```")).to match_html( "

cpp\n

", ) expect(PrettyText.cook("```text\ncpp\n```")).to match_html( "

cpp\n

", ) expect(PrettyText.cook("```custom\ncustom content\n```")).to match_html( "

custom content\n

", ) expect(PrettyText.cook("```custom foo=bar\ncustom content\n```")).to match_html( "

custom content

", ) expect(PrettyText.cook("```INVALID a=1, foo=bar , baz=2\n```")).to match_html( "

\n

", ) expect(PrettyText.cook("```text\n```")).to match_html( "

\n

", ) expect(PrettyText.cook("```auto\n```")).to match_html( "

\n

", ) expect(PrettyText.cook("```ruby startline=3 $%@#\n```")).to match_html( "

\n

", ) expect(PrettyText.cook("```mermaid a_-你=17\n```")).to match_html( "

\n

", ) expect( PrettyText.cook("```mermaid foo=\n```"), ).to match_html( "

\n

", ) # Check unicode bidi characters are stripped: expect(PrettyText.cook("```mermaid foo=\u202E begin admin o\u001C\n```")).to match_html( "

\n

", ) expect(PrettyText.cook("```c++\nc++\n```")).to match_html( "

c++\n

", ) expect(PrettyText.cook("```structured-text\nstructured-text\n```")).to match_html( "

structured-text\n

", ) expect(PrettyText.cook("```p21\np21\n```")).to match_html( "

p21\n

", ) expect( PrettyText.cook("

"), ).to match_html("

") end it "indents code correctly" do code = "X\n```\n\n #\n x\n```" cooked = PrettyText.cook(code) expect(cooked).to match_html( "

\n    #\n    x\n

", ) end it "does censor code fences" do begin %w[apple banana].each do |w| Fabricate(:watched_word, word: w, action: WatchedWord.actions[:censor]) end expect(PrettyText.cook("# banana")).not_to include("banana") ensure Discourse.redis.flushdb end end it "strips out unicode bidirectional (bidi) override characters and replaces with a highlighted span" do code = <<~MD X ```auto var isAdmin = false; /*‮ begin admin only */⁦ if (isAdmin) ⁩ ⁦ { console.log("You are an admin."); /* end admins only ‮*/⁦ } ``` MD cooked = PrettyText.cook(code) hidden_bidi_title = I18n.t("post.hidden_bidi_character") html = <<~HTML

var isAdmin = false;
        /*<U+202E> begin admin only */<U+2066> if (isAdmin) <U+2069> <U+2066> {
        console.log("You are an admin.");
        /* end admins only <U+202E>*/<U+2066> }

HTML expect(cooked).to eq(html.strip) end it "fuzzes all possible dangerous unicode bidirectional (bidi) override characters, making sure they are replaced" do bad_bidi = [ "\u202A", "\u202B", "\u202C", "\u202D", "\u202E", "\u2066", "\u2067", "\u2068", "\u2069", ] bad_bidi.each do |bidi| code = <<~MD ``` #{bidi} ``` MD cooked = PrettyText.cook(code) formatted_bidi = format("<U+%04X>", bidi.ord) html = <<~HTML

#{formatted_bidi}

HTML expect(cooked).to eq(html.strip) end end it "fuzzes all possible dangerous unicode bidirectional (bidi) override characters in solo code and pre nodes, making sure they are replaced" do bad_bidi = [ "\u202A", "\u202B", "\u202C", "\u202D", "\u202E", "\u2066", "\u2067", "\u2068", "\u2069", ] bad_bidi.each do |bidi| code = <<~MD #{bidi} MD cooked = PrettyText.cook(code) formatted_bidi = format("<U+%04X>", bidi.ord) html = <<~HTML

#{formatted_bidi}

HTML expect(cooked).to eq(html.strip) end bad_bidi.each do |bidi| code = <<~MD

#{bidi}

MD cooked = PrettyText.cook(code) formatted_bidi = format("<U+%04X>", bidi.ord) html = <<~HTML

#{formatted_bidi}

HTML expect(cooked).to eq(html.strip) end end end describe "rel attributes" do before do SiteSetting.add_rel_nofollow_to_user_content = true SiteSetting.exclude_rel_nofollow_domains = "foo.com|bar.com" end it "should inject nofollow in all user provided links" do expect(PrettyText.cook('cnn')).to match(/noopener nofollow ugc/) end it "should not inject nofollow in all local links" do expect( PrettyText.cook("cnn") !~ /nofollow ugc/, ).to eq(true) end it "should not inject nofollow in all subdomain links" do expect( PrettyText.cook( "cnn", ) !~ /nofollow ugc/, ).to eq(true) end it "should inject nofollow in all non subdomain links" do expect( PrettyText.cook( "cnn", ), ).to match(/nofollow ugc/) end it "should not inject nofollow for foo.com" do expect(PrettyText.cook("cnn") !~ /nofollow ugc/).to eq( true, ) end it "should inject nofollow for afoo.com" do expect(PrettyText.cook("cnn")).to match( /nofollow ugc/, ) end it "should not inject nofollow for bar.foo.com" do expect( PrettyText.cook("cnn") !~ /nofollow ugc/, ).to eq(true) end it "should not inject nofollow if omit_nofollow option is given" do expect( PrettyText.cook('cnn', omit_nofollow: true) !~ /nofollow ugc/, ).to eq(true) end it "adds the noopener attribute even if omit_nofollow option is given" do raw_html = 'Check out my site!' expect(PrettyText.cook(raw_html, omit_nofollow: true)).to match(/noopener/) end it "adds the noopener attribute even if omit_nofollow option is given" do raw_html = 'Check out my site!' expect(PrettyText.cook(raw_html, omit_nofollow: false)).to match(/noopener nofollow ugc/) end end describe "Excerpt" do it "sanitizes attempts to inject invalid attributes" do spinner = "", 100)).to eq("[image]") end context "with alt tags" do it "should keep alt tags" do expect( PrettyText.excerpt( "

", 100, ), ).to eq("[car]") end describe "when alt tag is empty" do it "should not keep alt tags" do expect(PrettyText.excerpt("

", 100)).to eq( "[#{I18n.t("excerpt_image")}]", ) end end end context "with title tags" do it "should keep title tags" do expect(PrettyText.excerpt("

", 100)).to eq( "[car]", ) end describe "when title tag is empty" do it "should not keep title tags" do expect(PrettyText.excerpt("

", 100)).to eq( "[#{I18n.t("excerpt_image")}]", ) end end end it "should convert images to markdown if the option is set" do expect( PrettyText.excerpt( "

", 100, markdown_images: true, ), ).to eq("![car](http://cnn.com/a.gif)") end it "replaces details / summary with the summary" do expect( PrettyText.excerpt("

expand

hello

", 6), ).to match_html "▶ expand" end it "should remove meta information" do expect( PrettyText.excerpt(wrapped_image, 100), ).to match_html "" end it "should strip images when option is set" do expect( PrettyText.excerpt("

", 100, strip_images: true), ).to be_blank expect( PrettyText.excerpt( "

Hello world!", 100, strip_images: true, ), ).to eq("Hello world!") end it "should strip images, but keep emojis when option is set" do emoji_image = "

" html = "

Hello world #{emoji_image}" expect(PrettyText.excerpt(html, 100, strip_images: true)).to eq("Hello world :heart:") expect( PrettyText.excerpt(html, 100, strip_images: true, keep_emoji_images: true), ).to match_html("Hello world #{emoji_image}") end end context "with emojis" do it "should remove broken emoji" do html = <<~HTML $\":bike:\"$ $\":cat:\"$ $\":discourse:\"$ HTML expect(PrettyText.excerpt(html, 7)).to eq(":bike: …") expect(PrettyText.excerpt(html, 8)).to eq(":bike: …") expect(PrettyText.excerpt(html, 9)).to eq(":bike: …") expect(PrettyText.excerpt(html, 10)).to eq(":bike: …") expect(PrettyText.excerpt(html, 11)).to eq(":bike: …") expect(PrettyText.excerpt(html, 12)).to eq(":bike: :cat: …") expect(PrettyText.excerpt(html, 13)).to eq(":bike: :cat: …") expect(PrettyText.excerpt(html, 14)).to eq(":bike: :cat: …") end end it "should have an option to strip links" do expect(PrettyText.excerpt("cnn", 100, strip_links: true)).to eq( "cnn", ) end it "should preserve links" do expect( PrettyText.excerpt("cnn", 100), ).to match_html "cnn" end it "should deal with special keys properly" do expect(PrettyText.excerpt("

", 100)).to eq("") end it "should truncate stuff properly" do expect(PrettyText.excerpt("hello world", 5)).to eq("hello…") expect(PrettyText.excerpt("
hello
world
", 6)).to eq("hello w…") end it "should insert a space between to Ps" do expect(PrettyText.excerpt("
a
b
", 5)).to eq("a b") end it "should strip quotes" do expect(PrettyText.excerpt("
a
b
boom", 5)).to eq( "boom", ) end it "should not count the surrounds of a link" do expect( PrettyText.excerpt("cnn", 3), ).to match_html "cnn" end it "uses an ellipsis instead of html entities if provided with the option" do expect( PrettyText.excerpt("cnn", 2, text_entities: true), ).to match_html "cn..." end it "should truncate links" do expect( PrettyText.excerpt("cnn", 2), ).to match_html "cn…" end it "doesn't extract empty quotes as links" do expect( PrettyText.extract_links("
not a linked quote
\n").to_a, ).to be_empty end it "doesn't extract links from elided parts" do expect( PrettyText.extract_links( "
cnn
\n", ).to_a, ).to be_empty end def extract_urls(text) PrettyText.extract_links(text).map(&:url).to_a end it "should be able to extract links" do expect(extract_urls("http://bla.com")).to eq(["http://cnn.com"]) end it "should extract links to topics" do expect(extract_urls("
aside
")).to eq( ["/t/321"], ) end it "does not extract links from hotlinked images" do html = <<~HTML
example

image 808×740 24.8 KB

HTML expect(extract_urls(html)).to eq(["https://example.com"]) end context "when lazy-videos" do it "should extract youtube url" do expect( extract_urls( "
", ), ).to eq(["https://www.youtube.com/watch?v=yXEuEUQIP3Q"]) end it "should extract vimeo url" do expect( extract_urls( "
", ), ).to eq(["https://vimeo.com/786646692"]) end it "should extract tiktok url" do expect( extract_urls( "
", ), ).to eq(["https://m.tiktok.com/v/6718335390845095173"]) end end it "should extract links to posts" do expect( extract_urls("
aside
"), ).to eq(["/t/1234/4567"]) end it "should not extract links to anchors" do expect(extract_urls("TOS")).to eq([]) end it "should not extract links inside quotes" do links = PrettyText.extract_links( " http://useless1.com
http://useless3.com http://useless4.com
http://useless2.com ", ) expect(links.map { |l| [l.url, l.is_quote] }.sort).to eq( [ ["http://body_only.com", false], ["http://body_and_quote.com", false], ["/t/1234", true], ].sort, ) end it "should not extract links inside oneboxes" do onebox = <<~HTML

twitter.com twitter.com

Example URL: example.com

HTML expect(PrettyText.extract_links(onebox).map(&:url)).to contain_exactly( "https://twitter.com/EDBPostgres/status/1402528437441634306", ) end it "should not preserve tags in code blocks" do expect( PrettyText.excerpt( "
<h3>Hours</h3>
", 100, ), ).to eq("<h3>Hours</h3>") end it "should handle nil" do expect(PrettyText.excerpt(nil, 100)).to eq("") end it "handles custom bbcode excerpt" do raw = <<~MD [excerpt] hello [site](https://site.com) [/excerpt] more stuff MD post = Fabricate(:post, raw: raw) expect(post.excerpt).to eq( "hello site", ) end it "handles div excerpt at the beginning of a post" do expect(PrettyText.excerpt("
hi
test", 100)).to eq("hi") end it "handles span excerpt at the beginning of a post" do expect(PrettyText.excerpt("hi test", 100)).to eq("hi") end it "ignores max excerpt length if a div excerpt is specified" do two_hundred = "123456789 " * 20 + "." text = two_hundred + "
#{two_hundred}
" + two_hundred expect(PrettyText.excerpt(text, 100)).to eq(two_hundred) end it "ignores max excerpt length if a span excerpt is specified" do two_hundred = "123456789 " * 20 + "." text = two_hundred + "#{two_hundred}" + two_hundred expect(PrettyText.excerpt(text, 100)).to eq(two_hundred) end it "unescapes html entities when we want text entities" do expect(PrettyText.excerpt("'", 500, text_entities: true)).to eq("'") end it "should have an option to preserve emoji images" do emoji_image = "" expect(PrettyText.excerpt(emoji_image, 100, keep_emoji_images: true)).to match_html( emoji_image, ) end it "should have an option to remap emoji to code points" do emoji_image = "I you " expect(PrettyText.excerpt(emoji_image, 100, remap_emoji: true)).to match_html( "I ❤ you :unknown:", ) end it "should have an option to preserve emoji codes" do emoji_code = "" expect(PrettyText.excerpt(emoji_code, 100)).to eq(":heart:") end context "with option to preserve onebox source" do it "should return the right excerpt" do onebox = "
\n
\n meta.discourse.org\n
\n
\n \n\n
Infrequent translation updates in stable branch
\n\n
Well, there's an Italian translation for \"New Topic\" in beta, it's been there since November 2014 and it works here on meta. Do you have any plugins installed? Try disabling them. I'm quite confident that it's either a plugin or a site...
\n\n
\n
\n \n \n
\n
\n
\n\n\n" expected = "meta.discourse.org" expect(PrettyText.excerpt(onebox, 100, keep_onebox_source: true)).to eq(expected) expect( PrettyText.excerpt("#{onebox}\n \n \n \n\n\n #{onebox}", 100, keep_onebox_source: true), ).to eq("#{expected}\n\n#{expected}") end it "should continue to strip quotes" do expect( PrettyText.excerpt( "
a
b
boom", 100, keep_onebox_source: true, ), ).to eq("boom") end end it "should strip audio/video" do html = <<~HTML
Listen to this!
HTML expect(PrettyText.excerpt(html, 100)).to eq("Listen to this!") html = <<~HTML

Watch this, but do not include the video in the excerpt.
HTML ellipsis = "…" excerpt_size = 40 excerpt = PrettyText.excerpt(html, excerpt_size) expect(excerpt.size).to eq(excerpt_size + ellipsis.size) expect(excerpt).to eq("Watch this, but do not include the video#{ellipsis}") end end describe "strip links" do it "returns blank for blank input" do expect(PrettyText.strip_links("")).to be_blank end it "does nothing to a string without links" do expect(PrettyText.strip_links("I'm the batman")).to eq("I'm the batman") end it "strips links but leaves the text content" do expect( PrettyText.strip_links( "I'm the linked batman", ), ).to eq("I'm the linked batman") end it "escapes the text content" do expect( PrettyText.strip_links( "I'm the linked <batman>", ), ).to eq("I'm the linked <batman>") end end describe "strip_image_wrapping" do def strip_image_wrapping(html) doc = Nokogiri::HTML5.fragment(html) described_class.strip_image_wrapping(doc) doc.to_html end it "doesn't change HTML when there's no wrapped image" do html = "" expect(strip_image_wrapping(html)).to eq(html) end it "strips the metadata" do expect( strip_image_wrapping(wrapped_image), ).to match_html "
" end end describe "format_for_email" do context "when (sub)domain" do before { Discourse.stubs(:base_path).returns("") } it "does not crash" do html = <<~HTML test HTML expect(described_class.format_for_email(html, post)).to eq <<~HTML test HTML end it "adds base url to relative links" do html = <<~HTML
@wiseguy, @trollol what do you guys think?
HTML expect(described_class.format_for_email(html, post)).to eq <<~HTML
@wiseguy, @trollol what do you guys think?
HTML end it "doesn't change external absolute links" do html = <<~HTML
Check out this guy.
HTML expect(described_class.format_for_email(html, post)).to eq(html) end it "doesn't change internal absolute links" do html = <<~HTML
Check out this guy.
HTML expect(described_class.format_for_email(html, post)).to eq(html) end it "can tolerate invalid URLs" do html = <<~HTML
Check out this guy.
HTML expect(described_class.format_for_email(html, post)).to eq(html) end it "doesn't change mailto" do html = <<~HTML
Contact me at this address.
HTML expect(described_class.format_for_email(html, post)).to eq(html) end it "prefers data-original-href attribute to get Vimeo iframe link and escapes it" do html = <<~HTML
Check out this video – .
HTML expect(described_class.format_for_email(html, post)).to match( Regexp.escape("https://vimeo.com/329875646/%3E%20%3Cscript%3Ealert(1)%3C/script%3E"), ) end it "creates a valid URL when data-original-href is missing from Vimeo link" do html = <<~HTML HTML expect(described_class.format_for_email(html, post)).to match( "https://vimeo.com/508864124/fcbbcc92fa", ) end describe "#convert_vimeo_iframes" do it "converts to <a>" do html = <<~HTML <p>This is a Vimeo link:</p> <iframe width="640" height="360" src="https://player.vimeo.com/video/1" data-original-href="https://vimeo.com/1" frameborder="0" allowfullscreen="" seamless="seamless" sandbox="allow-same-origin allow-scripts allow-forms allow-popups allow-popups-to-escape-sandbox allow-presentation"> HTML md = described_class.format_for_email(html, post) expect(md).not_to include("This is a Vimeo link:

https://vimeo.com/1
HTML end end describe "#strip_secure_uploads" do before do setup_s3 SiteSetting.s3_cdn_url = "https://s3.cdn.com" SiteSetting.secure_uploads = true SiteSetting.login_required = true end it "replaces secure video content" do html = <<~HTML HTML md = described_class.format_for_email(html, post) expect(md).not_to include(" Audio label HTML md = described_class.format_for_email(html, post) expect(md).not_to include(" HTML md = described_class.format_for_email(html, post) expect(md).not_to include(" HTML md = described_class.format_for_email(html, post) expect(md.scan(/stripped-secure-view-upload/).length).to eq(1) expect(md.scan(/Redacted/).length).to eq(1) end it "replaces secure images with a placeholder, keeping the url in an attribute" do url = "/secure-uploads/original/1X/testimage.png" html = <<~HTML HTML md = described_class.format_for_email(html, post) expect(md).not_to include("@wiseguy, @trollol what do you guys think?
HTML expect(described_class.format_for_email(html, post)).to eq <<~HTML
@wiseguy, @trollol what do you guys think?
HTML end it "doesn't change external absolute links" do html = <<~HTML
Check out this guy.
HTML expect(described_class.format_for_email(html, post)).to eq(html) end it "doesn't change internal absolute links" do html = <<~HTML
Check out this guy.
HTML expect(described_class.format_for_email(html, post)).to eq(html) end end end it "Is smart about linebreaks and IMG tags" do raw = <<~MD a a - li ``` test ``` ``` test ``` MD html = <<~HTML
a

a

li

test

test
HTML expect(PrettyText.cook(raw)).to eq(html.strip) end describe "emoji" do it "replaces unicode emoji with our emoji sets if emoji is enabled" do expect(PrettyText.cook("💣")).to match(/\:bomb\:/) end it "does not replace left right arrow" do expect(PrettyText.cook("↔")).to eq("
↔
") end it "doesn't replace emoji in inline code blocks with our emoji sets if emoji is enabled" do expect(PrettyText.cook("`💣`")).not_to match(/\:bomb\:/) end it "replaces some glyphs that are not in the emoji range" do expect(PrettyText.cook("☹")).to match(/\:frowning\:/) expect(PrettyText.cook("☺")).to match(/\:smiling_face\:/) expect(PrettyText.cook("☻")).to match(/\:slight_smile\:/) expect(PrettyText.cook("♡")).to match(/\:heart\:/) expect(PrettyText.cook("❤")).to match(/\:heart\:/) expect(PrettyText.cook("❤️")).to match(/\:heart\:/) # in emoji range but ensure it works along others end it "replaces digits" do expect(PrettyText.cook("🔢")).to match(/\:1234\:/) expect(PrettyText.cook("1️⃣")).to match(/\:one\:/) expect(PrettyText.cook("#️⃣")).to match(/\:hash\:/) expect(PrettyText.cook("*️⃣")).to match(/\:asterisk\:/) end it "doesn't replace unicode emoji if emoji is disabled" do SiteSetting.enable_emoji = false expect(PrettyText.cook("💣")).not_to match(/\:bomb\:/) end it "doesn't replace emoji if emoji is disabled" do SiteSetting.enable_emoji = false expect(PrettyText.cook(":bomb:")).to eq("
:bomb:
") end it "doesn't replace shortcuts if disabled" do SiteSetting.enable_emoji_shortcuts = false expect(PrettyText.cook(":)")).to eq("
:)
") end it "does replace shortcuts if enabled" do expect(PrettyText.cook(":)")).to match("smile") end it "replaces skin toned emoji" do expect(PrettyText.cook("hello 👱🏿‍♀️")).to eq( "
hello $\":blonde_woman:t6:\"$
", ) expect(PrettyText.cook("hello 👩‍🎤")).to eq( "
hello $\":woman_singer:\"$
", ) expect(PrettyText.cook("hello 👩🏾‍🎓")).to eq( "
hello $\":woman_student:t5:\"$
", ) expect(PrettyText.cook("hello 🤷‍♀️")).to eq( "
hello $\":woman_shrugging:\"$
", ) end it "correctly strips VARIATION SELECTOR-16 character (ufe0f) from some emojis" do expect(PrettyText.cook("❤️💣")).to match(/]+bomb[^>]+>/) end it "replaces Emoji from Unicode 14.0" do expect(PrettyText.cook("🫣")).to match(/\:face_with_peeking_eye\:/) end context "with subfolder" do it "prepends the subfolder path to the emoji url" do set_subfolder "/forum" expected = "src=\"/forum/images/emoji/twitter/grinning.png?v=#{Emoji::EMOJI_VERSION}\"" expect(PrettyText.cook("😀")).to include(expected) expect(PrettyText.cook(":grinning:")).to include(expected) end it "prepends the subfolder path even if it is part of the emoji url" do set_subfolder "/info" expected = "src=\"/info/images/emoji/twitter/information_source.png?v=#{Emoji::EMOJI_VERSION}\"" expect(PrettyText.cook("ℹ️")).to include(expected) expect(PrettyText.cook(":information_source:")).to include(expected) end end end describe "custom emoji" do it "replaces the custom emoji" do CustomEmoji.create!(name: "trout", upload: Fabricate(:upload)) Emoji.clear_cache expect(PrettyText.cook("hello :trout:")).to match(/]+trout[^>]+>/) end end describe "custom emoji translation" do before do PrettyText.reset_translations SiteSetting.enable_emoji = true SiteSetting.enable_emoji_shortcuts = true plugin = Plugin::Instance.new plugin.translate_emoji "0:)", "otter" end after do Plugin::CustomEmoji.clear_cache PrettyText.reset_translations end it "sets the custom translation" do expect(PrettyText.cook("hello 0:)")).to match(/otter/) end end it "replaces skin toned emoji" do expect(PrettyText.cook("hello 👱🏿‍♀️")).to eq( "
hello $\":blonde_woman:t6:\"$
", ) expect(PrettyText.cook("hello 👩‍🎤")).to eq( "
hello $\":woman_singer:\"$
", ) expect(PrettyText.cook("hello 👩🏾‍🎓")).to eq( "
hello $\":woman_student:t5:\"$
", ) expect(PrettyText.cook("hello 🤷‍♀️")).to eq( "
hello $\":woman_shrugging:\"$
", ) end it "should not treat a non emoji as an emoji" do expect(PrettyText.cook(":email,class_name:")).not_to include("emoji") end it "supports href schemes" do SiteSetting.allowed_href_schemes = "macappstore|steam" cooked = cook("[Steam URL Scheme](steam://store/452530)") expected = '
Steam URL Scheme
' expect(cooked).to eq(n expected) end it "supports forbidden schemes" do SiteSetting.allowed_href_schemes = "macappstore|itunes" cooked = cook("[Steam URL Scheme](steam://store/452530)") expected = "
Steam URL Scheme
" expect(cooked).to eq(n expected) end it "applies scheme restrictions to img[src] attributes" do SiteSetting.allowed_href_schemes = "steam" cooked = cook "![Steam URL Image](steam://store/452530) ![Other scheme image](itunes://store/452530)" expected = '

' expect(cooked).to eq(n expected) end it "applies scheme restrictions to track[src] and source[src]" do SiteSetting.allowed_href_schemes = "steam" cooked = cook <<~MD MD expect(cooked).to include <<~HTML HTML end it "applies scheme restrictions to source[srcset]" do SiteSetting.allowed_href_schemes = "steam" cooked = cook <<~MD MD expect(cooked).to include <<~HTML HTML end it "allows only tel URL scheme to start with a plus character" do SiteSetting.allowed_href_schemes = "tel|steam" cooked = cook("[Tel URL Scheme](tel://+452530579785)") expected = '
Tel URL Scheme
' expect(cooked).to eq(n expected) cooked2 = cook("[Steam URL Scheme](steam://+store/452530)") expected2 = "
Steam URL Scheme
" expect(cooked2).to eq(n expected2) end it "produces hashtag links" do user = Fabricate(:user) category = Fabricate(:category, name: "testing", slug: "testing") category2 = Fabricate(:category, name: "known", slug: "known") group = Fabricate(:group) private_category = Fabricate(:private_category, name: "secret", group: group, slug: "secret") tag = Fabricate(:tag, name: "known") Fabricate(:topic, tags: [tag]) cooked = PrettyText.cook(" #unknown::tag #known #known::tag #testing #secret", user_id: user.id) expect(cooked).to have_tag("span", text: "#unknown::tag", with: { class: "hashtag-raw" }) expect(cooked).to have_tag( "a", with: { class: "hashtag-cooked", href: category2.url, "data-type": "category", "data-slug": category2.slug, "data-id": category2.id, }, ) do with_tag("span", with: { class: "hashtag-icon-placeholder" }) end expect(cooked).to have_tag( "a", with: { class: "hashtag-cooked", href: category.url, "data-type": "category", "data-slug": category.slug, "data-id": category.id, }, ) do with_tag("span", with: { class: "hashtag-icon-placeholder" }) end expect(cooked).to have_tag( "a", with: { class: "hashtag-cooked", href: tag.url, "data-type": "tag", "data-slug": tag.name, "data-id": tag.id, }, ) do with_tag("span", with: { class: "hashtag-icon-placeholder" }) end expect(cooked).to have_tag("span", text: "#secret", with: { class: "hashtag-raw" }) # If the user hash access to the private category it should be cooked with the details + icon group.add(user) cooked = PrettyText.cook(" #unknown::tag #known #known::tag #testing #secret", user_id: user.id) expect(cooked).to have_tag( "a", with: { class: "hashtag-cooked", href: private_category.url, "data-type": "category", "data-slug": private_category.slug, "data-id": private_category.id, }, ) do with_tag("span", with: { class: "hashtag-icon-placeholder" }) end cooked = PrettyText.cook("[`a` #known::tag here](http://example.com)", user_id: user.id) html = <<~HTML
a #known::tag here
HTML expect(cooked).to eq(html.strip) cooked = PrettyText.cook("`a` #known::tag here", user_id: user.id) expect(cooked).to eq(html.strip) cooked = PrettyText.cook("test #known::tag", user_id: user.id) expect(cooked).to have_tag( "a", with: { class: "hashtag-cooked", href: tag.url, "data-type": "tag", "data-slug": tag.name, "data-id": tag.id, }, ) do with_tag("span", with: { class: "hashtag-icon-placeholder" }) end # ensure it does not fight with the autolinker expect(PrettyText.cook(" http://somewhere.com/#known")).not_to include("hashtag") expect(PrettyText.cook(" http://somewhere.com/?#known")).not_to include("hashtag") expect(PrettyText.cook(" http://somewhere.com/?abc#known")).not_to include("hashtag") end it "can handle mixed lists" do # known bug in old md engine cooked = PrettyText.cook("* a\n\n1. b") expect(cooked).to match_html("
\n
a
\n
\n
\n
b
\n
") end it "can handle traditional vs non traditional newlines" do SiteSetting.traditional_markdown_linebreaks = true expect(PrettyText.cook("1\n2")).to match_html "
1 2
" SiteSetting.traditional_markdown_linebreaks = false expect(PrettyText.cook("1\n2")).to match_html "
1
\n2
" end it "can handle emoji by name" do expected = <
HTML expect(PrettyText.cook(":smile::sunny:")).to eq(expected.strip) end it "handles emoji boundaries correctly" do cooked = PrettyText.cook("a,:man:t2:,b") expected = "
a, $\":man:t2:\"$ ,b
" expect(cooked).to match(expected.strip) end it "can handle emoji by translation" do expected = "
$\":wink:\"$
" expect(PrettyText.cook(";)")).to eq(expected) end it "can handle multiple emojis by translation" do cooked = PrettyText.cook(":) ;) :)") expect(cooked.split("img").length - 1).to eq(3) end it "handles emoji boundaries correctly" do expect(PrettyText.cook(",:)")).to include("emoji") expect(PrettyText.cook(":-)\n")).to include("emoji") expect(PrettyText.cook("a :)")).to include("emoji") expect(PrettyText.cook(":),")).not_to include("emoji") expect(PrettyText.cook("abcde ^:;-P")).to include("emoji") end describe "censoring" do after { Discourse.redis.flushdb } def expect_cooked_match(raw, expected_cooked) expect(PrettyText.cook(raw)).to eq(expected_cooked) end context "with basic words" do fab!(:watched_words) do %w[shucks whiz whizzer a**le badword* shuck$ café $uper].each do |word| Fabricate(:watched_word, action: WatchedWord.actions[:censor], word: word) end end it "works correctly" do expect_cooked_match("aw shucks, golly gee whiz.", "
aw ■■■■■■, golly gee ■■■■.
") end it "doesn't censor words unless they have boundaries." do expect_cooked_match( "you are a whizzard! I love cheesewhiz. Whiz.", "
you are a whizzard! I love cheesewhiz. ■■■■.
", ) end it "censors words even if previous partial matches exist." do expect_cooked_match( "you are a whizzer! I love cheesewhiz. Whiz.", "
you are a ■■■■■■■! I love cheesewhiz. ■■■■.
", ) end it "won't break links by censoring them." do expect_cooked_match( "The link still works. [whiz](http://www.whiz.com)", '
The link still works. ■■■■
', ) end it "escapes regexp characters" do expect_cooked_match("I have a pen, I have an a**le", "
I have a pen, I have an ■■■■■
") end it "works for words ending in non-word characters" do expect_cooked_match( "Aw shuck$, I can't fix the problem with money", "
Aw ■■■■■■, I can't fix the problem with money
", ) end it "works for words ending in accented characters" do expect_cooked_match("Let's go to a café today", "
Let's go to a ■■■■ today
") end it "works for words starting with non-word characters" do expect_cooked_match("Discourse is $uper amazing", "
Discourse is ■■■■■ amazing
") end it "handles * as wildcard" do expect_cooked_match("No badword or apple here plz.", "
No ■■■■■■■ or ■■■■■ here plz.
") end end context "with watched words as regular expressions" do before { SiteSetting.watched_words_regular_expressions = true } it "supports words as regular expressions" do %w[xyz* plee+ase].each do |word| Fabricate(:watched_word, action: WatchedWord.actions[:censor], word: word) end expect_cooked_match( "Pleased to meet you, but pleeeease call me later, xyz123", "
Pleased to meet you, but ■■■■■■■■■ call me later, ■■■123
", ) end it "supports custom boundaries" do Fabricate(:watched_word, action: WatchedWord.actions[:censor], word: "\\btown\\b") expect_cooked_match( "Meet downtown in your town at the townhouse on Main St.", "
Meet downtown in your ■■■■ at the townhouse on Main St.
", ) end end end describe "watched words - replace & link" do after { Discourse.redis.flushdb } # Makes sure that mini_racer/libv8-node env doesn't regress it "finishes in a timely matter" do sql = 1500.times.map { |i| <<~SQL }.join INSERT INTO watched_words (created_at, updated_at, word, action, replacement) VALUES ( :now, :now, 'word_#{i}', :action, 'replacement_#{i}' ); SQL DB.exec(sql, now: Time.current, action: WatchedWord.actions[:replace]) Fabricate( :watched_word, action: WatchedWord.actions[:replace], word: "nope", replacement: "yep", ) # Due to a bug in node 18.16 and lower this takes about 11s. # On node 18.19 and newer it takes about 250ms expect do Timeout.timeout(3) do expect(PrettyText.cook("abc nope def")).to match_html("
abc yep def
") end end.not_to raise_error end it "replaces words with other words" do Fabricate( :watched_word, action: WatchedWord.actions[:replace], word: "dolor sit*", replacement: "something else", ) expect(PrettyText.cook("Lorem ipsum dolor sit amet")).to match_html(<<~HTML)
Lorem ipsum something else amet
HTML expect(PrettyText.cook("Lorem ipsum dolor sits amet")).to match_html(<<~HTML)
Lorem ipsum something else amet
HTML expect(PrettyText.cook("Lorem ipsum dolor sittt amet")).to match_html(<<~HTML)
Lorem ipsum something else amet
HTML expect(PrettyText.cook("Lorem ipsum xdolor sit amet")).to match_html(<<~HTML)
Lorem ipsum xdolor sit amet
HTML end it "replaces words with wildcards" do Fabricate( :watched_word, action: WatchedWord.actions[:replace], word: "*dolor*", replacement: "something else", ) expect(PrettyText.cook("Lorem ipsum xdolorx sit amet")).to match_html(<<~HTML)
Lorem ipsum something else sit amet
HTML end it "replaces words with links" do Fabricate( :watched_word, action: WatchedWord.actions[:link], word: "meta", replacement: "https://meta.discourse.org", ) expect(PrettyText.cook("Meta is a Discourse forum")).to match_html(<<~HTML)
Meta is a Discourse forum
HTML end it "works with regex" do Fabricate( :watched_word, action: WatchedWord.actions[:replace], word: "f.o", replacement: "test", ) expect(PrettyText.cook("foo")).to match_html("
foo
") expect(PrettyText.cook("f.o")).to match_html("
test
") SiteSetting.watched_words_regular_expressions = true expect(PrettyText.cook("foo")).to match_html("
test
") expect(PrettyText.cook("f.o")).to match_html("
test
") end it "does not replace hashtags and mentions" do Fabricate(:user, username: "test") category = Fabricate(:category, slug: "test", name: "test") Fabricate( :watched_word, action: WatchedWord.actions[:replace], word: "test", replacement: "discourse", ) cooked = PrettyText.cook("@test #test test") expect(cooked).to have_tag("a", text: "@test", with: { class: "mention", href: "/u/test" }) expect(cooked).to have_tag( "a", text: "test", with: { class: "hashtag-cooked", href: "/c/test/#{category.id}", "data-type": "category", "data-slug": category.slug, "data-id": category.id, }, ) do with_tag("span", with: { class: "hashtag-icon-placeholder" }) end expect(cooked).to include("discourse") end it "does not replace hashtags and mentions when watched words are regular expressions" do SiteSetting.watched_words_regular_expressions = true Fabricate(:user, username: "test") category = Fabricate(:category, slug: "test", name: "test") Fabricate( :watched_word, action: WatchedWord.actions[:replace], word: "es", replacement: "discourse", ) cooked = PrettyText.cook("@test #test test") expect(cooked).to have_tag("a", text: "@test", with: { class: "mention", href: "/u/test" }) expect(cooked).to have_tag( "a", text: "test", with: { class: "hashtag-cooked", href: "/c/test/#{category.id}", "data-type": "category", "data-slug": category.slug, "data-id": category.id, }, ) do with_tag("span", with: { class: "hashtag-icon-placeholder" }) end expect(cooked).to include("tdiscourset") end it "supports overlapping words" do Fabricate( :watched_word, action: WatchedWord.actions[:link], word: "meta", replacement: "https://meta.discourse.org", ) Fabricate(:watched_word, action: WatchedWord.actions[:replace], word: "iz", replacement: "is") Fabricate( :watched_word, action: WatchedWord.actions[:link], word: "discourse", replacement: "https://discourse.org", ) expect(PrettyText.cook("Meta iz a Discourse forum")).to match_html(<<~HTML)
Meta is a Discourse forum
HTML end end it "supports typographer" do SiteSetting.enable_markdown_typographer = true expect(PrettyText.cook("->")).to eq("
→
") SiteSetting.enable_markdown_typographer = false expect(PrettyText.cook("->")).to eq("
->
") end it "uses quotation marks from site settings" do SiteSetting.enable_markdown_typographer = true expect(PrettyText.cook(%q|"Do you know," he said, "what 'Discourse' is?"|)).to eq( "
“Do you know,” he said, “what ‘Discourse’ is?”
", ) SiteSetting.markdown_typographer_quotation_marks = "„|“|‚|‘" expect(PrettyText.cook(%q|"Weißt du", sagte er, "was 'Discourse' ist?"|)).to eq( "
„Weißt du“, sagte er, „was ‚Discourse‘ ist?“
", ) end it "handles onebox correctly" do expect(PrettyText.cook("http://a.com\nhttp://b.com").split("onebox").length).to eq(3) expect(PrettyText.cook("http://a.com\n\nhttp://b.com").split("onebox").length).to eq(3) expect(PrettyText.cook("a\nhttp://a.com")).to include("onebox") expect(PrettyText.cook("> http://a.com")).not_to include("onebox") expect(PrettyText.cook("a\nhttp://a.com a")).not_to include("onebox") expect(PrettyText.cook("a\nhttp://a.com\na")).to include("onebox") expect(PrettyText.cook("http://a.com")).to include("onebox") expect(PrettyText.cook("http://a.com ")).to include("onebox") expect(PrettyText.cook("http://a.com a")).not_to include("onebox") expect(PrettyText.cook("- http://a.com")).not_to include("onebox") expect(PrettyText.cook("")).not_to include("onebox") expect(PrettyText.cook(" http://a.com")).not_to include("onebox") expect(PrettyText.cook("a\n http://a.com")).not_to include("onebox") expect(PrettyText.cook("sam@sam.com")).not_to include("onebox") expect(PrettyText.cook("\nhttp://a.com")).to include("onebox") end it "can handle bbcode" do expect(PrettyText.cook("a[b]b[/b]c")).to eq('
abc
') expect(PrettyText.cook("a[i]b[/i]c")).to eq('
abc
') end it "supports empty inline BBCode" do expect(PrettyText.cook("a[b][/b]c")).to eq('
ac
') end it "can handle bbcode after a newline" do # this is not 100% ideal cause we get an extra p here, but this is pretty rare expect(PrettyText.cook("a\n[code]code[/code]")).to eq( "
a
\n
code
", ) # this is fine expect(PrettyText.cook("a\na[code]code[/code]")).to eq("
a
\nacode
") end it "can onebox local topics" do op = post reply = Fabricate(:post, topic_id: op.topic_id) url = Discourse.base_url + reply.url quote = create_post(topic_id: op.topic.id, raw: "This is a sample reply with a quote\n\n#{url}") quote.reload expect(quote.cooked).not_to include("[quote") end it "supports tables" do markdown = <<~MD | Tables | Are | Cool | | ------------- |:-------------:| -----:| | col 3 is | right-aligned | $1600 | MD expected = <<~HTML

Tables Are Cool

col 3 is right-aligned $1600

HTML expect(PrettyText.cook(markdown)).to eq(expected.strip) end it "supports img bbcode" do cooked = PrettyText.cook "[img]http://www.image/test.png[/img]" html = "
$\"\"$
" expect(cooked).to eq(html) end it "supports img bbcode entities in attributes" do actual = PrettyText.cook "[img]http://aaa.com/?a=1&b=[/img]" expected = '
' expect(expected).to be_same_dom(actual) end it "supports email bbcode" do cooked = PrettyText.cook "[email]sam@sam.com[/email]" html = '
sam@sam.com
' expect(cooked).to eq(html) end it "supports url bbcode" do cooked = PrettyText.cook "[url]http://sam.com[/url]" html = '
http://sam.com
' expect(cooked).to eq(html) end it "supports nesting tags in url" do cooked = PrettyText.cook("[url=http://sam.com][b]I am sam[/b][/url]") html = '
I am sam
' expect(cooked).to eq(html) end it "supports query params in bbcode url" do cooked = PrettyText.cook( "[url=https://www.amazon.com/Camcorder-Hausbell-302S-Control-Infrared/dp/B01KLOA1PI/?tag=discourse]BBcode link[/url]", ) html = '
BBcode link
' expect(cooked).to eq(html) end it "supports inline code bbcode" do cooked = PrettyText.cook "Testing [code]codified **stuff** and `more` stuff[/code]" html = "
Testing codified **stuff** and `more` stuff
" expect(cooked).to eq(html) end it "supports block code bbcode" do cooked = PrettyText.cook "[code]\ncodified\n\n\n **stuff** and `more` stuff\n[/code]" html = "
codified\n\n\n **stuff** and `more` stuff
" expect(cooked).to eq(html) end it "support special handling for space in urls" do cooked = PrettyText.cook "http://testing.com?a%20b" html = '
http://testing.com?a%20b
' expect(cooked).to eq(html) end it "supports onebox for decoded urls" do cooked = PrettyText.cook "http://testing.com?a%50b" html = '
http://testing.com?aPb
' expect(cooked).to eq(html) end it "should sanitize the html" do expect(PrettyText.cook("alert(42)")).to eq "
alert(42)
" end it "should not onebox magically linked urls" do expect(PrettyText.cook("[url]site.com[/url]")).not_to include("onebox") end it "should sanitize the html" do expect(PrettyText.cook("
hi
")).to eq "
hi
" end it "should strip SCRIPT" do expect(PrettyText.cook("")).to eq "" expect(PrettyText.cook("
")).to eq "
" end it "strips script regardless of sanitize" do expect( PrettyText.cook("
", sanitize: false), ).to eq "
" end it "should allow sanitize bypass" do expect( PrettyText.cook("alert(42)", sanitize: false), ).to eq "
alert(42)
" end # custom rule used to specify image dimensions via alt tags describe "image dimensions" do it "allows title plus dimensions" do cooked = PrettyText.cook <<~MD ![title with | title|220x100](http://png.com/my.png) ![](http://png.com/my.png) ![|220x100](http://png.com/my.png) ![stuff](http://png.com/my.png) ![|220x100,50%](http://png.com/my.png "some title") MD html = <<~HTML

HTML expect(cooked).to eq(html.strip) end it "ignores whitespace and allows scaling by percent, width, height" do cooked = PrettyText.cook <<~MD ![|220x100, 50%](http://png.com/my.png) ![|220x100 , 50%](http://png.com/my.png) ![|220x100 ,50%](http://png.com/my.png) ![|220x100,150x](http://png.com/my.png) ![|220x100, x50](http://png.com/my.png) MD html = <<~HTML

HTML expect(cooked).to eq(html.strip) end end describe "upload decoding" do it "can decode upload:// for default setup" do set_cdn_url("https://cdn.com") upload = Fabricate(:upload) raw = <<~RAW ![upload](#{upload.short_url}) ![upload](#{upload.short_url} "some title to test") - ![upload](#{upload.short_url}) - test - ![upload](#{upload.short_url}) ![upload](#{upload.short_url.gsub(".png", "")}) Inline img
Block img
[some attachment](#{upload.short_url}) [some attachment|attachment](#{upload.short_url}) [some attachment|random](#{upload.short_url}) RAW cdn_url = Discourse.store.cdn_url(upload.url) cooked = <<~HTML

test

Inline img

Block img

some attachment

some attachment

some attachment|random
HTML expect(PrettyText.cook(raw)).to eq(cooked.strip) end it "can place a blank image if we can not find the upload" do raw = <<~MD ![upload](upload://abcABC.png) [some attachment|attachment](upload://abcdefg.png) MD cooked = <<~HTML

some attachment
HTML expect(PrettyText.cook(raw)).to eq(cooked.strip) end end it "can properly allowlist iframes" do SiteSetting.allowed_iframes = "https://bob.com/a|http://silly.com/?EMBED=" raw = <<~HTML HTML # we require explicit HTTPS here html = <<~HTML HTML cooked = PrettyText.cook(raw).strip expect(cooked).to eq(html.strip) end it "can skip relative paths in allowlist iframes" do SiteSetting.allowed_iframes = "https://bob.com/abc/def" raw = <<~HTML HTML html = <<~HTML HTML expect(PrettyText.cook(raw).strip).to eq(html.strip) end it "You can disable linkify" do md = "www.cnn.com test.it http://test.com https://test.ab https://a" cooked = PrettyText.cook(md) html = <<~HTML
www.cnn.com test.it http://test.com https://test.ab https://a
HTML expect(cooked).to eq(html.strip) # notice how cnn.com is no longer linked but it is SiteSetting.markdown_linkify_tlds = "not_com|it" cooked = PrettyText.cook(md) html = <<~HTML
www.cnn.com test.it http://test.com https://test.ab https://a
HTML expect(cooked).to eq(html.strip) # no tlds anymore SiteSetting.markdown_linkify_tlds = "" cooked = PrettyText.cook(md) html = <<~HTML
www.cnn.com test.it http://test.com https://test.ab https://a
HTML expect(cooked).to eq(html.strip) # lastly ... what about no linkify SiteSetting.enable_markdown_linkify = false cooked = PrettyText.cook(md) html = <<~HTML
www.cnn.com test.it http://test.com https://test.ab https://a
HTML end it "has a proper data whitelist on div" do cooked = PrettyText.cook("
test
") expect(cooked).to include("data-theme-a") end it "allowlists lang attribute" do cooked = PrettyText.cook( "
tester
tester
tester", ) expect(cooked).to eq( "
tester
tester
tester", ) end it "allowlists ruby tags" do # read all about ruby chars at: https://en.wikipedia.org/wiki/Ruby_character # basically it is super hard to remember every single rare letter when there are # so many, so ruby tags provide a hint. # html = (<<~MD).strip X 漢 ( ㄏㄢˋ ) MD cooked = PrettyText.cook html expect(cooked).to eq(html) end describe "d-wrap" do it "wraps the [wrap] tag inline" do cooked = PrettyText.cook("[wrap=toc]taco[/wrap]") html = <<~HTML

taco

HTML expect(cooked).to eq(html.strip) cooked = PrettyText.cook("Hello [wrap=toc id=1]taco[/wrap] world") html = <<~HTML
Hello taco world
HTML expect(cooked).to eq(html.strip) end it "wraps the [wrap] tag in block" do # can interfere with parsing SiteSetting.enable_markdown_typographer = true md = <<~MD [wrap=toc id=“a” aa='b"' bb="f'"] taco1 [/wrap] MD cooked = PrettyText.cook(md) html = <<~HTML

taco1

HTML expect(cooked).to eq(html.strip) end it "wraps the [wrap] tag without content" do md = <<~MD [wrap=toc] [/wrap] MD cooked = PrettyText.cook(md) html = <<~HTML
HTML expect(cooked).to eq(html.strip) end it "adds attributes as data-attributes" do cooked = PrettyText.cook("[wrap=toc name=\"single quote's\" id='1\"2']taco[/wrap]") html = <<~HTML

taco

HTML expect(cooked).to eq(html.strip) end it "prevents xss" do cooked = PrettyText.cook('[wrap=toc foo=""]taco[/wrap]') html = <<~HTML

taco

HTML expect(cooked).to eq(html.strip) end it "allows a limited set of attributes chars" do cooked = PrettyText.cook('[wrap=toc fo@"èk-"!io=bar]taco[/wrap]') html = <<~HTML
[wrap=toc fo@"èk-"!io=bar]taco[/wrap]
HTML expect(cooked).to eq(html.strip) end end it "adds anchor links to headings" do cooked = PrettyText.cook("# Hello world") html = <<~HTML
Hello world
HTML expect(cooked).to match_html(html) end describe "customizing markdown-it rules" do it "customizes the markdown-it rules correctly" do cooked = PrettyText.cook("This is some text **bold**", markdown_it_rules: []) expect(cooked).to eq("
This is some text **bold**
") cooked = PrettyText.cook("This is some text **bold**", markdown_it_rules: ["emphasis"]) expect(cooked).to eq("
This is some text bold
") end end describe "enabling/disabling features" do it "allows features to be overridden" do cooked = PrettyText.cook(":grin: @mention", features_override: []) expect(cooked).to eq("
:grin: @mention
") cooked = PrettyText.cook(":grin: @mention", features_override: ["emoji"]) expect(cooked).to eq( "
$\":grin:\"$ @mention
", ) cooked = PrettyText.cook(":grin: @mention", features_override: %w[mentions text-post-process]) expect(cooked).to eq("
:grin: @mention
") end end it "does not amend HTML when scrubbing" do md = <<~MD ~~\n\nhello\n\n~~ MD html = <<~HTML \n
hello
\n HTML cooked = PrettyText.cook(md) expect(cooked.strip).to eq(html.strip) end it "handles deprecations correctly" do Rails .logger .expects(:warn) .once .with("[PrettyText] Deprecation notice: Some deprecation message") PrettyText.v8.eval <<~JS require("discourse-common/lib/deprecated").default("Some deprecation message"); JS end describe "video thumbnails" do before do SiteSetting.authorized_extensions = "mp4|png" @video_upload = Fabricate(:upload, original_filename: "video.mp4", extension: "mp4") end after { Upload.where(original_filename: ["404.png", "#{@video_upload.sha1}.png"]).destroy_all } it "does not link to a thumbnail image if the video source is missing" do Fabricate(:upload, original_filename: "404.png", extension: "png") html = <<~HTML
HTML doc = Nokogiri::HTML5.fragment(html) described_class.add_video_placeholder_image(doc) expect(doc.to_html).to eq(html) end it "links to a thumbnail image if the video source is valid" do thumbnail = Fabricate(:upload, original_filename: "#{@video_upload.sha1}.png", extension: "png") html = <<~HTML
HTML doc = Nokogiri::HTML5.fragment(html) described_class.add_video_placeholder_image(doc) html_with_thumbnail = <<~HTML
HTML expect(doc.to_html).to eq(html_with_thumbnail) end end end