require "minitest/autorun" require "rails-html-sanitizer" require "rails/dom/testing/assertions/dom_assertions" puts Nokogiri::VERSION_INFO class SanitizersTest < Minitest::Test include Rails::Dom::Testing::Assertions::DomAssertions def test_sanitizer_sanitize_raises_not_implemented_error assert_raises NotImplementedError do Rails::Html::Sanitizer.new.sanitize('') end end def test_sanitize_nested_script assert_equal '<script>alert("XSS");</script>', safe_list_sanitize('alert("XSS");/', tags: %w(em)) end def test_sanitize_nested_script_in_style assert_equal '<script>alert("XSS");</script>', safe_list_sanitize('alert("XSS");/', tags: %w(em)) end class XpathRemovalTestSanitizer < Rails::Html::Sanitizer def sanitize(html, options = {}) fragment = Loofah.fragment(html) remove_xpaths(fragment, options[:xpaths]).to_s end end def test_remove_xpaths_removes_an_xpath html = %(

hello

) assert_equal %(

hello

), xpath_sanitize(html, xpaths: %w(.//script)) end def test_remove_xpaths_removes_all_occurrences_of_xpath html = %(

hello

) assert_equal %(

hello

), xpath_sanitize(html, xpaths: %w(.//script)) end def test_remove_xpaths_called_with_faulty_xpath assert_raises Nokogiri::XML::XPath::SyntaxError do xpath_sanitize('

hello

', xpaths: %w(..faulty_xpath)) end end def test_remove_xpaths_called_with_xpath_string assert_equal '', xpath_sanitize('', xpaths: './/a') end def test_remove_xpaths_called_with_enumerable_xpaths assert_equal '', xpath_sanitize('', xpaths: %w(.//a .//span)) end def test_strip_tags_with_quote input = '<" hi' expected = libxml_2_9_14_recovery_lt? ? %{<" hi} : %{ hi} assert_equal(expected, full_sanitize(input)) end def test_strip_invalid_html assert_equal "<<", full_sanitize("<<This is a test.\n\n\n\n

It no longer contains any HTML.

\n} assert_equal expected, full_sanitize(input) end def test_remove_unclosed_tags input = "This is <-- not\n a comment here." expected = libxml_2_9_14_recovery_lt? ? %{This is <-- not\n a comment here.} : %{This is } assert_equal(expected, full_sanitize(input)) end def test_strip_cdata input = "This has a ]]> here." expected = libxml_2_9_14_recovery_lt_bang? ? %{This has a <![CDATA[]]> here.} : %{This has a ]]> here.} assert_equal(expected, full_sanitize(input)) end def test_strip_unclosed_cdata input = "This has an unclosed ]] here..." expected = libxml_2_9_14_recovery_lt_bang? ? %{This has an unclosed <![CDATA[]] here...} : %{This has an unclosed ]] here...} assert_equal(expected, full_sanitize(input)) end def test_strip_blank_string assert_nil full_sanitize(nil) assert_equal "", full_sanitize("") assert_equal " ", full_sanitize(" ") end def test_strip_tags_with_plaintext assert_equal "Don't touch me", full_sanitize("Don't touch me") end def test_strip_tags_with_tags assert_equal "This is a test.", full_sanitize("

This is a test.

") end def test_escape_tags_with_many_open_quotes assert_equal "<<", full_sanitize("<<") end def test_strip_tags_with_sentence assert_equal "This is a test.", full_sanitize("This is a test.") end def test_strip_tags_with_comment assert_equal "This has a here.", full_sanitize("This has a here.") end def test_strip_tags_with_frozen_string assert_equal "Frozen string with no tags", full_sanitize("Frozen string with no tags".freeze) end def test_full_sanitize_respect_html_escaping_of_the_given_string assert_equal 'test\r\nstring', full_sanitize('test\r\nstring') assert_equal '&', full_sanitize('&') assert_equal '&', full_sanitize('&') assert_equal '&amp;', full_sanitize('&amp;') assert_equal 'omg <script>BOM</script>', full_sanitize('omg <script>BOM</script>') end def test_strip_links_with_tags_in_tags expected = "<a href='hello'>all day long</a>" input = "<a href='hello'>all day long</a>" assert_equal expected, link_sanitize(input) end def test_strip_links_with_unclosed_tags assert_equal "", link_sanitize("on my mind\nall day long") end def test_strip_links_leaves_nonlink_tags assert_equal "My mind\nall day long", link_sanitize("My mind\nall day long") end def test_strip_links_with_links assert_equal "0wn3d", link_sanitize("0wn3d") end def test_strip_links_with_linkception assert_equal "Magic", link_sanitize("Magic") end def test_sanitize_form assert_sanitized "
", '' end def test_sanitize_plaintext assert_sanitized "<span>foo</span></plaintext>", "<span>foo</span>" end def test_sanitize_script assert_sanitized "a b c<script language=\"Javascript\">blah blah blah</script>d e f", "a b cblah blah blahd e f" end def test_sanitize_js_handlers raw = %{onthis="do that" <a href="#" onclick="hello" name="foo" onbogus="remove me">hello</a>} assert_sanitized raw, %{onthis="do that" <a href="#" name="foo">hello</a>} end def test_sanitize_javascript_href raw = %{href="javascript:bang" <a href="javascript:bang" name="hello">foo</a>, <span href="javascript:bang">bar</span>} assert_sanitized raw, %{href="javascript:bang" <a name="hello">foo</a>, <span>bar</span>} end def test_sanitize_image_src raw = %{src="javascript:bang" <img src="javascript:bang" width="5">foo</img>, <span src="javascript:bang">bar</span>} assert_sanitized raw, %{src="javascript:bang" <img width="5">foo</img>, <span>bar</span>} end tags = Loofah::HTML5::SafeList::ALLOWED_ELEMENTS - %w(script form) tags.each do |tag_name| define_method "test_should_allow_#{tag_name}_tag" do scope_allowed_tags(tags) do assert_sanitized "start <#{tag_name} title=\"1\" onclick=\"foo\">foo <bad>bar</bad> baz</#{tag_name}> end", %(start <#{tag_name} title="1">foo bar baz</#{tag_name}> end) end end end def test_should_allow_anchors assert_sanitized %(<a href="foo" onclick="bar"><script>baz</script></a>), %(<a href=\"foo\">baz</a>) end def test_video_poster_sanitization scope_allowed_tags(%w(video)) do scope_allowed_attributes %w(src poster) do assert_sanitized %(<video src="videofile.ogg" autoplay poster="posterimage.jpg"></video>), %(<video src="videofile.ogg" poster="posterimage.jpg"></video>) assert_sanitized %(<video src="videofile.ogg" poster=javascript:alert(1)></video>), %(<video src="videofile.ogg"></video>) end end end # RFC 3986, sec 4.2 def test_allow_colons_in_path_component assert_sanitized "<a href=\"./this:that\">foo</a>" end %w(src width height alt).each do |img_attr| define_method "test_should_allow_image_#{img_attr}_attribute" do assert_sanitized %(<img #{img_attr}="foo" onclick="bar" />), %(<img #{img_attr}="foo" />) end end def test_should_handle_non_html assert_sanitized 'abc' end def test_should_handle_blank_text [nil, '', ' '].each { |blank| assert_sanitized blank } end def test_setting_allowed_tags_affects_sanitization scope_allowed_tags %w(u) do |sanitizer| assert_equal '<u></u>', sanitizer.sanitize('<a><u></u></a>') end end def test_setting_allowed_attributes_affects_sanitization scope_allowed_attributes %w(foo) do |sanitizer| input = '<a foo="hello" bar="world"></a>' assert_equal '<a foo="hello"></a>', sanitizer.sanitize(input) end end def test_custom_tags_overrides_allowed_tags scope_allowed_tags %(u) do |sanitizer| input = '<a><u></u></a>' assert_equal '<a></a>', sanitizer.sanitize(input, tags: %w(a)) end end def test_custom_attributes_overrides_allowed_attributes scope_allowed_attributes %(foo) do |sanitizer| input = '<a foo="hello" bar="world"></a>' assert_equal '<a bar="world"></a>', sanitizer.sanitize(input, attributes: %w(bar)) end end def test_should_allow_prune sanitizer = Rails::Html::SafeListSanitizer.new(prune: true) text = '<u>leave me <b>now</b></u>' assert_equal "<u>leave me </u>", sanitizer.sanitize(text, tags: %w(u)) end def test_should_allow_custom_tags text = "<u>foo</u>" assert_equal text, safe_list_sanitize(text, tags: %w(u)) end def test_should_allow_only_custom_tags text = "<u>foo</u> with <i>bar</i>" assert_equal "<u>foo</u> with bar", safe_list_sanitize(text, tags: %w(u)) end def test_should_allow_custom_tags_with_attributes text = %(<blockquote cite="http://example.com/">foo</blockquote>) assert_equal text, safe_list_sanitize(text) end def test_should_allow_custom_tags_with_custom_attributes text = %(<blockquote foo="bar">Lorem ipsum</blockquote>) assert_equal text, safe_list_sanitize(text, attributes: ['foo']) end def test_scrub_style_if_style_attribute_option_is_passed input = '<p style="color: #000; background-image: url(http://www.ragingplatypus.com/i/cam-full.jpg);"></p>' actual = safe_list_sanitize(input, attributes: %w(style)) assert_includes(['<p style="color: #000;"></p>', '<p style="color:#000;"></p>'], actual) end def test_should_raise_argument_error_if_tags_is_not_enumerable assert_raises ArgumentError do safe_list_sanitize('<a>some html</a>', tags: 'foo') end end def test_should_raise_argument_error_if_attributes_is_not_enumerable assert_raises ArgumentError do safe_list_sanitize('<a>some html</a>', attributes: 'foo') end end def test_should_not_accept_non_loofah_inheriting_scrubber scrubber = Object.new def scrubber.scrub(node); node.name = 'h1'; end assert_raises Loofah::ScrubberNotFound do safe_list_sanitize('<a>some html</a>', scrubber: scrubber) end end def test_should_accept_loofah_inheriting_scrubber scrubber = Loofah::Scrubber.new def scrubber.scrub(node); node.name = 'h1'; end html = "<script>hello!</script>" assert_equal "<h1>hello!</h1>", safe_list_sanitize(html, scrubber: scrubber) end def test_should_accept_loofah_scrubber_that_wraps_a_block scrubber = Loofah::Scrubber.new { |node| node.name = 'h1' } html = "<script>hello!</script>" assert_equal "<h1>hello!</h1>", safe_list_sanitize(html, scrubber: scrubber) end def test_custom_scrubber_takes_precedence_over_other_options scrubber = Loofah::Scrubber.new { |node| node.name = 'h1' } html = "<script>hello!</script>" assert_equal "<h1>hello!</h1>", safe_list_sanitize(html, scrubber: scrubber, tags: ['foo']) end [%w(img src), %w(a href)].each do |(tag, attr)| define_method "test_should_strip_#{attr}_attribute_in_#{tag}_with_bad_protocols" do assert_sanitized %(<#{tag} #{attr}="javascript:bang" title="1">boo</#{tag}>), %(<#{tag} title="1">boo</#{tag}>) end end def test_should_block_script_tag assert_sanitized %(<SCRIPT\nSRC=http://ha.ckers.org/xss.js></SCRIPT>), "" end def test_should_not_fall_for_xss_image_hack_with_uppercase_tags assert_sanitized %(<IMG """><SCRIPT>alert("XSS")</SCRIPT>">), %(<img>alert("XSS")"&gt;) end [%(<IMG SRC="javascript:alert('XSS');">), %(<IMG SRC=javascript:alert('XSS')>), %(<IMG SRC=JaVaScRiPt:alert('XSS')>), %(<IMG SRC=javascript:alert(&quot;XSS&quot;)>), %(<IMG SRC=javascript:alert(String.fromCharCode(88,83,83))>), %(<IMG SRC=&#106;&#97;&#118;&#97;&#115;&#99;&#114;&#105;&#112;&#116;&#58;&#97;&#108;&#101;&#114;&#116;&#40;&#39;&#88;&#83;&#83;&#39;&#41;>), %(<IMG SRC=&#0000106&#0000097&#0000118&#0000097&#0000115&#0000099&#0000114&#0000105&#0000112&#0000116&#0000058&#0000097&#0000108&#0000101&#0000114&#0000116&#0000040&#0000039&#0000088&#0000083&#0000083&#0000039&#0000041>), %(<IMG SRC=&#x6A&#x61&#x76&#x61&#x73&#x63&#x72&#x69&#x70&#x74&#x3A&#x61&#x6C&#x65&#x72&#x74&#x28&#x27&#x58&#x53&#x53&#x27&#x29>), %(<IMG SRC="jav\tascript:alert('XSS');">), %(<IMG SRC="jav&#x09;ascript:alert('XSS');">), %(<IMG SRC="jav&#x0A;ascript:alert('XSS');">), %(<IMG SRC="jav&#x0D;ascript:alert('XSS');">), %(<IMG SRC=" &#14; javascript:alert('XSS');">), %(<IMG SRC="javascript&#x3a;alert('XSS');">), %(<IMG SRC=`javascript:alert("RSnake says, 'XSS'")`>)].each do |img_hack| define_method "test_should_not_fall_for_xss_image_hack_#{img_hack}" do assert_sanitized img_hack, "<img>" end end def test_should_sanitize_tag_broken_up_by_null assert_sanitized %(<SCR\0IPT>alert(\"XSS\")</SCR\0IPT>), "" end def test_should_sanitize_invalid_script_tag assert_sanitized %(<SCRIPT/XSS SRC="http://ha.ckers.org/xss.js"></SCRIPT>), "" end def test_should_sanitize_script_tag_with_multiple_open_brackets assert_sanitized %(<<SCRIPT>alert("XSS");//<</SCRIPT>), "&lt;alert(\"XSS\");//&lt;" assert_sanitized %(<iframe src=http://ha.ckers.org/scriptlet.html\n<a), "" end def test_should_sanitize_unclosed_script assert_sanitized %(<SCRIPT SRC=http://ha.ckers.org/xss.js?<B>), "" end def test_should_sanitize_half_open_scripts assert_sanitized %(<IMG SRC="javascript:alert('XSS')"), "<img>" end def test_should_not_fall_for_ridiculous_hack img_hack = %(<IMG\nSRC\n=\n"\nj\na\nv\na\ns\nc\nr\ni\np\nt\n:\na\nl\ne\nr\nt\n(\n'\nX\nS\nS\n'\n)\n"\n>) assert_sanitized img_hack, "<img>" end def test_should_sanitize_attributes assert_sanitized %(<SPAN title="'><script>alert()</script>">blah</SPAN>), %(<span title="#{CGI.escapeHTML "'><script>alert()</script>"}">blah</span>) end def test_should_sanitize_illegal_style_properties raw = %(display:block; position:absolute; left:0; top:0; width:100%; height:100%; z-index:1; background-color:black; background-image:url(http://www.ragingplatypus.com/i/cam-full.jpg); background-x:center; background-y:center; background-repeat:repeat;) expected = %(display:block;width:100%;height:100%;background-color:black;background-x:center;background-y:center;) assert_equal expected, sanitize_css(raw) end def test_should_sanitize_with_trailing_space raw = "display:block; " expected = "display:block;" assert_equal expected, sanitize_css(raw) end def test_should_sanitize_xul_style_attributes raw = %(-moz-binding:url('http://ha.ckers.org/xssmoz.xml#xss')) assert_equal '', sanitize_css(raw) end def test_should_sanitize_invalid_tag_names assert_sanitized(%(a b c<script/XSS src="http://ha.ckers.org/xss.js"></script>d e f), "a b cd e f") end def test_should_sanitize_non_alpha_and_non_digit_characters_in_tags assert_sanitized('<a onclick!#$%&()*~+-_.,:;?@[/|\]^`=alert("XSS")>foo</a>', "<a>foo</a>") end def test_should_sanitize_invalid_tag_names_in_single_tags assert_sanitized('<img/src="http://ha.ckers.org/xss.js"/>', "<img />") end def test_should_sanitize_img_dynsrc_lowsrc assert_sanitized(%(<img lowsrc="javascript:alert('XSS')" />), "<img />") end def test_should_sanitize_div_background_image_unicode_encoded [ convert_to_css_hex("url(javascript:alert(1))", false), convert_to_css_hex("url(javascript:alert(1))", true), convert_to_css_hex("url(https://example.com)", false), convert_to_css_hex("url(https://example.com)", true), ].each do |propval| raw = "background-image:" + propval assert_empty(sanitize_css(raw)) end end def test_should_allow_div_background_image_unicode_encoded_safe_functions [ convert_to_css_hex("rgb(255,0,0)", false), convert_to_css_hex("rgb(255,0,0)", true), ].each do |propval| raw = "background-image:" + propval assert_includes(sanitize_css(raw), "background-image") end end def test_should_sanitize_div_style_expression raw = %(width: expression(alert('XSS'));) assert_equal '', sanitize_css(raw) end def test_should_sanitize_across_newlines raw = %(\nwidth:\nexpression(alert('XSS'));\n) assert_equal '', sanitize_css(raw) end def test_should_sanitize_img_vbscript assert_sanitized %(<img src='vbscript:msgbox("XSS")' />), '<img />' end def test_should_sanitize_cdata_section input = "<![CDATA[<span>section</span>]]>" expected = libxml_2_9_14_recovery_lt_bang? ? %{&lt;![CDATA[<span>section</span>]]&gt;} : %{section]]&gt;} assert_sanitized(input, expected) end def test_should_sanitize_unterminated_cdata_section input = "<![CDATA[<span>neverending..." expected = libxml_2_9_14_recovery_lt_bang? ? %{&lt;![CDATA[<span>neverending...</span>} : %{neverending...} assert_sanitized(input, expected) end def test_should_not_mangle_urls_with_ampersand assert_sanitized %{<a href=\"http://www.domain.com?var1=1&amp;var2=2\">my link</a>} end def test_should_sanitize_neverending_attribute assert_sanitized "<span class=\"\\", "<span class=\"\\\">" end [ %(<a href="javascript&#x3a;alert('XSS');">), %(<a href="javascript&#x003a;alert('XSS');">), %(<a href="javascript&#x3A;alert('XSS');">), %(<a href="javascript&#x003A;alert('XSS');">) ].each_with_index do |enc_hack, i| define_method "test_x03a_handling_#{i+1}" do assert_sanitized enc_hack, "<a>" end end def test_x03a_legitimate assert_sanitized %(<a href="http&#x3a;//legit">), %(<a href="http://legit">) assert_sanitized %(<a href="http&#x3A;//legit">), %(<a href="http://legit">) end def test_sanitize_ascii_8bit_string safe_list_sanitize('<a>hello</a>'.encode('ASCII-8BIT')).tap do |sanitized| assert_equal '<a>hello</a>', sanitized assert_equal Encoding::UTF_8, sanitized.encoding end end def test_sanitize_data_attributes assert_sanitized %(<a href="/blah" data-method="post">foo</a>), %(<a href="/blah">foo</a>) assert_sanitized %(<a data-remote="true" data-type="script" data-method="get" data-cross-domain="true" href="attack.js">Launch the missiles</a>), %(<a href="attack.js">Launch the missiles</a>) end def test_allow_data_attribute_if_requested text = %(<a data-foo="foo">foo</a>) assert_equal %(<a data-foo="foo">foo</a>), safe_list_sanitize(text, attributes: ['data-foo']) end def test_uri_escaping_of_href_attr_in_a_tag_in_safe_list_sanitizer skip if RUBY_VERSION < "2.3" html = %{<a href='examp<!--" unsafeattr=foo()>-->le.com'>test</a>} text = safe_list_sanitize(html) acceptable_results = [ # nokogiri w/vendored+patched libxml2 %{<a href="examp&lt;!--%22%20unsafeattr=foo()&gt;--&gt;le.com">test</a>}, # nokogiri w/ system libxml2 %{<a href="examp<!--%22%20unsafeattr=foo()>-->le.com">test</a>}, ] assert_includes(acceptable_results, text) end def test_uri_escaping_of_src_attr_in_a_tag_in_safe_list_sanitizer skip if RUBY_VERSION < "2.3" html = %{<a src='examp<!--" unsafeattr=foo()>-->le.com'>test</a>} text = safe_list_sanitize(html) acceptable_results = [ # nokogiri w/vendored+patched libxml2 %{<a src="examp&lt;!--%22%20unsafeattr=foo()&gt;--&gt;le.com">test</a>}, # nokogiri w/system libxml2 %{<a src="examp<!--%22%20unsafeattr=foo()>-->le.com">test</a>}, ] assert_includes(acceptable_results, text) end def test_uri_escaping_of_name_attr_in_a_tag_in_safe_list_sanitizer skip if RUBY_VERSION < "2.3" html = %{<a name='examp<!--" unsafeattr=foo()>-->le.com'>test</a>} text = safe_list_sanitize(html) acceptable_results = [ # nokogiri w/vendored+patched libxml2 %{<a name="examp&lt;!--%22%20unsafeattr=foo()&gt;--&gt;le.com">test</a>}, # nokogiri w/system libxml2 %{<a name="examp<!--%22%20unsafeattr=foo()>-->le.com">test</a>}, ] assert_includes(acceptable_results, text) end def test_uri_escaping_of_name_action_in_a_tag_in_safe_list_sanitizer skip if RUBY_VERSION < "2.3" html = %{<a action='examp<!--" unsafeattr=foo()>-->le.com'>test</a>} text = safe_list_sanitize(html, attributes: ['action']) acceptable_results = [ # nokogiri w/vendored+patched libxml2 %{<a action="examp&lt;!--%22%20unsafeattr=foo()&gt;--&gt;le.com">test</a>}, # nokogiri w/system libxml2 %{<a action="examp<!--%22%20unsafeattr=foo()>-->le.com">test</a>}, ] assert_includes(acceptable_results, text) end def test_exclude_node_type_processing_instructions assert_equal("<div>text</div><b>text</b>", safe_list_sanitize("<div>text</div><?div content><b>text</b>")) end def test_exclude_node_type_comment assert_equal("<div>text</div><b>text</b>", safe_list_sanitize("<div>text</div><!-- comment --><b>text</b>")) end %w[text/plain text/css image/png image/gif image/jpeg].each do |mediatype| define_method "test_mediatype_#{mediatype}_allowed" do input = %Q(<img src="data:#{mediatype};base64,PHNjcmlwdD5hbGVydCgnWFNTJyk8L3NjcmlwdD4=">) expected = input actual = safe_list_sanitize(input) assert_equal(expected, actual) input = %Q(<img src="DATA:#{mediatype};base64,PHNjcmlwdD5hbGVydCgnWFNTJyk8L3NjcmlwdD4=">) expected = input actual = safe_list_sanitize(input) assert_equal(expected, actual) end end def test_mediatype_text_html_disallowed input = %q(<img src="data:text/html;base64,PHNjcmlwdD5hbGVydCgnWFNTJyk8L3NjcmlwdD4=">) expected = %q(<img>) actual = safe_list_sanitize(input) assert_equal(expected, actual) input = %q(<img src="DATA:text/html;base64,PHNjcmlwdD5hbGVydCgnWFNTJyk8L3NjcmlwdD4=">) expected = %q(<img>) actual = safe_list_sanitize(input) assert_equal(expected, actual) end def test_mediatype_image_svg_xml_disallowed input = %q(<img src="data:image/svg+xml;base64,PHNjcmlwdD5hbGVydCgnWFNTJyk8L3NjcmlwdD4=">) expected = %q(<img>) actual = safe_list_sanitize(input) assert_equal(expected, actual) input = %q(<img src="DATA:image/svg+xml;base64,PHNjcmlwdD5hbGVydCgnWFNTJyk8L3NjcmlwdD4=">) expected = %q(<img>) actual = safe_list_sanitize(input) assert_equal(expected, actual) end def test_mediatype_other_disallowed input = %q(<a href="data:foo;base64,PHNjcmlwdD5hbGVydCgnWFNTJyk8L3NjcmlwdD4=">foo</a>) expected = %q(<a>foo</a>) actual = safe_list_sanitize(input) assert_equal(expected, actual) input = %q(<a href="DATA:foo;base64,PHNjcmlwdD5hbGVydCgnWFNTJyk8L3NjcmlwdD4=">foo</a>) expected = %q(<a>foo</a>) actual = safe_list_sanitize(input) assert_equal(expected, actual) end def test_scrubbing_svg_attr_values_that_allow_ref input = %Q(<div fill="yellow url(http://bad.com/) #fff">hey</div>) expected = %Q(<div fill="yellow #fff">hey</div>) actual = scope_allowed_attributes %w(fill) do safe_list_sanitize(input) end assert_equal(expected, actual) end def test_style_with_css_payload input, tags = "<style>div > span { background: \"red\"; }</style>", ["style"] expected = "<style>div &gt; span { background: \"red\"; }</style>" actual = safe_list_sanitize(input, tags: tags) assert_equal(expected, actual) end def test_combination_of_select_and_style_with_css_payload input, tags = "<select><style>div > span { background: \"red\"; }</style></select>", ["select", "style"] expected = "<select><style>div &gt; span { background: \"red\"; }</style></select>" actual = safe_list_sanitize(input, tags: tags) assert_equal(expected, actual) end def test_combination_of_select_and_style_with_script_payload input, tags = "<select><style><script>alert(1)</script></style></select>", ["select", "style"] expected = "<select><style>&lt;script&gt;alert(1)&lt;/script&gt;</style></select>" actual = safe_list_sanitize(input, tags: tags) assert_equal(expected, actual) end def test_combination_of_svg_and_style_with_script_payload input, tags = "<svg><style><script>alert(1)</script></style></svg>", ["svg", "style"] expected = "<svg><style>&lt;script&gt;alert(1)&lt;/script&gt;</style></svg>" actual = safe_list_sanitize(input, tags: tags) assert_equal(expected, actual) end def test_combination_of_math_and_style_with_img_payload input, tags = "<math><style><img src=x onerror=alert(1)></style></math>", ["math", "style"] expected = "<math><style>&lt;img src=x onerror=alert(1)&gt;</style></math>" actual = safe_list_sanitize(input, tags: tags) assert_equal(expected, actual) input, tags = "<math><style><img src=x onerror=alert(1)></style></math>", ["math", "style", "img"] expected = "<math><style>&lt;img src=x onerror=alert(1)&gt;</style></math>" actual = safe_list_sanitize(input, tags: tags) assert_equal(expected, actual) end def test_combination_of_svg_and_style_with_img_payload input, tags = "<svg><style><img src=x onerror=alert(1)></style></svg>", ["svg", "style"] expected = "<svg><style>&lt;img src=x onerror=alert(1)&gt;</style></svg>" actual = safe_list_sanitize(input, tags: tags) assert_equal(expected, actual) input, tags = "<svg><style><img src=x onerror=alert(1)></style></svg>", ["svg", "style", "img"] expected = "<svg><style>&lt;img src=x onerror=alert(1)&gt;</style></svg>" actual = safe_list_sanitize(input, tags: tags) assert_equal(expected, actual) end protected def xpath_sanitize(input, options = {}) XpathRemovalTestSanitizer.new.sanitize(input, options) end def full_sanitize(input, options = {}) Rails::Html::FullSanitizer.new.sanitize(input, options) end def link_sanitize(input, options = {}) Rails::Html::LinkSanitizer.new.sanitize(input, options) end def safe_list_sanitize(input, options = {}) Rails::Html::SafeListSanitizer.new.sanitize(input, options) end def assert_sanitized(input, expected = nil) if input assert_dom_equal expected || input, safe_list_sanitize(input) else assert_nil safe_list_sanitize(input) end end def sanitize_css(input) Rails::Html::SafeListSanitizer.new.sanitize_css(input) end def scope_allowed_tags(tags) old_tags = Rails::Html::SafeListSanitizer.allowed_tags Rails::Html::SafeListSanitizer.allowed_tags = tags yield Rails::Html::SafeListSanitizer.new ensure Rails::Html::SafeListSanitizer.allowed_tags = old_tags end def scope_allowed_attributes(attributes) old_attributes = Rails::Html::SafeListSanitizer.allowed_attributes Rails::Html::SafeListSanitizer.allowed_attributes = attributes yield Rails::Html::SafeListSanitizer.new ensure Rails::Html::SafeListSanitizer.allowed_attributes = old_attributes end # note that this is used for testing CSS hex encoding: \\[0-9a-f]{1,6} def convert_to_css_hex(string, escape_parens=false) string.chars.map do |c| if !escape_parens && (c == "(" || c == ")") c else format('\00%02X', c.ord) end end.join end def libxml_2_9_14_recovery_lt? # changed in 2.9.14, see https://github.com/sparklemotion/nokogiri/releases/tag/v1.13.5 Nokogiri.method(:uses_libxml?).arity == -1 && Nokogiri.uses_libxml?(">= 2.9.14") end def libxml_2_9_14_recovery_lt_bang? # changed in 2.9.14, see https://github.com/sparklemotion/nokogiri/releases/tag/v1.13.5 # then reverted in 2.10.0, see https://gitlab.gnome.org/GNOME/libxml2/-/issues/380 Nokogiri.method(:uses_libxml?).arity == -1 && Nokogiri.uses_libxml?("= 2.9.14") end end