. namespace core; /** * HTMLPurifier test case * * @package core * @category test * @copyright 2012 Petr Skoda {@link http://skodak.org} * @license http://www.gnu.org/copyleft/gpl.html GNU GPL v3 or later */ class htmlpurifier_test extends \basic_testcase { /** * Verify _blank target is allowed. */ public function test_allow_blank_target() { // See MDL-52651 for an explanation as to why the rel="noreferrer" attribute is expected here. // Also note we do not need to test links with an existing rel attribute as the HTML Purifier is configured to remove // the rel attribute. $text = 'Some link'; $expected = 'Some link'; $result = format_text($text, FORMAT_HTML); $this->assertSame($expected, $result); $result = format_text('Some link', FORMAT_HTML); $this->assertSame('Some link', $result); } /** * Verify our nolink tag accepted. */ public function test_nolink() { // We can not use format text because nolink changes result. $text = '
no filters
'; $result = purify_html($text, array()); $this->assertSame($text, $result); $text = 'xxxxx
xxx
'; $result = purify_html($text, array()); $this->assertSame($text, $result); // Ensure nolink doesn't force open tags to be closed, so can be virtually everywhere. $text = '

no filters

'; $result = purify_html($text, array()); $this->assertSame($text, $result); } /** * Verify our tex tag accepted. */ public function test_tex() { $text = 'a+b=c'; $result = purify_html($text, array()); $this->assertSame($text, $result); } /** * Verify our algebra tag accepted. */ public function test_algebra() { $text = 'a+b=c'; $result = purify_html($text, array()); $this->assertSame($text, $result); } /** * Verify our hacky multilang works. */ public function test_multilang() { $text = 'hmmmhm'; $result = purify_html($text, array()); $this->assertSame($text, $result); $text = 'hmmmhm'; $result = purify_html($text, array()); $this->assertSame($text, $result); $text = 'hmmm'; $result = purify_html($text, array()); $this->assertNotSame($text, $result); // Keep standard lang tags. $text = 'asas'; $result = purify_html($text, array()); $this->assertSame($text, $result); $text = 'xxxxxx'; $result = purify_html($text, array()); $this->assertSame($text, $result); } /** * Tests the 'allowid' option for format_text. */ public function test_format_text_allowid() { // Start off by not allowing ids (default). $options = [ 'allowid' => false, ]; $result = format_text('
Frog
', FORMAT_HTML, $options); $this->assertSame('
Frog
', $result); // Now allow ids. $options['allowid'] = true; $result = format_text('
Frog
', FORMAT_HTML, $options); $this->assertSame('
Frog
', $result); } public function test_allowobjectembed() { global $CFG; $this->assertSame('0', $CFG->allowobjectembed); $text = ' hmmm'; $result = purify_html($text, array()); $this->assertSame('hmmm', trim($result)); $CFG->allowobjectembed = '1'; $expected = ' hmmm'; $result = purify_html($text, array()); $this->assertSame(str_replace("\n", '', $expected), str_replace("\n", '', $result)); $CFG->allowobjectembed = '0'; $result = purify_html($text, array()); $this->assertSame('hmmm', trim($result)); } /** * Test if linebreaks kept unchanged. */ public function test_line_breaking() { $text = "\n\raa\rsss\nsss\r"; $this->assertSame($text, purify_html($text)); } /** * Test fixing of strict problems. */ public function test_tidy() { $text = "

xx"; $this->assertSame('

xx

', purify_html($text)); $text = "

xx

"; $this->assertSame('

xx

', purify_html($text)); $text = "xx
"; $this->assertSame('xx
', purify_html($text)); } /** * Test nesting - this used to cause problems in earlier versions. */ public function test_nested_lists() { $text = ""; $this->assertSame($text, purify_html($text)); } /** * Test that XSS protection works, complete smoke tests are in htmlpurifier itself. */ public function test_cleaning_nastiness() { $text = "xx"; $this->assertSame('xx', purify_html($text)); $text = '
xx
'; $this->assertSame('
xx
', purify_html($text)); $text = '
xx
'; $this->assertSame('
xx
', purify_html($text)); $text = 'xx'; $this->assertSame('xx', purify_html($text)); $text = 'xx'; $this->assertSame('xx', purify_html($text)); $text = 'xx'; $this->assertSame('xx', purify_html($text)); $text = 'x
x'; $this->assertSame('xx', purify_html($text)); } /** * Test internal function used for clean_text() speedup. */ public function test_is_purify_html_necessary() { // First our shortcuts. $text = ""; $this->assertFalse(is_purify_html_necessary($text)); $this->assertSame($text, purify_html($text)); $text = "666"; $this->assertFalse(is_purify_html_necessary($text)); $this->assertSame($text, purify_html($text)); $text = "abc\ndef \" ' "; $this->assertFalse(is_purify_html_necessary($text)); $this->assertSame($text, purify_html($text)); $text = "abc\n

def

efg

hij

"; $this->assertFalse(is_purify_html_necessary($text)); $this->assertSame($text, purify_html($text)); $text = "
abc\n

defefghi
j

"; $this->assertFalse(is_purify_html_necessary($text)); $this->assertSame($text, purify_html($text)); // Now failures. $text = " "; $this->assertTrue(is_purify_html_necessary($text)); $text = "Gin & Tonic"; $this->assertTrue(is_purify_html_necessary($text)); $text = "Gin > Tonic"; $this->assertTrue(is_purify_html_necessary($text)); $text = "Gin < Tonic"; $this->assertTrue(is_purify_html_necessary($text)); $text = "
abc
"; $this->assertTrue(is_purify_html_necessary($text)); $text = "abc"; $this->assertTrue(is_purify_html_necessary($text)); $text = "
abc"; $this->assertTrue(is_purify_html_necessary($text)); $text = "

abc

"; $this->assertTrue(is_purify_html_necessary($text)); $text = "

abc

"; $this->assertTrue(is_purify_html_necessary($text)); $text = "

abc"; $this->assertTrue(is_purify_html_necessary($text)); } public function test_allowed_schemes() { // First standard schemas. $text = 'link'; $this->assertSame($text, purify_html($text)); $text = 'link'; $this->assertSame($text, purify_html($text)); $text = 'link'; $this->assertSame($text, purify_html($text)); $text = 'link'; $this->assertSame($text, purify_html($text)); $text = 'link'; $this->assertSame($text, purify_html($text)); $text = 'link'; $this->assertSame($text, purify_html($text)); // Extra schemes allowed in moodle. $text = 'link'; $this->assertSame($text, purify_html($text)); $text = 'link'; $this->assertSame($text, purify_html($text)); $text = 'link'; $this->assertSame($text, purify_html($text)); $text = 'link'; $this->assertSame($text, purify_html($text)); $text = 'link'; $this->assertSame($text, purify_html($text)); $text = 'link'; $this->assertSame($text, purify_html($text)); // Now some borked or dangerous schemes. $text = 'link'; $this->assertSame('link', purify_html($text)); $text = 'link'; $this->assertSame('link', purify_html($text)); } /** * Test non-ascii domain names */ public function test_idn() { // Example of domain that gives the same result in IDNA2003 and IDNA2008 . $text = 'правительство.рф'; $expected = 'правительство.рф'; $this->assertSame($expected, purify_html($text)); // Examples of deviations from http://www.unicode.org/reports/tr46/#Table_Deviation_Characters . $text = 'teßt.de'; $expected = 'teßt.de'; $this->assertSame($expected, purify_html($text)); $text = 'http://βόλος.com'; $expected = 'http://βόλος.com'; $this->assertSame($expected, purify_html($text)); $text = 'http://نامه‌ای.com'; $expected = 'http://نامه‌ای.com'; $this->assertSame($expected, purify_html($text)); } /** * Tests media tags. * * @dataProvider media_tags_provider * @param string $mediatag HTML media tag * @param string $expected expected result */ public function test_media_tags($mediatag, $expected) { $actual = format_text($mediatag, FORMAT_MOODLE, ['filter' => false]); $this->assertEquals($expected, $actual); } /** * Test cases for the test_media_tags test. */ public function media_tags_provider() { // Takes an array of attributes, then generates a test for each of them. $generatetestcases = function($prefix, array $attrs, array $templates) { return array_reduce($attrs, function($carry, $attr) use ($prefix, $templates) { $testcase = [$prefix . '/' . $attr => [ sprintf($templates[0], $attr), sprintf($templates[1], $attr) ]]; return empty(array_values($carry)[0]) ? $testcase : $carry + $testcase; }, [[]]); }; $audioattrs = [ 'preload="auto"', 'autoplay=""', 'loop=""', 'muted=""', 'controls=""', 'crossorigin="anonymous"', 'crossorigin="use-credentials"' ]; $videoattrs = [ 'crossorigin="anonymous"', 'crossorigin="use-credentials"', 'poster="https://upload.wikimedia.org/wikipedia/en/1/14/Space_jam.jpg"', 'preload="auto"', 'autoplay=""', 'playsinline=""', 'loop=""', 'muted=""', 'controls=""', 'width="420"', 'height="69"' ]; return $generatetestcases('Plain audio', $audioattrs + ['src="http://example.com/jam.wav"'], [ '', '

' ]) + $generatetestcases('Audio with one source', $audioattrs, [ '', '
' . '' . '
' ]) + $generatetestcases('Audio with multiple sources', $audioattrs, [ '', '
' . '' . '
' ]) + $generatetestcases('Audio with sources and tracks', $audioattrs, [ '', '
' . '' . '
' ]) + $generatetestcases('Plain video', $videoattrs + ['src="http://example.com/prettygood.mp4'], [ '', '
' ]) + $generatetestcases('Video with illegal subtag', $videoattrs + ['src="http://example.com/prettygood.mp4'], [ '', '
' ]) + $generatetestcases('Video with legal subtag', $videoattrs + ['src="http://example.com/prettygood.mp4'], [ '', '
' ]) + $generatetestcases('Video inside an inline tag', $videoattrs + ['src="http://example.com/prettygood.mp4'], [ '', '
' ]) + $generatetestcases('Video inside a block tag', $videoattrs + ['src="http://example.com/prettygood.mp4'], [ '

', '

' ]) + $generatetestcases('Source tag without video or audio', $videoattrs, [ 'some text the end', '
some text the end
' ]) + $generatetestcases('Video with one source', $videoattrs, [ '', '
' . '' . '
' ]) + $generatetestcases('Video with multiple sources', $videoattrs, [ '', '
' . '' . '
' ]) + $generatetestcases('Video with sources and tracks', $audioattrs, [ '', '
' . '' . '
' ]) + ['Video with invalid crossorigin' => [ '', '
' . '' . '
' ]] + ['Audio with invalid crossorigin' => [ '', '
' . '' . '
' ]] + ['Other attributes' => [ '', '
' . '' . '
' ]]; } }