class FilterUnitTestCase extends BackdropUnitTestCase {
function testLineBreakFilter() {
$filter = new stdClass();
$filter->callback = '_filter_autop';
$tests = array(
"aaa\nbbb\n\nccc" => array(
"<p>aaa<br />\nbbb</p>\n<p>ccc</p>" => TRUE,
" => array(
"<script>aaa\nbbb\n\nccc</script>" => TRUE,
"<style>aaa\nbbb\n\nccc</style>" => TRUE,
"<pre>aaa\nbbb\n\nccc</pre>" => TRUE,
"<object>aaa\nbbb\n\nccc</object>" => TRUE,
"<iframe>aaa\nbbb\n\nccc</iframe>" => TRUE,
"One. <!-- comment --> Two.\n<!--\nThree.\n-->\n" => array(
'<!-- comment -->' => TRUE,
"<!--\nThree.\n-->" => TRUE,
'<p><div> </div></p>' => array(
"<p>\n<div> </div>\n</p>" => TRUE,
'<div><p> </p></div>' => array(
"<div>\n</div>" => TRUE,
'<blockquote><pre>aaa</pre></blockquote>' => array(
"<blockquote><pre>aaa</pre></blockquote>" => TRUE,
"<pre>aaa\nbbb\nccc</pre>\nddd\neee" => array(
"<pre>aaa\nbbb\nccc</pre>" => TRUE,
"<p>ddd<br />\neee</p>" => TRUE,
"aaa<!--comment-->\n\nbbb\n\nccc\n\nddd<!--comment\nwith line break-->\n\neee\n\nfff" => array(
"<p>aaa</p>\n<!--comment--><p>\nbbb</p>\n<p>ccc</p>\n<p>ddd</p>" => TRUE,
"<!--comment\nwith line break--><p>\neee</p>\n<p>fff</p>" => TRUE,
"<pre>aaa\nbbb<!-- comment -->\n\nccc</pre>\nddd" => array(
"<pre>aaa\nbbb<!-- comment -->\n\nccc</pre>" => TRUE,
"<iframe>aaa</iframe>\n\n" => array(
"<p><iframe>aaa</iframe></p>" => FALSE,
"<h3>\n indented line\n</h3>" => array(
"<h3>\n indented line\n</h3>" => TRUE,
"<h3>\n indented line<br />\n</h3>" => FALSE,
"<p>\n indented line\n second indented line\n</p>" => array(
"<p>\n indented line<br />\n second indented line\n</p>" => TRUE,
"<p>\n indented line<br />\n second indented line<br />\n</p>" => FALSE,
"<p>\n indented line\n second indented line\n</p>" => FALSE,
"<p>\n line before break<br>\n line after break</p>" => array(
"<p>\n line before break<br />\n line after break</p>" => TRUE,
"<p>\n line before break<br><br />\n line after break</p>" => FALSE,
"<p>\n line before break<br /><br />\n line after break</p>" => FALSE,
$this->assertFilteredString($filter, $tests);
$limit = max(ini_get('pcre.backtrack_limit'), ini_get('pcre.recursion_limit'));
$source = $this->randomName($limit);
$result = _filter_autop($source);
$success = $this->assertEqual($result, '<p>' . $source . "</p>\n", 'Line break filter can process very long strings.');
if (!$success) {
$this->verbose("\n" . $source . "\n<hr />\n" . $result);
function testFilterXSS() {
$f = filter_xss('<script>alert(0)</script>');
$this->assertNoNormalized($f, 'script', 'HTML tag stripping -- simple script without special characters.');
$f = filter_xss('<script src="" />');
$this->assertNoNormalized($f, 'script', 'HTML tag stripping -- empty script with source.');
$f = filter_xss('<ScRipt sRc=>');
$this->assertNoNormalized($f, 'script', 'HTML tag stripping evasion -- varying case.');
$f = filter_xss("<script\nsrc\n=\n\n>");
$this->assertNoNormalized($f, 'script', 'HTML tag stripping evasion -- multiline tag.');
$f = filter_xss('<script/a src=></script>');
$this->assertNoNormalized($f, 'script', 'HTML tag stripping evasion -- non whitespace character after tag name.');
$f = filter_xss('<script/src=></script>');
$this->assertNoNormalized($f, 'script', 'HTML tag stripping evasion -- no space between tag and attribute.');
$f = filter_xss("<\0scr\0ipt>alert(0)</script>");
$this->assertNoNormalized($f, 'ipt', 'HTML tag stripping evasion -- breaking HTML with nulls.');
$f = filter_xss("<scrscriptipt src=>");
$this->assertNoNormalized($f, 'script', 'HTML tag stripping evasion -- filter just removing "script".');
$f = filter_xss('<<script>alert(0);//<</script>');
$this->assertNoNormalized($f, 'script', 'HTML tag stripping evasion -- double opening brackets.');
$f = filter_xss('<script src=<b>');
$this->assertNoNormalized($f, 'script', 'HTML tag stripping evasion -- no closing tag.');
$f = filter_xss('<script>>');
$this->assertNoNormalized($f, 'script', 'HTML tag stripping evasion -- double closing tag.');
$f = filter_xss('<script src=//>');
$this->assertNoNormalized($f, 'script', 'HTML tag stripping evasion -- no scheme or ending slash.');
$f = filter_xss('<script src=');
$this->assertNoNormalized($f, 'script', 'HTML tag stripping evasion -- no closing bracket.');
$f = filter_xss('<script src= <');
$this->assertNoNormalized($f, 'script', 'HTML tag stripping evasion -- opening instead of closing bracket.');
$f = filter_xss('<nosuchtag attribute="newScriptInjectionVector">');
$this->assertNoNormalized($f, 'nosuchtag', 'HTML tag stripping evasion -- unknown tag.');
$f = filter_xss('<?xml:namespace ns="urn:schemas-microsoft-com:time">');
$this->assertTrue(stripos($f, '<?xml') === FALSE, 'HTML tag stripping evasion -- starting with a question sign (processing instructions).');
$f = filter_xss('<t:set attributeName="innerHTML" to="<script defer>alert(0)</script>">');
$this->assertNoNormalized($f, 't:set', 'HTML tag stripping evasion -- colon in the tag name (namespaces\' tricks).');
$f = filter_xss('<img """><script>alert(0)</script>', array('img'));
$this->assertNoNormalized($f, 'script', 'HTML tag stripping evasion -- a malformed image tag.');
$f = filter_xss('<blockquote><script>alert(0)</script></blockquote>', array('blockquote'));
$this->assertNoNormalized($f, 'script', 'HTML tag stripping evasion -- script in a blockquote.');
$f = filter_xss("<!--[if true]><script>alert(0)</script><![endif]-->");
$this->assertNoNormalized($f, 'script', 'HTML tag stripping evasion -- script within a comment.');
$f = filter_xss('<p onmouseover="">', array('p'));
$this->assertNoNormalized($f, 'onmouseover', 'HTML filter attributes removal -- events, no evasion.');
$f = filter_xss('<li style="list-style-image: url(javascript:alert(0))">', array('li'));
$this->assertNoNormalized($f, 'style', 'HTML filter attributes removal -- style, no evasion.');
$f = filter_xss('<img onerror =alert(0)>', array('img'));
$this->assertNoNormalized($f, 'onerror', 'HTML filter attributes removal evasion -- spaces before equals sign.');
$f = filter_xss('<img onabort!#$%&()*~+-_.,:;?@[/|\]^`=alert(0)>', array('img'));
$this->assertNoNormalized($f, 'onabort', 'HTML filter attributes removal evasion -- non alphanumeric characters before equals sign.');
$f = filter_xss('<img oNmediAError=alert(0)>', array('img'));
$this->assertNoNormalized($f, 'onmediaerror', 'HTML filter attributes removal evasion -- varying case.');
$f = filter_xss("<img o\0nfocus\0=alert(0)>", array('img'));
$this->assertNoNormalized($f, 'focus', 'HTML filter attributes removal evasion -- breaking with nulls.');
$f = filter_xss('<img src="javascript:alert(0)">', array('img'));
$this->assertNoNormalized($f, 'javascript', 'HTML scheme clearing -- no evasion.');
$f = filter_xss('<img src=javascript:alert(0)>', array('img'));
$this->assertNoNormalized($f, 'javascript', 'HTML scheme clearing evasion -- no quotes.');
$f = filter_xss('<img src="javascript:confirm(0)">', array('img'));
$this->assertNoNormalized($f, 'javascript', 'HTML scheme clearing evasion -- no alert ;)');
$f = filter_xss('<img src=`javascript:alert(0)`>', array('img'));
$this->assertNoNormalized($f, 'javascript', 'HTML scheme clearing evasion -- grave accents.');
$f = filter_xss('<img dynsrc="javascript:alert(0)">', array('img'));
$this->assertNoNormalized($f, 'javascript', 'HTML scheme clearing -- rare attribute.');
$f = filter_xss('<table background="javascript:alert(0)">', array('table'));
$this->assertNoNormalized($f, 'javascript', 'HTML scheme clearing -- another tag.');
$f = filter_xss('<base href="javascript:alert(0);//">', array('base'));
$this->assertNoNormalized($f, 'javascript', 'HTML scheme clearing -- one more attribute and tag.');
$f = filter_xss('<img src="jaVaSCriPt:alert(0)">', array('img'));
$this->assertNoNormalized($f, 'javascript', 'HTML scheme clearing evasion -- varying case.');
$f = filter_xss('<img src=javascript:alert(0)>', array('img'));
$this->assertNoNormalized($f, 'javascript', 'HTML scheme clearing evasion -- UTF-8 decimal encoding.');
$f = filter_xss('<img src=javascript:alert(0)>', array('img'));
$this->assertNoNormalized($f, 'javascript', 'HTML scheme clearing evasion -- long UTF-8 encoding.');
$f = filter_xss('<img src=javascript:alert(0)>', array('img'));
$this->assertNoNormalized($f, 'javascript', 'HTML scheme clearing evasion -- UTF-8 hex encoding.');
$f = filter_xss("<img src=\"jav\tascript:alert(0)\">", array('img'));
$this->assertNoNormalized($f, 'script', 'HTML scheme clearing evasion -- an embedded tab.');
$f = filter_xss('<img src="jav	ascript:alert(0)">', array('img'));
$this->assertNoNormalized($f, 'script', 'HTML scheme clearing evasion -- an encoded, embedded tab.');
$f = filter_xss('<img src="jav
ascript:alert(0)">', array('img'));
$this->assertNoNormalized($f, 'script', 'HTML scheme clearing evasion -- an encoded, embedded newline.');
$f = filter_xss('<img src="jav
ascript:alert(0)">', array('img'));
$this->assertNoNormalized($f, 'script', 'HTML scheme clearing evasion -- an encoded, embedded carriage return.');
$f = filter_xss("<img src=\"\n\n\nj\na\nva\ns\ncript:alert(0)\">", array('img'));
$this->assertNoNormalized($f, 'cript', 'HTML scheme clearing evasion -- broken into many lines.');
$f = filter_xss("<img src=\"jav\0a\0\0cript:alert(0)\">", array('img'));
$this->assertNoNormalized($f, 'cript', 'HTML scheme clearing evasion -- embedded nulls.');
$f = filter_xss('<img src=" 	 javascript:alert(0)">', array('img'));
$this->assertNoNormalized($f, 'javascript', 'HTML scheme clearing evasion -- spaces and metacharacters before scheme.');
$f = filter_xss('<img src="vbscript:msgbox(0)">', array('img'));
$this->assertNoNormalized($f, 'vbscript', 'HTML scheme clearing evasion -- another scheme.');
$f = filter_xss('<img src="nosuchscheme:notice(0)">', array('img'));
$this->assertNoNormalized($f, 'nosuchscheme', 'HTML scheme clearing evasion -- unknown scheme.');
$f = filter_xss('<br size="&{alert(0)}">', array('br'));
$this->assertNoNormalized($f, 'alert', 'Netscape 4.x javascript entities.');
$f = filter_xss("<p arg=\"\xe0\">\" style=\"background-image: url(javascript:alert(0));\"\xe0<p>", array('p'));
$this->assertNoNormalized($f, 'style', 'HTML filter -- invalid UTF-8.');
$f = filter_xss("\xc0aaa");
$this->assertEqual($f, '', 'HTML filter -- overlong UTF-8 sequences.');
$f = filter_xss("Who's Online");
$this->assertNormalized($f, "who's online", 'HTML filter -- html entity number');
$f = filter_xss("Who&#039;s Online");
$this->assertNormalized($f, "who's online", 'HTML filter -- encoded html entity number');
$f = filter_xss("Who&amp;#039; Online");
$this->assertNormalized($f, "who&#039; online", 'HTML filter -- double encoded html entity number');
function testHtmlFilter() {
$filter = new stdClass();
$filter->settings = array(
'allowed_html' => '<a> <em> <strong> <cite> <blockquote> <code> <ul> <ol> <li> <dl> <dt> <dd> <h3> <h4> <h5> <p> <test-element>',
'filter_html_help' => 1,
'filter_html_nofollow' => 0,
$f = _filter_html('<script />', $filter);
$this->assertNoNormalized($f, 'script', 'HTML filter should always remove script tags.');
$f = _filter_html('<iframe />', $filter);
$this->assertNoNormalized($f, 'iframe', 'HTML filter should always remove iframe tags.');
$f = _filter_html('<object />', $filter);
$this->assertNoNormalized($f, 'object', 'HTML filter should always remove object tags.');
$f = _filter_html('<style />', $filter);
$this->assertNoNormalized($f, 'style', 'HTML filter should always remove style tags.');
$f = _filter_html('<img />', $filter);
$this->assertNoNormalized($f, 'img', 'HTML filter should remove img tags on default.');
$f = _filter_html('<input />', $filter);
$this->assertNoNormalized($f, 'img', 'HTML filter should remove input tags on default.');
$f = _filter_html('<p style="display: none;" />', $filter);
$this->assertNoNormalized($f, 'style', 'HTML filter should remove style attribute on default.');
$f = _filter_html('<p onerror="alert(0);" />', $filter);
$this->assertNoNormalized($f, 'onerror', 'HTML filter should remove on* attributes on default.');
$f = _filter_html('<code onerror> </code>', $filter);
$this->assertNoNormalized($f, 'onerror', 'HTML filter should remove empty on* attributes on default.');
$f = _filter_html('<test-element></test-element>', $filter);
$this->assertNormalized($f, 'test-element', 'HTML filter should allow custom elements.');
function testNoFollowFilter() {
$filter = new stdClass();
$filter->settings = array(
'allowed_html' => '<a>',
'filter_html_help' => 1,
'filter_html_nofollow' => 1,
$f = _filter_html('<a href="">text</a>', $filter);
$this->assertNormalized($f, 'rel="nofollow"', 'Spam deterrent -- no evasion.');
$f = _filter_html('<A href="">text</a>', $filter);
$this->assertNormalized($f, 'rel="nofollow"', 'Spam deterrent evasion -- capital A.');
$f = _filter_html("<a/href=\"\">text</a>", $filter);
$this->assertNormalized($f, 'rel="nofollow"', 'Spam deterrent evasion -- non whitespace character after tag name.');
$f = _filter_html("<\0a\0 href=\"\">text</a>", $filter);
$this->assertNormalized($f, 'rel="nofollow"', 'Spam deterrent evasion -- some nulls.');
$f = _filter_html('<a href="" rel="follow">text</a>', $filter);
$this->assertNoNormalized($f, 'rel="follow"', 'Spam deterrent evasion -- with rel set - rel="follow" removed.');
$this->assertNormalized($f, 'rel="nofollow"', 'Spam deterrent evasion -- with rel set - rel="nofollow" added.');
function testFilterXSSAdmin() {
$f = filter_xss_admin('<object />');
$this->assertNoNormalized($f, 'object', 'Admin HTML filter -- should not allow object tag.');
$f = filter_xss_admin('<script />');
$this->assertNoNormalized($f, 'script', 'Admin HTML filter -- should not allow script tag.');
$f = filter_xss_admin('<style /><iframe /><frame /><frameset /><meta /><link /><embed /><applet /><param /><layer />');
$this->assertEqual($f, '', 'Admin HTML filter -- should never allow some tags.');
function testHtmlEscapeFilter() {
$filter = new stdClass();
$filter->callback = '_filter_html_escape';
$tests = array(
" One. <!-- \"comment\" --> Two'.\n<p>Three.</p>\n " => array(
"One. <!-- "comment" --> Two'.\n<p>Three.</p>" => TRUE,
' One.' => FALSE,
"</p>\n " => FALSE,
$this->assertFilteredString($filter, $tests);
function testUrlFilter() {
$filter = new stdClass();
$filter->callback = '_filter_url';
$filter->settings = array(
'filter_url_length' => 496,
$long_email = str_repeat('a', 254) . '';
$too_long_email = str_repeat('b', 255) . '';
$email_with_plus_sign = '';
$tests = array(
' or
' => array(
'<a href=""></a>' => TRUE,
'<a href=""></a>' => TRUE,
' or or ' . $email_with_plus_sign . ' or ' . $long_email . ' but not ' . $too_long_email . '
' => array(
'<a href=""></a>' => TRUE,
'<a href=""></a>' => TRUE,
'<a href="mailto:' . $long_email . '">' . $long_email . '</a>' => TRUE,
'<a href="mailto:' . $too_long_email . '">' . $too_long_email . '</a>' => FALSE,
'<a href="mailto:' . $email_with_plus_sign . '">' . $email_with_plus_sign . '</a>' => TRUE,
' or[baz]=beer#fragment or[baz]=beer#fragment!/example/status/22376963142324226
' => array(
'<a href=""></a>' => TRUE,
'<a href=""></a>' => TRUE,
'<a href="[baz]=beer#fragment">[baz]=beer#fragment</a>' => TRUE,
'<a href="[baz]=beer#fragment">[baz]=beer#fragment</a>' => TRUE,
'<a href="!/example/status/22376963142324226">!/example/status/22376963142324226</a>' => TRUE,
'<a href=""></a>' => TRUE,
'<a href="sftp://user@nonstandardport:222/dir">sftp://user@nonstandardport:222/dir</a>' => TRUE,
'<a href="ssh://">ssh://</a>' => TRUE,
' => array(
'<a href=""></a>' => TRUE,
'<a href=""></a>' => TRUE,
// cspell:disable-next-line
www.ex.ex or www.example.example or www.toolongdomainexampledomainexampledomainexampledomainexampledomain or
' => array(
'<a href="http://www.ex.ex">www.ex.ex</a>' => TRUE,
'<a href="http://www.example.example">www.example.example</a>' => TRUE,
'http://www.toolong' => FALSE,
'<a href=""></a>' => TRUE,
not foo://
' => array(
'href=""' => TRUE,
'href=""' => TRUE,
'href="news://"' => TRUE,
'href="telnet://example"' => TRUE,
'href="irc://"' => TRUE,
'href="ssh://odd.geek"' => TRUE,
'href="s"' => TRUE,
'href="webcal://calendar"' => TRUE,
'href="rtsp://"' => TRUE,
'href="foo://"' => FALSE,
'not foo://' => TRUE,
$this->assertFilteredString($filter, $tests);
$tests = array(
Partial URL with trailing period
Email with trailing comma,
Absolute URL with trailing question
Query string with trailing exclamation!
Partial URL with 3 trailing www.partial.periods...
Email with 3 trailing!!!
Absolute URL and query string with 2 different punctuation characters (
' => array(
'period <a href=""></a>.' => TRUE,
'comma <a href=""></a>,' => TRUE,
'question <a href=""></a>?' => TRUE,
'exclamation <a href=""></a>!' => TRUE,
'trailing <a href="http://www.partial.periods">www.partial.periods</a>...' => TRUE,
'trailing <a href=""></a>!!!' => TRUE,
'characters (<a href=""></a>).' => TRUE,
' => array(
'(<a href=""></a>)' => TRUE,
$this->assertFilteredString($filter, $tests);
$tests = array(
<p xmlns="" />
<p xmlns="">
An <a href="" title="Read more at">anchor</a>.
' => array(
'<p xmlns="" />' => TRUE,
'<p xmlns="">' => TRUE,
'href=""' => FALSE,
'href=""' => FALSE,
'An <a href="" title="Read more at">anchor</a>.' => TRUE,
Not <a href="foo"></a> or <a href=""></a>
but <strong></strong> or <em></em>
' => array(
'<a href="foo"></a>' => TRUE,
'href=""' => FALSE,
'<a href=""></a>' => TRUE,
'<strong><a href=""></a></strong>' => TRUE,
'<em><a href=""></a></em>' => TRUE,
Test <code>using the code tag</code>.
' => array(
'href' => FALSE,
'http' => FALSE,
Quoted text linking to, written by, originating from <code>@see or <em></em> bla bla</code>.
' => array(
'href=""' => TRUE,
'href=""' => TRUE,
'href=""' => TRUE,
'' => FALSE,
'' => FALSE,
'Intro.' => TRUE,
'Outro.' => TRUE,
Unknown tag <x>containing x and</x>? And a tag <pooh>beginning with p and containing www.example.pooh with p?</pooh>
' => array(
'href=""' => TRUE,
'href="http://www.example.pooh"' => TRUE,
<p>Test <br/>: This is a example <strong>with</strong> various tags. *<br/>
It is important to *<br/>test different URLs and in the same paragraph. *<br>
HTML soup by can literally contain *img*<img> anything. Just a with thrown in. from with extra
' => array(
'href=""' => TRUE,
'href=""' => TRUE,
'href=""' => TRUE,
'href=""' => TRUE,
'href=""' => TRUE,
'href=""' => TRUE,
'href=""' => TRUE,
'href=""' => TRUE,
'href=""' => TRUE,
'href=""' => TRUE,
'href=""' => TRUE,
'href=""' => TRUE,
// @see
var exampleUrl = "";
// @see
var exampleUrl = "";
' => array(
'href=""' => FALSE,
'href=""' => FALSE,
<style>body {
background: url(;
' => array(
'href' => FALSE,
<!-- Skip any URLs like in comments -->
' => array(
'href' => FALSE,
<!-- Skip any URLs like with a newline in comments -->
' => array(
'href' => FALSE,
<!-- Skip any URLs like in comments. <p>Also ignore http://commented.out/markup.</p> -->
' => array(
'href' => FALSE,
<dd>Some text around by</dd>
' => array(
'href=""' => TRUE,
'href=""' => TRUE,
'href=""' => TRUE,
'href=""' => TRUE,
'href=""' => TRUE,
'href=""' => TRUE,
<li class="odd"></li>
' => array(
'<div><a href=""></a></div>' => TRUE,
'<li><a href=""></a></li>' => TRUE,
'<li class="odd"><a href=""></a></li>' => TRUE,
<p class="nolink"></p>
<p class="no-link"></p>
<span class="link nolink button"></span>
<div id="divitis" class="nolink" alt="Alt text"></div>
<p class="nolink"></p>
<p class="nolink2"></p>
<span class="link nolink button"></span>
<div id="divitis" class="nolink" alt="Alt text"></div>
' => array(
'<p class="nolink"><a href=""></a></p>' => FALSE,
'<p class="no-link"><a href=""></a></p>' => TRUE,
'<span class="link nolink button"><a href=""></a></span>' => FALSE,
'<div id="divitis" class="nolink" alt="Alt text"><a href=""></a></div>' => FALSE,
'<p class="nolink"><a href=""></a></p>' => FALSE,
'<p class="nolink2"><a href=""></a></p>' => TRUE,
'<span class="link nolink button"><a href=""></a></span>' => FALSE,
'<div id="divitis" class="nolink" alt="Alt text"><a href=""></a></div>' => FALSE,
$this->assertFilteredString($filter, $tests);
$filter->settings['filter_url_length'] = 20;
$tests = array(
'' => array(
'<a href=""></a>' => TRUE,
$this->assertFilteredString($filter, $tests);
function assertFilteredString($filter, $tests) {
foreach ($tests as $source => $tasks) {
$function = $filter->callback;
$result = $function($source, $filter);
foreach ($tasks as $value => $is_expected) {
if ($is_expected) {
$success = $this->assertTrue(strpos($result, $value) !== FALSE, format_string('@source: @value found.', array(
'@source' => var_export($source, TRUE),
'@value' => var_export($value, TRUE),
else {
$success = $this->assertTrue(strpos($result, $value) === FALSE, format_string('@source: @value not found.', array(
'@source' => var_export($source, TRUE),
'@value' => var_export($value, TRUE),
if (!$success) {
$this->verbose('Source:<pre>' . check_plain(var_export($source, TRUE)) . '</pre>'
. '<hr />Result:<pre>' . check_plain(var_export($result, TRUE)) . '</pre>'
. '<hr />' . ($is_expected ? 'Expected:' : 'Not expected:')
. '<pre>' . check_plain(var_export($value, TRUE)) . '</pre>'
function testUrlFilterContent() {
$filter = new stdClass();
$filter->settings = array(
'filter_url_length' => 496,
$path = backdrop_get_path('module', 'filter') . '/tests';
$input = file_get_contents($path . '/filter.url-input.txt');
$expected = file_get_contents($path . '/filter.url-output.txt');
$result = _filter_url($input, $filter);
$this->assertIdentical($result, $expected, 'Complex HTML document was correctly processed.');
function testImageAlignFilter() {
$filter = new stdClass();
$filter->callback = '_filter_image_align';
$input = <<<EOF
<p><img src="foo.png" width="100" height="100" data-align="right" /></p>
<p><img src="foo.png" width="100" height="100" data-align="left" /></p>
<p><img src="foo.png" width="100" height="100" data-align="center" /></p>
<p><img src="foo.png" width="100" height="100" data-align="bottom" /></p>
<p><img src="foo.png" class="foo" data-align="right" /></p>
<blockquote data-align="left">
A quote
<p class="foo" data-align="center">
Centered paragraph.
$tests = array(
$input => array(
'<img src="foo.png" width="100" height="100" class="align-right" />' => TRUE,
'<img src="foo.png" width="100" height="100" class="align-left" />' => TRUE,
'<img src="foo.png" width="100" height="100" class="align-center" />' => TRUE,
'<img src="foo.png" width="100" height="100" />' => TRUE,
'<img src="foo.png" width="100" height="100" class="align-bottom" />' => FALSE,
'<img src="foo.png" class="foo align-right" />' => TRUE,
'<blockquote class="align-left">' => TRUE,
'<p class="foo align-center">' => TRUE,
'<body>' => FALSE,
$this->assertFilteredString($filter, $tests);
function testImageAlignCaption() {
$filter = new stdClass();
$filter->callback = '_filter_image_caption';
$input = <<<EOF
<img data-caption="Simple caption" src="foo.png" />
<img data-caption="The caption with a <a href="/foo"> link</a>.<strong> Bold tag.</strong>" src="foo.png" />
<img data-caption="The caption with a <div>not allowed tag</div>." src="foo.png" />
$tests = array(
$input => array(
'<figure class="caption caption-img"><img src="foo.png" /><figcaption>Simple caption</figcaption></figure>' => TRUE,
'<figure class="caption caption-img"><img src="foo.png" /><figcaption>The caption with a <a href="/foo"> link</a>.<strong> Bold tag.</strong></figcaption></figure>' => TRUE,
'<figure class="caption caption-img"><img src="foo.png" /><figcaption>The caption with a not allowed tag.</figcaption></figure>' => TRUE,
'<figure class="caption caption-img"><img src="foo.png" /><figcaption>The caption with a <div>not allowed tag</div>.</figcaption></figure>' => FALSE,
'<body>' => FALSE,
$this->assertFilteredString($filter, $tests);
function testHtmlCorrectorFilter() {
$f = _filter_htmlcorrector('<p>text');
$this->assertEqual($f, '<p>text</p>', 'HTML corrector -- tag closing at the end of input.');
$f = _filter_htmlcorrector('<p>text<p><p>text');
$this->assertEqual($f, '<p>text</p><p></p><p>text</p>', 'HTML corrector -- tag closing.');
$f = _filter_htmlcorrector("<ul><li>e1<li>e2");
$this->assertEqual($f, "<ul><li>e1</li><li>e2</li></ul>", 'HTML corrector -- unclosed list tags.');
$f = _filter_htmlcorrector('<div id="d">content');
$this->assertEqual($f, '<div id="d">content</div>', 'HTML corrector -- unclosed tag with attribute.');
$f = _filter_htmlcorrector('<hr><br>');
$this->assertEqual($f, '<hr /><br />', 'HTML corrector -- XHTML closing slash.');
$f = _filter_htmlcorrector('<P>test</P>');
$this->assertEqual($f, '<p>test</p>', 'HTML corrector -- Convert uppercased tags to proper lowercased ones.');
$f = _filter_htmlcorrector('<P>test</p>');
$this->assertEqual($f, '<p>test</p>', 'HTML corrector -- Convert uppercased tags to proper lowercased ones.');
$f = _filter_htmlcorrector('test<hr />');
$this->assertEqual($f, 'test<hr />', 'HTML corrector -- Let proper XHTML pass through.');
$f = _filter_htmlcorrector('test<hr/>');
$this->assertEqual($f, 'test<hr />', 'HTML corrector -- Let proper XHTML pass through, but ensure there is a single space before the closing slash.');
$f = _filter_htmlcorrector('test<hr />');
$this->assertEqual($f, 'test<hr />', 'HTML corrector -- Let proper XHTML pass through, but ensure there are not too many spaces before the closing slash.');
$f = _filter_htmlcorrector('<span class="test" />');
$this->assertEqual($f, '<span class="test"></span>', 'HTML corrector -- Convert XHTML that is properly formed but that would not be compatible with typical HTML user agents.');
$f = _filter_htmlcorrector('test1<br class="test">test2');
$this->assertEqual($f, 'test1<br class="test" />test2', 'HTML corrector -- Automatically close single tags.');
$f = _filter_htmlcorrector('line1<hr>line2');
$this->assertEqual($f, 'line1<hr />line2', 'HTML corrector -- Automatically close single tags.');
$f = _filter_htmlcorrector('line1<HR>line2');
$this->assertEqual($f, 'line1<hr />line2', 'HTML corrector -- Automatically close single tags.');
$f = _filter_htmlcorrector('<img src="">test</img>');
$this->assertEqual($f, '<img src="" />test', 'HTML corrector -- Automatically close single tags.');
$f = _filter_htmlcorrector('<br></br>');
$this->assertEqual($f, '<br />', "HTML corrector -- Transform empty tags to a single closed tag if the tag's content model is EMPTY.");
$f = _filter_htmlcorrector('<div></div>');
$this->assertEqual($f, '<div></div>', "HTML corrector -- Do not transform empty tags to a single closed tag if the tag's content model is not EMPTY.");
$f = _filter_htmlcorrector('<p>line1<br/><hr/>line2</p>');
$this->assertEqual($f, '<p>line1<br /></p><hr />line2', 'HTML corrector -- Move non-inline elements outside of inline containers.');
$f = _filter_htmlcorrector('<p>line1<div>line2</div></p>');
$this->assertEqual($f, '<p>line1</p><div>line2</div>', 'HTML corrector -- Move non-inline elements outside of inline containers.');
$f = _filter_htmlcorrector('<p>test<p>test</p>\n');
$this->assertEqual($f, '<p>test</p><p>test</p>\n', 'HTML corrector -- Auto-close improperly nested tags.');
$f = _filter_htmlcorrector('<p>Line1<br><STRONG>bold stuff</b>');
$this->assertEqual($f, '<p>Line1<br /><strong>bold stuff</strong></p>', 'HTML corrector -- Properly close unclosed tags, and remove useless closing tags.');
$f = _filter_htmlcorrector('test <!-- this is a comment -->');
$this->assertEqual($f, 'test <!-- this is a comment -->', 'HTML corrector -- Do not touch HTML comments.');
$f = _filter_htmlcorrector('test <!--this is a comment-->');
$this->assertEqual($f, 'test <!--this is a comment-->', 'HTML corrector -- Do not touch HTML comments.');
$f = _filter_htmlcorrector('test <!-- comment <p>another
<strong>multiple</strong> line
comment</p> -->');
$this->assertEqual($f, 'test <!-- comment <p>another
<strong>multiple</strong> line
comment</p> -->', 'HTML corrector -- Do not touch HTML comments.');
$f = _filter_htmlcorrector('test <!-- comment <p>another comment</p> -->');
$this->assertEqual($f, 'test <!-- comment <p>another comment</p> -->', 'HTML corrector -- Do not touch HTML comments.');
$f = _filter_htmlcorrector('test <!--break-->');
$this->assertEqual($f, 'test <!--break-->', 'HTML corrector -- Do not touch HTML comments.');
$f = _filter_htmlcorrector('<p>test\n</p>\n');
$this->assertEqual($f, '<p>test\n</p>\n', 'HTML corrector -- New-lines are accepted and kept as-is.');
$f = _filter_htmlcorrector('<p>دروبال');
$this->assertEqual($f, '<p>دروبال</p>', 'HTML corrector -- Encoding is correctly kept.');
$f = _filter_htmlcorrector('<script type="text/javascript">alert("test")</script>');
$this->assertEqual($f, '<script type="text/javascript">
<!--//--><![CDATA[// ><!--
</script>', 'HTML corrector -- CDATA added to script element');
$f = _filter_htmlcorrector('<p><script type="text/javascript">alert("test")</script></p>');
$this->assertEqual($f, '<p><script type="text/javascript">
<!--//--><![CDATA[// ><!--
</script></p>', 'HTML corrector -- CDATA added to a nested script element');
$f = _filter_htmlcorrector('<p><style> /* Styling */ body {color:red}</style></p>');
$this->assertEqual($f, '<p><style>
<!--/*--><![CDATA[/* ><!--*/
/* Styling */ body {color:red}
</style></p>', 'HTML corrector -- CDATA added to a style element.');
$filtered_data = _filter_htmlcorrector('<p><style>
/* Styling */
body {color:red}
$this->assertEqual($filtered_data, '<p><style>
<!--/*--><![CDATA[/* ><!--*/
/* Styling */
body {color:red}
format_string('HTML corrector -- Existing cdata section @pattern_name properly escaped', array('@pattern_name' => '/*<![CDATA[*/'))
$filtered_data = _filter_htmlcorrector('<p><style>
<!--/*--><![CDATA[/* ><!--*/
/* Styling */
body {color:red}
$this->assertEqual($filtered_data, '<p><style>
<!--/*--><![CDATA[/* ><!--*/
<!--/*--><![CDATA[/* ><!--*/
/* Styling */
body {color:red}
format_string('HTML corrector -- Existing cdata section @pattern_name properly escaped', array('@pattern_name' => '<!--/*--><![CDATA[/* ><!--*/'))
$filtered_data = _filter_htmlcorrector('<p><script type="text/javascript">
<!--//--><![CDATA[// ><!--
$this->assertEqual($filtered_data, '<p><script type="text/javascript">
<!--//--><![CDATA[// ><!--
<!--//--><![CDATA[// ><!--
format_string('HTML corrector -- Existing cdata section @pattern_name properly escaped', array('@pattern_name' => '<!--//--><![CDATA[// ><!--'))
$filtered_data = _filter_htmlcorrector('<p><script type="text/javascript">
// <![CDATA[
// ]]>
$this->assertEqual($filtered_data, '<p><script type="text/javascript">
<!--//--><![CDATA[// ><!--
// <![CDATA[
// ]]]]><![CDATA[>
format_string('HTML corrector -- Existing cdata section @pattern_name properly escaped', array('@pattern_name' => '// <![CDATA['))
function assertNormalized($haystack, $needle, $message = '', $group = 'Other') {
return $this->assertTrue(strpos(strtolower(decode_entities($haystack)), $needle) !== FALSE, $message, $group);
function assertNoNormalized($haystack, $needle, $message = '', $group = 'Other') {
return $this->assertTrue(strpos(strtolower(decode_entities($haystack)), $needle) === FALSE, $message, $group);