'Filter administration functionality', 'description' => 'Thoroughly test the administrative interface of the filter module.', 'group' => 'Filter', ); } /** * Test filter administration functionality. */ function testFilterAdmin() { // URL filter. $first_filter = 2; // Line filter. $second_filter = 1; // Create users. $admin_user = $this->drupalCreateUser(array('administer filters')); $web_user = $this->drupalCreateUser(array('create page content')); $this->drupalLogin($admin_user); list($filtered, $full) = $this->checkFilterFormats(); // Change default filter. $edit = array(); $edit['default'] = $full; $this->drupalPost('admin/settings/formats', $edit, t('Save changes')); $this->assertText(t('Default format updated.'), t('Default filter updated successfully.')); $this->assertNoRaw('admin/settings/formats/delete/' . $full, t('Delete link not found.')); // Add an additional tag. $edit = array(); $edit['allowed_html_1'] = ' '; $this->drupalPost('admin/settings/formats/' . $filtered . '/configure', $edit, t('Save configuration')); $this->assertText(t('The configuration options have been saved.'), t('Allowed HTML tag added.')); $this->assertRaw(htmlentities($edit['allowed_html_1']), t('Tag displayed.')); $result = db_query('SELECT * FROM {cache_filter}')->fetchObject(); $this->assertFalse($result, t('Cache cleared.')); // Reorder filters. $edit = array(); $edit['weights[filter/' . $second_filter . ']'] = 1; $edit['weights[filter/' . $first_filter . ']'] = 2; $this->drupalPost('admin/settings/formats/' . $filtered . '/order', $edit, t('Save configuration')); $this->assertText(t('The filter ordering has been saved.'), t('Order saved successfully.')); $result = db_query('SELECT * FROM {filter} WHERE format = :format ORDER BY weight ASC', array(':format' => $filtered)); $filters = array(); foreach ($result as $filter) { if ($filter->delta == $second_filter || $filter->delta == $first_filter) { $filters[] = $filter; } } $this->assertTrue(($filters[0]->delta == $second_filter && $filters[1]->delta == $first_filter), t('Order confirmed.')); // Add filter. $edit = array(); $edit['name'] = $this->randomName(); $edit['roles[2]'] = TRUE; $edit['filters[filter/' . $second_filter . ']'] = TRUE; $edit['filters[filter/' . $first_filter . ']'] = TRUE; $this->drupalPost('admin/settings/formats/add', $edit, t('Save configuration')); $this->assertRaw(t('Added text format %format.', array('%format' => $edit['name'])), t('New filter created.')); $format = $this->getFilter($edit['name']); $this->assertNotNull($format, t('Format found in database.')); if ($format !== NULL) { $this->assertFieldByName('roles[2]', '', t('Role found.')); $this->assertFieldByName('filters[filter/' . $second_filter . ']', '', t('Line break filter found.')); $this->assertFieldByName('filters[filter/' . $first_filter . ']', '', t('Url filter found.')); // Delete new filter. $this->drupalPost('admin/settings/formats/delete/' . $format->format, array(), t('Delete')); $this->assertRaw(t('Deleted text format %format.', array('%format' => $edit['name'])), t('Format successfully deleted.')); } // Change default filter back. $edit = array(); $edit['default'] = $filtered; $this->drupalPost('admin/settings/formats', $edit, t('Save changes')); $this->assertText(t('Default format updated.'), t('Default filter updated successfully.')); $this->assertNoRaw('admin/settings/formats/delete/' . $filtered, t('Delete link not found.')); // Allow authenticated users on full HTML. $edit = array(); $edit['roles[2]'] = TRUE; $this->drupalPost('admin/settings/formats/' . $full, $edit, t('Save configuration')); $this->assertText(t('The text format settings have been updated.'), t('Full HTML format successfully updated.')); // Switch user. $this->drupalLogout(); $this->drupalLogin($web_user); $this->drupalGet('node/add/page'); $this->assertRaw('', t('Full HTML filter accessible.')); // Use filtered HTML and see if it removes tags that are not allowed. $body = $this->randomName(); $extra_text = 'text'; $edit = array(); $edit['title'] = $this->randomName(); $edit['body[0][value]'] = $body . '' . $extra_text . ''; $edit['body[0][value_format]'] = $filtered; $this->drupalPost('node/add/page', $edit, t('Save')); $this->assertRaw(t('Page %title has been created.', array('%title' => $edit['title'])), t('Filtered node created.')); $node = $this->drupalGetNodeByTitle($edit['title']); $this->assertTrue($node, t('Node found in database.')); $this->drupalGet('node/' . $node->nid); $this->assertText($body . $extra_text, t('Filter removed invalid tag.')); // Switch user. $this->drupalLogout(); $this->drupalLogin($admin_user); // Clean up. // Allowed tags. $edit = array(); $edit['allowed_html_1'] = ' '; $this->drupalPost('admin/settings/formats/' . $filtered . '/configure', $edit, t('Save configuration')); $this->assertText(t('The configuration options have been saved.'), t('Changes reverted.')); // Full HTML. $edit = array(); $edit['roles[2]'] = FALSE; $this->drupalPost('admin/settings/formats/' . $full, $edit, t('Save configuration')); $this->assertText(t('The text format settings have been updated.'), t('Full HTML format successfully reverted.')); // Filter order. $edit = array(); $edit['weights[filter/' . $second_filter . ']'] = 2; $edit['weights[filter/' . $first_filter . ']'] = 1; $this->drupalPost('admin/settings/formats/' . $filtered . '/order', $edit, t('Save configuration')); $this->assertText(t('The filter ordering has been saved.'), t('Order successfully reverted.')); } /** * Query the database to get the two basic formats. * * @return * An array containing filtered and full filter ids. */ function checkFilterFormats() { $result = db_query('SELECT format, name FROM {filter_format}'); $filtered = -1; $full = -1; foreach ($result as $format) { if ($format->name == 'Filtered HTML') { $filtered = $format->format; } elseif ($format->name == 'Full HTML') { $full = $format->format; } } return array($filtered, $full); } /** * Get filter by name. * * @param $name * Name of filter to find. * @return * A filter object. */ function getFilter($name) { return db_query("SELECT * FROM {filter_format} WHERE name = :name", array(':name' => $name))->fetchObject(); } } class FilterTestCase extends DrupalWebTestCase { protected $format; public static function getInfo() { return array( 'name' => 'Core filters', 'description' => 'Filter each filter individually: Convert URLs into links, Convert line breaks, Correct broken HTML, Escape all HTML, Limit allowed HTML tags.', 'group' => 'Filter', ); } function setUp() { parent::setUp(); $admin_user = $this->drupalCreateUser(array('administer filters', 'create page content')); $this->drupalLogin($admin_user); } /** * Test the line break filter. */ function testLineBreakFilter() { // Single line breaks should be changed to tags, while paragraphs // separated with double line breaks should be enclosed with tags. $f = _filter_autop("aaa\nbbb\n\nccc"); $this->assertEqual(str_replace("\n", '', $f), "aaa bbb ccc", t('Line breaking basic case.')); // Text within some contexts should not be processed. $f = _filter_autop(""); $this->assertEqual($f, "", t('Line breaking -- do not break scripts.')); $f = _filter_autop(' '); $this->assertEqual(substr_count($f, ''), substr_count($f, ''), t('Make sure line breaking produces matching paragraph tags.')); $f = _filter_autop(' '); $this->assertEqual(substr_count($f, ''), substr_count($f, ''), t('Make sure line breaking produces matching paragraph tags.')); $f = _filter_autop('aaa'); $this->assertEqual(substr_count($f, ''), substr_count($f, ''), t('Make sure line breaking produces matching paragraph tags.')); $limit = max(ini_get('pcre.backtrack_limit'), ini_get('pcre.recursion_limit')); $f = _filter_autop($this->randomName($limit)); $this->assertNotEqual($f, '', t('Make sure line breaking can process long strings.')); } /** * Test limiting allowed tags, XSS prevention and adding 'nofollow' to links. * * XSS tests assume that script is dissallowed on default and src is allowed * on default, but on* and style are dissallowed. * * Script injection vectors mostly adopted from http://ha.ckers.org/xss.html. * * Relevant CVEs: * - CVE-2002-1806, ~CVE-2005-0682, ~CVE-2005-2106, CVE-2005-3973, * CVE-2006-1226 (= rev. 1.112?), CVE-2008-0273, CVE-2008-3740. */ function testHtmlFilter() { // Tag stripping, different ways to work around removal of HTML tags. $f = filter_xss(''); $this->assertNoNormalized($f, 'script', t('HTML tag stripping -- simple script without special characters.')); $f = filter_xss(''); $this->assertNoNormalized($f, 'script', t('HTML tag stripping evasion -- non whitespace character after tag name.')); $f = filter_xss(''); $this->assertNoNormalized($f, 'script', t('HTML tag stripping evasion -- no space between tag and attribute.')); // Null between < and tag name works at least with IE6. $f = filter_xss("<\0scr\0ipt>alert(0)"); $this->assertNoNormalized($f, 'ipt', t('HTML tag stripping evasion -- breaking HTML with nulls.')); $f = filter_xss(""); $this->assertNoNormalized($f, 'script', t('HTML tag stripping evasion -- filter just removing "script".')); $f = filter_xss('<'); $this->assertNoNormalized($f, 'script', t('HTML tag stripping evasion -- double opening brackets.')); $f = filter_xss('', array('img')); $this->assertNoNormalized($f, 'script', t('HTML tag stripping evasion -- a malformed image tag.')); $f = filter_xss('', array('blockquote')); $this->assertNoNormalized($f, 'script', t('HTML tag stripping evasion -- script in a blockqoute.')); $f = filter_xss(""); $this->assertNoNormalized($f, 'script', t('HTML tag stripping evasion -- script within a comment.')); // Dangerous attributes removal. $f = filter_xss('', array('p')); $this->assertNoNormalized($f, 'onmouseover', t('HTML filter attributes removal -- events, no evasion.')); $f = filter_xss(' ', array('li')); $this->assertNoNormalized($f, 'style', t('HTML filter attributes removal -- style, no evasion.')); $f = filter_xss('', array('img')); $this->assertNoNormalized($f, 'onerror', t('HTML filter attributes removal evasion -- spaces before equals sign.')); $f = filter_xss('', array('img')); $this->assertNoNormalized($f, 'onabort', t('HTML filter attributes removal evasion -- non alphanumeric characters before equals sign.')); $f = filter_xss('', array('img')); $this->assertNoNormalized($f, 'onmediaerror', t('HTML filter attributes removal evasion -- varying case.')); // Works at least with IE6. $f = filter_xss("", array('img')); $this->assertNoNormalized($f, 'focus', t('HTML filter attributes removal evasion -- breaking with nulls.')); // Only whitelisted scheme names allowed in attributes. $f = filter_xss('', array('img')); $this->assertNoNormalized($f, 'javascript', t('HTML scheme clearing -- no evasion.')); $f = filter_xss('', array('img')); $this->assertNoNormalized($f, 'javascript', t('HTML scheme clearing evasion -- no quotes.')); // A bit like CVE-2006-0070. $f = filter_xss('', array('img')); $this->assertNoNormalized($f, 'javascript', t('HTML scheme clearing evasion -- no alert ;)')); $f = filter_xss('', array('img')); $this->assertNoNormalized($f, 'javascript', t('HTML scheme clearing evasion -- grave accents.')); $f = filter_xss('', array('img')); $this->assertNoNormalized($f, 'javascript', t('HTML scheme clearing -- rare attribute.')); $f = filter_xss('', array('table')); $this->assertNoNormalized($f, 'javascript', t('HTML scheme clearing -- another tag.')); $f = filter_xss('', array('base')); $this->assertNoNormalized($f, 'javascript', t('HTML scheme clearing -- one more attribute and tag.')); $f = filter_xss('', array('img')); $this->assertNoNormalized($f, 'javascript', t('HTML scheme clearing evasion -- varying case.')); $f = filter_xss('', array('img')); $this->assertNoNormalized($f, 'javascript', t('HTML scheme clearing evasion -- UTF-8 decimal encoding.')); $f = filter_xss('', array('img')); $this->assertNoNormalized($f, 'javascript', t('HTML scheme clearing evasion -- long UTF-8 encoding.')); $f = filter_xss('', array('img')); $this->assertNoNormalized($f, 'javascript', t('HTML scheme clearing evasion -- UTF-8 hex encoding.')); $f = filter_xss("", array('img')); $this->assertNoNormalized($f, 'script', t('HTML scheme clearing evasion -- an embedded tab.')); $f = filter_xss('', array('img')); $this->assertNoNormalized($f, 'script', t('HTML scheme clearing evasion -- an encoded, embedded tab.')); $f = filter_xss('', array('img')); $this->assertNoNormalized($f, 'script', t('HTML scheme clearing evasion -- an encoded, embedded newline.')); // With this test would fail, but the entity gets turned into // , so it's OK. $f = filter_xss('', array('img')); $this->assertNoNormalized($f, 'script', t('HTML scheme clearing evasion -- an encoded, embedded carriage return.')); $f = filter_xss("", array('img')); $this->assertNoNormalized($f, 'cript', t('HTML scheme clearing evasion -- broken into many lines.')); $f = filter_xss("", array('img')); $this->assertNoNormalized($f, 'cript', t('HTML scheme clearing evasion -- embedded nulls.')); $f = filter_xss('', array('img')); $this->assertNoNormalized($f, 'javascript', t('HTML scheme clearing evasion -- spaces and metacharacters before scheme.')); $f = filter_xss('', array('img')); $this->assertNoNormalized($f, 'vbscript', t('HTML scheme clearing evasion -- another scheme.')); $f = filter_xss('', array('img')); $this->assertNoNormalized($f, 'nosuchscheme', t('HTML scheme clearing evasion -- unknown scheme.')); // Netscape 4.x javascript entities. $f = filter_xss(' ', array('br')); $this->assertNoNormalized($f, 'alert', t('Netscape 4.x javascript entities.')); // DRUPAL-SA-2008-006: Invalid UTF-8, these only work as reflected XSS with // Internet Explorer 6. $f = filter_xss("\" style=\"background-image: url(javascript:alert(0));\"\xe0 ", array('p')); $this->assertNoNormalized($f, 'style', t('HTML filter -- invalid UTF-8.')); $f = filter_xss("\xc0aaa"); $this->assertEqual($f, '', t('HTML filter -- overlong UTF-8 sequences.')); $f = filter_xss("Who's Online"); $this->assertNormalized($f, "who's online", t('HTML filter -- html entity number')); $f = filter_xss("Who's Online"); $this->assertNormalized($f, "who's online", t('HTML filter -- encoded html entity number')); $f = filter_xss("Who&#039; Online"); $this->assertNormalized($f, "who' online", t('HTML filter -- double encoded html entity number')); } /** * Test filter settings, defaults, access restrictions and similar. * * @todo This is for functions like filter_filter and check_markup, whose * functionality is not completely focused on filtering. Some ideas: * restricting formats according to user permissions, proper cache * handling, defaults -- allowed tags/attributes/protocols. * * @todo It is possible to add script, iframe etc. to allowed tags, but this * makes HTML filter completely ineffective. * * @todo Class, id, name and xmlns should be added to disallowed attributes, * or better a whitelist approach should be used for that too. */ function testFilter() { // Check that access restriction really works. // HTML filter is not able to secure some tags, these should never be // allowed. $f = filter_filter('process', 0, 'no_such_format', '', 'f'); $this->assertEqual($f, '', t('Converting URLs -- do not process scripts.')); // Addresses in attributes should not be converted. $f = _filter_url(' ', 'f'); $this->assertEqual($f, ' ', t('Converting URLs -- do not convert addresses in attributes.')); $f = _filter_url('text', 'f'); $this->assertEqual($f, 'text', t('Converting URLs -- do not break existing links with custom title attribute.')); // Even though a dot at the end of a URL can indicate a fully qualified // domain name, such usage is rare compared to using a link at the end // of a sentence, so remove the dot from the link. // @todo It can also be used at the end of a filename or a query string. $f = _filter_url('www.example.com.', 'f'); $this->assertEqual($f, 'www.example.com.', t('Converting URLs -- do not recognize a dot at the end of a domain name (FQDNs).')); $f = _filter_url('http://www.example.com.', 'f'); $this->assertEqual($f, 'http://www.example.com.', t('Converting URLs -- do not recognize a dot at the end of an URL (FQDNs).')); $f = _filter_url('www.example.com/index.php?a=.', 'f'); $this->assertEqual($f, 'www.example.com/index.php?a=.', t('Converting URLs -- do forget about a dot at the end of a query string.')); } /** * Test the HTML corrector. * * @todo This test could really use some validity checking function. */ function testHtmlCorrector() { // Tag closing. $f = _filter_htmlcorrector(' text'); $this->assertEqual($f, ' text', t('HTML corrector -- tag closing at the end of input.')); $f = _filter_htmlcorrector('text text'); $this->assertEqual($f, ' text text', t('HTML corrector -- tag closing.')); $f = _filter_htmlcorrector("e1 e2"); $this->assertEqual($f, "e1 e2", t('HTML corrector -- unclosed list tags.')); $f = _filter_htmlcorrector('content'); $this->assertEqual($f, 'content', t('HTML corrector -- unclosed tag with attribute.')); // XHTML slash for empty elements. $f = _filter_htmlcorrector(' '); $this->assertEqual($f, ' ', t('HTML corrector -- XHTML closing slash.')); } function createFormat($filter) { $edit = array( 'name' => $this->randomName(), 'roles[2]' => TRUE, 'filters[filter/' . $filter . ']' => TRUE, ); $this->drupalPost('admin/settings/filter/add', $edit, t('Save configuration')); return db_query("SELECT * FROM {filter_format} WHERE name = :name", array(':name' => $edit['name']))->fetchObject(); } function deleteFormat($format) { if ($format !== NULL) { $this->drupalPost('admin/settings/formats/delete/' . $format->format, array(), t('Delete')); } } /** * Asserts that a text transformed to lowercase with HTML entities decoded does contains a given string. * * Otherwise fails the test with a given message, similar to all the * SimpleTest assert* functions. * * Note that this does not remove nulls, new lines and other characters that * could be used to obscure a tag or an attribute name. * * @param $haystack * Text to look in. * @param $needle * Lowercase, plain text to look for. * @param $message * Message to display if failed. * @param $group * The group this message belongs to, defaults to 'Other'. * @return * TRUE on pass, FALSE on fail. */ function assertNormalized($haystack, $needle, $message = '', $group = 'Other') { return $this->assertTrue(strpos(strtolower(decode_entities($haystack)), $needle) !== FALSE, $message, $group); } /** * Asserts that text transformed to lowercase with HTML entities decoded does not contain a given string. * * Otherwise fails the test with a given message, similar to all the * SimpleTest assert* functions. * * Note that this does not remove nulls, new lines, and other character that * could be used to obscure a tag or an attribute name. * * @param $haystack * Text to look in. * @param $needle * Lowercase, plain text to look for. * @param $message * Message to display if failed. * @param $group * The group this message belongs to, defaults to 'Other'. * @return * TRUE on pass, FALSE on fail. */ function assertNoNormalized($haystack, $needle, $message = '', $group = 'Other') { return $this->assertTrue(strpos(strtolower(decode_entities($haystack)), $needle) === FALSE, $message, $group); } }