<?php require_once('common.php'); function formatCode($string) { return str_replace( array("\t", '»', '\0(null)'), array('<strong>\t</strong>', '<span class="linebreak">»</span>', '<strong>\0</strong>'), escapeHTML( str_replace("\0", '\0(null)', wordwrap($string, 28, " »\n", true) ) ) ); } ?><!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd"> <html> <head> <title>HTML Purifier XSS Attacks Smoketest</title> <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" /> <style type="text/css"> .scroll {overflow:auto; width:100%;} .even {background:#EAEAEA;} thead th {border-bottom:1px solid #000;} pre strong {color:#00C;} pre .linebreak {color:#AAA;font-weight:100;} </style> </head> <body> <h1>HTML Purifier XSS Attacks Smoketest</h1> <p>XSS attacks are from <a href="http://ha.ckers.org/xss.html">http://ha.ckers.org/xss.html</a>.</p> <p><strong>Caveats:</strong> <tt>Google.com</tt> has been programatically disallowed, but as you can see, there are ways of getting around that, so coverage in this area is not complete. Most XSS broadcasts its presence by spawning an alert dialogue. The displayed code is not strictly correct, as linebreaks have been forced for readability. Linewraps have been marked with <tt>»</tt>. Some tests are omitted for your convenience. Not all control characters are displayed.</p> <h2>Test</h2> <?php if (version_compare(PHP_VERSION, '5', '<')) exit('<p>Requires PHP 5.</p>'); $xml = simplexml_load_file('xssAttacks.xml'); // programatically disallow google.com for URI evasion tests // not complete $config = HTMLPurifier_Config::createDefault(); $config->set('URI.HostBlacklist', array('google.com')); $purifier = new HTMLPurifier($config); ?> <table cellspacing="0" cellpadding="2"> <thead><tr><th>Name</th><th width="30%">Raw</th><th>Output</th><th>Render</th></tr></thead> <tbody> <?php $i = 0; foreach ($xml->attack as $attack) { $code = $attack->code; // custom code for null byte injection tests if (substr($code, 0, 7) == 'perl -e') { $code = substr($code, $i=strpos($code, '"')+1, strrpos($code, '"') - $i); $code = str_replace('\0', "\0", $code); } // disable vectors we cannot test in any meaningful way if ($code == 'See Below') continue; // event handlers, whitelist defeats if ($attack->name == 'OBJECT w/Flash 2') continue; // requires ActionScript if ($attack->name == 'IMG Embedded commands 2') continue; // is an HTTP response // custom code for US-ASCII, which couldn't be expressed in XML without encoding if ($attack->name == 'US-ASCII encoding') $code = urldecode($code); ?> <tr<?php if ($i++ % 2) {echo ' class="even"';} ?>> <td><?php echo escapeHTML($attack->name); ?></td> <td><pre><?php echo formatCode($code); ?></pre></td> <?php $pure_html = $purifier->purify($code); ?> <td><pre><?php echo formatCode($pure_html); ?></pre></td> <td><div class="scroll"><?php echo $pure_html ?></div></td> </tr> <?php } ?> </tbody> </table> </body> </html> <?php // vim: et sw=4 sts=4