0
0
mirror of https://github.com/ezyang/htmlpurifier.git synced 2024-09-20 03:05:18 +00:00
htmlpurifier/benchmarks/Lexer.php

120 lines
2.9 KiB
PHP
Raw Normal View History

<?php
// emulates inserting a dir called HTMLPurifier into your class dir
set_include_path(get_include_path() . PATH_SEPARATOR . '../../');
require_once 'HTMLPurifier/Lexer/DirectLex.php';
require_once 'HTMLPurifier/Lexer/PEARSax3.php';
// PEAR
require_once 'Benchmark/Timer.php'; // to do the timing
require_once 'Text/Password.php'; // for generating random input
// custom class to aid unit testing
class TinyTimer extends Benchmark_Timer
{
var $name;
function TinyTimer($name, $auto = false) {
$this->name = htmlentities($name);
$this->Benchmark_Timer($auto);
}
function getOutput() {
$total = $this->TimeElapsed();
$result = $this->getProfiling();
$dashes = '';
$out = '<tr>';
$out .= "<td>{$this->name}</td>";
foreach ($result as $k => $v) {
if ($v['name'] == 'Start' || $v['name'] == 'Stop') continue;
//$perc = (($v['diff'] * 100) / $total);
//$tperc = (($v['total'] * 100) / $total);
$out .= '<td align="right">' . $v['diff'] . "</td>";
//$out .= '<td align="right">' . number_format($perc, 2, '.', '') .
// "%</td>";
}
$out .= '</tr>';
return $out;
}
}
?>
<html>
<head>
<title>Benchmark: DirectLex versus PEAR's XML_HTMLSax3</title>
</head>
<body>
<h1>Benchmark: DirectLex versus PEAR's XML_HTMLSax3</h1>
<table border="1">
<tr><th>Case</th><th>DirectLex</th><th>XML_HTMLSax3</th></tr>
<?php
function do_benchmark($name, $document) {
$timer = new TinyTimer($name);
$timer->start();
$lexer = new HTMLPurifier_Lexer_DirectLex();
$tokens = $lexer->tokenizeHTML($document);
$timer->setMarker('HTMLPurifier_Lexer');
$lexer = new HTMLPurifier_Lexer_PEARSax3();
$sax_tokens = $lexer->tokenizeHTML($document);
$timer->setMarker('HTMLPurifier_Lexer_Sax');
$timer->stop();
$timer->display();
}
// sample of html pages
$dir = 'samples/Lexer';
$dh = opendir($dir);
while (false !== ($filename = readdir($dh))) {
if (strpos($filename, '.html') !== strlen($filename) - 5) continue;
$document = file_get_contents($dir . '/' . $filename);
do_benchmark("File: $filename", $document);
}
// crashers
$snippets = array();
$snippets[] = '<a href="foo>';
$snippets[] = '<a "=>';
foreach ($snippets as $snippet) {
do_benchmark($snippet, $snippet);
}
// random input
$random = Text_Password::create(80, 'unpronounceable', 'qwerty <>="\'');
do_benchmark('Random input', $random);
?></table>
<?php
echo '<div>Random input was: ' .
'<span colspan="4" style="font-family:monospace;">' . htmlentities($random) .
'</span></div>';
?>
</body></html>