0
0
mirror of https://github.com/ezyang/htmlpurifier.git synced 2025-01-05 06:01:52 +00:00

[2.0.1] Revamp error collector scheme: we now have custom mocks and an exchange of responsibilities

- Fix oversight in AutoParagraph dealing with armor.
- Order errors with no line number last
- Language object now needs $config and $context objects to do parameterized objects
- Auto-close notice added
- Token constructors accept line numbers

git-svn-id: http://htmlpurifier.org/svnroot/htmlpurifier/trunk@1245 48356398-32a2-884e-a903-53898d9a118a
This commit is contained in:
Edward Z. Yang 2007-06-26 19:33:37 +00:00
parent 275932ec05
commit 6a95d91a1a
17 changed files with 248 additions and 109 deletions

View File

@ -54,14 +54,6 @@ require_once 'HTMLPurifier/Encoder.php';
require_once 'HTMLPurifier/ErrorCollector.php'; require_once 'HTMLPurifier/ErrorCollector.php';
require_once 'HTMLPurifier/LanguageFactory.php'; require_once 'HTMLPurifier/LanguageFactory.php';
HTMLPurifier_ConfigSchema::define(
'Core', 'Language', 'en', 'string', '
ISO 639 language code for localizable things in HTML Purifier to use,
which is mainly error reporting. There is currently only an English (en)
translation, so this directive is currently useless.
This directive has been available since 2.0.0.
');
HTMLPurifier_ConfigSchema::define( HTMLPurifier_ConfigSchema::define(
'Core', 'CollectErrors', false, 'bool', ' 'Core', 'CollectErrors', false, 'bool', '
Whether or not to collect errors found while filtering the document. This Whether or not to collect errors found while filtering the document. This
@ -148,7 +140,7 @@ class HTMLPurifier
if ($config->get('Core', 'CollectErrors')) { if ($config->get('Core', 'CollectErrors')) {
// may get moved out if other facilities use it // may get moved out if other facilities use it
$language_factory = HTMLPurifier_LanguageFactory::instance(); $language_factory = HTMLPurifier_LanguageFactory::instance();
$language = $language_factory->create($config->get('Core', 'Language')); $language = $language_factory->create($config, $context);
$context->register('Locale', $language); $context->register('Locale', $language);
$error_collector = new HTMLPurifier_ErrorCollector($context); $error_collector = new HTMLPurifier_ErrorCollector($context);

View File

@ -27,36 +27,35 @@ class HTMLPurifier_ErrorCollector
* @param $msg string Error message text * @param $msg string Error message text
*/ */
function send($severity, $msg, $args = array()) { function send($severity, $msg, $args = array()) {
if (func_num_args() == 2) {
$msg = $this->locale->getMessage($msg);
} else {
// setup one-based array if necessary
if (!is_array($args)) { if (!is_array($args)) {
$args = func_get_args(); $args = func_get_args();
array_shift($args); array_shift($args);
unset($args[0]); unset($args[0]);
} }
$msg = $this->locale->formatMessage($msg, $args);
}
$token = $this->context->get('CurrentToken', true); $token = $this->context->get('CurrentToken', true);
$line = $token ? $token->line : $this->context->get('CurrentLine', true); $line = $token ? $token->line : $this->context->get('CurrentLine', true);
$attr = $this->context->get('CurrentAttr', true); $attr = $this->context->get('CurrentAttr', true);
// perform special substitutions
// Currently defined: $CurrentToken.Name, $CurrentToken.Serialized, // perform special substitutions, also add custom parameters
// $CurrentAttr.Name, $CurrentAttr.Value
if (strpos($msg, '$') !== false) {
$subst = array(); $subst = array();
if (!is_null($token)) { if (!is_null($token)) {
if (isset($token->name)) $subst['$CurrentToken.Name'] = $token->name; $args['CurrentToken'] = $token;
$subst['$CurrentToken.Serialized'] = $this->generator->generateFromToken($token);
} }
if (!is_null($attr)) { if (!is_null($attr)) {
$subst['$CurrentAttr.Name'] = $attr; $subst['$CurrentAttr.Name'] = $attr;
if (isset($token->attr[$attr])) $subst['$CurrentAttr.Value'] = $token->attr[$attr]; if (isset($token->attr[$attr])) $subst['$CurrentAttr.Value'] = $token->attr[$attr];
} }
if (!empty($subst)) $msg = strtr($msg, $subst);
if (empty($args)) {
$msg = $this->locale->getMessage($msg);
} else {
$msg = $this->locale->formatMessage($msg, $args);
} }
if (!empty($subst)) $msg = strtr($msg, $subst);
$this->errors[] = array($line, $severity, $msg); $this->errors[] = array($line, $severity, $msg);
} }
@ -74,8 +73,6 @@ class HTMLPurifier_ErrorCollector
* @param $config Configuration array, vital for HTML output nature * @param $config Configuration array, vital for HTML output nature
*/ */
function getHTMLFormatted($config) { function getHTMLFormatted($config) {
$generator = new HTMLPurifier_Generator();
$generator->generateFromTokens(array(), $config, $this->context); // initialize
$ret = array(); $ret = array();
$errors = $this->errors; $errors = $this->errors;
@ -83,20 +80,22 @@ class HTMLPurifier_ErrorCollector
// sort error array by line // sort error array by line
// line numbers are enabled if they aren't explicitly disabled // line numbers are enabled if they aren't explicitly disabled
if ($config->get('Core', 'MaintainLineNumbers') !== false) { if ($config->get('Core', 'MaintainLineNumbers') !== false) {
$has_line = array();
$lines = array(); $lines = array();
$original_order = array(); $original_order = array();
foreach ($errors as $i => $error) { foreach ($errors as $i => $error) {
$has_line[] = (int) (bool) $error[0];
$lines[] = $error[0]; $lines[] = $error[0];
$original_order[] = $i; $original_order[] = $i;
} }
array_multisort($lines, SORT_ASC, $original_order, SORT_ASC, $errors); array_multisort($has_line, SORT_DESC, $lines, SORT_ASC, $original_order, SORT_ASC, $errors);
} }
foreach ($errors as $error) { foreach ($errors as $error) {
list($line, $severity, $msg) = $error; list($line, $severity, $msg) = $error;
$string = ''; $string = '';
$string .= $this->locale->getErrorName($severity) . ': '; $string .= $this->locale->getErrorName($severity) . ': ';
$string .= $generator->escape($msg); $string .= $this->generator->escape($msg);
if ($line) { if ($line) {
// have javascript link generation that causes // have javascript link generation that causes
// textarea to skip to the specified line // textarea to skip to the specified line

View File

@ -38,7 +38,7 @@ class HTMLPurifier_Injector_AutoParagraph extends HTMLPurifier_Injector
if (empty($this->currentNesting)) { if (empty($this->currentNesting)) {
if (!$this->allowsElement('p')) return; if (!$this->allowsElement('p')) return;
// case 1: we're in root node (and it allows paragraphs) // case 1: we're in root node (and it allows paragraphs)
$token = array(new HTMLPurifier_Token_Start('p')); $token = array($this->_pStart());
$this->_splitText($text, $token); $this->_splitText($text, $token);
} elseif ($this->currentNesting[count($this->currentNesting)-1]->name == 'p') { } elseif ($this->currentNesting[count($this->currentNesting)-1]->name == 'p') {
// case 2: we're in a paragraph // case 2: we're in a paragraph
@ -229,7 +229,6 @@ class HTMLPurifier_Injector_AutoParagraph extends HTMLPurifier_Injector
array_pop($result); array_pop($result);
} }
} }
/** /**

View File

@ -31,6 +31,16 @@ class HTMLPurifier_Language
*/ */
var $_loaded = false; var $_loaded = false;
/**
* Instances of HTMLPurifier_Config and HTMLPurifier_Context
*/
var $config, $context;
function HTMLPurifier_Language($config, &$context) {
$this->config = $config;
$this->context =& $context;
}
/** /**
* Loads language object with necessary info from factory cache * Loads language object with necessary info from factory cache
* @note This is a lazy loader * @note This is a lazy loader
@ -73,16 +83,38 @@ class HTMLPurifier_Language
* @param $key string identifier of message * @param $key string identifier of message
* @param $args Parameters to substitute in * @param $args Parameters to substitute in
* @return string localised message * @return string localised message
* @todo Implement conditionals? Right now, some messages make
* reference to line numbers, but those aren't always available
*/ */
function formatMessage($key, $args = array()) { function formatMessage($key, $args = array()) {
if (!$this->_loaded) $this->load(); if (!$this->_loaded) $this->load();
if (!isset($this->messages[$key])) return "[$key]"; if (!isset($this->messages[$key])) return "[$key]";
$raw = $this->messages[$key]; $raw = $this->messages[$key];
$substitutions = array(); $subst = array();
$generator = false;
foreach ($args as $i => $value) { foreach ($args as $i => $value) {
$substitutions['$' . $i] = $value; if (is_object($value)) {
// complicated stuff
if (!$generator) $generator = $this->context->get('Generator');
// assuming it's a token
if (isset($value->name)) $subst['$'.$i.'.Name'] = $value->name;
if (isset($value->data)) $subst['$'.$i.'.Data'] = $value->data;
$subst['$'.$i.'.Compact'] =
$subst['$'.$i.'.Serialized'] = $generator->generateFromToken($value);
// a more complex algorithm for compact representation
// could be introduced for all types of tokens. This
// may need to be factored out into a dedicated class
if (!empty($value->attr)) {
$stripped_token = $value->copy();
$stripped_token->attr = array();
$subst['$'.$i.'.Compact'] = $generator->generateFromToken($stripped_token);
} }
return strtr($raw, $substitutions); $subst['$'.$i.'.Line'] = $value->line ? $value->line : 'unknown';
continue;
}
$subst['$' . $i] = $value;
}
return strtr($raw, $subst);
} }
} }

View File

@ -17,19 +17,20 @@ $messages = array(
'Lexer: Missing end quote' => 'Attribute declaration has no end quote', 'Lexer: Missing end quote' => 'Attribute declaration has no end quote',
'Strategy_RemoveForeignElements: Tag transform' => '<$1> element transformed into $CurrentToken.Serialized', 'Strategy_RemoveForeignElements: Tag transform' => '<$1> element transformed into $CurrentToken.Serialized',
'Strategy_RemoveForeignElements: Missing required attribute' => '<$1> element missing required attribute $2', 'Strategy_RemoveForeignElements: Missing required attribute' => '$CurrentToken.Compact element missing required attribute $1',
'Strategy_RemoveForeignElements: Foreign element to text' => 'Unrecognized $CurrentToken.Serialized tag converted to text', 'Strategy_RemoveForeignElements: Foreign element to text' => 'Unrecognized $CurrentToken.Serialized tag converted to text',
'Strategy_RemoveForeignElements: Foreign element removed' => 'Unrecognized $CurrentToken.Serialized tag removed', 'Strategy_RemoveForeignElements: Foreign element removed' => 'Unrecognized $CurrentToken.Serialized tag removed',
'Strategy_RemoveForeignElements: Comment removed' => 'Comment containing "$1" removed', 'Strategy_RemoveForeignElements: Comment removed' => 'Comment containing "$CurrentToken.Data" removed',
'Strategy_RemoveForeignElements: Script removed' => 'Inline scripting removed', 'Strategy_RemoveForeignElements: Script removed' => 'Script removed',
'Strategy_RemoveForeignElements: Token removed to end' => 'Tags and text starting from $1 element where removed to end', 'Strategy_RemoveForeignElements: Token removed to end' => 'Tags and text starting from $1 element where removed to end',
'Strategy_MakeWellFormed: Unnecessary end tag removed' => 'Unnecessary </$1> tag removed', 'Strategy_MakeWellFormed: Unnecessary end tag removed' => 'Unnecessary $CurrentToken.Serialized tag removed',
'Strategy_MakeWellFormed: Unnecessary end tag to text' => 'Unnecessary </$1> tag converted to text', 'Strategy_MakeWellFormed: Unnecessary end tag to text' => 'Unnecessary $CurrentToken.Serialized tag converted to text',
'Strategy_MakeWellFormed: Stray end tag removed' => 'Stray </$1> tag removed', 'Strategy_MakeWellFormed: Tag auto closed' => '$1.Compact started on line $1.Line auto-closed by $CurrentToken.Compact',
'Strategy_MakeWellFormed: Stray end tag to text' => 'Stray </$1> tag converted to text', 'Strategy_MakeWellFormed: Stray end tag removed' => 'Stray $CurrentToken.Serialized tag removed',
'Strategy_MakeWellFormed: Tag closed by element end' => '<$1> tag closed by end of $CurrentToken.Serialized', 'Strategy_MakeWellFormed: Stray end tag to text' => 'Stray $CurrentToken.Serialized tag converted to text',
'Strategy_MakeWellFormed: Tag closed by document end' => '<$1> tag closed by end of document', 'Strategy_MakeWellFormed: Tag closed by element end' => '$1.Compact tag started on line $1.Line closed by end of $CurrentToken.Serialized',
'Strategy_MakeWellFormed: Tag closed by document end' => '$1.Compact tag started on line $1.Line closed by end of document',
); );

View File

@ -3,6 +3,14 @@
require_once 'HTMLPurifier/Language.php'; require_once 'HTMLPurifier/Language.php';
require_once 'HTMLPurifier/AttrDef/Lang.php'; require_once 'HTMLPurifier/AttrDef/Lang.php';
HTMLPurifier_ConfigSchema::define(
'Core', 'Language', 'en', 'string', '
ISO 639 language code for localizable things in HTML Purifier to use,
which is mainly error reporting. There is currently only an English (en)
translation, so this directive is currently useless.
This directive has been available since 2.0.0.
');
/** /**
* Class responsible for generating HTMLPurifier_Language objects, managing * Class responsible for generating HTMLPurifier_Language objects, managing
* caching and fallbacks. * caching and fallbacks.
@ -79,12 +87,15 @@ class HTMLPurifier_LanguageFactory
/** /**
* Creates a language object, handles class fallbacks * Creates a language object, handles class fallbacks
* @param $code string language code * @param $config Instance of HTMLPurifier_Config
* @param $context Instance of HTMLPurifier_Context
*/ */
function create($code) { function create($config, &$context) {
$config = $context = false; // hope it doesn't use these! // validate language code
$code = $this->validator->validate($code, $config, $context); $code = $this->validator->validate(
$config->get('Core', 'Language'), $config, $context
);
if ($code === false) $code = 'en'; // malformed code becomes English if ($code === false) $code = 'en'; // malformed code becomes English
$pcode = str_replace('-', '_', $code); // make valid PHP classname $pcode = str_replace('-', '_', $code); // make valid PHP classname
@ -111,7 +122,7 @@ class HTMLPurifier_LanguageFactory
$lang = HTMLPurifier_LanguageFactory::factory( $fallback ); $lang = HTMLPurifier_LanguageFactory::factory( $fallback );
$depth--; $depth--;
} else { } else {
$lang = new $class; $lang = new $class($config, $context);
} }
$lang->code = $code; $lang->code = $code;

View File

@ -153,6 +153,7 @@ class HTMLPurifier_Strategy_MakeWellFormed extends HTMLPurifier_Strategy
// if the token is not allowed by the parent, auto-close // if the token is not allowed by the parent, auto-close
// the parent // the parent
if (!isset($parent_info->child->elements[$token->name])) { if (!isset($parent_info->child->elements[$token->name])) {
if ($e) $e->send(E_NOTICE, 'Strategy_MakeWellFormed: Tag auto closed', $parent);
// close the parent, then append the token // close the parent, then append the token
$result[] = new HTMLPurifier_Token_End($parent->name); $result[] = new HTMLPurifier_Token_End($parent->name);
$result[] = $token; $result[] = $token;
@ -182,12 +183,12 @@ class HTMLPurifier_Strategy_MakeWellFormed extends HTMLPurifier_Strategy
// make sure that we have something open // make sure that we have something open
if (empty($this->currentNesting)) { if (empty($this->currentNesting)) {
if ($escape_invalid_tags) { if ($escape_invalid_tags) {
if ($e) $e->send(E_WARNING, 'Strategy_MakeWellFormed: Unnecessary end tag to text', $token->name); if ($e) $e->send(E_WARNING, 'Strategy_MakeWellFormed: Unnecessary end tag to text');
$result[] = new HTMLPurifier_Token_Text( $result[] = new HTMLPurifier_Token_Text(
$generator->generateFromToken($token, $config, $context) $generator->generateFromToken($token, $config, $context)
); );
} elseif ($e) { } elseif ($e) {
$e->send(E_WARNING, 'Strategy_MakeWellFormed: Unnecessary end tag removed', $token->name); $e->send(E_WARNING, 'Strategy_MakeWellFormed: Unnecessary end tag removed');
} }
continue; continue;
} }
@ -223,9 +224,9 @@ class HTMLPurifier_Strategy_MakeWellFormed extends HTMLPurifier_Strategy
$result[] = new HTMLPurifier_Token_Text( $result[] = new HTMLPurifier_Token_Text(
$generator->generateFromToken($token, $config, $context) $generator->generateFromToken($token, $config, $context)
); );
if ($e) $e->send(E_WARNING, 'Strategy_MakeWellFormed: Stray end tag to text', $token->name); if ($e) $e->send(E_WARNING, 'Strategy_MakeWellFormed: Stray end tag to text');
} elseif ($e) { } elseif ($e) {
$e->send(E_WARNING, 'Strategy_MakeWellFormed: Stray end tag removed', $token->name); $e->send(E_WARNING, 'Strategy_MakeWellFormed: Stray end tag removed');
} }
continue; continue;
} }
@ -235,7 +236,7 @@ class HTMLPurifier_Strategy_MakeWellFormed extends HTMLPurifier_Strategy
$size = count($skipped_tags); $size = count($skipped_tags);
for ($i = $size - 1; $i > 0; $i--) { for ($i = $size - 1; $i > 0; $i--) {
if ($e && !isset($skipped_tags[$i]->armor['MakeWellFormed_TagClosedError'])) { if ($e && !isset($skipped_tags[$i]->armor['MakeWellFormed_TagClosedError'])) {
$e->send(E_NOTICE, 'Strategy_MakeWellFormed: Tag closed by element end', $skipped_tags[$i]->name); $e->send(E_NOTICE, 'Strategy_MakeWellFormed: Tag closed by element end', $skipped_tags[$i]);
} }
$result[] = new HTMLPurifier_Token_End($skipped_tags[$i]->name); $result[] = new HTMLPurifier_Token_End($skipped_tags[$i]->name);
} }
@ -244,25 +245,25 @@ class HTMLPurifier_Strategy_MakeWellFormed extends HTMLPurifier_Strategy
} }
$context->destroy('CurrentNesting');
$context->destroy('InputTokens');
$context->destroy('InputIndex');
$context->destroy('CurrentToken');
// we're at the end now, fix all still unclosed tags // we're at the end now, fix all still unclosed tags
// not using processToken() because at this point we don't // not using processToken() because at this point we don't
// care about current nesting // care about current nesting
if (!empty($this->currentNesting)) { if (!empty($this->currentNesting)) {
$size = count($this->currentNesting); $size = count($this->currentNesting);
for ($i = $size - 1; $i >= 0; $i--) { for ($i = $size - 1; $i >= 0; $i--) {
if ($e && !isset($skipped_tags[$i]->armor['MakeWellFormed_TagClosedError'])) { if ($e && !isset($this->currentNesting[$i]->armor['MakeWellFormed_TagClosedError'])) {
$e->send(E_NOTICE, 'Strategy_MakeWellFormed: Tag closed by document end', $this->currentNesting[$i]->name); $e->send(E_NOTICE, 'Strategy_MakeWellFormed: Tag closed by document end', $this->currentNesting[$i]);
} }
$result[] = $result[] =
new HTMLPurifier_Token_End($this->currentNesting[$i]->name); new HTMLPurifier_Token_End($this->currentNesting[$i]->name);
} }
} }
$context->destroy('CurrentNesting');
$context->destroy('InputTokens');
$context->destroy('InputIndex');
$context->destroy('CurrentToken');
unset($this->outputTokens, $this->injectors, $this->currentInjector, unset($this->outputTokens, $this->injectors, $this->currentInjector,
$this->currentNesting, $this->inputTokens, $this->inputIndex); $this->currentNesting, $this->inputTokens, $this->inputIndex);

View File

@ -100,7 +100,7 @@ class HTMLPurifier_Strategy_RemoveForeignElements extends HTMLPurifier_Strategy
} }
} }
if (!$ok) { if (!$ok) {
if ($e) $e->send(E_ERROR, 'Strategy_RemoveForeignElements: Missing required attribute', $token->name, $name); if ($e) $e->send(E_ERROR, 'Strategy_RemoveForeignElements: Missing required attribute', $name);
continue; continue;
} }
$token->armor['ValidateAttributes'] = true; $token->armor['ValidateAttributes'] = true;
@ -143,7 +143,7 @@ class HTMLPurifier_Strategy_RemoveForeignElements extends HTMLPurifier_Strategy
$token = new HTMLPurifier_Token_Text($data); $token = new HTMLPurifier_Token_Text($data);
} else { } else {
// strip comments // strip comments
if ($e) $e->send(E_NOTICE, 'Strategy_RemoveForeignElements: Comment removed', $token->data); if ($e) $e->send(E_NOTICE, 'Strategy_RemoveForeignElements: Comment removed');
continue; continue;
} }
} elseif ($token->type == 'text') { } elseif ($token->type == 'text') {

View File

@ -66,7 +66,7 @@ class HTMLPurifier_Token_Tag extends HTMLPurifier_Token // abstract
* @param $name String name. * @param $name String name.
* @param $attr Associative array of attributes. * @param $attr Associative array of attributes.
*/ */
function HTMLPurifier_Token_Tag($name, $attr = array()) { function HTMLPurifier_Token_Tag($name, $attr = array(), $line = null) {
$this->name = ctype_lower($name) ? $name : strtolower($name); $this->name = ctype_lower($name) ? $name : strtolower($name);
foreach ($attr as $key => $value) { foreach ($attr as $key => $value) {
// normalization only necessary when key is not lowercase // normalization only necessary when key is not lowercase
@ -81,6 +81,7 @@ class HTMLPurifier_Token_Tag extends HTMLPurifier_Token // abstract
} }
} }
$this->attr = $attr; $this->attr = $attr;
$this->line = $line;
} }
} }
@ -134,9 +135,10 @@ class HTMLPurifier_Token_Text extends HTMLPurifier_Token
* *
* @param $data String parsed character data. * @param $data String parsed character data.
*/ */
function HTMLPurifier_Token_Text($data) { function HTMLPurifier_Token_Text($data, $line = null) {
$this->data = $data; $this->data = $data;
$this->is_whitespace = ctype_space($data); $this->is_whitespace = ctype_space($data);
$this->line = $line;
} }
} }
@ -153,8 +155,9 @@ class HTMLPurifier_Token_Comment extends HTMLPurifier_Token
* *
* @param $data String comment data. * @param $data String comment data.
*/ */
function HTMLPurifier_Token_Comment($data) { function HTMLPurifier_Token_Comment($data, $line = null) {
$this->data = $data; $this->data = $data;
$this->line = $line;
} }
} }

View File

@ -0,0 +1,47 @@
<?php
require_once 'HTMLPurifier/ErrorCollector.php';
generate_mock_once('HTMLPurifier_ErrorCollector');
/**
* Extended error collector mock that has the ability to expect context
*/
class HTMLPurifier_ErrorCollectorEMock extends HTMLPurifier_ErrorCollectorMock
{
var $_context;
var $_expected_context = array();
var $_expected_context_at = array();
function prepare(&$context) {
$this->_context =& $context;
}
function expectContext($key, $value) {
$this->_expected_context[$key] = $value;
}
function expectContextAt($step, $key, $value) {
$this->_expected_context_at[$step][$key] = $value;
}
function send() {
// test for context
$test = &$this->_getCurrentTestCase();
foreach ($this->_expected_context as $key => $value) {
$test->assertEqual($value, $this->_context->get($key));
}
$step = $this->getCallCount('send');
if (isset($this->_expected_context_at[$step])) {
foreach ($this->_expected_context_at[$step] as $key => $value) {
$test->assertEqual($value, $this->_context->get($key));
}
}
// boilerplate mock code, does not have return value or references
$args = func_get_args();
$this->_invoke('send', $args);
}
}
?>

View File

@ -26,7 +26,7 @@ class HTMLPurifier_ErrorCollectorTest extends UnitTestCase
$context->register('Locale', $language); $context->register('Locale', $language);
$context->register('CurrentLine', $line); $context->register('CurrentLine', $line);
$generator = new HTMLPurifier_GeneratorMock(); $generator = new HTMLPurifier_Generator();
$context->register('Generator', $generator); $context->register('Generator', $generator);
$collector = new HTMLPurifier_ErrorCollector($context); $collector = new HTMLPurifier_ErrorCollector($context);
@ -60,7 +60,7 @@ class HTMLPurifier_ErrorCollectorTest extends UnitTestCase
$context = new HTMLPurifier_Context(); $context = new HTMLPurifier_Context();
$context->register('Locale', $language); $context->register('Locale', $language);
$generator = new HTMLPurifier_GeneratorMock(); $generator = new HTMLPurifier_Generator();
$context->register('Generator', $generator); $context->register('Generator', $generator);
$collector = new HTMLPurifier_ErrorCollector($context); $collector = new HTMLPurifier_ErrorCollector($context);
@ -77,7 +77,7 @@ class HTMLPurifier_ErrorCollectorTest extends UnitTestCase
$context = new HTMLPurifier_Context(); $context = new HTMLPurifier_Context();
$context->register('Locale', $language); $context->register('Locale', $language);
$generator = new HTMLPurifier_GeneratorMock(); $generator = new HTMLPurifier_Generator();
$context->register('Generator', $generator); $context->register('Generator', $generator);
$collector = new HTMLPurifier_ErrorCollector($context); $collector = new HTMLPurifier_ErrorCollector($context);
@ -100,32 +100,36 @@ class HTMLPurifier_ErrorCollectorTest extends UnitTestCase
function testContextSubstitutions() { function testContextSubstitutions() {
$language = new HTMLPurifier_LanguageMock(); $language = new HTMLPurifier_LanguageMock();
$language->setReturnValue('getMessage',
'$CurrentToken.Name, $CurrentToken.Serialized', array('message-token'));
$language->setReturnValue('getMessage',
'$CurrentAttr.Name => $CurrentAttr.Value', array('message-attr'));
$context = new HTMLPurifier_Context(); $context = new HTMLPurifier_Context();
$context->register('Locale', $language); $context->register('Locale', $language);
$current_token = new HTMLPurifier_Token_Start('a', array('href' => 'http://example.com')); $generator = new HTMLPurifier_Generator();
$current_token->line = 32;
$current_attr = 'href';
$generator = new HTMLPurifier_GeneratorMock();
$generator->setReturnValue('generateFromToken', '<a href="http://example.com">', array($current_token));
$context->register('Generator', $generator); $context->register('Generator', $generator);
$current_token = false;
$context->register('CurrentToken', $current_token);
$collector = new HTMLPurifier_ErrorCollector($context); $collector = new HTMLPurifier_ErrorCollector($context);
$context->register('CurrentToken', $current_token); // 0
$collector->send(E_NOTICE, 'message-token'); $current_token = new HTMLPurifier_Token_Start('a', array('href' => 'http://example.com'), 32);
$language->setReturnValue('formatMessage', 'Token message',
array('message-data-token', array('CurrentToken' => $current_token)));
$collector->send(E_NOTICE, 'message-data-token');
$current_attr = 'href';
$language->setReturnValue('formatMessage', '$CurrentAttr.Name => $CurrentAttr.Value',
array('message-attr', array('CurrentToken' => $current_token)));
// 1
$collector->send(E_NOTICE, 'message-attr'); // test when context isn't available $collector->send(E_NOTICE, 'message-attr'); // test when context isn't available
// 2
$context->register('CurrentAttr', $current_attr); $context->register('CurrentAttr', $current_attr);
$collector->send(E_NOTICE, 'message-attr'); $collector->send(E_NOTICE, 'message-attr');
$result = array( $result = array(
0 => array(32, E_NOTICE, 'a, <a href="http://example.com">'), 0 => array(32, E_NOTICE, 'Token message'),
1 => array(32, E_NOTICE, '$CurrentAttr.Name => $CurrentAttr.Value'), 1 => array(32, E_NOTICE, '$CurrentAttr.Name => $CurrentAttr.Value'),
2 => array(32, E_NOTICE, 'href => http://example.com') 2 => array(32, E_NOTICE, 'href => http://example.com')
); );

View File

@ -1,6 +1,6 @@
<?php <?php
require_once 'HTMLPurifier/ErrorCollector.php'; require_once 'HTMLPurifier/ErrorCollectorEMock.php';
require_once 'HTMLPurifier/Lexer/DirectLex.php'; require_once 'HTMLPurifier/Lexer/DirectLex.php';
class HTMLPurifier_ErrorsHarness extends UnitTestCase class HTMLPurifier_ErrorsHarness extends UnitTestCase
@ -13,7 +13,8 @@ class HTMLPurifier_ErrorsHarness extends UnitTestCase
$this->config = HTMLPurifier_Config::create(array('Core.CollectErrors' => true)); $this->config = HTMLPurifier_Config::create(array('Core.CollectErrors' => true));
$this->context = new HTMLPurifier_Context(); $this->context = new HTMLPurifier_Context();
generate_mock_once('HTMLPurifier_ErrorCollector'); generate_mock_once('HTMLPurifier_ErrorCollector');
$this->collector = new HTMLPurifier_ErrorCollectorMock(); $this->collector = new HTMLPurifier_ErrorCollectorEMock();
$this->collector->prepare($this->context);
$this->context->register('ErrorCollector', $this->collector); $this->context->register('ErrorCollector', $this->collector);
} }
@ -22,6 +23,10 @@ class HTMLPurifier_ErrorsHarness extends UnitTestCase
$this->collector->expectOnce('send', $args); $this->collector->expectOnce('send', $args);
} }
function expectContext($key, $value) {
$this->collector->expectContext($key, $value);
}
} }
?> ?>

View File

@ -9,7 +9,9 @@ class HTMLPurifier_LanguageFactoryTest extends UnitTestCase
$factory = HTMLPurifier_LanguageFactory::instance(); $factory = HTMLPurifier_LanguageFactory::instance();
$language = $factory->create('en'); $config = HTMLPurifier_Config::create(array('Core.Language' => 'en'));
$context = new HTMLPurifier_Context();
$language = $factory->create($config, $context);
$this->assertIsA($language, 'HTMLPurifier_Language'); $this->assertIsA($language, 'HTMLPurifier_Language');
$this->assertIdentical($language->code, 'en'); $this->assertIdentical($language->code, 'en');
@ -27,7 +29,10 @@ class HTMLPurifier_LanguageFactoryTest extends UnitTestCase
$factory = HTMLPurifier_LanguageFactory::instance(); $factory = HTMLPurifier_LanguageFactory::instance();
$language = $factory->create('en-x-test'); $config = HTMLPurifier_Config::create(array('Core.Language' => 'en-x-test'));
$context = new HTMLPurifier_Context();
$language = $factory->create($config, $context);
$this->assertIsA($language, 'HTMLPurifier_Language_en_x_test'); $this->assertIsA($language, 'HTMLPurifier_Language_en_x_test');
$this->assertIdentical($language->code, 'en-x-test'); $this->assertIdentical($language->code, 'en-x-test');

View File

@ -8,7 +8,9 @@ class HTMLPurifier_LanguageTest extends UnitTestCase
var $lang; var $lang;
function test_getMessage() { function test_getMessage() {
$lang = new HTMLPurifier_Language(); $config = HTMLPurifier_Config::createDefault();
$context = new HTMLPurifier_Context();
$lang = new HTMLPurifier_Language($config, $context);
$lang->_loaded = true; $lang->_loaded = true;
$lang->messages['HTMLPurifier'] = 'HTML Purifier'; $lang->messages['HTMLPurifier'] = 'HTML Purifier';
$this->assertIdentical($lang->getMessage('HTMLPurifier'), 'HTML Purifier'); $this->assertIdentical($lang->getMessage('HTMLPurifier'), 'HTML Purifier');
@ -16,12 +18,31 @@ class HTMLPurifier_LanguageTest extends UnitTestCase
} }
function test_formatMessage() { function test_formatMessage() {
$lang = new HTMLPurifier_Language(); $config = HTMLPurifier_Config::createDefault();
$context = new HTMLPurifier_Context();
$lang = new HTMLPurifier_Language($config, $context);
$lang->_loaded = true; $lang->_loaded = true;
$lang->messages['LanguageTest: Error'] = 'Error is $1 on line $2'; $lang->messages['LanguageTest: Error'] = 'Error is $1 on line $2';
$this->assertIdentical($lang->formatMessage('LanguageTest: Error', array(1=>'fatal', 32)), 'Error is fatal on line 32'); $this->assertIdentical($lang->formatMessage('LanguageTest: Error', array(1=>'fatal', 32)), 'Error is fatal on line 32');
} }
function test_formatMessage_complexParameter() {
$config = HTMLPurifier_Config::createDefault();
$context = new HTMLPurifier_Context();
$generator = new HTMLPurifier_Generator(); // replace with mock if this gets icky
$context->register('Generator', $generator);
$lang = new HTMLPurifier_Language($config, $context);
$lang->_loaded = true;
$lang->messages['LanguageTest: Element info'] = 'Element Token: $1.Name, $1.Serialized, $1.Compact, $1.Line';
$lang->messages['LanguageTest: Data info'] = 'Data Token: $1.Data, $1.Serialized, $1.Compact, $1.Line';
$this->assertIdentical($lang->formatMessage('LanguageTest: Element info',
array(1=>new HTMLPurifier_Token_Start('a', array('href'=>'http://example.com'), 18))),
'Element Token: a, <a href="http://example.com">, <a>, 18');
$this->assertIdentical($lang->formatMessage('LanguageTest: Data info',
array(1=>new HTMLPurifier_Token_Text('data>', 23))),
'Data Token: data>, data&gt;, data&gt;, 23');
}
} }
?> ?>

View File

@ -18,19 +18,24 @@ class HTMLPurifier_Lexer_DirectLex_ErrorsTest extends HTMLPurifier_ErrorsHarness
function testUnclosedComment() { function testUnclosedComment() {
$this->expectErrorCollection(E_WARNING, 'Lexer: Unclosed comment'); $this->expectErrorCollection(E_WARNING, 'Lexer: Unclosed comment');
$this->expectContext('CurrentLine', 1);
$this->invoke('<!-- >'); $this->invoke('<!-- >');
} }
function testUnescapedLt() { function testUnescapedLt() {
$this->expectErrorCollection(E_NOTICE, 'Lexer: Unescaped lt'); $this->expectErrorCollection(E_NOTICE, 'Lexer: Unescaped lt');
$this->expectContext('CurrentLine', 1);
$this->invoke('< foo>'); $this->invoke('< foo>');
} }
function testMissingGt() { function testMissingGt() {
$this->expectErrorCollection(E_WARNING, 'Lexer: Missing gt'); $this->expectErrorCollection(E_WARNING, 'Lexer: Missing gt');
$this->expectContext('CurrentLine', 1);
$this->invoke('<a href=""'); $this->invoke('<a href=""');
} }
// these are sub-errors, will only be thrown in context of collector
function testMissingAttributeKey1() { function testMissingAttributeKey1() {
$this->expectErrorCollection(E_ERROR, 'Lexer: Missing attribute key'); $this->expectErrorCollection(E_ERROR, 'Lexer: Missing attribute key');
$this->invokeAttr('=""'); $this->invokeAttr('=""');

View File

@ -16,34 +16,44 @@ class HTMLPurifier_Strategy_MakeWellFormed_ErrorsTest extends HTMLPurifier_Strat
} }
function testUnnecessaryEndTagRemoved() { function testUnnecessaryEndTagRemoved() {
$this->expectErrorCollection(E_WARNING, 'Strategy_MakeWellFormed: Unnecessary end tag removed', 'b'); $this->expectErrorCollection(E_WARNING, 'Strategy_MakeWellFormed: Unnecessary end tag removed');
$this->expectContext('CurrentToken', new HTMLPurifier_Token_End('b', array(), 1));
$this->invoke('</b>'); $this->invoke('</b>');
} }
function testUnnecessaryEndTagToText() { function testUnnecessaryEndTagToText() {
$this->config->set('Core', 'EscapeInvalidTags', true); $this->config->set('Core', 'EscapeInvalidTags', true);
$this->expectErrorCollection(E_WARNING, 'Strategy_MakeWellFormed: Unnecessary end tag to text', 'b'); $this->expectErrorCollection(E_WARNING, 'Strategy_MakeWellFormed: Unnecessary end tag to text');
$this->expectContext('CurrentToken', new HTMLPurifier_Token_End('b', array(), 1));
$this->invoke('</b>'); $this->invoke('</b>');
} }
function testTagAutoClosed() {
$this->expectErrorCollection(E_NOTICE, 'Strategy_MakeWellFormed: Tag auto closed', new HTMLPurifier_Token_Start('b', array(), 1));
$this->expectContext('CurrentToken', new HTMLPurifier_Token_Start('div', array(), 1));
$this->invoke('<b>Foo<div>Bar</div>');
}
function testStrayEndTagRemoved() { function testStrayEndTagRemoved() {
$this->expectErrorCollection(E_WARNING, 'Strategy_MakeWellFormed: Stray end tag removed', 'b'); $this->expectErrorCollection(E_WARNING, 'Strategy_MakeWellFormed: Stray end tag removed');
$this->expectContext('CurrentToken', new HTMLPurifier_Token_End('b', array(), 1));
$this->invoke('<i></b></i>'); $this->invoke('<i></b></i>');
} }
function testStrayEndTagToText() { function testStrayEndTagToText() {
$this->config->set('Core', 'EscapeInvalidTags', true); $this->config->set('Core', 'EscapeInvalidTags', true);
$this->expectErrorCollection(E_WARNING, 'Strategy_MakeWellFormed: Stray end tag to text', 'b'); $this->expectErrorCollection(E_WARNING, 'Strategy_MakeWellFormed: Stray end tag to text');
$this->expectContext('CurrentToken', new HTMLPurifier_Token_End('b', array(), 1));
$this->invoke('<i></b></i>'); $this->invoke('<i></b></i>');
} }
function testTagClosedByElementEnd() { function testTagClosedByElementEnd() {
$this->expectErrorCollection(E_NOTICE, 'Strategy_MakeWellFormed: Tag closed by element end', 'b'); $this->expectErrorCollection(E_NOTICE, 'Strategy_MakeWellFormed: Tag closed by element end', new HTMLPurifier_Token_Start('b', array(), 1));
$this->invoke('<i><b>Foobar</i>'); $this->invoke('<i><b>Foobar</i>');
} }
function testTagClosedByDocumentEnd() { function testTagClosedByDocumentEnd() {
$this->expectErrorCollection(E_NOTICE, 'Strategy_MakeWellFormed: Tag closed by document end', 'b'); $this->expectErrorCollection(E_NOTICE, 'Strategy_MakeWellFormed: Tag closed by document end', new HTMLPurifier_Token_Start('b', array(), 1));
$this->invoke('<b>Foobar'); $this->invoke('<b>Foobar');
} }

View File

@ -16,37 +16,41 @@ class HTMLPurifier_Strategy_RemoveForeignElements_ErrorsTest extends HTMLPurifie
} }
function testTagTransform() { function testTagTransform() {
// uses $CurrentToken.Serialized
$this->expectErrorCollection(E_NOTICE, 'Strategy_RemoveForeignElements: Tag transform', 'center'); $this->expectErrorCollection(E_NOTICE, 'Strategy_RemoveForeignElements: Tag transform', 'center');
$this->expectContext('CurrentToken', new HTMLPurifier_Token_Start('div', array('style' => 'text-align:center;'), 1));
$this->invoke('<center>'); $this->invoke('<center>');
} }
function testMissingRequiredAttr() { function testMissingRequiredAttr() {
// a little fragile, since img has two required attributes // a little fragile, since img has two required attributes
$this->expectErrorCollection(E_ERROR, 'Strategy_RemoveForeignElements: Missing required attribute', 'img', 'alt'); $this->expectErrorCollection(E_ERROR, 'Strategy_RemoveForeignElements: Missing required attribute', 'alt');
$this->expectContext('CurrentToken', new HTMLPurifier_Token_Empty('img', array(), 1));
$this->invoke('<img />'); $this->invoke('<img />');
} }
function testForeignElementToText() { function testForeignElementToText() {
// uses $CurrentToken.Serialized
$this->config->set('Core', 'EscapeInvalidTags', true); $this->config->set('Core', 'EscapeInvalidTags', true);
$this->expectErrorCollection(E_WARNING, 'Strategy_RemoveForeignElements: Foreign element to text'); $this->expectErrorCollection(E_WARNING, 'Strategy_RemoveForeignElements: Foreign element to text');
$this->invoke('<cannot-possibly-exist-element>'); $this->expectContext('CurrentToken', new HTMLPurifier_Token_Start('invalid', array(), 1));
$this->invoke('<invalid>');
} }
function testForeignElementRemoved() { function testForeignElementRemoved() {
// uses $CurrentToken.Serialized // uses $CurrentToken.Serialized
$this->expectErrorCollection(E_ERROR, 'Strategy_RemoveForeignElements: Foreign element removed'); $this->expectErrorCollection(E_ERROR, 'Strategy_RemoveForeignElements: Foreign element removed');
$this->invoke('<cannot-possibly-exist-element>'); $this->expectContext('CurrentToken', new HTMLPurifier_Token_Start('invalid', array(), 1));
$this->invoke('<invalid>');
} }
function testCommentRemoved() { function testCommentRemoved() {
$this->expectErrorCollection(E_NOTICE, 'Strategy_RemoveForeignElements: Comment removed', ' test '); $this->expectErrorCollection(E_NOTICE, 'Strategy_RemoveForeignElements: Comment removed');
$this->expectContext('CurrentToken', new HTMLPurifier_Token_Comment(' test ', 1));
$this->invoke('<!-- test -->'); $this->invoke('<!-- test -->');
} }
function testScriptRemoved() { function testScriptRemoved() {
$this->collector->expectAt(0, 'send', array(E_ERROR, 'Strategy_RemoveForeignElements: Script removed')); $this->collector->expectAt(0, 'send', array(E_ERROR, 'Strategy_RemoveForeignElements: Script removed'));
$this->collector->expectContextAt(0, 'CurrentToken', new HTMLPurifier_Token_Start('script', array(), 1));
$this->collector->expectAt(1, 'send', array(E_ERROR, 'Strategy_RemoveForeignElements: Token removed to end', 'script')); $this->collector->expectAt(1, 'send', array(E_ERROR, 'Strategy_RemoveForeignElements: Token removed to end', 'script'));
$this->invoke('<script>asdf'); $this->invoke('<script>asdf');
} }