attrTypes = new HTMLPurifier_AttrTypes(); if (!$blank) $this->initialize(); } function initialize() { $this->initialized = true; // load default modules to the recognized modules list (not active) $modules = array( // define 'CommonAttributes', 'Text', 'Hypertext', 'List', 'Presentation', 'Edit', 'Bdo', 'Tables', 'Image', 'StyleAttribute', 'Target', 'Scripting', // define-redefine 'Legacy', // redefine 'TransformToStrict', 'TransformToXHTML11' ); foreach ($modules as $module) { $this->addModule($module); } // these doctype definitions should be placed somewhere else $common = array( 'CommonAttributes', 'Text', 'Hypertext', 'List', 'Presentation', 'Edit', 'Bdo', 'Tables', 'Image', 'StyleAttribute', 'Scripting' ); $transitional = array('Legacy', 'Target'); $d =& $this->addDoctype('HTML 4.01 Transitional'); $d->modules = array_merge($common, $transitional); $d->modulesForMode['correctional'] = array('TransformToStrict'); $d =& $this->addDoctype('XHTML 1.0 Transitional'); $d->modules = array_merge($common, $transitional); $d->modulesForMode['correctional'] = array('TransformToStrict'); $d =& $this->addDoctype('HTML 4.01 Strict'); $d->modules = array_merge($common); $d->modulesForMode['lenient'] = array('TransformToStrict'); $d =& $this->addDoctype('XHTML 1.0 Strict'); $d->modules = array_merge($common); $d->modulesForMode['lenient'] = array('TransformToStrict'); $d =& $this->addDoctype('XHTML 1.1'); $d->modules = array_merge($common); $d->modulesForMode['lenient'] = array('TransformToStrict', 'TransformToXHTML11'); $this->autoDoctype = '*'; } /** * @temporary */ function &addDoctype($name) { $this->doctypes[$name] = new HTMLPurifier_Doctype(); $this->doctypes[$name]->name = $name; return $this->doctypes[$name]; } /** * Adds a module to the recognized module list. This does not * do anything else: the module must be added to a corresponding * collection to be "activated". * @param $module Mixed: string module name, with or without * HTMLPurifier_HTMLModule prefix, or instance of * subclass of HTMLPurifier_HTMLModule. * @note This function will not call autoload, you must instantiate * (and thus invoke) autoload outside the method. * @note If a string is passed as a module name, different variants * will be tested in this order: * - Check for HTMLPurifier_HTMLModule_$name * - Check all prefixes with $name in order they were added * - Check for literal object name * - Throw fatal error * If your object name collides with an internal class, specify * your module manually. */ function addModule($module) { if (is_string($module)) { $original_module = $module; $ok = false; foreach ($this->prefixes as $prefix) { $module = $prefix . $original_module; if ($this->_classExists($module)) { $ok = true; break; } } if (!$ok) { $module = $original_module; if (!$this->_classExists($module)) { trigger_error($original_module . ' module does not exist', E_USER_ERROR); return; } } $module = new $module(); } $module->order = $this->counter++; // assign then increment $this->modules[$module->name] = $module; if ($this->autoDoctype !== false && $this->autoCollection !== false) { $this->collections[$this->autoCollection][$this->autoDoctype][] = $module->name; } } /** * Safely tests for class existence without invoking __autoload in PHP5 * @param $name String class name to test * @private */ function _classExists($name) { static $is_php_4 = null; if ($is_php_4 === null) { $is_php_4 = version_compare(PHP_VERSION, '5', '<'); } if ($is_php_4) { return class_exists($name); } else { return class_exists($name, false); } } /** * Adds a class prefix that addModule() will use to resolve a * string name to a concrete class */ function addPrefix($prefix) { $this->prefixes[] = (string) $prefix; } function setup($config) { // retrieve the doctype $this->doctype = $this->getDoctype($config); if (isset($this->doctypeAliases[$this->doctype])) { // resolve alias $this->doctype = $this->doctypeAliases[$this->doctype]; } // retrieve object instance of doctype $doctype = $this->doctypes[$this->doctype]; $modules = $doctype->modules; foreach ($doctype->modulesForMode as $mode => $mode_modules) { // TODO: test if $mode is active $modules = array_merge($modules, $mode_modules); } foreach ($modules as $module) { $this->validModules[$module] = $this->modules[$module]; } // setup lookup table based on all valid modules foreach ($this->validModules as $module) { foreach ($module->info as $name => $def) { if (!isset($this->elementLookup[$name])) { $this->elementLookup[$name] = array(); } $this->elementLookup[$name][] = $module->name; } } // note the different choice $this->contentSets = new HTMLPurifier_ContentSets( // content set assembly deals with all possible modules, // not just ones deemed to be "safe" $this->validModules ); $this->attrCollections = new HTMLPurifier_AttrCollections( $this->attrTypes, // there is no way to directly disable a global attribute, // but using AllowedAttributes or simply not including // the module in your custom doctype should be sufficient $this->validModules ); } /** * Retrieves the doctype from the configuration object */ function getDoctype($config) { $doctype = $config->get('HTML', 'Doctype'); if ($doctype !== null) { return $doctype; } if (!$this->initialized) { // don't do HTML-oriented backwards compatibility stuff // use either the auto-doctype, or the catch-all doctype return $this->autoDoctype ? $this->autoDoctype : '*'; } // this is backwards-compatibility stuff if ($config->get('Core', 'XHTML')) { $doctype = 'XHTML 1.0'; } else { $doctype = 'HTML 4.01'; } if ($config->get('HTML', 'Strict')) { $doctype .= ' Strict'; } else { $doctype .= ' Transitional'; } return $doctype; } /** * Retrieves merged element definitions. * @param $config Instance of HTMLPurifier_Config, for determining * stray elements. */ function getElements($config) { $elements = array(); foreach ($this->validModules as $module) { foreach ($module->info as $name => $v) { if (isset($elements[$name])) continue; // if element is not safe, don't use it if (!$this->trusted && ($v->safe === false)) continue; $elements[$name] = $this->getElement($name, $config); } } // remove dud elements foreach ($elements as $n => $v) { if ($v === false) unset($elements[$n]); } return $elements; } /** * Retrieves a single merged element definition * @param $name Name of element * @param $config Instance of HTMLPurifier_Config, may not be necessary. */ function getElement($name, $config) { $def = false; $modules = $this->validModules; if (!isset($this->elementLookup[$name])) { return false; } foreach($this->elementLookup[$name] as $module_name) { $module = $modules[$module_name]; $new_def = $module->info[$name]; // refuse to create/merge in a definition that is deemed unsafe if (!$this->trusted && ($new_def->safe === false)) { $def = false; continue; } if (!$def && $new_def->standalone) { // element with unknown safety is not to be trusted. // however, a merge-in definition with undefined safety // is fine if (!$new_def->safe) continue; $def = $new_def; } elseif ($def) { $def->mergeIn($new_def); } else { // could "save it for another day": // non-standalone definitions that don't have a standalone // to merge into could be deferred to the end continue; } // attribute value expansions $this->attrCollections->performInclusions($def->attr); $this->attrCollections->expandIdentifiers($def->attr, $this->attrTypes); // descendants_are_inline, for ChildDef_Chameleon if (is_string($def->content_model) && strpos($def->content_model, 'Inline') !== false) { if ($name != 'del' && $name != 'ins') { // this is for you, ins/del $def->descendants_are_inline = true; } } $this->contentSets->generateChildDef($def, $module); } return $def; } } ?>