mirror of
https://github.com/ezyang/htmlpurifier.git
synced 2024-11-08 23:08:42 +00:00
e99520ab96
git-svn-id: http://htmlpurifier.org/svnroot/htmlpurifier/trunk@1253 48356398-32a2-884e-a903-53898d9a118a
188 lines
5.9 KiB
PHP
188 lines
5.9 KiB
PHP
<?php
|
|
|
|
/**
|
|
* Structure that stores an HTML element definition. Used by
|
|
* HTMLPurifier_HTMLDefinition and HTMLPurifier_HTMLModule.
|
|
* @note This class is inspected by HTMLPurifier_Printer_HTMLDefinition.
|
|
* Please update that class too.
|
|
*/
|
|
class HTMLPurifier_ElementDef
|
|
{
|
|
|
|
/**
|
|
* Does the definition work by itself, or is it created solely
|
|
* for the purpose of merging into another definition?
|
|
*/
|
|
var $standalone = true;
|
|
|
|
/**
|
|
* Associative array of attribute name to HTMLPurifier_AttrDef
|
|
* @note Before being processed by HTMLPurifier_AttrCollections
|
|
* when modules are finalized during
|
|
* HTMLPurifier_HTMLDefinition->setup(), this array may also
|
|
* contain an array at index 0 that indicates which attribute
|
|
* collections to load into the full array. It may also
|
|
* contain string indentifiers in lieu of HTMLPurifier_AttrDef,
|
|
* see HTMLPurifier_AttrTypes on how they are expanded during
|
|
* HTMLPurifier_HTMLDefinition->setup() processing.
|
|
* @public
|
|
*/
|
|
var $attr = array();
|
|
|
|
/**
|
|
* Indexed list of tag's HTMLPurifier_AttrTransform to be done before validation
|
|
* @public
|
|
*/
|
|
var $attr_transform_pre = array();
|
|
|
|
/**
|
|
* Indexed list of tag's HTMLPurifier_AttrTransform to be done after validation
|
|
* @public
|
|
*/
|
|
var $attr_transform_post = array();
|
|
|
|
|
|
|
|
/**
|
|
* HTMLPurifier_ChildDef of this tag.
|
|
* @public
|
|
*/
|
|
var $child;
|
|
|
|
/**
|
|
* Abstract string representation of internal ChildDef rules. See
|
|
* HTMLPurifier_ContentSets for how this is parsed and then transformed
|
|
* into an HTMLPurifier_ChildDef.
|
|
* @warning This is a temporary variable that is not available after
|
|
* being processed by HTMLDefinition
|
|
* @public
|
|
*/
|
|
var $content_model;
|
|
|
|
/**
|
|
* Value of $child->type, used to determine which ChildDef to use,
|
|
* used in combination with $content_model.
|
|
* @warning This must be lowercase
|
|
* @warning This is a temporary variable that is not available after
|
|
* being processed by HTMLDefinition
|
|
* @public
|
|
*/
|
|
var $content_model_type;
|
|
|
|
|
|
|
|
/**
|
|
* Does the element have a content model (#PCDATA | Inline)*? This
|
|
* is important for chameleon ins and del processing in
|
|
* HTMLPurifier_ChildDef_Chameleon. Dynamically set: modules don't
|
|
* have to worry about this one.
|
|
* @public
|
|
*/
|
|
var $descendants_are_inline = false;
|
|
|
|
/**
|
|
* List of the names of required attributes this element has. Dynamically
|
|
* populated.
|
|
* @public
|
|
*/
|
|
var $required_attr = array();
|
|
|
|
/**
|
|
* Lookup table of tags excluded from all descendants of this tag.
|
|
* @note SGML permits exclusions for all descendants, but this is
|
|
* not possible with DTDs or XML Schemas. W3C has elected to
|
|
* use complicated compositions of content_models to simulate
|
|
* exclusion for children, but we go the simpler, SGML-style
|
|
* route of flat-out exclusions, which correctly apply to
|
|
* all descendants and not just children. Note that the XHTML
|
|
* Modularization Abstract Modules are blithely unaware of such
|
|
* distinctions.
|
|
* @public
|
|
*/
|
|
var $excludes = array();
|
|
|
|
/**
|
|
* Is this element safe for untrusted users to use?
|
|
*/
|
|
var $safe;
|
|
|
|
/**
|
|
* Low-level factory constructor for creating new standalone element defs
|
|
* @static
|
|
*/
|
|
function create($safe, $content_model, $content_model_type, $attr) {
|
|
$def = new HTMLPurifier_ElementDef();
|
|
$def->safe = (bool) $safe;
|
|
$def->content_model = $content_model;
|
|
$def->content_model_type = $content_model_type;
|
|
$def->attr = $attr;
|
|
return $def;
|
|
}
|
|
|
|
/**
|
|
* Merges the values of another element definition into this one.
|
|
* Values from the new element def take precedence if a value is
|
|
* not mergeable.
|
|
*/
|
|
function mergeIn($def) {
|
|
|
|
// later keys takes precedence
|
|
foreach($def->attr as $k => $v) {
|
|
if ($k === 0) {
|
|
// merge in the includes
|
|
// sorry, no way to override an include
|
|
foreach ($v as $v2) {
|
|
$this->attr[0][] = $v2;
|
|
}
|
|
continue;
|
|
}
|
|
if ($v === false) {
|
|
if (isset($this->attr[$k])) unset($this->attr[$k]);
|
|
continue;
|
|
}
|
|
$this->attr[$k] = $v;
|
|
}
|
|
$this->_mergeAssocArray($this->attr_transform_pre, $def->attr_transform_pre);
|
|
$this->_mergeAssocArray($this->attr_transform_post, $def->attr_transform_post);
|
|
$this->_mergeAssocArray($this->excludes, $def->excludes);
|
|
|
|
if(!empty($def->content_model)) {
|
|
$this->content_model .= ' | ' . $def->content_model;
|
|
$this->child = false;
|
|
}
|
|
if(!empty($def->content_model_type)) {
|
|
$this->content_model_type = $def->content_model_type;
|
|
$this->child = false;
|
|
}
|
|
if(!is_null($def->child)) $this->child = $def->child;
|
|
if($def->descendants_are_inline) $this->descendants_are_inline = $def->descendants_are_inline;
|
|
if(!is_null($def->safe)) $this->safe = $def->safe;
|
|
|
|
}
|
|
|
|
/**
|
|
* Merges one array into another, removes values which equal false
|
|
* @param $a1 Array by reference that is merged into
|
|
* @param $a2 Array that merges into $a1
|
|
*/
|
|
function _mergeAssocArray(&$a1, $a2) {
|
|
foreach ($a2 as $k => $v) {
|
|
if ($v === false) {
|
|
if (isset($a1[$k])) unset($a1[$k]);
|
|
continue;
|
|
}
|
|
$a1[$k] = $v;
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Retrieves a copy of the element definition
|
|
*/
|
|
function copy() {
|
|
return unserialize(serialize($this));
|
|
}
|
|
|
|
}
|
|
|
|
|