mirror of
https://github.com/ezyang/htmlpurifier.git
synced 2025-01-24 14:21:52 +00:00
MOODLE-556: Normalization of whitespace in MathML token elements
This commit is contained in:
parent
e8f71f91da
commit
a721ae0ae6
@ -192,6 +192,7 @@ require 'HTMLPurifier/HTMLModule/Tidy/XHTML.php';
|
||||
require 'HTMLPurifier/Injector/AutoParagraph.php';
|
||||
require 'HTMLPurifier/Injector/DisplayLinkURI.php';
|
||||
require 'HTMLPurifier/Injector/Linkify.php';
|
||||
require 'HTMLPurifier/Injector/MathSpaceNormalize.php';
|
||||
require 'HTMLPurifier/Injector/PurifierLinkify.php';
|
||||
require 'HTMLPurifier/Injector/RemoveEmpty.php';
|
||||
require 'HTMLPurifier/Injector/RemoveSpansWithoutAttributes.php';
|
||||
|
@ -186,6 +186,7 @@ require_once $__dir . '/HTMLPurifier/HTMLModule/Tidy/XHTML.php';
|
||||
require_once $__dir . '/HTMLPurifier/Injector/AutoParagraph.php';
|
||||
require_once $__dir . '/HTMLPurifier/Injector/DisplayLinkURI.php';
|
||||
require_once $__dir . '/HTMLPurifier/Injector/Linkify.php';
|
||||
require_once $__dir . '/HTMLPurifier/Injector/MathSpaceNormalize.php';
|
||||
require_once $__dir . '/HTMLPurifier/Injector/PurifierLinkify.php';
|
||||
require_once $__dir . '/HTMLPurifier/Injector/RemoveEmpty.php';
|
||||
require_once $__dir . '/HTMLPurifier/Injector/RemoveSpansWithoutAttributes.php';
|
||||
|
@ -19,6 +19,9 @@ class HTMLPurifier_HTMLModule_Math extends HTMLPurifier_HTMLModule
|
||||
public function setup($config)
|
||||
{
|
||||
|
||||
// Normalize whitespace inside text elements as per MathML spec 2.1.7
|
||||
$this->info_injector[] = new HTMLPurifier_Injector_MathSpaceNormalize();
|
||||
|
||||
/*****************************************************************
|
||||
* Meta variables
|
||||
* Used in this file to simplify code and help adapt the DTD
|
||||
|
40
library/HTMLPurifier/Injector/MathSpaceNormalize.php
Normal file
40
library/HTMLPurifier/Injector/MathSpaceNormalize.php
Normal file
@ -0,0 +1,40 @@
|
||||
<?php
|
||||
|
||||
class HTMLPurifier_Injector_MathSpaceNormalize extends HTMLPurifier_Injector
|
||||
{
|
||||
|
||||
/**
|
||||
* Elements to apply handleText to.
|
||||
* These are those that accept #PCDATA except <cs> and <cbytes>.
|
||||
* @type array
|
||||
*/
|
||||
protected $tags = array('mi', 'mn', 'mo', 'ms', 'mtext', 'ci', 'cn', 'csymbol', 'annotation');
|
||||
|
||||
/**
|
||||
* @param HTMLPurifier_Token $token
|
||||
*/
|
||||
public function handleText(&$token)
|
||||
{
|
||||
|
||||
// No parent tag => return to avoid error on following line
|
||||
if (count($this->currentNesting) == 0) {
|
||||
return;
|
||||
}
|
||||
|
||||
// Get the parent tag
|
||||
$parent_token = $this->currentNesting[count($this->currentNesting) - 1];
|
||||
|
||||
// If we're not in a "token element" (specified in $tags above), return
|
||||
if ($parent_token === null || !in_array($parent_token->name, $this->tags)) {
|
||||
return;
|
||||
}
|
||||
|
||||
// Replace as per the MathML specification, section 2.1.7
|
||||
$token->data = preg_replace(
|
||||
'/[ \t\n\r]+/',
|
||||
' ',
|
||||
trim($token->data) // Using trim($token->data, ' \t\n\r') trims t,n,r
|
||||
);
|
||||
}
|
||||
|
||||
}
|
Loading…
Reference in New Issue
Block a user