0
0
mirror of https://github.com/ezyang/htmlpurifier.git synced 2025-01-05 06:01:52 +00:00

[3.1.0] Add multi-parse capability for StringHash

git-svn-id: http://htmlpurifier.org/svnroot/htmlpurifier/trunk@1624 48356398-32a2-884e-a903-53898d9a118a
This commit is contained in:
Edward Z. Yang 2008-03-23 00:02:37 +00:00
parent b8f00ace1a
commit 848795d4a0
3 changed files with 89 additions and 10 deletions

View File

@ -21,21 +21,60 @@
* *
* We use this as an easy to use file-format for configuration schema * We use this as an easy to use file-format for configuration schema
* files, but the class itself is usage agnostic. * files, but the class itself is usage agnostic.
*
* You can use ---- to forcibly terminate parsing of a single string-hash;
* this marker is used in multi string-hashes to delimit boundaries.
*/ */
class HTMLPurifier_StringHashParser class HTMLPurifier_StringHashParser
{ {
public $default = 'ID'; public $default = 'ID';
/**
* Parses a file that contains a single string-hash.
*/
public function parseFile($file) { public function parseFile($file) {
if (!file_exists($file)) return false; if (!file_exists($file)) return false;
$fh = fopen($file, 'r'); $fh = fopen($file, 'r');
if (!$fh) return false;
$ret = $this->parseHandle($fh);
fclose($fh);
return $ret;
}
/**
* Parses a file that contains multiple string-hashes delimited by '----'
*/
public function parseMultiFile($file) {
if (!file_exists($file)) return false;
$ret = array();
$fh = fopen($file, 'r');
if (!$fh) return false;
while (!feof($fh)) {
$ret[] = $this->parseHandle($fh);
}
fclose($fh);
return $ret;
}
/**
* Internal parser that acepts a file handle.
* @note While it's possible to simulate in-memory parsing by using
* custom stream wrappers, if such a use-case arises we should
* factor out the file handle into its own class.
* @param $fh File handle with pointer at start of valid string-hash
* block.
*/
protected function parseHandle($fh) {
$state = false; $state = false;
$single = false; $single = false;
$ret = array(); $ret = array();
while (($line = fgets($fh)) !== false) { do {
$line = fgets($fh);
if ($line === false) break;
$line = rtrim($line, "\n\r"); $line = rtrim($line, "\n\r");
if (!$state && $line === '') continue; if (!$state && $line === '') continue;
if ($line === '----') break;
if (strncmp('--', $line, 2) === 0) { if (strncmp('--', $line, 2) === 0) {
// Multiline declaration // Multiline declaration
$state = trim($line, '- '); $state = trim($line, '- ');
@ -58,8 +97,7 @@ class HTMLPurifier_StringHashParser
if (!isset($ret[$state])) $ret[$state] = ''; if (!isset($ret[$state])) $ret[$state] = '';
$ret[$state] .= "$line\n"; $ret[$state] .= "$line\n";
} }
} } while (!feof($fh));
fclose($fh);
return $ret; return $ret;
} }

View File

@ -0,0 +1,18 @@
Namespace.Directive
TYPE: string
CHAIN-ME: 2
--DESCRIPTION--
Multiline
stuff
--FOR-WHO--
Single multiline
----
Namespace.Directive2
TYPE: integer
CHAIN-ME: 3
--DESCRIPTION--
M
stuff
--FOR-WHO--
Single multiline2

View File

@ -11,19 +11,19 @@ class HTMLPurifier_StringHashParserTest extends UnitTestCase
*/ */
protected $parser; protected $parser;
function setup() { public function setup() {
$this->parser = new HTMLPurifier_StringHashParser(); $this->parser = new HTMLPurifier_StringHashParser();
} }
/** /**
* Assert that $file gets parsed into the form of $expect * Assert that $file gets parsed into the form of $expect
*/ */
function assertParse($file, $expect) { public function assertParse($file, $expect) {
$result = $this->parser->parseFile(dirname(__FILE__) . '/StringHashParser/' . $file); $result = $this->parser->parseFile(dirname(__FILE__) . '/StringHashParser/' . $file);
$this->assertIdentical($result, $expect); $this->assertIdentical($result, $expect);
} }
function testSimple() { public function testSimple() {
$this->assertParse('Simple.txt', array( $this->assertParse('Simple.txt', array(
'ID' => 'Namespace.Directive', 'ID' => 'Namespace.Directive',
'TYPE' => 'string', 'TYPE' => 'string',
@ -33,26 +33,26 @@ class HTMLPurifier_StringHashParserTest extends UnitTestCase
)); ));
} }
function testOverrideSingle() { public function testOverrideSingle() {
$this->assertParse('OverrideSingle.txt', array( $this->assertParse('OverrideSingle.txt', array(
'KEY' => 'New', 'KEY' => 'New',
)); ));
} }
function testAppendMultiline() { public function testAppendMultiline() {
$this->assertParse('AppendMultiline.txt', array( $this->assertParse('AppendMultiline.txt', array(
'KEY' => "Line1\nLine2\n", 'KEY' => "Line1\nLine2\n",
)); ));
} }
function testDefault() { public function testDefault() {
$this->parser->default = 'NEW-ID'; $this->parser->default = 'NEW-ID';
$this->assertParse('Default.txt', array( $this->assertParse('Default.txt', array(
'NEW-ID' => 'DefaultValue', 'NEW-ID' => 'DefaultValue',
)); ));
} }
function testError() { public function testError() {
try { try {
$this->parser->parseFile('NoExist.txt'); $this->parser->parseFile('NoExist.txt');
} catch (HTMLPurifier_ConfigSchema_Exception $e) { } catch (HTMLPurifier_ConfigSchema_Exception $e) {
@ -60,4 +60,27 @@ class HTMLPurifier_StringHashParserTest extends UnitTestCase
} }
} }
public function testParseMultiple() {
$result = $this->parser->parseMultiFile(dirname(__FILE__) . '/StringHashParser/Multi.txt');
$this->assertIdentical(
$result,
array(
array(
'ID' => 'Namespace.Directive',
'TYPE' => 'string',
'CHAIN-ME' => '2',
'DESCRIPTION' => "Multiline\nstuff\n",
'FOR-WHO' => "Single multiline\n",
),
array(
'ID' => 'Namespace.Directive2',
'TYPE' => 'integer',
'CHAIN-ME' => '3',
'DESCRIPTION' => "M\nstuff\n",
'FOR-WHO' => "Single multiline2\n",
)
)
);
}
} }