mirror of
https://github.com/ezyang/htmlpurifier.git
synced 2024-12-22 08:21:52 +00:00
fac747bdbd
With minor corrections. Signed-off-by: Marcus Bointon <marcus@synchromedia.co.uk> Signed-off-by: Edward Z. Yang <ezyang@mit.edu>
137 lines
3.6 KiB
PHP
137 lines
3.6 KiB
PHP
<?php
|
|
|
|
/**
|
|
* Parses string hash files. File format is as such:
|
|
*
|
|
* DefaultKeyValue
|
|
* KEY: Value
|
|
* KEY2: Value2
|
|
* --MULTILINE-KEY--
|
|
* Multiline
|
|
* value.
|
|
*
|
|
* Which would output something similar to:
|
|
*
|
|
* array(
|
|
* 'ID' => 'DefaultKeyValue',
|
|
* 'KEY' => 'Value',
|
|
* 'KEY2' => 'Value2',
|
|
* 'MULTILINE-KEY' => "Multiline\nvalue.\n",
|
|
* )
|
|
*
|
|
* We use this as an easy to use file-format for configuration schema
|
|
* files, but the class itself is usage agnostic.
|
|
*
|
|
* You can use ---- to forcibly terminate parsing of a single string-hash;
|
|
* this marker is used in multi string-hashes to delimit boundaries.
|
|
*/
|
|
class HTMLPurifier_StringHashParser
|
|
{
|
|
|
|
/**
|
|
* @type string
|
|
*/
|
|
public $default = 'ID';
|
|
|
|
/**
|
|
* Parses a file that contains a single string-hash.
|
|
* @param string $file
|
|
* @return array
|
|
*/
|
|
public function parseFile($file)
|
|
{
|
|
if (!file_exists($file)) {
|
|
return false;
|
|
}
|
|
$fh = fopen($file, 'r');
|
|
if (!$fh) {
|
|
return false;
|
|
}
|
|
$ret = $this->parseHandle($fh);
|
|
fclose($fh);
|
|
return $ret;
|
|
}
|
|
|
|
/**
|
|
* Parses a file that contains multiple string-hashes delimited by '----'
|
|
* @param string $file
|
|
* @return array
|
|
*/
|
|
public function parseMultiFile($file)
|
|
{
|
|
if (!file_exists($file)) {
|
|
return false;
|
|
}
|
|
$ret = array();
|
|
$fh = fopen($file, 'r');
|
|
if (!$fh) {
|
|
return false;
|
|
}
|
|
while (!feof($fh)) {
|
|
$ret[] = $this->parseHandle($fh);
|
|
}
|
|
fclose($fh);
|
|
return $ret;
|
|
}
|
|
|
|
/**
|
|
* Internal parser that acepts a file handle.
|
|
* @note While it's possible to simulate in-memory parsing by using
|
|
* custom stream wrappers, if such a use-case arises we should
|
|
* factor out the file handle into its own class.
|
|
* @param resource $fh File handle with pointer at start of valid string-hash
|
|
* block.
|
|
* @return array
|
|
*/
|
|
protected function parseHandle($fh)
|
|
{
|
|
$state = false;
|
|
$single = false;
|
|
$ret = array();
|
|
do {
|
|
$line = fgets($fh);
|
|
if ($line === false) {
|
|
break;
|
|
}
|
|
$line = rtrim($line, "\n\r");
|
|
if (!$state && $line === '') {
|
|
continue;
|
|
}
|
|
if ($line === '----') {
|
|
break;
|
|
}
|
|
if (strncmp('--#', $line, 3) === 0) {
|
|
// Comment
|
|
continue;
|
|
} elseif (strncmp('--', $line, 2) === 0) {
|
|
// Multiline declaration
|
|
$state = trim($line, '- ');
|
|
if (!isset($ret[$state])) {
|
|
$ret[$state] = '';
|
|
}
|
|
continue;
|
|
} elseif (!$state) {
|
|
$single = true;
|
|
if (strpos($line, ':') !== false) {
|
|
// Single-line declaration
|
|
list($state, $line) = explode(':', $line, 2);
|
|
$line = trim($line);
|
|
} else {
|
|
// Use default declaration
|
|
$state = $this->default;
|
|
}
|
|
}
|
|
if ($single) {
|
|
$ret[$state] = $line;
|
|
$single = false;
|
|
$state = false;
|
|
} else {
|
|
$ret[$state] .= "$line\n";
|
|
}
|
|
} while (!feof($fh));
|
|
return $ret;
|
|
}
|
|
}
|
|
|
|
// vim: et sw=4 sts=4
|