4 * Custom validation class, accepts DTD child definitions
6 * @warning Currently this class is an all or nothing proposition, that is,
7 * it will only give a bool return value.
9 class HTMLPurifier_ChildDef_Custom
extends HTMLPurifier_ChildDef
11 public $type = 'custom';
12 public $allow_empty = false;
14 * Allowed child pattern as defined by the DTD
18 * PCRE regex derived from $dtd_regex
23 * @param $dtd_regex Allowed child pattern from the DTD
25 public function __construct($dtd_regex) {
26 $this->dtd_regex
= $dtd_regex;
27 $this->_compileRegex();
30 * Compiles the PCRE regex from a DTD regex ($dtd_regex to $_pcre_regex)
32 protected function _compileRegex() {
33 $raw = str_replace(' ', '', $this->dtd_regex
);
37 $el = '[#a-zA-Z0-9_.-]+';
40 // COMPLICATED! AND MIGHT BE BUGGY! I HAVE NO CLUE WHAT I'M
41 // DOING! Seriously: if there's problems, please report them.
43 // collect all elements into the $elements array
44 preg_match_all("/$el/", $reg, $matches);
45 foreach ($matches[0] as $match) {
46 $this->elements
[$match] = true;
49 // setup all elements as parentheticals with leading commas
50 $reg = preg_replace("/$el/", '(,\\0)', $reg);
52 // remove commas when they were not solicited
53 $reg = preg_replace("/([^,(|]\(+),/", '\\1', $reg);
55 // remove all non-paranthetical commas: they are handled by first regex
56 $reg = preg_replace("/,\(/", '(', $reg);
58 $this->_pcre_regex
= $reg;
60 public function validateChildren($tokens_of_children, $config, $context) {
61 $list_of_children = '';
62 $nesting = 0; // depth into the nest
63 foreach ($tokens_of_children as $token) {
64 if (!empty($token->is_whitespace
)) continue;
66 $is_child = ($nesting == 0); // direct
68 if ($token instanceof HTMLPurifier_Token_Start
) {
70 } elseif ($token instanceof HTMLPurifier_Token_End
) {
75 $list_of_children .= $token->name
. ',';
78 // add leading comma to deal with stray comma declarations
79 $list_of_children = ',' . rtrim($list_of_children, ',');
82 '/^,?'.$this->_pcre_regex
.'$/',