public function tokenizeHTML($string, $config, $context) { $this->tokens = array(); $this->last_token_was_empty = false; $string = $this->normalize($string, $config, $context); $this->parent_handler = set_error_handler(array($this, 'muteStrictErrorHandler')); $parser = new XML_HTMLSax3(); $parser->set_object($this); $parser->set_element_handler('openHandler','closeHandler'); $parser->set_data_handler('dataHandler'); $parser->set_escape_handler('escapeHandler'); // doesn't seem to work correctly for attributes $parser->set_option('XML_OPTION_ENTITIES_PARSED', 1); $parser->parse($string); restore_error_handler(); return $this->tokens; }
function tokenizeHTML($string, $config, &$context) { $this->tokens = array(); $string = $this->normalize($string, $config, $context); $parser = new XML_HTMLSax3(); $parser->set_object($this); $parser->set_element_handler('openHandler', 'closeHandler'); $parser->set_data_handler('dataHandler'); $parser->set_escape_handler('escapeHandler'); // doesn't seem to work correctly for attributes $parser->set_option('XML_OPTION_ENTITIES_PARSED', 1); $parser->parse($string); return $this->tokens; }
/** * @param string $data * @access public */ function parse($data) { $parser = new XML_HTMLSax3(); $parser->set_object($this); $parser->set_element_handler('openHandler', 'closeHandler'); $parser->set_data_handler('dataHandler'); $parser->set_escape_handler('escapeHandler'); $parser->set_option('XML_OPTION_TRIM_DATA_NODES', 0); $parser->parse($data); }