2007-07-19 12:40:28 +02:00
|
|
|
<?php
|
|
|
|
|
2008-02-25 03:10:37 +01:00
|
|
|
/**
|
|
|
|
* @package sapphire
|
|
|
|
* @subpackage misc
|
|
|
|
*/
|
|
|
|
|
2007-07-19 12:40:28 +02:00
|
|
|
/**
|
|
|
|
* Base class for XML parsers
|
2008-02-25 03:10:37 +01:00
|
|
|
* @package sapphire
|
|
|
|
* @subpackage misc
|
2007-07-19 12:40:28 +02:00
|
|
|
*/
|
|
|
|
class XML extends Object {
|
|
|
|
protected $parser;
|
|
|
|
protected $context, $attributeStore;
|
|
|
|
protected $parsed;
|
|
|
|
protected $collatedText;
|
|
|
|
|
|
|
|
|
|
|
|
function tidyXHTML($content) {
|
|
|
|
$cleanFile = TEMP_FOLDER . "/cleaner.tmp";
|
|
|
|
$fh = fopen($cleanFile,"w");
|
|
|
|
fwrite($fh, $content);
|
|
|
|
fclose($fh);
|
|
|
|
|
|
|
|
if(file_exists($cleanFile)) {
|
|
|
|
$result = `tidy -asxhtml $cleanFile`;
|
|
|
|
unlink($cleanFile);
|
|
|
|
return $result;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
function parse($content, $recursive = false) {
|
|
|
|
$this->parser = xml_parser_create('UTF-8');
|
|
|
|
|
|
|
|
// Andrew keeps giving me the wrong FSKING encoding! :-P
|
|
|
|
$content = ereg_replace('encoding="[^"]+"','encoding="utf-8"', $content);
|
|
|
|
|
|
|
|
xml_parser_set_option($this->parser, XML_OPTION_CASE_FOLDING, false);
|
|
|
|
//xml_parser_set_option($this->parser, XML_OPTION_TARGET_ENCODING, 'UTF-8');
|
|
|
|
xml_set_object($this->parser, $this);
|
|
|
|
xml_set_element_handler($this->parser, "tag_open", "tag_close");
|
|
|
|
xml_set_character_data_handler($this->parser, "cdata");
|
|
|
|
|
|
|
|
$this->parsed = null;
|
|
|
|
$this->context = array();
|
|
|
|
$this->attributeStore = array();
|
|
|
|
|
|
|
|
xml_parse($this->parser, $content);
|
|
|
|
|
|
|
|
// Handle a bad encoding type by forcing ISO-8859-15
|
|
|
|
if(xml_get_error_code($this->parser) == 32 && !$recursive) {
|
|
|
|
$content = ereg_replace('encoding="[^"]+"','encoding="utf-8"', $content);
|
|
|
|
return $this->parse($content, true);
|
|
|
|
}
|
|
|
|
|
|
|
|
if($err = xml_get_error_code($this->parser)) {
|
|
|
|
user_error("XML parser broke with error $err:" . xml_error_string($err), E_USER_ERROR);
|
|
|
|
}
|
|
|
|
|
|
|
|
return $this->parsed;
|
|
|
|
}
|
|
|
|
|
|
|
|
function inContext() {
|
|
|
|
$items = func_get_args();
|
|
|
|
$i=0;
|
|
|
|
foreach($items as $item) {
|
|
|
|
while($i < sizeof($this->context)) {
|
|
|
|
if($this->context[$i] == $item) break;
|
|
|
|
$i++;
|
|
|
|
}
|
|
|
|
if($this->context[$i] != $item) return false;
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
function stackActionFor($tag) {
|
|
|
|
for($i=sizeof($this->contextStack)-1;$i>=0;$i--) {
|
|
|
|
if($this->context[$i]['tag'] == $tag) return $this->contextStack[$i]['action'];
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
function tag_open($parser, $tag, $attributes) {
|
|
|
|
// Strip namespaces out of tags and attributes
|
|
|
|
$tag = ereg_replace('[^:]+:','',$tag);
|
|
|
|
if($attributes) foreach($attributes as $k => $v) $newAttributes[ereg_replace('[^:]+:','',$k)] = $v;
|
2007-11-26 05:20:19 +01:00
|
|
|
$attributes = isset($newAttributes) ? $newAttributes : $attributes;
|
2007-07-19 12:40:28 +02:00
|
|
|
|
|
|
|
|
2007-11-26 05:20:19 +01:00
|
|
|
if(isset($attributes['class'])) {
|
2007-07-19 12:40:28 +02:00
|
|
|
$this->context[] = "$tag.{$attributes['class']}";
|
|
|
|
} else {
|
|
|
|
$this->context[] = $tag;
|
|
|
|
}
|
|
|
|
$this->attributeStore[] = $attributes;
|
|
|
|
|
|
|
|
$this->collatedText = "";
|
|
|
|
|
|
|
|
$tagProcessorFunc = "process_$tag";
|
|
|
|
if($this->hasMethod($tagProcessorFunc)) {
|
|
|
|
$this->$tagProcessorFunc($attributes);
|
2007-11-26 05:20:19 +01:00
|
|
|
}elseif($this->hasMethod($tagProcessorFunc = "process_tag")){
|
|
|
|
$this->$tagProcessorFunc($tag, $attributes);
|
2007-07-19 12:40:28 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
if($attributes) foreach($attributes as $k => $v) {
|
|
|
|
$attProcessorFunc = "processatt_$k";
|
|
|
|
if($this->hasMethod($attProcessorFunc)) {
|
|
|
|
$this->$attProcessorFunc($tag, $attributes);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
function tag_close($parser, $tag) {
|
|
|
|
$tag = ereg_replace('[^:]+:','',$tag);
|
|
|
|
|
|
|
|
array_pop($this->context);
|
|
|
|
$attributes = array_pop($this->attributeStore);
|
|
|
|
|
|
|
|
if(method_exists($this, $funcName = "process_{$tag}_end")) {
|
|
|
|
$this->$funcName($this->collatedText, $attributes);
|
2007-11-26 05:20:19 +01:00
|
|
|
}elseif(method_exists($this,$funcName = "process_tag_end")){
|
|
|
|
// else run default method
|
|
|
|
$this->$funcName($tag,$this->collatedText, $attributes);
|
2007-07-19 12:40:28 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
$this->collatedText = "";
|
|
|
|
}
|
|
|
|
|
|
|
|
function cdata($parser, $cdata) {
|
|
|
|
$this->collatedText .= $cdata;
|
|
|
|
}
|
|
|
|
}
|