394 lines
		
	
	
	
		
			12 KiB
		
	
	
	
		
			PHP
		
	
	
	
	
	
			
		
		
	
	
			394 lines
		
	
	
	
		
			12 KiB
		
	
	
	
		
			PHP
		
	
	
	
	
	
| <?php
 | |
| /**
 | |
|  * Atom Syndication Format PHP Library
 | |
|  *
 | |
|  * @package AtomLib
 | |
|  * @link http://code.google.com/p/phpatomlib/
 | |
|  *
 | |
|  * @author Elias Torres <elias@torrez.us>
 | |
|  * @version 0.4
 | |
|  * @since 2.3.0
 | |
|  */
 | |
| 
 | |
| /**
 | |
|  * Structure that store common Atom Feed Properties
 | |
|  *
 | |
|  * @package AtomLib
 | |
|  */
 | |
| class AtomFeed {
 | |
| 	/**
 | |
| 	 * Stores Links
 | |
| 	 * @var array
 | |
| 	 * @access public
 | |
| 	 */
 | |
|     var $links = array();
 | |
|     /**
 | |
|      * Stores Categories
 | |
|      * @var array
 | |
|      * @access public
 | |
|      */
 | |
|     var $categories = array();
 | |
| 	/**
 | |
| 	 * Stores Entries
 | |
| 	 *
 | |
| 	 * @var array
 | |
| 	 * @access public
 | |
| 	 */
 | |
|     var $entries = array();
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * Structure that store Atom Entry Properties
 | |
|  *
 | |
|  * @package AtomLib
 | |
|  */
 | |
| class AtomEntry {
 | |
| 	/**
 | |
| 	 * Stores Links
 | |
| 	 * @var array
 | |
| 	 * @access public
 | |
| 	 */
 | |
|     var $links = array();
 | |
|     /**
 | |
|      * Stores Categories
 | |
|      * @var array
 | |
| 	 * @access public
 | |
|      */
 | |
|     var $categories = array();
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * AtomLib Atom Parser API
 | |
|  *
 | |
|  * @package AtomLib
 | |
|  */
 | |
| class AtomParser {
 | |
| 
 | |
|     var $NS = 'http://www.w3.org/2005/Atom';
 | |
|     var $ATOM_CONTENT_ELEMENTS = array('content','summary','title','subtitle','rights');
 | |
|     var $ATOM_SIMPLE_ELEMENTS = array('id','updated','published','draft');
 | |
| 
 | |
|     var $debug = false;
 | |
| 
 | |
|     var $depth = 0;
 | |
|     var $indent = 2;
 | |
|     var $in_content;
 | |
|     var $ns_contexts = array();
 | |
|     var $ns_decls = array();
 | |
|     var $content_ns_decls = array();
 | |
|     var $content_ns_contexts = array();
 | |
|     var $is_xhtml = false;
 | |
|     var $is_html = false;
 | |
|     var $is_text = true;
 | |
|     var $skipped_div = false;
 | |
| 
 | |
|     var $FILE = "php://input";
 | |
| 
 | |
|     var $feed;
 | |
|     var $current;
 | |
| 
 | |
| 	/**
 | |
| 	 * PHP5 constructor.
 | |
| 	 */
 | |
|     function __construct() {
 | |
| 
 | |
|         $this->feed = new AtomFeed();
 | |
|         $this->current = null;
 | |
|         $this->map_attrs_func = array( __CLASS__, 'map_attrs' );
 | |
|         $this->map_xmlns_func = array( __CLASS__, 'map_xmlns' );
 | |
|     }
 | |
| 
 | |
| 	/**
 | |
| 	 * PHP4 constructor.
 | |
| 	 */
 | |
| 	public function AtomParser() {
 | |
| 		self::__construct();
 | |
| 	}
 | |
| 
 | |
| 	/**
 | |
| 	 * Map attributes to key="val"
 | |
| 	 *
 | |
| 	 * @param string $k Key
 | |
| 	 * @param string $v Value
 | |
| 	 * @return string
 | |
| 	 */
 | |
| 	public static function map_attrs($k, $v) {
 | |
| 		return "$k=\"$v\"";
 | |
| 	}
 | |
| 
 | |
| 	/**
 | |
| 	 * Map XML namespace to string.
 | |
| 	 *
 | |
| 	 * @param indexish $p XML Namespace element index
 | |
| 	 * @param array $n Two-element array pair. [ 0 => {namespace}, 1 => {url} ]
 | |
| 	 * @return string 'xmlns="{url}"' or 'xmlns:{namespace}="{url}"'
 | |
| 	 */
 | |
| 	public static function map_xmlns($p, $n) {
 | |
| 		$xd = "xmlns";
 | |
| 		if( 0 < strlen($n[0]) ) {
 | |
| 			$xd .= ":{$n[0]}";
 | |
| 		}
 | |
| 		return "{$xd}=\"{$n[1]}\"";
 | |
| 	}
 | |
| 
 | |
|     function _p($msg) {
 | |
|         if($this->debug) {
 | |
|             print str_repeat(" ", $this->depth * $this->indent) . $msg ."\n";
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     function error_handler($log_level, $log_text, $error_file, $error_line) {
 | |
|         $this->error = $log_text;
 | |
|     }
 | |
| 
 | |
|     function parse() {
 | |
| 
 | |
|         set_error_handler(array(&$this, 'error_handler'));
 | |
| 
 | |
|         array_unshift($this->ns_contexts, array());
 | |
| 
 | |
|         if ( ! function_exists( 'xml_parser_create_ns' ) ) {
 | |
|         	trigger_error( __( "PHP's XML extension is not available. Please contact your hosting provider to enable PHP's XML extension." ) );
 | |
|         	return false;
 | |
|         }
 | |
| 
 | |
|         $parser = xml_parser_create_ns();
 | |
|         xml_set_object($parser, $this);
 | |
|         xml_set_element_handler($parser, "start_element", "end_element");
 | |
|         xml_parser_set_option($parser,XML_OPTION_CASE_FOLDING,0);
 | |
|         xml_parser_set_option($parser,XML_OPTION_SKIP_WHITE,0);
 | |
|         xml_set_character_data_handler($parser, "cdata");
 | |
|         xml_set_default_handler($parser, "_default");
 | |
|         xml_set_start_namespace_decl_handler($parser, "start_ns");
 | |
|         xml_set_end_namespace_decl_handler($parser, "end_ns");
 | |
| 
 | |
|         $this->content = '';
 | |
| 
 | |
|         $ret = true;
 | |
| 
 | |
|         $fp = fopen($this->FILE, "r");
 | |
|         while ($data = fread($fp, 4096)) {
 | |
|             if($this->debug) $this->content .= $data;
 | |
| 
 | |
|             if(!xml_parse($parser, $data, feof($fp))) {
 | |
|                 /* translators: 1: error message, 2: line number */
 | |
|                 trigger_error(sprintf(__('XML Error: %1$s at line %2$s')."\n",
 | |
|                     xml_error_string(xml_get_error_code($parser)),
 | |
|                     xml_get_current_line_number($parser)));
 | |
|                 $ret = false;
 | |
|                 break;
 | |
|             }
 | |
|         }
 | |
|         fclose($fp);
 | |
| 
 | |
|         xml_parser_free($parser);
 | |
| 
 | |
|         restore_error_handler();
 | |
| 
 | |
|         return $ret;
 | |
|     }
 | |
| 
 | |
|     function start_element($parser, $name, $attrs) {
 | |
| 
 | |
|         $tag = array_pop(explode(":", $name));
 | |
| 
 | |
|         switch($name) {
 | |
|             case $this->NS . ':feed':
 | |
|                 $this->current = $this->feed;
 | |
|                 break;
 | |
|             case $this->NS . ':entry':
 | |
|                 $this->current = new AtomEntry();
 | |
|                 break;
 | |
|         };
 | |
| 
 | |
|         $this->_p("start_element('$name')");
 | |
|         #$this->_p(print_r($this->ns_contexts,true));
 | |
|         #$this->_p('current(' . $this->current . ')');
 | |
| 
 | |
|         array_unshift($this->ns_contexts, $this->ns_decls);
 | |
| 
 | |
|         $this->depth++;
 | |
| 
 | |
|         if(!empty($this->in_content)) {
 | |
| 
 | |
|             $this->content_ns_decls = array();
 | |
| 
 | |
|             if($this->is_html || $this->is_text)
 | |
|                 trigger_error("Invalid content in element found. Content must not be of type text or html if it contains markup.");
 | |
| 
 | |
|             $attrs_prefix = array();
 | |
| 
 | |
|             // resolve prefixes for attributes
 | |
|             foreach($attrs as $key => $value) {
 | |
|                 $with_prefix = $this->ns_to_prefix($key, true);
 | |
|                 $attrs_prefix[$with_prefix[1]] = $this->xml_escape($value);
 | |
|             }
 | |
| 
 | |
|             $attrs_str = join(' ', array_map($this->map_attrs_func, array_keys($attrs_prefix), array_values($attrs_prefix)));
 | |
|             if(strlen($attrs_str) > 0) {
 | |
|                 $attrs_str = " " . $attrs_str;
 | |
|             }
 | |
| 
 | |
|             $with_prefix = $this->ns_to_prefix($name);
 | |
| 
 | |
|             if(!$this->is_declared_content_ns($with_prefix[0])) {
 | |
|                 array_push($this->content_ns_decls, $with_prefix[0]);
 | |
|             }
 | |
| 
 | |
|             $xmlns_str = '';
 | |
|             if(count($this->content_ns_decls) > 0) {
 | |
|                 array_unshift($this->content_ns_contexts, $this->content_ns_decls);
 | |
|                 $xmlns_str .= join(' ', array_map($this->map_xmlns_func, array_keys($this->content_ns_contexts[0]), array_values($this->content_ns_contexts[0])));
 | |
|                 if(strlen($xmlns_str) > 0) {
 | |
|                     $xmlns_str = " " . $xmlns_str;
 | |
|                 }
 | |
|             }
 | |
| 
 | |
|             array_push($this->in_content, array($tag, $this->depth, "<". $with_prefix[1] ."{$xmlns_str}{$attrs_str}" . ">"));
 | |
| 
 | |
|         } else if(in_array($tag, $this->ATOM_CONTENT_ELEMENTS) || in_array($tag, $this->ATOM_SIMPLE_ELEMENTS)) {
 | |
|             $this->in_content = array();
 | |
|             $this->is_xhtml = $attrs['type'] == 'xhtml';
 | |
|             $this->is_html = $attrs['type'] == 'html' || $attrs['type'] == 'text/html';
 | |
|             $this->is_text = !in_array('type',array_keys($attrs)) || $attrs['type'] == 'text';
 | |
|             $type = $this->is_xhtml ? 'XHTML' : ($this->is_html ? 'HTML' : ($this->is_text ? 'TEXT' : $attrs['type']));
 | |
| 
 | |
|             if(in_array('src',array_keys($attrs))) {
 | |
|                 $this->current->$tag = $attrs;
 | |
|             } else {
 | |
|                 array_push($this->in_content, array($tag,$this->depth, $type));
 | |
|             }
 | |
|         } else if($tag == 'link') {
 | |
|             array_push($this->current->links, $attrs);
 | |
|         } else if($tag == 'category') {
 | |
|             array_push($this->current->categories, $attrs);
 | |
|         }
 | |
| 
 | |
|         $this->ns_decls = array();
 | |
|     }
 | |
| 
 | |
|     function end_element($parser, $name) {
 | |
| 
 | |
|         $tag = array_pop(explode(":", $name));
 | |
| 
 | |
|         $ccount = count($this->in_content);
 | |
| 
 | |
|         # if we are *in* content, then let's proceed to serialize it
 | |
|         if(!empty($this->in_content)) {
 | |
|             # if we are ending the original content element
 | |
|             # then let's finalize the content
 | |
|             if($this->in_content[0][0] == $tag &&
 | |
|                 $this->in_content[0][1] == $this->depth) {
 | |
|                 $origtype = $this->in_content[0][2];
 | |
|                 array_shift($this->in_content);
 | |
|                 $newcontent = array();
 | |
|                 foreach($this->in_content as $c) {
 | |
|                     if(count($c) == 3) {
 | |
|                         array_push($newcontent, $c[2]);
 | |
|                     } else {
 | |
|                         if($this->is_xhtml || $this->is_text) {
 | |
|                             array_push($newcontent, $this->xml_escape($c));
 | |
|                         } else {
 | |
|                             array_push($newcontent, $c);
 | |
|                         }
 | |
|                     }
 | |
|                 }
 | |
|                 if(in_array($tag, $this->ATOM_CONTENT_ELEMENTS)) {
 | |
|                     $this->current->$tag = array($origtype, join('',$newcontent));
 | |
|                 } else {
 | |
|                     $this->current->$tag = join('',$newcontent);
 | |
|                 }
 | |
|                 $this->in_content = array();
 | |
|             } else if($this->in_content[$ccount-1][0] == $tag &&
 | |
|                 $this->in_content[$ccount-1][1] == $this->depth) {
 | |
|                 $this->in_content[$ccount-1][2] = substr($this->in_content[$ccount-1][2],0,-1) . "/>";
 | |
|             } else {
 | |
|                 # else, just finalize the current element's content
 | |
|                 $endtag = $this->ns_to_prefix($name);
 | |
|                 array_push($this->in_content, array($tag, $this->depth, "</$endtag[1]>"));
 | |
|             }
 | |
|         }
 | |
| 
 | |
|         array_shift($this->ns_contexts);
 | |
| 
 | |
|         $this->depth--;
 | |
| 
 | |
|         if($name == ($this->NS . ':entry')) {
 | |
|             array_push($this->feed->entries, $this->current);
 | |
|             $this->current = null;
 | |
|         }
 | |
| 
 | |
|         $this->_p("end_element('$name')");
 | |
|     }
 | |
| 
 | |
|     function start_ns($parser, $prefix, $uri) {
 | |
|         $this->_p("starting: " . $prefix . ":" . $uri);
 | |
|         array_push($this->ns_decls, array($prefix,$uri));
 | |
|     }
 | |
| 
 | |
|     function end_ns($parser, $prefix) {
 | |
|         $this->_p("ending: #" . $prefix . "#");
 | |
|     }
 | |
| 
 | |
|     function cdata($parser, $data) {
 | |
|         $this->_p("data: #" . str_replace(array("\n"), array("\\n"), trim($data)) . "#");
 | |
|         if(!empty($this->in_content)) {
 | |
|             array_push($this->in_content, $data);
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     function _default($parser, $data) {
 | |
|         # when does this gets called?
 | |
|     }
 | |
| 
 | |
| 
 | |
|     function ns_to_prefix($qname, $attr=false) {
 | |
|         # split 'http://www.w3.org/1999/xhtml:div' into ('http','//www.w3.org/1999/xhtml','div')
 | |
|         $components = explode(":", $qname);
 | |
| 
 | |
|         # grab the last one (e.g 'div')
 | |
|         $name = array_pop($components);
 | |
| 
 | |
|         if(!empty($components)) {
 | |
|             # re-join back the namespace component
 | |
|             $ns = join(":",$components);
 | |
|             foreach($this->ns_contexts as $context) {
 | |
|                 foreach($context as $mapping) {
 | |
|                     if($mapping[1] == $ns && strlen($mapping[0]) > 0) {
 | |
|                         return array($mapping, "$mapping[0]:$name");
 | |
|                     }
 | |
|                 }
 | |
|             }
 | |
|         }
 | |
| 
 | |
|         if($attr) {
 | |
|             return array(null, $name);
 | |
|         } else {
 | |
|             foreach($this->ns_contexts as $context) {
 | |
|                 foreach($context as $mapping) {
 | |
|                     if(strlen($mapping[0]) == 0) {
 | |
|                         return array($mapping, $name);
 | |
|                     }
 | |
|                 }
 | |
|             }
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     function is_declared_content_ns($new_mapping) {
 | |
|         foreach($this->content_ns_contexts as $context) {
 | |
|             foreach($context as $mapping) {
 | |
|                 if($new_mapping == $mapping) {
 | |
|                     return true;
 | |
|                 }
 | |
|             }
 | |
|         }
 | |
|         return false;
 | |
|     }
 | |
| 
 | |
|     function xml_escape($string)
 | |
|     {
 | |
|              return str_replace(array('&','"',"'",'<','>'),
 | |
|                 array('&','"',''','<','>'),
 | |
|                 $string );
 | |
|     }
 | |
| }
 |