(bug 14901) Email notification mistakes log action for new page creation
[lhc/web/wiklou.git] / includes / XmlTypeCheck.php
index 09b8c20..b95dd6a 100644 (file)
@@ -1,4 +1,24 @@
 <?php
+/**
+ * XML syntax and type checker.
+ *
+ * This program is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation; either version 2 of the License, or
+ * (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License along
+ * with this program; if not, write to the Free Software Foundation, Inc.,
+ * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
+ * http://www.gnu.org/copyleft/gpl.html
+ *
+ * @file
+ */
 
 class XmlTypeCheck {
        /**
@@ -7,87 +27,100 @@ class XmlTypeCheck {
         */
        public $wellFormed = false;
 
+       /**
+        * Will be set to true if the optional element filter returned
+        * a match at some point.
+        */
+       public $filterMatch = false;
+
        /**
         * Name of the document's root element, including any namespace
         * as an expanded URL.
         */
        public $rootElement = '';
 
-       private $softNamespaces;
-       private $namespaces = array();
-
        /**
         * @param $file string filename
-        * @param $softNamespaces bool
-        *        If set to true, use of undeclared XML namespaces will be ignored.
-        *        This matches the behavior of rsvg, but more compliant consumers
-        *        such as Firefox will reject such files.
-        *        Leave off for the default, stricter checks.
+        * @param $filterCallback callable (optional)
+        *        Function to call to do additional custom validity checks from the
+        *        SAX element handler event. This gives you access to the element
+        *        namespace, name, and attributes, but not to text contents.
+        *        Filter should return 'true' to toggle on $this->filterMatch
         */
-       function __construct( $file, $softNamespaces=false ) {
-               $this->softNamespaces = $softNamespaces;
+       function __construct( $file, $filterCallback=null ) {
+               $this->filterCallback = $filterCallback;
                $this->run( $file );
        }
 
+       /**
+        * Get the root element. Simple accessor to $rootElement
+        *
+        * @return string
+        */
+       public function getRootElement() {
+               return $this->rootElement;
+       }
+
+       /**
+        * @param $fname
+        */
        private function run( $fname ) {
-               if( $this->softNamespaces ) {
-                       $parser = xml_parser_create( 'UTF-8' );
-               } else {
-                       $parser = xml_parser_create_ns( 'UTF-8' );
-               }
+               $parser = xml_parser_create_ns( 'UTF-8' );
 
                // case folding violates XML standard, turn it off
                xml_parser_set_option( $parser, XML_OPTION_CASE_FOLDING, false );
 
-               xml_set_element_handler( $parser, array( $this, 'elementOpen' ), false );
+               xml_set_element_handler( $parser, array( $this, 'rootElementOpen' ), false );
+
+               if ( file_exists( $fname ) ) {
+                       $file = fopen( $fname, "rb" );
+                       if ( $file ) {
+                               do {
+                                       $chunk = fread( $file, 32768 );
+                                       $ret = xml_parse( $parser, $chunk, feof( $file ) );
+                                       if( $ret == 0 ) {
+                                               // XML isn't well-formed!
+                                               fclose( $file );
+                                               xml_parser_free( $parser );
+                                               return;
+                                       }
+                               } while( !feof( $file ) );
 
-               $file = fopen( $fname, "rb" );
-               do {
-                       $chunk = fread( $file, 32768 );
-                       $ret = xml_parse( $parser, $chunk, feof( $file ) );
-                       if( $ret == 0 ) {
-                               // XML isn't well-formed!
                                fclose( $file );
-                               xml_parser_free( $parser );
-                               return;
                        }
-               } while( !feof( $file ) );
+               }
 
                $this->wellFormed = true;
 
-               fclose( $file );
                xml_parser_free( $parser );
        }
 
-       private function elementOpen( $parser, $name, $attribs ) {
-               if( $this->softNamespaces ) {
-                       // Check namespaces manually, so expat doesn't throw
-                       // errors on use of undeclared namespaces.
-                       foreach( $attribs as $attrib => $val ) {
-                               if( $attrib == 'xmlns' ) {
-                                       $this->namespaces[''] = $val;
-                               } elseif( substr( $attrib, 0, strlen( 'xmlns:' ) ) == 'xmlns:' ) {
-                                       $this->namespaces[substr( $attrib, strlen( 'xmlns:' ) )] = $val;
-                               }
-                       }
-
-                       if( strpos( $name, ':' ) === false ) {
-                               $ns = '';
-                               $subname = $name;
-                       } else {
-                               list( $ns, $subname ) = explode( ':', $name, 2 );
-                       }
+       /**
+        * @param $parser
+        * @param $name
+        * @param $attribs
+        */
+       private function rootElementOpen( $parser, $name, $attribs ) {
+               $this->rootElement = $name;
 
-                       if( isset( $this->namespaces[$ns] ) ) {
-                               $name = $this->namespaces[$ns] . ':' . $subname;
-                       } else {
-                               // Technically this is invalid for XML with Namespaces.
-                               // But..... we'll just let it slide in soft mode.
-                       }
+               if( is_callable( $this->filterCallback ) ) {
+                       xml_set_element_handler( $parser, array( $this, 'elementOpen' ), false );
+                       $this->elementOpen( $parser, $name, $attribs );
+               } else {
+                       // We only need the first open element
+                       xml_set_element_handler( $parser, false, false );
                }
+       }
 
-               // We only need the first open element
-               $this->rootElement = $name;
-               xml_set_element_handler( $parser, false, false );
+       /**
+        * @param $parser
+        * @param $name
+        * @param $attribs
+        */
+       private function elementOpen( $parser, $name, $attribs ) {
+               if( call_user_func( $this->filterCallback, $name, $attribs ) ) {
+                       // Filter hit!
+                       $this->filterMatch = true;
+               }
        }
 }