[239] | 1 | /*
|
---|
| 2 | Copyright (c) 2003-2011, CKSource - Frederico Knabben. All rights reserved.
|
---|
| 3 | For licensing, see LICENSE.html or http://ckeditor.com/license
|
---|
| 4 | */
|
---|
| 5 |
|
---|
| 6 | /**
|
---|
| 7 | * Creates a {@link CKEDITOR.htmlParser} class instance.
|
---|
| 8 | * @class Provides an "event like" system to parse strings of HTML data.
|
---|
| 9 | * @example
|
---|
| 10 | * var parser = new CKEDITOR.htmlParser();
|
---|
| 11 | * parser.onTagOpen = function( tagName, attributes, selfClosing )
|
---|
| 12 | * {
|
---|
| 13 | * alert( tagName );
|
---|
| 14 | * };
|
---|
| 15 | * parser.parse( '<p>Some <b>text</b>.</p>' );
|
---|
| 16 | */
|
---|
| 17 | CKEDITOR.htmlParser = function()
|
---|
| 18 | {
|
---|
| 19 | this._ =
|
---|
| 20 | {
|
---|
| 21 | htmlPartsRegex : new RegExp( '<(?:(?:\\/([^>]+)>)|(?:!--([\\S|\\s]*?)-->)|(?:([^\\s>]+)\\s*((?:(?:"[^"]*")|(?:\'[^\']*\')|[^"\'>])*)\\/?>))', 'g' )
|
---|
| 22 | };
|
---|
| 23 | };
|
---|
| 24 |
|
---|
| 25 | (function()
|
---|
| 26 | {
|
---|
| 27 | var attribsRegex = /([\w\-:.]+)(?:(?:\s*=\s*(?:(?:"([^"]*)")|(?:'([^']*)')|([^\s>]+)))|(?=\s|$))/g,
|
---|
| 28 | emptyAttribs = {checked:1,compact:1,declare:1,defer:1,disabled:1,ismap:1,multiple:1,nohref:1,noresize:1,noshade:1,nowrap:1,readonly:1,selected:1};
|
---|
| 29 |
|
---|
| 30 | CKEDITOR.htmlParser.prototype =
|
---|
| 31 | {
|
---|
| 32 | /**
|
---|
| 33 | * Function to be fired when a tag opener is found. This function
|
---|
| 34 | * should be overriden when using this class.
|
---|
| 35 | * @param {String} tagName The tag name. The name is guarantted to be
|
---|
| 36 | * lowercased.
|
---|
| 37 | * @param {Object} attributes An object containing all tag attributes. Each
|
---|
| 38 | * property in this object represent and attribute name and its
|
---|
| 39 | * value is the attribute value.
|
---|
| 40 | * @param {Boolean} selfClosing true if the tag closes itself, false if the
|
---|
| 41 | * tag doesn't.
|
---|
| 42 | * @example
|
---|
| 43 | * var parser = new CKEDITOR.htmlParser();
|
---|
| 44 | * parser.onTagOpen = function( tagName, attributes, selfClosing )
|
---|
| 45 | * {
|
---|
| 46 | * alert( tagName ); // e.g. "b"
|
---|
| 47 | * });
|
---|
| 48 | * parser.parse( "<!-- Example --><b>Hello</b>" );
|
---|
| 49 | */
|
---|
| 50 | onTagOpen : function() {},
|
---|
| 51 |
|
---|
| 52 | /**
|
---|
| 53 | * Function to be fired when a tag closer is found. This function
|
---|
| 54 | * should be overriden when using this class.
|
---|
| 55 | * @param {String} tagName The tag name. The name is guarantted to be
|
---|
| 56 | * lowercased.
|
---|
| 57 | * @example
|
---|
| 58 | * var parser = new CKEDITOR.htmlParser();
|
---|
| 59 | * parser.onTagClose = function( tagName )
|
---|
| 60 | * {
|
---|
| 61 | * alert( tagName ); // e.g. "b"
|
---|
| 62 | * });
|
---|
| 63 | * parser.parse( "<!-- Example --><b>Hello</b>" );
|
---|
| 64 | */
|
---|
| 65 | onTagClose : function() {},
|
---|
| 66 |
|
---|
| 67 | /**
|
---|
| 68 | * Function to be fired when text is found. This function
|
---|
| 69 | * should be overriden when using this class.
|
---|
| 70 | * @param {String} text The text found.
|
---|
| 71 | * @example
|
---|
| 72 | * var parser = new CKEDITOR.htmlParser();
|
---|
| 73 | * parser.onText = function( text )
|
---|
| 74 | * {
|
---|
| 75 | * alert( text ); // e.g. "Hello"
|
---|
| 76 | * });
|
---|
| 77 | * parser.parse( "<!-- Example --><b>Hello</b>" );
|
---|
| 78 | */
|
---|
| 79 | onText : function() {},
|
---|
| 80 |
|
---|
| 81 | /**
|
---|
| 82 | * Function to be fired when CDATA section is found. This function
|
---|
| 83 | * should be overriden when using this class.
|
---|
| 84 | * @param {String} cdata The CDATA been found.
|
---|
| 85 | * @example
|
---|
| 86 | * var parser = new CKEDITOR.htmlParser();
|
---|
| 87 | * parser.onCDATA = function( cdata )
|
---|
| 88 | * {
|
---|
| 89 | * alert( cdata ); // e.g. "var hello;"
|
---|
| 90 | * });
|
---|
| 91 | * parser.parse( "<script>var hello;</script>" );
|
---|
| 92 | */
|
---|
| 93 | onCDATA : function() {},
|
---|
| 94 |
|
---|
| 95 | /**
|
---|
| 96 | * Function to be fired when a commend is found. This function
|
---|
| 97 | * should be overriden when using this class.
|
---|
| 98 | * @param {String} comment The comment text.
|
---|
| 99 | * @example
|
---|
| 100 | * var parser = new CKEDITOR.htmlParser();
|
---|
| 101 | * parser.onComment = function( comment )
|
---|
| 102 | * {
|
---|
| 103 | * alert( comment ); // e.g. " Example "
|
---|
| 104 | * });
|
---|
| 105 | * parser.parse( "<!-- Example --><b>Hello</b>" );
|
---|
| 106 | */
|
---|
| 107 | onComment : function() {},
|
---|
| 108 |
|
---|
| 109 | /**
|
---|
| 110 | * Parses text, looking for HTML tokens, like tag openers or closers,
|
---|
| 111 | * or comments. This function fires the onTagOpen, onTagClose, onText
|
---|
| 112 | * and onComment function during its execution.
|
---|
| 113 | * @param {String} html The HTML to be parsed.
|
---|
| 114 | * @example
|
---|
| 115 | * var parser = new CKEDITOR.htmlParser();
|
---|
| 116 | * // The onTagOpen, onTagClose, onText and onComment should be overriden
|
---|
| 117 | * // at this point.
|
---|
| 118 | * parser.parse( "<!-- Example --><b>Hello</b>" );
|
---|
| 119 | */
|
---|
| 120 | parse : function( html )
|
---|
| 121 | {
|
---|
| 122 | var parts,
|
---|
| 123 | tagName,
|
---|
| 124 | nextIndex = 0,
|
---|
| 125 | cdata; // The collected data inside a CDATA section.
|
---|
| 126 |
|
---|
| 127 | while ( ( parts = this._.htmlPartsRegex.exec( html ) ) )
|
---|
| 128 | {
|
---|
| 129 | var tagIndex = parts.index;
|
---|
| 130 | if ( tagIndex > nextIndex )
|
---|
| 131 | {
|
---|
| 132 | var text = html.substring( nextIndex, tagIndex );
|
---|
| 133 |
|
---|
| 134 | if ( cdata )
|
---|
| 135 | cdata.push( text );
|
---|
| 136 | else
|
---|
| 137 | this.onText( text );
|
---|
| 138 | }
|
---|
| 139 |
|
---|
| 140 | nextIndex = this._.htmlPartsRegex.lastIndex;
|
---|
| 141 |
|
---|
| 142 | /*
|
---|
| 143 | "parts" is an array with the following items:
|
---|
| 144 | 0 : The entire match for opening/closing tags and comments.
|
---|
| 145 | 1 : Group filled with the tag name for closing tags.
|
---|
| 146 | 2 : Group filled with the comment text.
|
---|
| 147 | 3 : Group filled with the tag name for opening tags.
|
---|
| 148 | 4 : Group filled with the attributes part of opening tags.
|
---|
| 149 | */
|
---|
| 150 |
|
---|
| 151 | // Closing tag
|
---|
| 152 | if ( ( tagName = parts[ 1 ] ) )
|
---|
| 153 | {
|
---|
| 154 | tagName = tagName.toLowerCase();
|
---|
| 155 |
|
---|
| 156 | if ( cdata && CKEDITOR.dtd.$cdata[ tagName ] )
|
---|
| 157 | {
|
---|
| 158 | // Send the CDATA data.
|
---|
| 159 | this.onCDATA( cdata.join('') );
|
---|
| 160 | cdata = null;
|
---|
| 161 | }
|
---|
| 162 |
|
---|
| 163 | if ( !cdata )
|
---|
| 164 | {
|
---|
| 165 | this.onTagClose( tagName );
|
---|
| 166 | continue;
|
---|
| 167 | }
|
---|
| 168 | }
|
---|
| 169 |
|
---|
| 170 | // If CDATA is enabled, just save the raw match.
|
---|
| 171 | if ( cdata )
|
---|
| 172 | {
|
---|
| 173 | cdata.push( parts[ 0 ] );
|
---|
| 174 | continue;
|
---|
| 175 | }
|
---|
| 176 |
|
---|
| 177 | // Opening tag
|
---|
| 178 | if ( ( tagName = parts[ 3 ] ) )
|
---|
| 179 | {
|
---|
| 180 | tagName = tagName.toLowerCase();
|
---|
| 181 |
|
---|
| 182 | // There are some tag names that can break things, so let's
|
---|
| 183 | // simply ignore them when parsing. (#5224)
|
---|
| 184 | if ( /="/.test( tagName ) )
|
---|
| 185 | continue;
|
---|
| 186 |
|
---|
| 187 | var attribs = {},
|
---|
| 188 | attribMatch,
|
---|
| 189 | attribsPart = parts[ 4 ],
|
---|
| 190 | selfClosing = !!( attribsPart && attribsPart.charAt( attribsPart.length - 1 ) == '/' );
|
---|
| 191 |
|
---|
| 192 | if ( attribsPart )
|
---|
| 193 | {
|
---|
| 194 | while ( ( attribMatch = attribsRegex.exec( attribsPart ) ) )
|
---|
| 195 | {
|
---|
| 196 | var attName = attribMatch[1].toLowerCase(),
|
---|
| 197 | attValue = attribMatch[2] || attribMatch[3] || attribMatch[4] || '';
|
---|
| 198 |
|
---|
| 199 | if ( !attValue && emptyAttribs[ attName ] )
|
---|
| 200 | attribs[ attName ] = attName;
|
---|
| 201 | else
|
---|
| 202 | attribs[ attName ] = attValue;
|
---|
| 203 | }
|
---|
| 204 | }
|
---|
| 205 |
|
---|
| 206 | this.onTagOpen( tagName, attribs, selfClosing );
|
---|
| 207 |
|
---|
| 208 | // Open CDATA mode when finding the appropriate tags.
|
---|
| 209 | if ( !cdata && CKEDITOR.dtd.$cdata[ tagName ] )
|
---|
| 210 | cdata = [];
|
---|
| 211 |
|
---|
| 212 | continue;
|
---|
| 213 | }
|
---|
| 214 |
|
---|
| 215 | // Comment
|
---|
| 216 | if ( ( tagName = parts[ 2 ] ) )
|
---|
| 217 | this.onComment( tagName );
|
---|
| 218 | }
|
---|
| 219 |
|
---|
| 220 | if ( html.length > nextIndex )
|
---|
| 221 | this.onText( html.substring( nextIndex, html.length ) );
|
---|
| 222 | }
|
---|
| 223 | };
|
---|
| 224 | })();
|
---|