2 Copyright (c) 2003-2011, CKSource - Frederico Knabben. All rights reserved.
\r
3 For licensing, see LICENSE.html or http://ckeditor.com/license
\r
8 // Regex to scan for at the end of blocks, which are actually placeholders.
\r
9 // Safari transforms the to \xa0. (#4172)
\r
10 var tailNbspRegex = /^[\t\r\n ]*(?: |\xa0)$/;
\r
12 var protectedSourceMarker = '{cke_protected}';
\r
14 // Return the last non-space child node of the block (#4344).
\r
15 function lastNoneSpaceChild( block )
\r
17 var lastIndex = block.children.length,
\r
18 last = block.children[ lastIndex - 1 ];
\r
19 while ( last && last.type == CKEDITOR.NODE_TEXT && !CKEDITOR.tools.trim( last.value ) )
\r
20 last = block.children[ --lastIndex ];
\r
24 function trimFillers( block, fromSource )
\r
26 // If the current node is a block, and if we're converting from source or
\r
27 // we're not in IE then search for and remove any tailing BR node.
\r
29 // Also, any at the end of blocks are fillers, remove them as well.
\r
31 var children = block.children, lastChild = lastNoneSpaceChild( block );
\r
34 if ( ( fromSource || !CKEDITOR.env.ie ) && lastChild.type == CKEDITOR.NODE_ELEMENT && lastChild.name == 'br' )
\r
36 if ( lastChild.type == CKEDITOR.NODE_TEXT && tailNbspRegex.test( lastChild.value ) )
\r
41 function blockNeedsExtension( block, fromSource, extendEmptyBlock )
\r
43 if( !fromSource && ( !extendEmptyBlock ||
\r
44 typeof extendEmptyBlock == 'function' && ( extendEmptyBlock( block ) === false ) ) )
\r
47 // 1. For IE version >=8, empty blocks are displayed correctly themself in wysiwiyg;
\r
48 // 2. For the rest, at least table cell and list item need no filler space.
\r
50 if ( fromSource && CKEDITOR.env.ie &&
\r
51 ( document.documentMode > 7
\r
52 || block.name in CKEDITOR.dtd.tr
\r
53 || block.name in CKEDITOR.dtd.$listItem ) )
\r
56 var lastChild = lastNoneSpaceChild( block );
\r
58 return !lastChild || lastChild &&
\r
59 ( lastChild.type == CKEDITOR.NODE_ELEMENT && lastChild.name == 'br'
\r
60 // Some of the controls in form needs extension too,
\r
61 // to move cursor at the end of the form. (#4791)
\r
62 || block.name == 'form' && lastChild.name == 'input' );
\r
65 function getBlockExtension( isOutput, emptyBlockFiller )
\r
67 return function( node )
\r
69 trimFillers( node, !isOutput );
\r
71 if ( blockNeedsExtension( node, !isOutput, emptyBlockFiller ) )
\r
73 if ( isOutput || CKEDITOR.env.ie )
\r
74 node.add( new CKEDITOR.htmlParser.text( '\xa0' ) );
\r
76 node.add( new CKEDITOR.htmlParser.element( 'br', {} ) );
\r
81 var dtd = CKEDITOR.dtd;
\r
83 // Define orders of table elements.
\r
84 var tableOrder = [ 'caption', 'colgroup', 'col', 'thead', 'tfoot', 'tbody' ];
\r
86 // Find out the list of block-like tags that can contain <br>.
\r
87 var blockLikeTags = CKEDITOR.tools.extend( {}, dtd.$block, dtd.$listItem, dtd.$tableContent );
\r
88 for ( var i in blockLikeTags )
\r
90 if ( ! ( 'br' in dtd[i] ) )
\r
91 delete blockLikeTags[i];
\r
93 // We just avoid filler in <pre> right now.
\r
94 // TODO: Support filler for <pre>, line break is also occupy line height.
\r
95 delete blockLikeTags.pre;
\r
96 var defaultDataFilterRules =
\r
99 a : function( element )
\r
101 var attrs = element.attributes;
\r
102 if ( attrs && attrs[ 'data-cke-saved-name' ] )
\r
103 attrs[ 'class' ] = ( attrs[ 'class' ] ? attrs[ 'class' ] + ' ' : '' ) + 'cke_anchor';
\r
108 // Event attributes (onXYZ) must not be directly set. They can become
\r
109 // active in the editing area (IE|WebKit).
\r
110 [ ( /^on/ ), 'data-cke-pa-on' ]
\r
114 var defaultDataBlockFilterRules = { elements : {} };
\r
116 for ( i in blockLikeTags )
\r
117 defaultDataBlockFilterRules.elements[ i ] = getBlockExtension();
\r
119 var defaultHtmlFilterRules =
\r
123 // Remove the "cke:" namespace prefix.
\r
124 [ ( /^cke:/ ), '' ],
\r
126 // Ignore <?xml:namespace> tags.
\r
127 [ ( /^\?xml:namespace$/ ), '' ]
\r
132 // Attributes saved for changes and protected attributes.
\r
133 [ ( /^data-cke-(saved|pa)-/ ), '' ],
\r
135 // All "data-cke-" attributes are to be ignored.
\r
136 [ ( /^data-cke-.*/ ), '' ],
\r
138 [ 'hidefocus', '' ]
\r
143 $ : function( element )
\r
145 var attribs = element.attributes;
\r
149 // Elements marked as temporary are to be ignored.
\r
150 if ( attribs[ 'data-cke-temp' ] )
\r
153 // Remove duplicated attributes - #3789.
\r
154 var attributeNames = [ 'name', 'href', 'src' ],
\r
155 savedAttributeName;
\r
156 for ( var i = 0 ; i < attributeNames.length ; i++ )
\r
158 savedAttributeName = 'data-cke-saved-' + attributeNames[ i ];
\r
159 savedAttributeName in attribs && ( delete attribs[ attributeNames[ i ] ] );
\r
166 // The contents of table should be in correct order (#4809).
\r
167 table : function( element )
\r
169 var children = element.children;
\r
170 children.sort( function ( node1, node2 )
\r
172 return node1.type == CKEDITOR.NODE_ELEMENT && node2.type == node1.type ?
\r
173 CKEDITOR.tools.indexOf( tableOrder, node1.name ) > CKEDITOR.tools.indexOf( tableOrder, node2.name ) ? 1 : -1 : 0;
\r
177 embed : function( element )
\r
179 var parent = element.parent;
\r
181 // If the <embed> is child of a <object>, copy the width
\r
182 // and height attributes from it.
\r
183 if ( parent && parent.name == 'object' )
\r
185 var parentWidth = parent.attributes.width,
\r
186 parentHeight = parent.attributes.height;
\r
187 parentWidth && ( element.attributes.width = parentWidth );
\r
188 parentHeight && ( element.attributes.height = parentHeight );
\r
191 // Restore param elements into self-closing.
\r
192 param : function( param )
\r
194 param.children = [];
\r
195 param.isEmpty = true;
\r
199 // Remove empty link but not empty anchor.(#3829)
\r
200 a : function( element )
\r
202 if ( !( element.children.length ||
\r
203 element.attributes.name ||
\r
204 element.attributes[ 'data-cke-saved-name' ] ) )
\r
210 // Remove dummy span in webkit.
\r
211 span: function( element )
\r
213 if ( element.attributes[ 'class' ] == 'Apple-style-span' )
\r
214 delete element.name;
\r
217 // Empty <pre> in IE is reported with filler node ( ).
\r
218 pre : function( element ) { CKEDITOR.env.ie && trimFillers( element ); },
\r
220 html : function( element )
\r
222 delete element.attributes.contenteditable;
\r
223 delete element.attributes[ 'class' ];
\r
226 body : function( element )
\r
228 delete element.attributes.spellcheck;
\r
229 delete element.attributes.contenteditable;
\r
232 style : function( element )
\r
234 var child = element.children[ 0 ];
\r
235 child && child.value && ( child.value = CKEDITOR.tools.trim( child.value ));
\r
237 if ( !element.attributes.type )
\r
238 element.attributes.type = 'text/css';
\r
241 title : function( element )
\r
243 var titleText = element.children[ 0 ];
\r
244 titleText && ( titleText.value = element.attributes[ 'data-cke-title' ] || '' );
\r
250 'class' : function( value, element )
\r
252 // Remove all class names starting with "cke_".
\r
253 return CKEDITOR.tools.ltrim( value.replace( /(?:^|\s+)cke_[^\s]*/g, '' ) ) || false;
\r
258 if ( CKEDITOR.env.ie )
\r
260 // IE outputs style attribute in capital letters. We should convert
\r
261 // them back to lower case, while not hurting the values (#5930)
\r
262 defaultHtmlFilterRules.attributes.style = function( value, element )
\r
264 return value.replace( /(^|;)([^\:]+)/g, function( match )
\r
266 return match.toLowerCase();
\r
271 function protectReadOnly( element )
\r
273 var attrs = element.attributes;
\r
275 // We should flag that the element was locked by our code so
\r
276 // it'll be editable by the editor functions (#6046).
\r
277 if ( attrs.contenteditable != "false" )
\r
278 attrs[ 'data-cke-editable' ] = attrs.contenteditable ? 'true' : 1;
\r
280 attrs.contenteditable = "false";
\r
282 function unprotectReadyOnly( element )
\r
284 var attrs = element.attributes;
\r
285 switch( attrs[ 'data-cke-editable' ] )
\r
287 case 'true': attrs.contenteditable = 'true'; break;
\r
288 case '1': delete attrs.contenteditable; break;
\r
291 // Disable form elements editing mode provided by some browers. (#5746)
\r
292 for ( i in { input : 1, textarea : 1 } )
\r
294 defaultDataFilterRules.elements[ i ] = protectReadOnly;
\r
295 defaultHtmlFilterRules.elements[ i ] = unprotectReadyOnly;
\r
298 var protectElementRegex = /<(a|area|img|input)\b([^>]*)>/gi,
\r
299 protectAttributeRegex = /\b(href|src|name)\s*=\s*(?:(?:"[^"]*")|(?:'[^']*')|(?:[^ "'>]+))/gi;
\r
301 var protectElementsRegex = /(?:<style(?=[ >])[^>]*>[\s\S]*<\/style>)|(?:<(:?link|meta|base)[^>]*>)/gi,
\r
302 encodedElementsRegex = /<cke:encoded>([^<]*)<\/cke:encoded>/gi;
\r
304 var protectElementNamesRegex = /(<\/?)((?:object|embed|param|html|body|head|title)[^>]*>)/gi,
\r
305 unprotectElementNamesRegex = /(<\/?)cke:((?:html|body|head|title)[^>]*>)/gi;
\r
307 var protectSelfClosingRegex = /<cke:(param|embed)([^>]*?)\/?>(?!\s*<\/cke:\1)/gi;
\r
309 function protectAttributes( html )
\r
311 return html.replace( protectElementRegex, function( element, tag, attributes )
\r
313 return '<' + tag + attributes.replace( protectAttributeRegex, function( fullAttr, attrName )
\r
315 // We should not rewrite the existed protected attributes, e.g. clipboard content from editor. (#5218)
\r
316 if ( attributes.indexOf( 'data-cke-saved-' + attrName ) == -1 )
\r
317 return ' data-cke-saved-' + fullAttr + ' ' + fullAttr;
\r
324 function protectElements( html )
\r
326 return html.replace( protectElementsRegex, function( match )
\r
328 return '<cke:encoded>' + encodeURIComponent( match ) + '</cke:encoded>';
\r
332 function unprotectElements( html )
\r
334 return html.replace( encodedElementsRegex, function( match, encoded )
\r
336 return decodeURIComponent( encoded );
\r
340 function protectElementsNames( html )
\r
342 return html.replace( protectElementNamesRegex, '$1cke:$2');
\r
345 function unprotectElementNames( html )
\r
347 return html.replace( unprotectElementNamesRegex, '$1$2' );
\r
350 function protectSelfClosingElements( html )
\r
352 return html.replace( protectSelfClosingRegex, '<cke:$1$2></cke:$1>' );
\r
355 function protectPreFormatted( html )
\r
357 return html.replace( /(<pre\b[^>]*>)(\r\n|\n)/g, '$1$2$2' );
\r
360 function protectRealComments( html )
\r
362 return html.replace( /<!--(?!{cke_protected})[\s\S]+?-->/g, function( match )
\r
364 return '<!--' + protectedSourceMarker +
\r
366 encodeURIComponent( match ).replace( /--/g, '%2D%2D' ) +
\r
371 function unprotectRealComments( html )
\r
373 return html.replace( /<!--\{cke_protected\}\{C\}([\s\S]+?)-->/g, function( match, data )
\r
375 return decodeURIComponent( data );
\r
379 function unprotectSource( html, editor )
\r
381 var store = editor._.dataStore;
\r
383 return html.replace( /<!--\{cke_protected\}([\s\S]+?)-->/g, function( match, data )
\r
385 return decodeURIComponent( data );
\r
386 }).replace( /\{cke_protected_(\d+)\}/g, function( match, id )
\r
388 return store && store[ id ] || '';
\r
392 function protectSource( data, editor )
\r
394 var protectedHtml = [],
\r
395 protectRegexes = editor.config.protectedSource,
\r
396 store = editor._.dataStore || ( editor._.dataStore = { id : 1 } ),
\r
397 tempRegex = /<\!--\{cke_temp(comment)?\}(\d*?)-->/g;
\r
401 // Script tags will also be forced to be protected, otherwise
\r
402 // IE will execute them.
\r
403 ( /<script[\s\S]*?<\/script>/gi ),
\r
405 // <noscript> tags (get lost in IE and messed up in FF).
\r
406 /<noscript[\s\S]*?<\/noscript>/gi
\r
408 .concat( protectRegexes );
\r
410 // First of any other protection, we must protect all comments
\r
411 // to avoid loosing them (of course, IE related).
\r
412 // Note that we use a different tag for comments, as we need to
\r
413 // transform them when applying filters.
\r
414 data = data.replace( (/<!--[\s\S]*?-->/g), function( match )
\r
416 return '<!--{cke_tempcomment}' + ( protectedHtml.push( match ) - 1 ) + '-->';
\r
419 for ( var i = 0 ; i < regexes.length ; i++ )
\r
421 data = data.replace( regexes[i], function( match )
\r
423 match = match.replace( tempRegex, // There could be protected source inside another one. (#3869).
\r
424 function( $, isComment, id )
\r
426 return protectedHtml[ id ];
\r
430 // Avoid protecting over protected, e.g. /\{.*?\}/
\r
431 return ( /cke_temp(comment)?/ ).test( match ) ? match
\r
432 : '<!--{cke_temp}' + ( protectedHtml.push( match ) - 1 ) + '-->';
\r
435 data = data.replace( tempRegex, function( $, isComment, id )
\r
437 return '<!--' + protectedSourceMarker +
\r
438 ( isComment ? '{C}' : '' ) +
\r
439 encodeURIComponent( protectedHtml[ id ] ).replace( /--/g, '%2D%2D' ) +
\r
444 // Different protection pattern is used for those that
\r
445 // live in attributes to avoid from being HTML encoded.
\r
446 return data.replace( /(['"]).*?\1/g, function ( match )
\r
448 return match.replace( /<!--\{cke_protected\}([\s\S]+?)-->/g, function( match, data )
\r
450 store[ store.id ] = decodeURIComponent( data );
\r
451 return '{cke_protected_'+ ( store.id++ ) + '}';
\r
456 CKEDITOR.plugins.add( 'htmldataprocessor',
\r
458 requires : [ 'htmlwriter' ],
\r
460 init : function( editor )
\r
462 var dataProcessor = editor.dataProcessor = new CKEDITOR.htmlDataProcessor( editor );
\r
464 dataProcessor.writer.forceSimpleAmpersand = editor.config.forceSimpleAmpersand;
\r
466 dataProcessor.dataFilter.addRules( defaultDataFilterRules );
\r
467 dataProcessor.dataFilter.addRules( defaultDataBlockFilterRules );
\r
468 dataProcessor.htmlFilter.addRules( defaultHtmlFilterRules );
\r
470 var defaultHtmlBlockFilterRules = { elements : {} };
\r
471 for ( i in blockLikeTags )
\r
472 defaultHtmlBlockFilterRules.elements[ i ] = getBlockExtension( true, editor.config.fillEmptyBlocks );
\r
474 dataProcessor.htmlFilter.addRules( defaultHtmlBlockFilterRules );
\r
477 onLoad : function()
\r
479 ! ( 'fillEmptyBlocks' in CKEDITOR.config ) && ( CKEDITOR.config.fillEmptyBlocks = 1 );
\r
483 CKEDITOR.htmlDataProcessor = function( editor )
\r
485 this.editor = editor;
\r
487 this.writer = new CKEDITOR.htmlWriter();
\r
488 this.dataFilter = new CKEDITOR.htmlParser.filter();
\r
489 this.htmlFilter = new CKEDITOR.htmlParser.filter();
\r
492 CKEDITOR.htmlDataProcessor.prototype =
\r
494 toHtml : function( data, fixForBody )
\r
496 // The source data is already HTML, but we need to clean
\r
497 // it up and apply the filter.
\r
499 data = protectSource( data, this.editor );
\r
501 // Before anything, we must protect the URL attributes as the
\r
502 // browser may changing them when setting the innerHTML later in
\r
504 data = protectAttributes( data );
\r
506 // Protect elements than can't be set inside a DIV. E.g. IE removes
\r
507 // style tags from innerHTML. (#3710)
\r
508 data = protectElements( data );
\r
510 // Certain elements has problem to go through DOM operation, protect
\r
511 // them by prefixing 'cke' namespace. (#3591)
\r
512 data = protectElementsNames( data );
\r
514 // All none-IE browsers ignore self-closed custom elements,
\r
515 // protecting them into open-close. (#3591)
\r
516 data = protectSelfClosingElements( data );
\r
518 // Compensate one leading line break after <pre> open as browsers
\r
519 // eat it up. (#5789)
\r
520 data = protectPreFormatted( data );
\r
522 // Call the browser to help us fixing a possibly invalid HTML
\r
524 var div = new CKEDITOR.dom.element( 'div' );
\r
525 // Add fake character to workaround IE comments bug. (#3801)
\r
526 div.setHtml( 'a' + data );
\r
527 data = div.getHtml().substr( 1 );
\r
529 // Unprotect "some" of the protected elements at this point.
\r
530 data = unprotectElementNames( data );
\r
532 data = unprotectElements( data );
\r
534 // Restore the comments that have been protected, in this way they
\r
535 // can be properly filtered.
\r
536 data = unprotectRealComments( data );
\r
538 // Now use our parser to make further fixes to the structure, as
\r
539 // well as apply the filter.
\r
540 var fragment = CKEDITOR.htmlParser.fragment.fromHtml( data, fixForBody ),
\r
541 writer = new CKEDITOR.htmlParser.basicWriter();
\r
543 fragment.writeHtml( writer, this.dataFilter );
\r
544 data = writer.getHtml( true );
\r
546 // Protect the real comments again.
\r
547 data = protectRealComments( data );
\r
552 toDataFormat : function( html, fixForBody )
\r
554 var writer = this.writer,
\r
555 fragment = CKEDITOR.htmlParser.fragment.fromHtml( html, fixForBody );
\r
559 fragment.writeHtml( writer, this.htmlFilter );
\r
561 var data = writer.getHtml( true );
\r
563 // Restore those non-HTML protected source. (#4475,#4880)
\r
564 data = unprotectRealComments( data );
\r
565 data = unprotectSource( data, this.editor );
\r
573 * Whether to force using "&" instead of "&amp;" in elements attributes
\r
574 * values, it's not recommended to change this setting for compliance with the
\r
575 * W3C XHTML 1.0 standards (<a href="http://www.w3.org/TR/xhtml1/#C_12">C.12, XHTML 1.0</a>).
\r
576 * @name CKEDITOR.config.forceSimpleAmpersand
\r
577 * @name CKEDITOR.config.forceSimpleAmpersand
\r
581 * config.forceSimpleAmpersand = false;
\r
585 * Whether a filler text (non-breaking space entity - ) will be inserted into empty block elements in HTML output,
\r
586 * this is used to render block elements properly with line-height; When a function is instead specified,
\r
587 * it'll be passed a {@link CKEDITOR.htmlParser.element} to decide whether adding the filler text
\r
588 * by expecting a boolean return value.
\r
589 * @name CKEDITOR.config.fillEmptyBlocks
\r
594 * config.fillEmptyBlocks = false; // Prevent filler nodes in all empty blocks.
\r
596 * // Prevent filler node only in float cleaners.
\r
597 * config.fillEmptyBlocks = function( element )
\r
599 * if ( element.attributes[ 'class' ].indexOf ( 'clear-both' ) != -1 )
\r