2 Copyright (c) 2003-2011, CKSource - Frederico Knabben. All rights reserved.
\r
3 For licensing, see LICENSE.html or http://ckeditor.com/license
\r
8 var fragmentPrototype = CKEDITOR.htmlParser.fragment.prototype,
\r
9 elementPrototype = CKEDITOR.htmlParser.element.prototype;
\r
11 fragmentPrototype.onlyChild = elementPrototype.onlyChild = function()
\r
13 var children = this.children,
\r
14 count = children.length,
\r
15 firstChild = ( count == 1 ) && children[ 0 ];
\r
16 return firstChild || null;
\r
19 elementPrototype.removeAnyChildWithName = function( tagName )
\r
21 var children = this.children,
\r
25 for ( var i = 0; i < children.length; i++ )
\r
27 child = children[ i ];
\r
31 if ( child.name == tagName )
\r
33 childs.push( child );
\r
34 children.splice( i--, 1 );
\r
36 childs = childs.concat( child.removeAnyChildWithName( tagName ) );
\r
41 elementPrototype.getAncestor = function( tagNameRegex )
\r
43 var parent = this.parent;
\r
44 while ( parent && !( parent.name && parent.name.match( tagNameRegex ) ) )
\r
45 parent = parent.parent;
\r
49 fragmentPrototype.firstChild = elementPrototype.firstChild = function( evaluator )
\r
53 for ( var i = 0 ; i < this.children.length ; i++ )
\r
55 child = this.children[ i ];
\r
56 if ( evaluator( child ) )
\r
58 else if ( child.name )
\r
60 child = child.firstChild( evaluator );
\r
69 // Adding a (set) of styles to the element's 'style' attributes.
\r
70 elementPrototype.addStyle = function( name, value, isPrepend )
\r
72 var styleText, addingStyleText = '';
\r
74 if ( typeof value == 'string' )
\r
75 addingStyleText += name + ':' + value + ';';
\r
79 if ( typeof name == 'object' )
\r
81 for ( var style in name )
\r
83 if ( name.hasOwnProperty( style ) )
\r
84 addingStyleText += style + ':' + name[ style ] + ';';
\r
87 // raw style text form.
\r
89 addingStyleText += name;
\r
94 if ( !this.attributes )
\r
95 this.attributes = {};
\r
97 styleText = this.attributes.style || '';
\r
99 styleText = ( isPrepend ?
\r
100 [ addingStyleText, styleText ]
\r
101 : [ styleText, addingStyleText ] ).join( ';' );
\r
103 this.attributes.style = styleText.replace( /^;|;(?=;)/, '' );
\r
107 * Return the DTD-valid parent tag names of the specified one.
\r
110 CKEDITOR.dtd.parentOf = function( tagName )
\r
113 for ( var tag in this )
\r
115 if ( tag.indexOf( '$' ) == -1 && this[ tag ][ tagName ] )
\r
121 // 1. move consistent list item styles up to list root.
\r
122 // 2. clear out unnecessary list item numbering.
\r
123 function postProcessList( list )
\r
125 var children = list.children,
\r
128 count = list.children.length,
\r
131 styleTypeRegexp = /list-style-type:(.*?)(?:;|$)/,
\r
132 stylesFilter = CKEDITOR.plugins.pastefromword.filters.stylesFilter;
\r
134 attrs = list.attributes;
\r
135 if ( styleTypeRegexp.exec( attrs.style ) )
\r
138 for ( var i = 0; i < count; i++ )
\r
140 child = children[ i ];
\r
142 if ( child.attributes.value && Number( child.attributes.value ) == i + 1 )
\r
143 delete child.attributes.value;
\r
145 match = styleTypeRegexp.exec( child.attributes.style );
\r
149 if ( match[ 1 ] == mergeStyle || !mergeStyle )
\r
150 mergeStyle = match[ 1 ];
\r
161 for ( i = 0; i < count; i++ )
\r
163 attrs = children[ i ].attributes;
\r
164 attrs.style && ( attrs.style = stylesFilter( [ [ 'list-style-type'] ] )( attrs.style ) || '' );
\r
167 list.addStyle( 'list-style-type', mergeStyle );
\r
171 var cssLengthRelativeUnit = /^([.\d]*)+(em|ex|px|gd|rem|vw|vh|vm|ch|mm|cm|in|pt|pc|deg|rad|ms|s|hz|khz){1}?/i;
\r
172 var emptyMarginRegex = /^(?:\b0[^\s]*\s*){1,4}$/; // e.g. 0px 0pt 0px
\r
173 var romanLiternalPattern = '^m{0,4}(cm|cd|d?c{0,3})(xc|xl|l?x{0,3})(ix|iv|v?i{0,3})$',
\r
174 lowerRomanLiteralRegex = new RegExp( romanLiternalPattern ),
\r
175 upperRomanLiteralRegex = new RegExp( romanLiternalPattern.toUpperCase() );
\r
177 var orderedPatterns = { 'decimal' : /\d+/, 'lower-roman': lowerRomanLiteralRegex, 'upper-roman': upperRomanLiteralRegex, 'lower-alpha' : /^[a-z]+$/, 'upper-alpha': /^[A-Z]+$/ },
\r
178 unorderedPatterns = { 'disc' : /[l\u00B7\u2002]/, 'circle' : /[\u006F\u00D8]/,'square' : /[\u006E\u25C6]/},
\r
179 listMarkerPatterns = { 'ol' : orderedPatterns, 'ul' : unorderedPatterns },
\r
180 romans = [ [1000, 'M'], [900, 'CM'], [500, 'D'], [400, 'CD'], [100, 'C'], [90, 'XC'], [50, 'L'], [40, 'XL'], [10, 'X'], [9, 'IX'], [5, 'V'], [4, 'IV'], [1, 'I'] ],
\r
181 alpahbets = "ABCDEFGHIJKLMNOPQRSTUVWXYZ";
\r
183 // Convert roman numbering back to decimal.
\r
184 function fromRoman( str )
\r
186 str = str.toUpperCase();
\r
187 var l = romans.length, retVal = 0;
\r
188 for ( var i = 0; i < l; ++i )
\r
190 for ( var j = romans[i], k = j[1].length; str.substr( 0, k ) == j[1]; str = str.substr( k ) )
\r
196 // Convert alphabet numbering back to decimal.
\r
197 function fromAlphabet( str )
\r
199 str = str.toUpperCase();
\r
200 var l = alpahbets.length, retVal = 1;
\r
201 for ( var x = 1; str.length > 0; x *= l )
\r
203 retVal += alpahbets.indexOf( str.charAt( str.length - 1 ) ) * x;
\r
204 str = str.substr( 0, str.length - 1 );
\r
209 var listBaseIndent = 0,
\r
210 previousListItemMargin = null,
\r
213 var plugin = ( CKEDITOR.plugins.pastefromword =
\r
217 // Create a <cke:listbullet> which indicate an list item type.
\r
218 createListBulletMarker : function ( bullet, bulletText )
\r
220 var marker = new CKEDITOR.htmlParser.element( 'cke:listbullet' );
\r
221 marker.attributes = { 'cke:listsymbol' : bullet[ 0 ] };
\r
222 marker.add( new CKEDITOR.htmlParser.text( bulletText ) );
\r
226 isListBulletIndicator : function( element )
\r
228 var styleText = element.attributes && element.attributes.style;
\r
229 if ( /mso-list\s*:\s*Ignore/i.test( styleText ) )
\r
233 isContainingOnlySpaces : function( element )
\r
236 return ( ( text = element.onlyChild() )
\r
237 && ( /^(:?\s| )+$/ ).test( text.value ) );
\r
240 resolveList : function( element )
\r
242 // <cke:listbullet> indicate a list item.
\r
243 var attrs = element.attributes,
\r
246 if ( ( listMarker = element.removeAnyChildWithName( 'cke:listbullet' ) )
\r
247 && listMarker.length
\r
248 && ( listMarker = listMarker[ 0 ] ) )
\r
250 element.name = 'cke:li';
\r
254 attrs.style = plugin.filters.stylesFilter(
\r
256 // Text-indent is not representing list item level any more.
\r
259 // First attempt is to resolve indent level from on a constant margin increment.
\r
260 [ ( /^margin(:?-left)?$/ ), null, function( margin )
\r
262 // Deal with component/short-hand form.
\r
263 var values = margin.split( ' ' );
\r
264 margin = plugin.utils.convertToPx( values[ 3 ] || values[ 1 ] || values [ 0 ] );
\r
265 margin = parseInt( margin, 10 );
\r
267 // Figure out the indent unit by checking the first time of incrementation.
\r
268 if ( !listBaseIndent && previousListItemMargin !== null && margin > previousListItemMargin )
\r
269 listBaseIndent = margin - previousListItemMargin;
\r
271 previousListItemMargin = margin;
\r
273 attrs[ 'cke:indent' ] = listBaseIndent && ( Math.ceil( margin / listBaseIndent ) + 1 ) || 1;
\r
275 // The best situation: "mso-list:l0 level1 lfo2" tells the belonged list root, list item indentation, etc.
\r
276 [ ( /^mso-list$/ ), null, function( val )
\r
278 val = val.split( ' ' );
\r
279 var listId = Number( val[ 0 ].match( /\d+/ ) ),
\r
280 indent = Number( val[ 1 ].match( /\d+/ ) );
\r
282 listId !== previousListId && ( attrs[ 'cke:reset' ] = 1 );
\r
283 previousListId = listId;
\r
284 attrs[ 'cke:indent' ] = indent;
\r
286 ] )( attrs.style, element ) || '';
\r
289 // First level list item might be presented without a margin.
\r
292 // In case all above doesn't apply.
\r
293 if ( !attrs[ 'cke:indent' ] )
\r
295 previousListItemMargin = 0;
\r
296 attrs[ 'cke:indent' ] = 1;
\r
299 // Inherit attributes from bullet.
\r
300 CKEDITOR.tools.extend( attrs, listMarker.attributes );
\r
303 // Current list disconnected.
\r
305 previousListId = previousListItemMargin = listBaseIndent = null;
\r
310 // Convert various length units to 'px' in ignorance of DPI.
\r
311 convertToPx : ( function ()
\r
313 var calculator = CKEDITOR.dom.element.createFromHtml(
\r
314 '<div style="position:absolute;left:-9999px;' +
\r
315 'top:-9999px;margin:0px;padding:0px;border:0px;"' +
\r
316 '></div>', CKEDITOR.document );
\r
317 CKEDITOR.document.getBody().append( calculator );
\r
319 return function( cssLength )
\r
321 if ( cssLengthRelativeUnit.test( cssLength ) )
\r
323 calculator.setStyle( 'width', cssLength );
\r
324 return calculator.$.clientWidth + 'px';
\r
331 // Providing a shorthand style then retrieve one or more style component values.
\r
332 getStyleComponents : ( function()
\r
334 var calculator = CKEDITOR.dom.element.createFromHtml(
\r
335 '<div style="position:absolute;left:-9999px;top:-9999px;"></div>',
\r
336 CKEDITOR.document );
\r
337 CKEDITOR.document.getBody().append( calculator );
\r
339 return function( name, styleValue, fetchList )
\r
341 calculator.setStyle( name, styleValue );
\r
343 count = fetchList.length;
\r
344 for ( var i = 0; i < count; i++ )
\r
345 styles[ fetchList[ i ] ] = calculator.getStyle( fetchList[ i ] );
\r
351 listDtdParents : CKEDITOR.dtd.parentOf( 'ol' )
\r
356 // Transform a normal list into flat list items only presentation.
\r
357 // E.g. <ul><li>level1<ol><li>level2</li></ol></li> =>
\r
358 // <cke:li cke:listtype="ul" cke:indent="1">level1</cke:li>
\r
359 // <cke:li cke:listtype="ol" cke:indent="2">level2</cke:li>
\r
360 flattenList : function( element )
\r
362 var attrs = element.attributes,
\r
363 parent = element.parent;
\r
368 // Resolve how many level nested.
\r
371 parent.attributes && parent.attributes[ 'cke:list' ] && indentLevel++;
\r
372 parent = parent.parent;
\r
375 // All list items are of the same type.
\r
376 switch ( attrs.type )
\r
379 listStyleType = 'lower-alpha';
\r
381 // TODO: Support more list style type from MS-Word.
\r
384 var children = element.children,
\r
387 for ( var i = 0; i < children.length; i++ )
\r
389 child = children[ i ];
\r
390 var attributes = child.attributes;
\r
392 if ( child.name in CKEDITOR.dtd.$listItem )
\r
394 var listItemChildren = child.children,
\r
395 count = listItemChildren.length,
\r
396 last = listItemChildren[ count - 1 ];
\r
398 // Move out nested list.
\r
399 if ( last.name in CKEDITOR.dtd.$list )
\r
401 children.splice( i + 1, 0, last );
\r
402 last.parent = element;
\r
404 // Remove the parent list item if it's just a holder.
\r
405 if ( !--listItemChildren.length )
\r
406 children.splice( i, 1 );
\r
409 child.name = 'cke:li';
\r
411 // Inherit numbering from list root on the first list item.
\r
412 attrs.start && !i && ( attributes.value = attrs.start );
\r
414 plugin.filters.stylesFilter(
\r
416 [ 'tab-stops', null, function( val )
\r
418 var margin = val.split( ' ' )[ 1 ].match( cssLengthRelativeUnit );
\r
419 margin && ( previousListItemMargin = parseInt( plugin.utils.convertToPx( margin[ 0 ] ), 10 ) );
\r
421 [ 'mso-list', null, function( val )
\r
423 val = val.split( ' ' );
\r
424 var listId = Number( val[ 0 ].match( /\d+/ ) );
\r
425 listId !== previousListId && ( attributes[ 'cke:reset' ] = 1 );
\r
426 previousListId = listId;
\r
428 ] )( attributes.style );
\r
430 attributes[ 'cke:indent' ] = indentLevel;
\r
431 attributes[ 'cke:listtype' ] = element.name;
\r
432 attributes[ 'cke:list-style-type' ] = listStyleType;
\r
436 delete element.name;
\r
438 // We're loosing tag name here, signalize this element as a list.
\r
439 attrs[ 'cke:list' ] = 1;
\r
443 * Try to collect all list items among the children and establish one
\r
444 * or more HTML list structures for them.
\r
447 assembleList : function( element )
\r
449 var children = element.children, child,
\r
450 listItem, // The current processing cke:li element.
\r
452 listItemIndent, // Indent level of current list item.
\r
454 lastListItem, // The previous one just been added to the list.
\r
455 list, // Current staging list and it's parent list if any.
\r
457 previousListStyleType,
\r
460 // Properties of the list item are to be resolved from the list bullet.
\r
466 for ( var i = 0; i < children.length; i++ )
\r
468 child = children[ i ];
\r
470 if ( 'cke:li' == child.name )
\r
474 listItemAttrs = listItem.attributes;
\r
475 bullet = listItemAttrs[ 'cke:listsymbol' ];
\r
476 bullet = bullet && bullet.match( /^(?:[(]?)([^\s]+?)([.)]?)$/ );
\r
477 listType = listStyleType = itemNumeric = null;
\r
479 if ( listItemAttrs[ 'cke:ignored' ] )
\r
481 children.splice( i--, 1 );
\r
486 // This's from a new list root.
\r
487 listItemAttrs[ 'cke:reset' ] && ( list = lastIndent = lastListItem = null );
\r
489 // List item indent level might come from a real list indentation or
\r
490 // been resolved from a pseudo list item's margin value, even get
\r
491 // no indentation at all.
\r
492 listItemIndent = Number( listItemAttrs[ 'cke:indent' ] );
\r
494 // We're moving out of the current list, cleaning up.
\r
495 if ( listItemIndent != lastIndent )
\r
496 previousListType = previousListStyleType = null;
\r
498 // List type and item style are already resolved.
\r
501 listType = listItemAttrs[ 'cke:listtype' ] || 'ol';
\r
502 listStyleType = listItemAttrs[ 'cke:list-style-type' ];
\r
506 // Probably share the same list style type with previous list item,
\r
507 // give it priority to avoid ambiguous between C(Alpha) and C.(Roman).
\r
508 if ( previousListType && listMarkerPatterns[ previousListType ] [ previousListStyleType ].test( bullet[ 1 ] ) )
\r
510 listType = previousListType;
\r
511 listStyleType = previousListStyleType;
\r
515 for ( var type in listMarkerPatterns )
\r
517 for ( var style in listMarkerPatterns[ type ] )
\r
519 if ( listMarkerPatterns[ type ][ style ].test( bullet[ 1 ] ) )
\r
521 // Small numbering has higher priority, when dealing with ambiguous
\r
522 // between C(Alpha) and C.(Roman).
\r
523 if ( type == 'ol' && ( /alpha|roman/ ).test( style ) )
\r
525 var num = /roman/.test( style ) ? fromRoman( bullet[ 1 ] ) : fromAlphabet( bullet[ 1 ] );
\r
526 if ( !itemNumeric || num < itemNumeric )
\r
530 listStyleType = style;
\r
536 listStyleType = style;
\r
544 // Simply use decimal/disc for the rest forms of unrepresentable
\r
545 // numerals, e.g. Chinese..., but as long as there a second part
\r
546 // included, it has a bigger chance of being a order list ;)
\r
547 !listType && ( listType = bullet[ 2 ] ? 'ol' : 'ul' );
\r
550 previousListType = listType;
\r
551 previousListStyleType = listStyleType || ( listType == 'ol' ? 'decimal' : 'disc' );
\r
552 if ( listStyleType && listStyleType != ( listType == 'ol' ? 'decimal' : 'disc' ) )
\r
553 listItem.addStyle( 'list-style-type', listStyleType );
\r
555 // Figure out start numbering.
\r
556 if ( listType == 'ol' && bullet )
\r
558 switch ( listStyleType )
\r
561 itemNumeric = Number( bullet[ 1 ] );
\r
563 case 'lower-roman':
\r
564 case 'upper-roman':
\r
565 itemNumeric = fromRoman( bullet[ 1 ] );
\r
567 case 'lower-alpha':
\r
568 case 'upper-alpha':
\r
569 itemNumeric = fromAlphabet( bullet[ 1 ] );
\r
573 // Always create the numbering, swipe out unnecessary ones later.
\r
574 listItem.attributes.value = itemNumeric;
\r
577 // Start the list construction.
\r
580 openedLists.push( list = new CKEDITOR.htmlParser.element( listType ) );
\r
581 list.add( listItem );
\r
582 children[ i ] = list;
\r
586 if ( listItemIndent > lastIndent )
\r
588 openedLists.push( list = new CKEDITOR.htmlParser.element( listType ) );
\r
589 list.add( listItem );
\r
590 lastListItem.add( list );
\r
592 else if ( listItemIndent < lastIndent )
\r
594 // There might be a negative gap between two list levels. (#4944)
\r
595 var diff = lastIndent - listItemIndent,
\r
597 while ( diff-- && ( parent = list.parent ) )
\r
598 list = parent.parent;
\r
600 list.add( listItem );
\r
603 list.add( listItem );
\r
605 children.splice( i--, 1 );
\r
608 lastListItem = listItem;
\r
609 lastIndent = listItemIndent;
\r
612 list = lastIndent = lastListItem = null;
\r
615 for ( i = 0; i < openedLists.length; i++ )
\r
616 postProcessList( openedLists[ i ] );
\r
618 list = lastIndent = lastListItem = previousListId = previousListItemMargin = listBaseIndent = null;
\r
622 * A simple filter which always rejecting.
\r
624 falsyFilter : function( value )
\r
630 * A filter dedicated on the 'style' attribute filtering, e.g. dropping/replacing style properties.
\r
631 * @param styles {Array} in form of [ styleNameRegexp, styleValueRegexp,
\r
632 * newStyleValue/newStyleGenerator, newStyleName ] where only the first
\r
633 * parameter is mandatory.
\r
634 * @param whitelist {Boolean} Whether the {@param styles} will be considered as a white-list.
\r
636 stylesFilter : function( styles, whitelist )
\r
638 return function( styleText, element )
\r
641 // html-encoded quote might be introduced by 'font-family'
\r
642 // from MS-Word which confused the following regexp. e.g.
\r
643 //'font-family: "Lucida, Console"'
\r
644 ( styleText || '' )
\r
645 .replace( /"/g, '"' )
\r
646 .replace( /\s*([^ :;]+)\s*:\s*([^;]+)\s*(?=;|$)/g,
\r
647 function( match, name, value )
\r
649 name = name.toLowerCase();
\r
650 name == 'font-family' && ( value = value.replace( /["']/g, '' ) );
\r
656 for ( var i = 0 ; i < styles.length; i++ )
\r
660 namePattern = styles[ i ][ 0 ];
\r
661 valuePattern = styles[ i ][ 1 ];
\r
662 newValue = styles[ i ][ 2 ];
\r
663 newName = styles[ i ][ 3 ];
\r
665 if ( name.match( namePattern )
\r
666 && ( !valuePattern || value.match( valuePattern ) ) )
\r
668 name = newName || name;
\r
669 whitelist && ( newValue = newValue || value );
\r
671 if ( typeof newValue == 'function' )
\r
672 newValue = newValue( value, element, name );
\r
674 // Return an couple indicate both name and value
\r
676 if ( newValue && newValue.push )
\r
677 name = newValue[ 0 ], newValue = newValue[ 1 ];
\r
679 if ( typeof newValue == 'string' )
\r
680 rules.push( [ name, newValue ] );
\r
686 !whitelist && rules.push( [ name, value ] );
\r
690 for ( var i = 0 ; i < rules.length ; i++ )
\r
691 rules[ i ] = rules[ i ].join( ':' );
\r
692 return rules.length ?
\r
693 ( rules.join( ';' ) + ';' ) : false;
\r
698 * Migrate the element by decorate styles on it.
\r
699 * @param styleDefiniton
\r
702 elementMigrateFilter : function ( styleDefiniton, variables )
\r
704 return function( element )
\r
708 new CKEDITOR.style( styleDefiniton, variables )._.definition
\r
710 element.name = styleDef.element;
\r
711 CKEDITOR.tools.extend( element.attributes, CKEDITOR.tools.clone( styleDef.attributes ) );
\r
712 element.addStyle( CKEDITOR.style.getStyleText( styleDef ) );
\r
717 * Migrate styles by creating a new nested stylish element.
\r
718 * @param styleDefinition
\r
720 styleMigrateFilter : function( styleDefinition, variableName )
\r
723 var elementMigrateFilter = this.elementMigrateFilter;
\r
724 return function( value, element )
\r
726 // Build an stylish element first.
\r
727 var styleElement = new CKEDITOR.htmlParser.element( null ),
\r
730 variables[ variableName ] = value;
\r
731 elementMigrateFilter( styleDefinition, variables )( styleElement );
\r
732 // Place the new element inside the existing span.
\r
733 styleElement.children = element.children;
\r
734 element.children = [ styleElement ];
\r
739 * A filter which remove cke-namespaced-attribute on
\r
740 * all none-cke-namespaced elements.
\r
744 bogusAttrFilter : function( value, element )
\r
746 if ( element.name.indexOf( 'cke:' ) == -1 )
\r
751 * A filter which will be used to apply inline css style according the stylesheet
\r
752 * definition rules, is generated lazily when filtering.
\r
754 applyStyleFilter : null
\r
758 getRules : function( editor )
\r
760 var dtd = CKEDITOR.dtd,
\r
761 blockLike = CKEDITOR.tools.extend( {}, dtd.$block, dtd.$listItem, dtd.$tableContent ),
\r
762 config = editor.config,
\r
763 filters = this.filters,
\r
764 falsyFilter = filters.falsyFilter,
\r
765 stylesFilter = filters.stylesFilter,
\r
766 elementMigrateFilter = filters.elementMigrateFilter,
\r
767 styleMigrateFilter = CKEDITOR.tools.bind( this.filters.styleMigrateFilter, this.filters ),
\r
768 createListBulletMarker = this.utils.createListBulletMarker,
\r
769 flattenList = filters.flattenList,
\r
770 assembleList = filters.assembleList,
\r
771 isListBulletIndicator = this.utils.isListBulletIndicator,
\r
772 containsNothingButSpaces = this.utils.isContainingOnlySpaces,
\r
773 resolveListItem = this.utils.resolveList,
\r
774 convertToPx = this.utils.convertToPx,
\r
775 getStyleComponents = this.utils.getStyleComponents,
\r
776 listDtdParents = this.utils.listDtdParents,
\r
777 removeFontStyles = config.pasteFromWordRemoveFontStyles !== false,
\r
778 removeStyles = config.pasteFromWordRemoveStyles !== false;
\r
784 // Remove script, meta and link elements.
\r
785 [ ( /meta|link|script/ ), '' ]
\r
788 root : function( element )
\r
790 element.filterChildren();
\r
791 assembleList( element );
\r
796 '^' : function( element )
\r
798 // Transform CSS style declaration to inline style.
\r
799 var applyStyleFilter;
\r
800 if ( CKEDITOR.env.gecko && ( applyStyleFilter = filters.applyStyleFilter ) )
\r
801 applyStyleFilter( element );
\r
804 $ : function( element )
\r
806 var tagName = element.name || '',
\r
807 attrs = element.attributes;
\r
809 // Convert length unit of width/height on blocks to
\r
810 // a more editor-friendly way (px).
\r
811 if ( tagName in blockLike
\r
814 attrs.style = stylesFilter(
\r
815 [ [ ( /^(:?width|height)$/ ), null, convertToPx ] ] )( attrs.style ) || '';
\r
818 // Processing headings.
\r
819 if ( tagName.match( /h\d/ ) )
\r
821 element.filterChildren();
\r
822 // Is the heading actually a list item?
\r
823 if ( resolveListItem( element ) )
\r
826 // Adapt heading styles to editor's convention.
\r
827 elementMigrateFilter( config[ 'format_' + tagName ] )( element );
\r
829 // Remove inline elements which contain only empty spaces.
\r
830 else if ( tagName in dtd.$inline )
\r
832 element.filterChildren();
\r
833 if ( containsNothingButSpaces( element ) )
\r
834 delete element.name;
\r
836 // Remove element with ms-office namespace,
\r
837 // with it's content preserved, e.g. 'o:p'.
\r
838 else if ( tagName.indexOf( ':' ) != -1
\r
839 && tagName.indexOf( 'cke' ) == -1 )
\r
841 element.filterChildren();
\r
843 // Restore image real link from vml.
\r
844 if ( tagName == 'v:imagedata' )
\r
846 var href = element.attributes[ 'o:href' ];
\r
848 element.attributes.src = href;
\r
849 element.name = 'img';
\r
852 delete element.name;
\r
855 // Assembling list items into a whole list.
\r
856 if ( tagName in listDtdParents )
\r
858 element.filterChildren();
\r
859 assembleList( element );
\r
863 // We'll drop any style sheet, but Firefox conclude
\r
864 // certain styles in a single style element, which are
\r
865 // required to be changed into inline ones.
\r
866 'style' : function( element )
\r
868 if ( CKEDITOR.env.gecko )
\r
870 // Grab only the style definition section.
\r
871 var styleDefSection = element.onlyChild().value.match( /\/\* Style Definitions \*\/([\s\S]*?)\/\*/ ),
\r
872 styleDefText = styleDefSection && styleDefSection[ 1 ],
\r
873 rules = {}; // Storing the parsed result.
\r
875 if ( styleDefText )
\r
878 // Remove line-breaks.
\r
879 .replace(/[\n\r]/g,'')
\r
880 // Extract selectors and style properties.
\r
881 .replace( /(.+?)\{(.+?)\}/g,
\r
882 function( rule, selectors, styleBlock )
\r
884 selectors = selectors.split( ',' );
\r
885 var length = selectors.length, selector;
\r
886 for ( var i = 0; i < length; i++ )
\r
888 // Assume MS-Word mostly generate only simple
\r
889 // selector( [Type selector][Class selector]).
\r
890 CKEDITOR.tools.trim( selectors[ i ] )
\r
891 .replace( /^(\w+)(\.[\w-]+)?$/g,
\r
892 function( match, tagName, className )
\r
894 tagName = tagName || '*';
\r
895 className = className.substring( 1, className.length );
\r
897 // Reject MS-Word Normal styles.
\r
898 if ( className.match( /MsoNormal/ ) )
\r
901 if ( !rules[ tagName ] )
\r
902 rules[ tagName ] = {};
\r
904 rules[ tagName ][ className ] = styleBlock;
\r
906 rules[ tagName ] = styleBlock;
\r
911 filters.applyStyleFilter = function( element )
\r
913 var name = rules[ '*' ] ? '*' : element.name,
\r
914 className = element.attributes && element.attributes[ 'class' ],
\r
916 if ( name in rules )
\r
918 style = rules[ name ];
\r
919 if ( typeof style == 'object' )
\r
920 style = style[ className ];
\r
921 // Maintain style rules priorities.
\r
922 style && element.addStyle( style, true );
\r
930 'p' : function( element )
\r
932 // This's a fall-back approach to recognize list item in FF3.6,
\r
933 // as it's not perfect as not all list style (e.g. "heading list") is shipped
\r
934 // with this pattern. (#6662)
\r
935 if ( /MsoListParagraph/.exec( element.attributes[ 'class' ] ) )
\r
937 var bulletText = element.firstChild( function( node )
\r
939 return node.type == CKEDITOR.NODE_TEXT && !containsNothingButSpaces( node.parent );
\r
941 var bullet = bulletText && bulletText.parent,
\r
942 bulletAttrs = bullet && bullet.attributes;
\r
943 bulletAttrs && !bulletAttrs.style && ( bulletAttrs.style = 'mso-list: Ignore;' );
\r
946 element.filterChildren();
\r
948 // Is the paragraph actually a list item?
\r
949 if ( resolveListItem( element ) )
\r
952 // Adapt paragraph formatting to editor's convention
\r
953 // according to enter-mode.
\r
954 if ( config.enterMode == CKEDITOR.ENTER_BR )
\r
956 // We suffer from attribute/style lost in this situation.
\r
957 delete element.name;
\r
958 element.add( new CKEDITOR.htmlParser.element( 'br' ) );
\r
961 elementMigrateFilter( config[ 'format_' + ( config.enterMode == CKEDITOR.ENTER_P ? 'p' : 'div' ) ] )( element );
\r
964 'div' : function( element )
\r
966 // Aligned table with no text surrounded is represented by a wrapper div, from which
\r
967 // table cells inherit as text-align styles, which is wrong.
\r
968 // Instead we use a clear-float div after the table to properly achieve the same layout.
\r
969 var singleChild = element.onlyChild();
\r
970 if ( singleChild && singleChild.name == 'table' )
\r
972 var attrs = element.attributes;
\r
973 singleChild.attributes = CKEDITOR.tools.extend( singleChild.attributes, attrs );
\r
974 attrs.style && singleChild.addStyle( attrs.style );
\r
976 var clearFloatDiv = new CKEDITOR.htmlParser.element( 'div' );
\r
977 clearFloatDiv.addStyle( 'clear' ,'both' );
\r
978 element.add( clearFloatDiv );
\r
979 delete element.name;
\r
983 'td' : function ( element )
\r
985 // 'td' in 'thead' is actually <th>.
\r
986 if ( element.getAncestor( 'thead') )
\r
987 element.name = 'th';
\r
990 // MS-Word sometimes present list as a mixing of normal list
\r
991 // and pseudo-list, normalize the previous ones into pseudo form.
\r
992 'ol' : flattenList,
\r
993 'ul' : flattenList,
\r
994 'dl' : flattenList,
\r
996 'font' : function( element )
\r
998 // Drop the font tag if it comes from list bullet text.
\r
999 if ( isListBulletIndicator( element.parent ) )
\r
1001 delete element.name;
\r
1005 element.filterChildren();
\r
1007 var attrs = element.attributes,
\r
1008 styleText = attrs.style,
\r
1009 parent = element.parent;
\r
1011 if ( 'font' == parent.name ) // Merge nested <font> tags.
\r
1013 CKEDITOR.tools.extend( parent.attributes,
\r
1014 element.attributes );
\r
1015 styleText && parent.addStyle( styleText );
\r
1016 delete element.name;
\r
1018 // Convert the merged into a span with all attributes preserved.
\r
1021 styleText = styleText || '';
\r
1022 // IE's having those deprecated attributes, normalize them.
\r
1023 if ( attrs.color )
\r
1025 attrs.color != '#000000' && ( styleText += 'color:' + attrs.color + ';' );
\r
1026 delete attrs.color;
\r
1030 styleText += 'font-family:' + attrs.face + ';';
\r
1031 delete attrs.face;
\r
1033 // TODO: Mapping size in ranges of xx-small,
\r
1034 // x-small, small, medium, large, x-large, xx-large.
\r
1037 styleText += 'font-size:' +
\r
1038 ( attrs.size > 3 ? 'large'
\r
1039 : ( attrs.size < 3 ? 'small' : 'medium' ) ) + ';';
\r
1040 delete attrs.size;
\r
1043 element.name = 'span';
\r
1044 element.addStyle( styleText );
\r
1048 'span' : function( element )
\r
1050 // Remove the span if it comes from list bullet text.
\r
1051 if ( isListBulletIndicator( element.parent ) )
\r
1054 element.filterChildren();
\r
1055 if ( containsNothingButSpaces( element ) )
\r
1057 delete element.name;
\r
1061 // List item bullet type is supposed to be indicated by
\r
1062 // the text of a span with style 'mso-list : Ignore' or an image.
\r
1063 if ( isListBulletIndicator( element ) )
\r
1065 var listSymbolNode = element.firstChild( function( node )
\r
1067 return node.value || node.name == 'img';
\r
1070 var listSymbol = listSymbolNode && ( listSymbolNode.value || 'l.' ),
\r
1071 listType = listSymbol && listSymbol.match( /^(?:[(]?)([^\s]+?)([.)]?)$/ );
\r
1075 var marker = createListBulletMarker( listType, listSymbol );
\r
1076 // Some non-existed list items might be carried by an inconsequential list, indicate by "mso-hide:all/display:none",
\r
1077 // those are to be removed later, now mark it with "cke:ignored".
\r
1078 var ancestor = element.getAncestor( 'span' );
\r
1079 if ( ancestor && (/ mso-hide:\s*all|display:\s*none /).test( ancestor.attributes.style ) )
\r
1080 marker.attributes[ 'cke:ignored' ] = 1;
\r
1085 // Update the src attribute of image element with href.
\r
1086 var children = element.children,
\r
1087 attrs = element.attributes,
\r
1088 styleText = attrs && attrs.style,
\r
1089 firstChild = children && children[ 0 ];
\r
1091 // Assume MS-Word mostly carry font related styles on <span>,
\r
1092 // adapting them to editor's convention.
\r
1095 attrs.style = stylesFilter(
\r
1097 // Drop 'inline-height' style which make lines overlapping.
\r
1098 [ 'line-height' ],
\r
1099 [ ( /^font-family$/ ), null, !removeFontStyles ? styleMigrateFilter( config[ 'font_style' ], 'family' ) : null ] ,
\r
1100 [ ( /^font-size$/ ), null, !removeFontStyles ? styleMigrateFilter( config[ 'fontSize_style' ], 'size' ) : null ] ,
\r
1101 [ ( /^color$/ ), null, !removeFontStyles ? styleMigrateFilter( config[ 'colorButton_foreStyle' ], 'color' ) : null ] ,
\r
1102 [ ( /^background-color$/ ), null, !removeFontStyles ? styleMigrateFilter( config[ 'colorButton_backStyle' ], 'color' ) : null ]
\r
1103 ] )( styleText, element ) || '';
\r
1109 // Migrate basic style formats to editor configured ones.
\r
1110 'b' : elementMigrateFilter( config[ 'coreStyles_bold' ] ),
\r
1111 'i' : elementMigrateFilter( config[ 'coreStyles_italic' ] ),
\r
1112 'u' : elementMigrateFilter( config[ 'coreStyles_underline' ] ),
\r
1113 's' : elementMigrateFilter( config[ 'coreStyles_strike' ] ),
\r
1114 'sup' : elementMigrateFilter( config[ 'coreStyles_superscript' ] ),
\r
1115 'sub' : elementMigrateFilter( config[ 'coreStyles_subscript' ] ),
\r
1116 // Editor doesn't support anchor with content currently (#3582),
\r
1117 // drop such anchors with content preserved.
\r
1118 'a' : function( element )
\r
1120 var attrs = element.attributes;
\r
1121 if ( attrs && !attrs.href && attrs.name )
\r
1122 delete element.name;
\r
1124 'cke:listbullet' : function( element )
\r
1126 if ( element.getAncestor( /h\d/ ) && !config.pasteFromWordNumberedHeadingToList )
\r
1127 delete element.name;
\r
1133 // Remove onmouseover and onmouseout events (from MS Word comments effect)
\r
1134 [ ( /^onmouse(:?out|over)/ ), '' ],
\r
1135 // Onload on image element.
\r
1136 [ ( /^onload$/ ), '' ],
\r
1137 // Remove office and vml attribute from elements.
\r
1138 [ ( /(?:v|o):\w+/ ), '' ],
\r
1139 // Remove lang/language attributes.
\r
1140 [ ( /^lang/ ), '' ]
\r
1145 'style' : stylesFilter(
\r
1147 // Provide a white-list of styles that we preserve, those should
\r
1148 // be the ones that could later be altered with editor tools.
\r
1150 // Leave list-style-type
\r
1151 [ ( /^list-style-type$/ ), null ],
\r
1153 // Preserve margin-left/right which used as default indent style in the editor.
\r
1154 [ ( /^margin$|^margin-(?!bottom|top)/ ), null, function( value, element, name )
\r
1156 if ( element.name in { p : 1, div : 1 } )
\r
1158 var indentStyleName = config.contentsLangDirection == 'ltr' ?
\r
1159 'margin-left' : 'margin-right';
\r
1161 // Extract component value from 'margin' shorthand.
\r
1162 if ( name == 'margin' )
\r
1164 value = getStyleComponents( name, value,
\r
1165 [ indentStyleName ] )[ indentStyleName ];
\r
1167 else if ( name != indentStyleName )
\r
1170 if ( value && !emptyMarginRegex.test( value ) )
\r
1171 return [ indentStyleName, value ];
\r
1177 // Preserve clear float style.
\r
1178 [ ( /^clear$/ ) ],
\r
1180 [ ( /^border.*|margin.*|vertical-align|float$/ ), null,
\r
1181 function( value, element )
\r
1183 if ( element.name == 'img' )
\r
1187 [ (/^width|height$/ ), null,
\r
1188 function( value, element )
\r
1190 if ( element.name in { table : 1, td : 1, th : 1, img : 1 } )
\r
1194 // Otherwise provide a black-list of styles that we remove.
\r
1197 // Fixing color values.
\r
1198 [ ( /-color$/ ), null, function( value )
\r
1200 if ( value == 'transparent' )
\r
1202 if ( CKEDITOR.env.gecko )
\r
1203 return value.replace( /-moz-use-text-color/g, 'transparent' );
\r
1205 // Remove empty margin values, e.g. 0.00001pt 0em 0pt
\r
1206 [ ( /^margin$/ ), emptyMarginRegex ],
\r
1207 [ 'text-indent', '0cm' ],
\r
1208 [ 'page-break-before' ],
\r
1210 [ 'display', 'none' ],
\r
1211 removeFontStyles ? [ ( /font-?/ ) ] : null
\r
1212 ], removeStyles ),
\r
1214 // Prefer width styles over 'width' attributes.
\r
1215 'width' : function( value, element )
\r
1217 if ( element.name in dtd.$tableContent )
\r
1220 // Prefer border styles over table 'border' attributes.
\r
1221 'border' : function( value, element )
\r
1223 if ( element.name in dtd.$tableContent )
\r
1227 // Only Firefox carry style sheet from MS-Word, which
\r
1228 // will be applied by us manually. For other browsers
\r
1229 // the css className is useless.
\r
1230 'class' : falsyFilter,
\r
1232 // MS-Word always generate 'background-color' along with 'bgcolor',
\r
1233 // simply drop the deprecated attributes.
\r
1234 'bgcolor' : falsyFilter,
\r
1236 // Deprecate 'valign' attribute in favor of 'vertical-align'.
\r
1237 'valign' : removeStyles ? falsyFilter : function( value, element )
\r
1239 element.addStyle( 'vertical-align', value );
\r
1244 // Fore none-IE, some useful data might be buried under these IE-conditional
\r
1245 // comments where RegExp were the right approach to dig them out where usual approach
\r
1246 // is transform it into a fake element node which hold the desired data.
\r
1248 !CKEDITOR.env.ie ?
\r
1249 function( value, node )
\r
1251 var imageInfo = value.match( /<img.*?>/ ),
\r
1252 listInfo = value.match( /^\[if !supportLists\]([\s\S]*?)\[endif\]$/ );
\r
1254 // Seek for list bullet indicator.
\r
1257 // Bullet symbol could be either text or an image.
\r
1258 var listSymbol = listInfo[ 1 ] || ( imageInfo && 'l.' ),
\r
1259 listType = listSymbol && listSymbol.match( />(?:[(]?)([^\s]+?)([.)]?)</ );
\r
1260 return createListBulletMarker( listType, listSymbol );
\r
1263 // Reveal the <img> element in conditional comments for Firefox.
\r
1264 if ( CKEDITOR.env.gecko && imageInfo )
\r
1266 var img = CKEDITOR.htmlParser.fragment.fromHtml( imageInfo[ 0 ] ).children[ 0 ],
\r
1267 previousComment = node.previous,
\r
1268 // Try to dig the real image link from vml markup from previous comment text.
\r
1269 imgSrcInfo = previousComment && previousComment.value.match( /<v:imagedata[^>]*o:href=['"](.*?)['"]/ ),
\r
1270 imgSrc = imgSrcInfo && imgSrcInfo[ 1 ];
\r
1272 // Is there a real 'src' url to be used?
\r
1273 imgSrc && ( img.attributes.src = imgSrc );
\r
1284 // The paste processor here is just a reduced copy of html data processor.
\r
1285 var pasteProcessor = function()
\r
1287 this.dataFilter = new CKEDITOR.htmlParser.filter();
\r
1290 pasteProcessor.prototype =
\r
1292 toHtml : function( data )
\r
1294 var fragment = CKEDITOR.htmlParser.fragment.fromHtml( data, false ),
\r
1295 writer = new CKEDITOR.htmlParser.basicWriter();
\r
1297 fragment.writeHtml( writer, this.dataFilter );
\r
1298 return writer.getHtml( true );
\r
1302 CKEDITOR.cleanWord = function( data, editor )
\r
1304 // Firefox will be confused by those downlevel-revealed IE conditional
\r
1305 // comments, fixing them first( convert it to upperlevel-revealed one ).
\r
1306 // e.g. <![if !vml]>...<![endif]>
\r
1307 if ( CKEDITOR.env.gecko )
\r
1308 data = data.replace( /(<!--\[if[^<]*?\])-->([\S\s]*?)<!--(\[endif\]-->)/gi, '$1$2$3' );
\r
1310 var dataProcessor = new pasteProcessor(),
\r
1311 dataFilter = dataProcessor.dataFilter;
\r
1313 // These rules will have higher priorities than default ones.
\r
1314 dataFilter.addRules( CKEDITOR.plugins.pastefromword.getRules( editor ) );
\r
1316 // Allow extending data filter rules.
\r
1317 editor.fire( 'beforeCleanWord', { filter : dataFilter } );
\r
1321 data = dataProcessor.toHtml( data, false );
\r
1325 alert( editor.lang.pastefromword.error );
\r
1328 /* Below post processing those things that are unable to delivered by filter rules. */
\r
1330 // Remove 'cke' namespaced attribute used in filter rules as marker.
\r
1331 data = data.replace( /cke:.*?".*?"/g, '' );
\r
1333 // Remove empty style attribute.
\r
1334 data = data.replace( /style=""/g, '' );
\r
1336 // Remove the dummy spans ( having no inline style ).
\r
1337 data = data.replace( /<span>/g, '' );
\r
1344 * Whether to ignore all font related formatting styles, including:
\r
1345 * <ul> <li>font size;</li>
\r
1346 * <li>font family;</li>
\r
1347 * <li>font foreground/background color.</li></ul>
\r
1348 * @name CKEDITOR.config.pasteFromWordRemoveFontStyles
\r
1353 * config.pasteFromWordRemoveFontStyles = false;
\r
1357 * Whether to transform MS Word outline numbered headings into lists.
\r
1358 * @name CKEDITOR.config.pasteFromWordNumberedHeadingToList
\r
1363 * config.pasteFromWordNumberedHeadingToList = true;
\r
1367 * Whether to remove element styles that can't be managed with the editor. Note
\r
1368 * that this doesn't handle the font specific styles, which depends on the
\r
1369 * {@link CKEDITOR.config.pasteFromWordRemoveFontStyles} setting instead.
\r
1370 * @name CKEDITOR.config.pasteFromWordRemoveStyles
\r
1375 * config.pasteFromWordRemoveStyles = false;
\r