JasonWoof Got questions, comments, patches, etc.? Contact Jason Woofenden
vanilla ckeditor-3.5.3
[ckeditor.git] / _source / plugins / pastefromword / filter / default.js
1 /*\r
2 Copyright (c) 2003-2011, CKSource - Frederico Knabben. All rights reserved.\r
3 For licensing, see LICENSE.html or http://ckeditor.com/license\r
4 */\r
5 \r
6 (function()\r
7 {\r
8         var fragmentPrototype = CKEDITOR.htmlParser.fragment.prototype,\r
9                 elementPrototype = CKEDITOR.htmlParser.element.prototype;\r
10 \r
11         fragmentPrototype.onlyChild = elementPrototype.onlyChild = function()\r
12         {\r
13                 var children = this.children,\r
14                         count = children.length,\r
15                         firstChild = ( count == 1 ) && children[ 0 ];\r
16                 return firstChild || null;\r
17         };\r
18 \r
19         elementPrototype.removeAnyChildWithName = function( tagName )\r
20         {\r
21                 var children = this.children,\r
22                         childs = [],\r
23                         child;\r
24 \r
25                 for ( var i = 0; i < children.length; i++ )\r
26                 {\r
27                         child = children[ i ];\r
28                         if ( !child.name )\r
29                                 continue;\r
30 \r
31                         if ( child.name == tagName )\r
32                         {\r
33                                 childs.push( child );\r
34                                 children.splice( i--, 1 );\r
35                         }\r
36                         childs = childs.concat( child.removeAnyChildWithName( tagName ) );\r
37                 }\r
38                 return childs;\r
39         };\r
40 \r
41         elementPrototype.getAncestor = function( tagNameRegex )\r
42         {\r
43                 var parent = this.parent;\r
44                 while ( parent && !( parent.name && parent.name.match( tagNameRegex ) ) )\r
45                         parent = parent.parent;\r
46                 return parent;\r
47         };\r
48 \r
49         fragmentPrototype.firstChild = elementPrototype.firstChild = function( evaluator )\r
50         {\r
51                 var child;\r
52 \r
53                 for ( var i = 0 ; i < this.children.length ; i++ )\r
54                 {\r
55                         child = this.children[ i ];\r
56                         if ( evaluator( child ) )\r
57                                 return child;\r
58                         else if ( child.name )\r
59                         {\r
60                                 child = child.firstChild( evaluator );\r
61                                 if ( child )\r
62                                         return child;\r
63                         }\r
64                 }\r
65 \r
66                 return null;\r
67         };\r
68 \r
69         // Adding a (set) of styles to the element's 'style' attributes.\r
70         elementPrototype.addStyle = function( name, value, isPrepend )\r
71         {\r
72                 var styleText, addingStyleText = '';\r
73                 // name/value pair.\r
74                 if ( typeof value == 'string' )\r
75                         addingStyleText += name + ':' + value + ';';\r
76                 else\r
77                 {\r
78                         // style literal.\r
79                         if ( typeof name == 'object' )\r
80                         {\r
81                                 for ( var style in name )\r
82                                 {\r
83                                         if ( name.hasOwnProperty( style ) )\r
84                                                 addingStyleText += style + ':' + name[ style ] + ';';\r
85                                 }\r
86                         }\r
87                         // raw style text form.\r
88                         else\r
89                                 addingStyleText += name;\r
90 \r
91                         isPrepend = value;\r
92                 }\r
93 \r
94                 if ( !this.attributes )\r
95                         this.attributes = {};\r
96 \r
97                 styleText = this.attributes.style || '';\r
98 \r
99                 styleText = ( isPrepend ?\r
100                               [ addingStyleText, styleText ]\r
101                                           : [ styleText, addingStyleText ] ).join( ';' );\r
102 \r
103                 this.attributes.style = styleText.replace( /^;|;(?=;)/, '' );\r
104         };\r
105 \r
106         /**\r
107          * Return the DTD-valid parent tag names of the specified one.\r
108          * @param tagName\r
109          */\r
110         CKEDITOR.dtd.parentOf = function( tagName )\r
111         {\r
112                 var result = {};\r
113                 for ( var tag in this )\r
114                 {\r
115                         if ( tag.indexOf( '$' ) == -1 && this[ tag ][ tagName ] )\r
116                                 result[ tag ] = 1;\r
117                 }\r
118                 return result;\r
119         };\r
120 \r
121         // 1. move consistent list item styles up to list root.\r
122         // 2. clear out unnecessary list item numbering.\r
123         function postProcessList( list )\r
124         {\r
125                 var children = list.children,\r
126                         child,\r
127                         attrs,\r
128                         count = list.children.length,\r
129                         match,\r
130                         mergeStyle,\r
131                         styleTypeRegexp = /list-style-type:(.*?)(?:;|$)/,\r
132                         stylesFilter = CKEDITOR.plugins.pastefromword.filters.stylesFilter;\r
133 \r
134                 attrs = list.attributes;\r
135                 if ( styleTypeRegexp.exec( attrs.style ) )\r
136                         return;\r
137 \r
138                 for ( var i = 0; i < count; i++ )\r
139                 {\r
140                         child = children[ i ];\r
141 \r
142                         if ( child.attributes.value && Number( child.attributes.value ) == i + 1 )\r
143                                 delete child.attributes.value;\r
144 \r
145                         match = styleTypeRegexp.exec( child.attributes.style );\r
146 \r
147                         if ( match )\r
148                         {\r
149                                 if ( match[ 1 ] == mergeStyle || !mergeStyle )\r
150                                         mergeStyle = match[ 1 ];\r
151                                 else\r
152                                 {\r
153                                         mergeStyle = null;\r
154                                         break;\r
155                                 }\r
156                         }\r
157                 }\r
158 \r
159                 if ( mergeStyle )\r
160                 {\r
161                         for ( i = 0; i < count; i++ )\r
162                         {\r
163                                 attrs = children[ i ].attributes;\r
164                                 attrs.style && ( attrs.style = stylesFilter( [ [ 'list-style-type'] ] )( attrs.style ) || '' );\r
165                         }\r
166 \r
167                         list.addStyle( 'list-style-type', mergeStyle );\r
168                 }\r
169         }\r
170 \r
171         var cssLengthRelativeUnit = /^([.\d]*)+(em|ex|px|gd|rem|vw|vh|vm|ch|mm|cm|in|pt|pc|deg|rad|ms|s|hz|khz){1}?/i;\r
172         var emptyMarginRegex = /^(?:\b0[^\s]*\s*){1,4}$/;               // e.g. 0px 0pt 0px\r
173         var romanLiternalPattern = '^m{0,4}(cm|cd|d?c{0,3})(xc|xl|l?x{0,3})(ix|iv|v?i{0,3})$',\r
174                 lowerRomanLiteralRegex = new RegExp( romanLiternalPattern ),\r
175                 upperRomanLiteralRegex = new RegExp( romanLiternalPattern.toUpperCase() );\r
176 \r
177         var orderedPatterns = { 'decimal' : /\d+/, 'lower-roman': lowerRomanLiteralRegex, 'upper-roman': upperRomanLiteralRegex, 'lower-alpha' : /^[a-z]+$/, 'upper-alpha': /^[A-Z]+$/ },\r
178                 unorderedPatterns = { 'disc' : /[l\u00B7\u2002]/, 'circle' : /[\u006F\u00D8]/,'square' : /[\u006E\u25C6]/},\r
179                 listMarkerPatterns = { 'ol' : orderedPatterns, 'ul' : unorderedPatterns },\r
180                 romans = [ [1000, 'M'], [900, 'CM'], [500, 'D'], [400, 'CD'], [100, 'C'], [90, 'XC'], [50, 'L'], [40, 'XL'], [10, 'X'], [9, 'IX'], [5, 'V'], [4, 'IV'], [1, 'I'] ],\r
181                 alpahbets = "ABCDEFGHIJKLMNOPQRSTUVWXYZ";\r
182 \r
183         // Convert roman numbering back to decimal.\r
184         function fromRoman( str )\r
185          {\r
186                  str = str.toUpperCase();\r
187                  var l = romans.length, retVal = 0;\r
188                  for ( var i = 0; i < l; ++i )\r
189                  {\r
190                          for ( var j = romans[i], k = j[1].length; str.substr( 0, k ) == j[1]; str = str.substr( k ) )\r
191                                  retVal += j[ 0 ];\r
192                  }\r
193                  return retVal;\r
194          }\r
195 \r
196         // Convert alphabet numbering back to decimal.\r
197         function fromAlphabet( str )\r
198         {\r
199                 str = str.toUpperCase();\r
200                 var l = alpahbets.length, retVal = 1;\r
201                 for ( var x = 1; str.length > 0; x *= l )\r
202                 {\r
203                         retVal += alpahbets.indexOf( str.charAt( str.length - 1 ) ) * x;\r
204                         str = str.substr( 0, str.length - 1 );\r
205                 }\r
206                 return retVal;\r
207         }\r
208 \r
209         var listBaseIndent = 0,\r
210                 previousListItemMargin = null,\r
211                 previousListId;\r
212 \r
213         var plugin = ( CKEDITOR.plugins.pastefromword =\r
214         {\r
215                 utils :\r
216                 {\r
217                         // Create a <cke:listbullet> which indicate an list item type.\r
218                         createListBulletMarker : function ( bullet, bulletText )\r
219                         {\r
220                                 var marker = new CKEDITOR.htmlParser.element( 'cke:listbullet' );\r
221                                 marker.attributes = { 'cke:listsymbol' : bullet[ 0 ] };\r
222                                 marker.add( new CKEDITOR.htmlParser.text( bulletText ) );\r
223                                 return marker;\r
224                         },\r
225 \r
226                         isListBulletIndicator : function( element )\r
227                         {\r
228                                 var styleText = element.attributes && element.attributes.style;\r
229                                 if ( /mso-list\s*:\s*Ignore/i.test( styleText ) )\r
230                                         return true;\r
231                         },\r
232 \r
233                         isContainingOnlySpaces : function( element )\r
234                         {\r
235                                 var text;\r
236                                 return ( ( text = element.onlyChild() )\r
237                                             && ( /^(:?\s|&nbsp;)+$/ ).test( text.value ) );\r
238                         },\r
239 \r
240                         resolveList : function( element )\r
241                         {\r
242                                 // <cke:listbullet> indicate a list item.\r
243                                 var attrs = element.attributes,\r
244                                         listMarker;\r
245 \r
246                                 if ( ( listMarker = element.removeAnyChildWithName( 'cke:listbullet' ) )\r
247                                                 && listMarker.length\r
248                                                 && ( listMarker = listMarker[ 0 ] ) )\r
249                                 {\r
250                                         element.name = 'cke:li';\r
251 \r
252                                         if ( attrs.style )\r
253                                         {\r
254                                                 attrs.style = plugin.filters.stylesFilter(\r
255                                                                 [\r
256                                                                         // Text-indent is not representing list item level any more.\r
257                                                                         [ 'text-indent' ],\r
258                                                                         [ 'line-height' ],\r
259                                                                         // First attempt is to resolve indent level from on a constant margin increment.\r
260                                                                         [ ( /^margin(:?-left)?$/ ), null, function( margin )\r
261                                                                         {\r
262                                                                                 // Deal with component/short-hand form.\r
263                                                                                 var values = margin.split( ' ' );\r
264                                                                                 margin = plugin.utils.convertToPx( values[ 3 ] || values[ 1 ] || values [ 0 ] );\r
265                                                                                 margin = parseInt( margin, 10 );\r
266 \r
267                                                                                 // Figure out the indent unit by checking the first time of incrementation.\r
268                                                                                 if ( !listBaseIndent && previousListItemMargin !== null && margin > previousListItemMargin )\r
269                                                                                         listBaseIndent = margin - previousListItemMargin;\r
270 \r
271                                                                                 previousListItemMargin = margin;\r
272 \r
273                                                                                 attrs[ 'cke:indent' ] = listBaseIndent && ( Math.ceil( margin / listBaseIndent ) + 1 ) || 1;\r
274                                                                         } ],\r
275                                                                         // The best situation: "mso-list:l0 level1 lfo2" tells the belonged list root, list item indentation, etc.\r
276                                                                         [ ( /^mso-list$/ ), null, function( val )\r
277                                                                         {\r
278                                                                                 val = val.split( ' ' );\r
279                                                                                 var listId = Number( val[ 0 ].match( /\d+/ ) ),\r
280                                                                                         indent = Number( val[ 1 ].match( /\d+/ ) );\r
281 \r
282                                                                                 listId !== previousListId && ( attrs[ 'cke:reset' ] = 1 );\r
283                                                                                 previousListId = listId;\r
284                                                                                 attrs[ 'cke:indent' ] = indent;\r
285                                                                         } ]\r
286                                                                 ] )( attrs.style, element ) || '';\r
287                                         }\r
288 \r
289                                         // First level list item might be presented without a margin.\r
290 \r
291 \r
292                                         // In case all above doesn't apply.\r
293                                         if ( !attrs[ 'cke:indent' ] )\r
294                                         {\r
295                                                 previousListItemMargin = 0;\r
296                                                 attrs[ 'cke:indent' ] = 1;\r
297                                         }\r
298 \r
299                                         // Inherit attributes from bullet.\r
300                                         CKEDITOR.tools.extend( attrs, listMarker.attributes );\r
301                                         return true;\r
302                                 }\r
303                                 // Current list disconnected.\r
304                                 else\r
305                                         previousListId = previousListItemMargin = listBaseIndent = null;\r
306 \r
307                                 return false;\r
308                         },\r
309 \r
310                         // Convert various length units to 'px' in ignorance of DPI.\r
311                         convertToPx : ( function ()\r
312                         {\r
313                                 var calculator = CKEDITOR.dom.element.createFromHtml(\r
314                                                                 '<div style="position:absolute;left:-9999px;' +\r
315                                                                 'top:-9999px;margin:0px;padding:0px;border:0px;"' +\r
316                                                                 '></div>', CKEDITOR.document );\r
317                                 CKEDITOR.document.getBody().append( calculator );\r
318 \r
319                                 return function( cssLength )\r
320                                 {\r
321                                         if ( cssLengthRelativeUnit.test( cssLength ) )\r
322                                         {\r
323                                                 calculator.setStyle( 'width', cssLength );\r
324                                                 return calculator.$.clientWidth + 'px';\r
325                                         }\r
326 \r
327                                         return cssLength;\r
328                                 };\r
329                         } )(),\r
330 \r
331                         // Providing a shorthand style then retrieve one or more style component values.\r
332                         getStyleComponents : ( function()\r
333                         {\r
334                                 var calculator = CKEDITOR.dom.element.createFromHtml(\r
335                                                                 '<div style="position:absolute;left:-9999px;top:-9999px;"></div>',\r
336                                                                 CKEDITOR.document );\r
337                                 CKEDITOR.document.getBody().append( calculator );\r
338 \r
339                                 return function( name, styleValue, fetchList )\r
340                                 {\r
341                                         calculator.setStyle( name, styleValue );\r
342                                         var styles = {},\r
343                                                 count = fetchList.length;\r
344                                         for ( var i = 0; i < count; i++ )\r
345                                                 styles[ fetchList[ i ] ]  = calculator.getStyle( fetchList[ i ] );\r
346 \r
347                                         return styles;\r
348                                 };\r
349                         } )(),\r
350 \r
351                         listDtdParents : CKEDITOR.dtd.parentOf( 'ol' )\r
352                 },\r
353 \r
354                 filters :\r
355                 {\r
356                                 // Transform a normal list into flat list items only presentation.\r
357                                 // E.g. <ul><li>level1<ol><li>level2</li></ol></li> =>\r
358                                 // <cke:li cke:listtype="ul" cke:indent="1">level1</cke:li>\r
359                                 // <cke:li cke:listtype="ol" cke:indent="2">level2</cke:li>\r
360                                 flattenList : function( element )\r
361                                 {\r
362                                         var     attrs = element.attributes,\r
363                                                 parent = element.parent;\r
364 \r
365                                         var listStyleType,\r
366                                                 indentLevel = 1;\r
367 \r
368                                         // Resolve how many level nested.\r
369                                         while ( parent )\r
370                                         {\r
371                                                 parent.attributes && parent.attributes[ 'cke:list' ] && indentLevel++;\r
372                                                 parent = parent.parent;\r
373                                         }\r
374 \r
375                                         // All list items are of the same type.\r
376                                         switch ( attrs.type )\r
377                                         {\r
378                                                 case 'a' :\r
379                                                         listStyleType = 'lower-alpha';\r
380                                                         break;\r
381                                                 // TODO: Support more list style type from MS-Word.\r
382                                         }\r
383 \r
384                                         var children = element.children,\r
385                                                 child;\r
386 \r
387                                         for ( var i = 0; i < children.length; i++ )\r
388                                         {\r
389                                                 child = children[ i ];\r
390                                                 var attributes = child.attributes;\r
391 \r
392                                                 if ( child.name in CKEDITOR.dtd.$listItem )\r
393                                                 {\r
394                                                         var listItemChildren = child.children,\r
395                                                                 count = listItemChildren.length,\r
396                                                                 last = listItemChildren[ count - 1 ];\r
397 \r
398                                                         // Move out nested list.\r
399                                                         if ( last.name in CKEDITOR.dtd.$list )\r
400                                                         {\r
401                                                                 children.splice( i + 1, 0, last );\r
402                                                                 last.parent = element;\r
403 \r
404                                                                 // Remove the parent list item if it's just a holder.\r
405                                                                 if ( !--listItemChildren.length )\r
406                                                                         children.splice( i, 1 );\r
407                                                         }\r
408 \r
409                                                         child.name = 'cke:li';\r
410 \r
411                                                         // Inherit numbering from list root on the first list item.\r
412                                                         attrs.start && !i && ( attributes.value = attrs.start );\r
413 \r
414                                                         plugin.filters.stylesFilter(\r
415                                                                 [\r
416                                                                     [ 'tab-stops', null, function( val )\r
417                                                                         {\r
418                                                                                 var margin = val.split( ' ' )[ 1 ].match( cssLengthRelativeUnit );\r
419                                                                                 margin && ( previousListItemMargin = parseInt( plugin.utils.convertToPx( margin[ 0 ] ), 10 ) );\r
420                                                                         } ],\r
421                                                                         [ 'mso-list', null, function( val )\r
422                                                                         {\r
423                                                                                 val = val.split( ' ' );\r
424                                                                                 var listId = Number( val[ 0 ].match( /\d+/ ) );\r
425                                                                                 listId !== previousListId && ( attributes[ 'cke:reset' ] = 1 );\r
426                                                                                 previousListId = listId;\r
427                                                                         } ]\r
428                                                                 ] )( attributes.style );\r
429 \r
430                                                         attributes[ 'cke:indent' ] = indentLevel;\r
431                                                         attributes[ 'cke:listtype' ] = element.name;\r
432                                                         attributes[ 'cke:list-style-type' ] = listStyleType;\r
433                                                 }\r
434                                         }\r
435 \r
436                                         delete element.name;\r
437 \r
438                                         // We're loosing tag name here, signalize this element as a list.\r
439                                         attrs[ 'cke:list' ] = 1;\r
440                                 },\r
441 \r
442                                 /**\r
443                                  *  Try to collect all list items among the children and establish one\r
444                                  *  or more HTML list structures for them.\r
445                                  * @param element\r
446                                  */\r
447                                 assembleList : function( element )\r
448                                 {\r
449                                         var children = element.children, child,\r
450                                                         listItem,   // The current processing cke:li element.\r
451                                                         listItemAttrs,\r
452                                                         listItemIndent, // Indent level of current list item.\r
453                                                         lastIndent,\r
454                                                         lastListItem, // The previous one just been added to the list.\r
455                                                         list, // Current staging list and it's parent list if any.\r
456                                                         openedLists = [],\r
457                                                         previousListStyleType,\r
458                                                         previousListType;\r
459 \r
460                                         // Properties of the list item are to be resolved from the list bullet.\r
461                                         var bullet,\r
462                                                 listType,\r
463                                                 listStyleType,\r
464                                                 itemNumeric;\r
465 \r
466                                         for ( var i = 0; i < children.length; i++ )\r
467                                         {\r
468                                                 child = children[ i ];\r
469 \r
470                                                 if ( 'cke:li' == child.name )\r
471                                                 {\r
472                                                         child.name = 'li';\r
473                                                         listItem = child;\r
474                                                         listItemAttrs = listItem.attributes;\r
475                                                         bullet = listItemAttrs[ 'cke:listsymbol' ];\r
476                                                         bullet = bullet && bullet.match( /^(?:[(]?)([^\s]+?)([.)]?)$/ );\r
477                                                         listType = listStyleType = itemNumeric = null;\r
478 \r
479                                                         if ( listItemAttrs[ 'cke:ignored' ] )\r
480                                                         {\r
481                                                                 children.splice( i--, 1 );\r
482                                                                 continue;\r
483                                                         }\r
484 \r
485 \r
486                                                         // This's from a new list root.\r
487                                                         listItemAttrs[ 'cke:reset' ] && ( list = lastIndent = lastListItem = null );\r
488 \r
489                                                         // List item indent level might come from a real list indentation or\r
490                                                         // been resolved from a pseudo list item's margin value, even get\r
491                                                         // no indentation at all.\r
492                                                         listItemIndent = Number( listItemAttrs[ 'cke:indent' ] );\r
493 \r
494                                                         // We're moving out of the current list, cleaning up.\r
495                                                         if ( listItemIndent != lastIndent )\r
496                                                                 previousListType = previousListStyleType = null;\r
497 \r
498                                                         // List type and item style are already resolved.\r
499                                                         if ( !bullet )\r
500                                                         {\r
501                                                                 listType = listItemAttrs[ 'cke:listtype' ] || 'ol';\r
502                                                                 listStyleType = listItemAttrs[ 'cke:list-style-type' ];\r
503                                                         }\r
504                                                         else\r
505                                                         {\r
506                                                                 // Probably share the same list style type with previous list item,\r
507                                                                 // give it priority to avoid ambiguous between C(Alpha) and C.(Roman).\r
508                                                                 if ( previousListType && listMarkerPatterns[ previousListType ] [ previousListStyleType ].test( bullet[ 1 ] ) )\r
509                                                                 {\r
510                                                                         listType = previousListType;\r
511                                                                         listStyleType = previousListStyleType;\r
512                                                                 }\r
513                                                                 else\r
514                                                                 {\r
515                                                                         for ( var type in listMarkerPatterns )\r
516                                                                         {\r
517                                                                                 for ( var style in listMarkerPatterns[ type ] )\r
518                                                                                 {\r
519                                                                                         if ( listMarkerPatterns[ type ][ style ].test( bullet[ 1 ] ) )\r
520                                                                                         {\r
521                                                                                                 // Small numbering has higher priority, when dealing with ambiguous\r
522                                                                                                 // between C(Alpha) and C.(Roman).\r
523                                                                                                 if ( type == 'ol' && ( /alpha|roman/ ).test( style ) )\r
524                                                                                                 {\r
525                                                                                                         var num = /roman/.test( style ) ? fromRoman( bullet[ 1 ] ) : fromAlphabet( bullet[ 1 ] );\r
526                                                                                                         if ( !itemNumeric || num < itemNumeric )\r
527                                                                                                         {\r
528                                                                                                                 itemNumeric = num;\r
529                                                                                                                 listType = type;\r
530                                                                                                                 listStyleType = style;\r
531                                                                                                         }\r
532                                                                                                 }\r
533                                                                                                 else\r
534                                                                                                 {\r
535                                                                                                         listType = type;\r
536                                                                                                         listStyleType = style;\r
537                                                                                                         break;\r
538                                                                                                 }\r
539                                                                                         }\r
540                                                                                 }\r
541                                                                         }\r
542                                                                 }\r
543 \r
544                                                                 // Simply use decimal/disc for the rest forms of unrepresentable\r
545                                                                 // numerals, e.g. Chinese..., but as long as there a second part\r
546                                                                 // included, it has a bigger chance of being a order list ;)\r
547                                                                 !listType && ( listType = bullet[ 2 ] ? 'ol' : 'ul' );\r
548                                                         }\r
549 \r
550                                                         previousListType = listType;\r
551                                                         previousListStyleType = listStyleType || ( listType == 'ol' ? 'decimal' : 'disc' );\r
552                                                         if ( listStyleType && listStyleType != ( listType == 'ol' ? 'decimal' : 'disc' ) )\r
553                                                                 listItem.addStyle( 'list-style-type', listStyleType );\r
554 \r
555                                                         // Figure out start numbering.\r
556                                                         if ( listType == 'ol' && bullet )\r
557                                                         {\r
558                                                                 switch ( listStyleType )\r
559                                                                 {\r
560                                                                         case 'decimal' :\r
561                                                                                 itemNumeric = Number( bullet[ 1 ] );\r
562                                                                                 break;\r
563                                                                         case 'lower-roman':\r
564                                                                         case 'upper-roman':\r
565                                                                                 itemNumeric = fromRoman( bullet[ 1 ] );\r
566                                                                                 break;\r
567                                                                         case 'lower-alpha':\r
568                                                                         case 'upper-alpha':\r
569                                                                                 itemNumeric = fromAlphabet( bullet[ 1 ] );\r
570                                                                                 break;\r
571                                                                 }\r
572 \r
573                                                                 // Always create the numbering, swipe out unnecessary ones later.\r
574                                                                 listItem.attributes.value = itemNumeric;\r
575                                                         }\r
576 \r
577                                                         // Start the list construction.\r
578                                                         if ( !list )\r
579                                                         {\r
580                                                                 openedLists.push( list = new CKEDITOR.htmlParser.element( listType ) );\r
581                                                                 list.add( listItem );\r
582                                                                 children[ i ] = list;\r
583                                                         }\r
584                                                         else\r
585                                                         {\r
586                                                                 if ( listItemIndent > lastIndent )\r
587                                                                 {\r
588                                                                         openedLists.push( list = new CKEDITOR.htmlParser.element( listType ) );\r
589                                                                         list.add( listItem );\r
590                                                                         lastListItem.add( list );\r
591                                                                 }\r
592                                                                 else if ( listItemIndent < lastIndent )\r
593                                                                 {\r
594                                                                         // There might be a negative gap between two list levels. (#4944)\r
595                                                                         var diff = lastIndent - listItemIndent,\r
596                                                                                         parent;\r
597                                                                         while ( diff-- && ( parent = list.parent ) )\r
598                                                                                 list = parent.parent;\r
599 \r
600                                                                         list.add( listItem );\r
601                                                                 }\r
602                                                                 else\r
603                                                                         list.add( listItem );\r
604 \r
605                                                                 children.splice( i--, 1 );\r
606                                                         }\r
607 \r
608                                                         lastListItem = listItem;\r
609                                                         lastIndent = listItemIndent;\r
610                                                 }\r
611                                                 else if ( list )\r
612                                                         list = lastIndent = lastListItem = null;\r
613                                         }\r
614 \r
615                                         for ( i = 0; i < openedLists.length; i++ )\r
616                                                 postProcessList( openedLists[ i ] );\r
617 \r
618                                         list = lastIndent = lastListItem = previousListId = previousListItemMargin = listBaseIndent = null;\r
619                                 },\r
620 \r
621                                 /**\r
622                                  * A simple filter which always rejecting.\r
623                                  */\r
624                                 falsyFilter : function( value )\r
625                                 {\r
626                                         return false;\r
627                                 },\r
628 \r
629                                 /**\r
630                                  * A filter dedicated on the 'style' attribute filtering, e.g. dropping/replacing style properties.\r
631                                  * @param styles {Array} in form of [ styleNameRegexp, styleValueRegexp,\r
632                                  *  newStyleValue/newStyleGenerator, newStyleName ] where only the first\r
633                                  *  parameter is mandatory.\r
634                                  * @param whitelist {Boolean} Whether the {@param styles} will be considered as a white-list.\r
635                                  */\r
636                                 stylesFilter : function( styles, whitelist )\r
637                                 {\r
638                                         return function( styleText, element )\r
639                                         {\r
640                                                  var rules = [];\r
641                                                 // html-encoded quote might be introduced by 'font-family'\r
642                                                 // from MS-Word which confused the following regexp. e.g.\r
643                                                 //'font-family: &quot;Lucida, Console&quot;'\r
644                                                 ( styleText || '' )\r
645                                                         .replace( /&quot;/g, '"' )\r
646                                                         .replace( /\s*([^ :;]+)\s*:\s*([^;]+)\s*(?=;|$)/g,\r
647                                                                  function( match, name, value )\r
648                                                                  {\r
649                                                                          name = name.toLowerCase();\r
650                                                                          name == 'font-family' && ( value = value.replace( /["']/g, '' ) );\r
651 \r
652                                                                          var namePattern,\r
653                                                                                  valuePattern,\r
654                                                                                  newValue,\r
655                                                                                  newName;\r
656                                                                          for ( var i = 0 ; i < styles.length; i++ )\r
657                                                                          {\r
658                                                                                 if ( styles[ i ] )\r
659                                                                                 {\r
660                                                                                         namePattern = styles[ i ][ 0 ];\r
661                                                                                         valuePattern = styles[ i ][ 1 ];\r
662                                                                                         newValue = styles[ i ][ 2 ];\r
663                                                                                         newName = styles[ i ][ 3 ];\r
664 \r
665                                                                                         if ( name.match( namePattern )\r
666                                                                                                  && ( !valuePattern || value.match( valuePattern ) ) )\r
667                                                                                         {\r
668                                                                                                 name = newName || name;\r
669                                                                                                 whitelist && ( newValue = newValue || value );\r
670 \r
671                                                                                                 if ( typeof newValue == 'function' )\r
672                                                                                                         newValue = newValue( value, element, name );\r
673 \r
674                                                                                                 // Return an couple indicate both name and value\r
675                                                                                                 // changed.\r
676                                                                                                 if ( newValue && newValue.push )\r
677                                                                                                         name = newValue[ 0 ], newValue = newValue[ 1 ];\r
678 \r
679                                                                                                 if ( typeof newValue == 'string' )\r
680                                                                                                         rules.push( [ name, newValue ] );\r
681                                                                                                 return;\r
682                                                                                         }\r
683                                                                                 }\r
684                                                                          }\r
685 \r
686                                                                          !whitelist && rules.push( [ name, value ] );\r
687 \r
688                                                                  });\r
689 \r
690                                                 for ( var i = 0 ; i < rules.length ; i++ )\r
691                                                          rules[ i ] = rules[ i ].join( ':' );\r
692                                                 return rules.length ?\r
693                                                          ( rules.join( ';' ) + ';' ) : false;\r
694                                          };\r
695                                 },\r
696 \r
697                                 /**\r
698                                  * Migrate the element by decorate styles on it.\r
699                                  * @param styleDefiniton\r
700                                  * @param variables\r
701                                  */\r
702                                 elementMigrateFilter : function ( styleDefiniton, variables )\r
703                                 {\r
704                                         return function( element )\r
705                                                 {\r
706                                                         var styleDef =\r
707                                                                         variables ?\r
708                                                                                 new CKEDITOR.style( styleDefiniton, variables )._.definition\r
709                                                                                 : styleDefiniton;\r
710                                                         element.name = styleDef.element;\r
711                                                         CKEDITOR.tools.extend( element.attributes, CKEDITOR.tools.clone( styleDef.attributes ) );\r
712                                                         element.addStyle( CKEDITOR.style.getStyleText( styleDef ) );\r
713                                                 };\r
714                                 },\r
715 \r
716                                 /**\r
717                                  * Migrate styles by creating a new nested stylish element.\r
718                                  * @param styleDefinition\r
719                                  */\r
720                                 styleMigrateFilter : function( styleDefinition, variableName )\r
721                                 {\r
722 \r
723                                         var elementMigrateFilter = this.elementMigrateFilter;\r
724                                         return function( value, element )\r
725                                         {\r
726                                                 // Build an stylish element first.\r
727                                                 var styleElement = new CKEDITOR.htmlParser.element( null ),\r
728                                                         variables = {};\r
729 \r
730                                                 variables[ variableName ] = value;\r
731                                                 elementMigrateFilter( styleDefinition, variables )( styleElement );\r
732                                                 // Place the new element inside the existing span.\r
733                                                 styleElement.children = element.children;\r
734                                                 element.children = [ styleElement ];\r
735                                         };\r
736                                 },\r
737 \r
738                                 /**\r
739                                  * A filter which remove cke-namespaced-attribute on\r
740                                  * all none-cke-namespaced elements.\r
741                                  * @param value\r
742                                  * @param element\r
743                                  */\r
744                                 bogusAttrFilter : function( value, element )\r
745                                 {\r
746                                         if ( element.name.indexOf( 'cke:' ) == -1 )\r
747                                                 return false;\r
748                                 },\r
749 \r
750                                 /**\r
751                                  * A filter which will be used to apply inline css style according the stylesheet\r
752                                  * definition rules, is generated lazily when filtering.\r
753                                  */\r
754                                 applyStyleFilter : null\r
755 \r
756                         },\r
757 \r
758                 getRules : function( editor )\r
759                 {\r
760                         var dtd = CKEDITOR.dtd,\r
761                                 blockLike = CKEDITOR.tools.extend( {}, dtd.$block, dtd.$listItem, dtd.$tableContent ),\r
762                                 config = editor.config,\r
763                                 filters = this.filters,\r
764                                 falsyFilter = filters.falsyFilter,\r
765                                 stylesFilter = filters.stylesFilter,\r
766                                 elementMigrateFilter = filters.elementMigrateFilter,\r
767                                 styleMigrateFilter = CKEDITOR.tools.bind( this.filters.styleMigrateFilter, this.filters ),\r
768                                 createListBulletMarker = this.utils.createListBulletMarker,\r
769                                 flattenList = filters.flattenList,\r
770                                 assembleList = filters.assembleList,\r
771                                 isListBulletIndicator = this.utils.isListBulletIndicator,\r
772                                 containsNothingButSpaces = this.utils.isContainingOnlySpaces,\r
773                                 resolveListItem = this.utils.resolveList,\r
774                                 convertToPx = this.utils.convertToPx,\r
775                                 getStyleComponents = this.utils.getStyleComponents,\r
776                                 listDtdParents = this.utils.listDtdParents,\r
777                                 removeFontStyles = config.pasteFromWordRemoveFontStyles !== false,\r
778                                 removeStyles = config.pasteFromWordRemoveStyles !== false;\r
779 \r
780                         return {\r
781 \r
782                                 elementNames :\r
783                                 [\r
784                                         // Remove script, meta and link elements.\r
785                                         [ ( /meta|link|script/ ), '' ]\r
786                                 ],\r
787 \r
788                                 root : function( element )\r
789                                 {\r
790                                         element.filterChildren();\r
791                                         assembleList( element );\r
792                                 },\r
793 \r
794                                 elements :\r
795                                 {\r
796                                         '^' : function( element )\r
797                                         {\r
798                                                 // Transform CSS style declaration to inline style.\r
799                                                 var applyStyleFilter;\r
800                                                 if ( CKEDITOR.env.gecko && ( applyStyleFilter = filters.applyStyleFilter ) )\r
801                                                         applyStyleFilter( element );\r
802                                         },\r
803 \r
804                                         $ : function( element )\r
805                                         {\r
806                                                 var tagName = element.name || '',\r
807                                                         attrs = element.attributes;\r
808 \r
809                                                 // Convert length unit of width/height on blocks to\r
810                                                 // a more editor-friendly way (px).\r
811                                                 if ( tagName in blockLike\r
812                                                         && attrs.style )\r
813                                                 {\r
814                                                         attrs.style = stylesFilter(\r
815                                                                                 [ [ ( /^(:?width|height)$/ ), null, convertToPx ] ] )( attrs.style ) || '';\r
816                                                 }\r
817 \r
818                                                 // Processing headings.\r
819                                                 if ( tagName.match( /h\d/ ) )\r
820                                                 {\r
821                                                         element.filterChildren();\r
822                                                         // Is the heading actually a list item?\r
823                                                         if ( resolveListItem( element ) )\r
824                                                                 return;\r
825 \r
826                                                         // Adapt heading styles to editor's convention.\r
827                                                         elementMigrateFilter( config[ 'format_' + tagName ] )( element );\r
828                                                 }\r
829                                                 // Remove inline elements which contain only empty spaces.\r
830                                                 else if ( tagName in dtd.$inline )\r
831                                                 {\r
832                                                         element.filterChildren();\r
833                                                         if ( containsNothingButSpaces( element ) )\r
834                                                                 delete element.name;\r
835                                                 }\r
836                                                 // Remove element with ms-office namespace,\r
837                                                 // with it's content preserved, e.g. 'o:p'.\r
838                                                 else if ( tagName.indexOf( ':' ) != -1\r
839                                                                  && tagName.indexOf( 'cke' ) == -1 )\r
840                                                 {\r
841                                                         element.filterChildren();\r
842 \r
843                                                         // Restore image real link from vml.\r
844                                                         if ( tagName == 'v:imagedata' )\r
845                                                         {\r
846                                                                 var href = element.attributes[ 'o:href' ];\r
847                                                                 if ( href )\r
848                                                                         element.attributes.src = href;\r
849                                                                 element.name = 'img';\r
850                                                                 return;\r
851                                                         }\r
852                                                         delete element.name;\r
853                                                 }\r
854 \r
855                                                 // Assembling list items into a whole list.\r
856                                                 if ( tagName in listDtdParents )\r
857                                                 {\r
858                                                         element.filterChildren();\r
859                                                         assembleList( element );\r
860                                                 }\r
861                                         },\r
862 \r
863                                         // We'll drop any style sheet, but Firefox conclude\r
864                                         // certain styles in a single style element, which are\r
865                                         // required to be changed into inline ones.\r
866                                         'style' : function( element )\r
867                                         {\r
868                                                 if ( CKEDITOR.env.gecko )\r
869                                                 {\r
870                                                         // Grab only the style definition section.\r
871                                                         var styleDefSection = element.onlyChild().value.match( /\/\* Style Definitions \*\/([\s\S]*?)\/\*/ ),\r
872                                                                 styleDefText = styleDefSection && styleDefSection[ 1 ],\r
873                                                                 rules = {}; // Storing the parsed result.\r
874 \r
875                                                         if ( styleDefText )\r
876                                                         {\r
877                                                                 styleDefText\r
878                                                                         // Remove line-breaks.\r
879                                                                         .replace(/[\n\r]/g,'')\r
880                                                                         // Extract selectors and style properties.\r
881                                                                         .replace( /(.+?)\{(.+?)\}/g,\r
882                                                                                 function( rule, selectors, styleBlock )\r
883                                                                                 {\r
884                                                                                         selectors = selectors.split( ',' );\r
885                                                                                         var length = selectors.length, selector;\r
886                                                                                         for ( var i = 0; i < length; i++ )\r
887                                                                                         {\r
888                                                                                                 // Assume MS-Word mostly generate only simple\r
889                                                                                                 // selector( [Type selector][Class selector]).\r
890                                                                                                 CKEDITOR.tools.trim( selectors[ i ] )\r
891                                                                                                                           .replace( /^(\w+)(\.[\w-]+)?$/g,\r
892                                                                                                 function( match, tagName, className )\r
893                                                                                                 {\r
894                                                                                                         tagName = tagName || '*';\r
895                                                                                                         className = className.substring( 1, className.length );\r
896 \r
897                                                                                                         // Reject MS-Word Normal styles.\r
898                                                                                                         if ( className.match( /MsoNormal/ ) )\r
899                                                                                                                 return;\r
900 \r
901                                                                                                         if ( !rules[ tagName ] )\r
902                                                                                                                 rules[ tagName ] = {};\r
903                                                                                                         if ( className )\r
904                                                                                                                 rules[ tagName ][ className ] = styleBlock;\r
905                                                                                                         else\r
906                                                                                                                 rules[ tagName ] = styleBlock;\r
907                                                                                                 } );\r
908                                                                                         }\r
909                                                                                 });\r
910 \r
911                                                                 filters.applyStyleFilter = function( element )\r
912                                                                 {\r
913                                                                         var name = rules[ '*' ] ? '*' : element.name,\r
914                                                                                 className = element.attributes && element.attributes[ 'class' ],\r
915                                                                                 style;\r
916                                                                         if ( name in rules )\r
917                                                                         {\r
918                                                                                 style = rules[ name ];\r
919                                                                                 if ( typeof style == 'object' )\r
920                                                                                         style = style[ className ];\r
921                                                                                 // Maintain style rules priorities.\r
922                                                                                 style && element.addStyle( style, true );\r
923                                                                         }\r
924                                                                 };\r
925                                                         }\r
926                                                 }\r
927                                                 return false;\r
928                                         },\r
929 \r
930                                         'p' : function( element )\r
931                                         {\r
932                                                 // This's a fall-back approach to recognize list item in FF3.6,\r
933                                                 // as it's not perfect as not all list style (e.g. "heading list") is shipped\r
934                                                 // with this pattern. (#6662)\r
935                                                 if ( /MsoListParagraph/.exec( element.attributes[ 'class' ] ) )\r
936                                                 {\r
937                                                         var bulletText = element.firstChild( function( node )\r
938                                                         {\r
939                                                                 return node.type == CKEDITOR.NODE_TEXT && !containsNothingButSpaces( node.parent );\r
940                                                         });\r
941                                                         var bullet = bulletText && bulletText.parent,\r
942                                                                 bulletAttrs = bullet && bullet.attributes;\r
943                                                         bulletAttrs && !bulletAttrs.style && ( bulletAttrs.style = 'mso-list: Ignore;' );\r
944                                                 }\r
945 \r
946                                                 element.filterChildren();\r
947 \r
948                                                 // Is the paragraph actually a list item?\r
949                                                 if ( resolveListItem( element ) )\r
950                                                         return;\r
951 \r
952                                                 // Adapt paragraph formatting to editor's convention\r
953                                                 // according to enter-mode.\r
954                                                 if ( config.enterMode == CKEDITOR.ENTER_BR )\r
955                                                 {\r
956                                                         // We suffer from attribute/style lost in this situation.\r
957                                                         delete element.name;\r
958                                                         element.add( new CKEDITOR.htmlParser.element( 'br' ) );\r
959                                                 }\r
960                                                 else\r
961                                                         elementMigrateFilter( config[ 'format_' + ( config.enterMode == CKEDITOR.ENTER_P ? 'p' : 'div' ) ] )( element );\r
962                                         },\r
963 \r
964                                         'div' : function( element )\r
965                                         {\r
966                                                 // Aligned table with no text surrounded is represented by a wrapper div, from which\r
967                                                 // table cells inherit as text-align styles, which is wrong.\r
968                                                 // Instead we use a clear-float div after the table to properly achieve the same layout.\r
969                                                 var singleChild = element.onlyChild();\r
970                                                 if ( singleChild && singleChild.name == 'table' )\r
971                                                 {\r
972                                                         var attrs = element.attributes;\r
973                                                         singleChild.attributes = CKEDITOR.tools.extend( singleChild.attributes, attrs );\r
974                                                         attrs.style && singleChild.addStyle( attrs.style );\r
975 \r
976                                                         var clearFloatDiv = new CKEDITOR.htmlParser.element( 'div' );\r
977                                                         clearFloatDiv.addStyle( 'clear' ,'both' );\r
978                                                         element.add( clearFloatDiv );\r
979                                                         delete element.name;\r
980                                                 }\r
981                                         },\r
982 \r
983                                         'td' : function ( element )\r
984                                         {\r
985                                                 // 'td' in 'thead' is actually <th>.\r
986                                                 if ( element.getAncestor( 'thead') )\r
987                                                         element.name = 'th';\r
988                                         },\r
989 \r
990                                         // MS-Word sometimes present list as a mixing of normal list\r
991                                         // and pseudo-list, normalize the previous ones into pseudo form.\r
992                                         'ol' : flattenList,\r
993                                         'ul' : flattenList,\r
994                                         'dl' : flattenList,\r
995 \r
996                                         'font' : function( element )\r
997                                         {\r
998                                                 // Drop the font tag if it comes from list bullet text.\r
999                                                 if ( isListBulletIndicator( element.parent ) )\r
1000                                                 {\r
1001                                                         delete element.name;\r
1002                                                         return;\r
1003                                                 }\r
1004 \r
1005                                                 element.filterChildren();\r
1006 \r
1007                                                 var attrs = element.attributes,\r
1008                                                         styleText = attrs.style,\r
1009                                                         parent = element.parent;\r
1010 \r
1011                                                 if ( 'font' == parent.name )     // Merge nested <font> tags.\r
1012                                                 {\r
1013                                                         CKEDITOR.tools.extend( parent.attributes,\r
1014                                                                         element.attributes );\r
1015                                                         styleText && parent.addStyle( styleText );\r
1016                                                         delete element.name;\r
1017                                                 }\r
1018                                                 // Convert the merged into a span with all attributes preserved.\r
1019                                                 else\r
1020                                                 {\r
1021                                                         styleText = styleText || '';\r
1022                                                         // IE's having those deprecated attributes, normalize them.\r
1023                                                         if ( attrs.color )\r
1024                                                         {\r
1025                                                                 attrs.color != '#000000' && ( styleText += 'color:' + attrs.color + ';' );\r
1026                                                                 delete attrs.color;\r
1027                                                         }\r
1028                                                         if ( attrs.face )\r
1029                                                         {\r
1030                                                                 styleText += 'font-family:' + attrs.face + ';';\r
1031                                                                 delete attrs.face;\r
1032                                                         }\r
1033                                                         // TODO: Mapping size in ranges of xx-small,\r
1034                                                         // x-small, small, medium, large, x-large, xx-large.\r
1035                                                         if ( attrs.size )\r
1036                                                         {\r
1037                                                                 styleText += 'font-size:' +\r
1038                                                                              ( attrs.size > 3 ? 'large'\r
1039                                                                                              : ( attrs.size < 3 ? 'small' : 'medium' ) ) + ';';\r
1040                                                                 delete attrs.size;\r
1041                                                         }\r
1042 \r
1043                                                         element.name = 'span';\r
1044                                                         element.addStyle( styleText );\r
1045                                                 }\r
1046                                         },\r
1047 \r
1048                                         'span' : function( element )\r
1049                                         {\r
1050                                                 // Remove the span if it comes from list bullet text.\r
1051                                                 if ( isListBulletIndicator( element.parent ) )\r
1052                                                         return false;\r
1053 \r
1054                                                 element.filterChildren();\r
1055                                                 if ( containsNothingButSpaces( element ) )\r
1056                                                 {\r
1057                                                         delete element.name;\r
1058                                                         return null;\r
1059                                                 }\r
1060 \r
1061                                                 // List item bullet type is supposed to be indicated by\r
1062                                                 // the text of a span with style 'mso-list : Ignore' or an image.\r
1063                                                 if ( isListBulletIndicator( element ) )\r
1064                                                 {\r
1065                                                         var listSymbolNode = element.firstChild( function( node )\r
1066                                                         {\r
1067                                                                 return node.value || node.name == 'img';\r
1068                                                         });\r
1069 \r
1070                                                         var listSymbol =  listSymbolNode && ( listSymbolNode.value || 'l.' ),\r
1071                                                                 listType = listSymbol && listSymbol.match( /^(?:[(]?)([^\s]+?)([.)]?)$/ );\r
1072 \r
1073                                                         if ( listType )\r
1074                                                         {\r
1075                                                                 var marker = createListBulletMarker( listType, listSymbol );\r
1076                                                                 // Some non-existed list items might be carried by an inconsequential list, indicate by "mso-hide:all/display:none",\r
1077                                                                 // those are to be removed later, now mark it with "cke:ignored".\r
1078                                                                 var ancestor = element.getAncestor( 'span' );\r
1079                                                                 if ( ancestor && (/ mso-hide:\s*all|display:\s*none /).test( ancestor.attributes.style ) )\r
1080                                                                         marker.attributes[ 'cke:ignored' ] = 1;\r
1081                                                                 return marker;\r
1082                                                         }\r
1083                                                 }\r
1084 \r
1085                                                 // Update the src attribute of image element with href.\r
1086                                                 var children = element.children,\r
1087                                                         attrs = element.attributes,\r
1088                                                         styleText = attrs && attrs.style,\r
1089                                                         firstChild = children && children[ 0 ];\r
1090 \r
1091                                                 // Assume MS-Word mostly carry font related styles on <span>,\r
1092                                                 // adapting them to editor's convention.\r
1093                                                 if ( styleText )\r
1094                                                 {\r
1095                                                         attrs.style = stylesFilter(\r
1096                                                                         [\r
1097                                                                                 // Drop 'inline-height' style which make lines overlapping.\r
1098                                                                                 [ 'line-height' ],\r
1099                                                                                 [ ( /^font-family$/ ), null, !removeFontStyles ? styleMigrateFilter( config[ 'font_style' ], 'family' ) : null ] ,\r
1100                                                                                 [ ( /^font-size$/ ), null, !removeFontStyles ? styleMigrateFilter( config[ 'fontSize_style' ], 'size' ) : null ] ,\r
1101                                                                                 [ ( /^color$/ ), null, !removeFontStyles ? styleMigrateFilter( config[ 'colorButton_foreStyle' ], 'color' ) : null ] ,\r
1102                                                                                 [ ( /^background-color$/ ), null, !removeFontStyles ? styleMigrateFilter( config[ 'colorButton_backStyle' ], 'color' ) : null ]\r
1103                                                                         ] )( styleText, element ) || '';\r
1104                                                 }\r
1105 \r
1106                                                 return null;\r
1107                                         },\r
1108 \r
1109                                         // Migrate basic style formats to editor configured ones.\r
1110                                         'b' : elementMigrateFilter( config[ 'coreStyles_bold' ] ),\r
1111                                         'i' : elementMigrateFilter( config[ 'coreStyles_italic' ] ),\r
1112                                         'u' : elementMigrateFilter( config[ 'coreStyles_underline' ] ),\r
1113                                         's' : elementMigrateFilter( config[ 'coreStyles_strike' ] ),\r
1114                                         'sup' : elementMigrateFilter( config[ 'coreStyles_superscript' ] ),\r
1115                                         'sub' : elementMigrateFilter( config[ 'coreStyles_subscript' ] ),\r
1116                                         // Editor doesn't support anchor with content currently (#3582),\r
1117                                         // drop such anchors with content preserved.\r
1118                                         'a' : function( element )\r
1119                                         {\r
1120                                                 var attrs = element.attributes;\r
1121                                                 if ( attrs && !attrs.href && attrs.name )\r
1122                                                         delete element.name;\r
1123                                         },\r
1124                                         'cke:listbullet' : function( element )\r
1125                                         {\r
1126                                                 if ( element.getAncestor( /h\d/ ) && !config.pasteFromWordNumberedHeadingToList )\r
1127                                                         delete element.name;\r
1128                                         }\r
1129                                 },\r
1130 \r
1131                                 attributeNames :\r
1132                                 [\r
1133                                         // Remove onmouseover and onmouseout events (from MS Word comments effect)\r
1134                                         [ ( /^onmouse(:?out|over)/ ), '' ],\r
1135                                         // Onload on image element.\r
1136                                         [ ( /^onload$/ ), '' ],\r
1137                                         // Remove office and vml attribute from elements.\r
1138                                         [ ( /(?:v|o):\w+/ ), '' ],\r
1139                                         // Remove lang/language attributes.\r
1140                                         [ ( /^lang/ ), '' ]\r
1141                                 ],\r
1142 \r
1143                                 attributes :\r
1144                                 {\r
1145                                         'style' : stylesFilter(\r
1146                                         removeStyles ?\r
1147                                         // Provide a white-list of styles that we preserve, those should\r
1148                                         // be the ones that could later be altered with editor tools.\r
1149                                         [\r
1150                                                 // Leave list-style-type\r
1151                                                 [ ( /^list-style-type$/ ), null ],\r
1152 \r
1153                                                 // Preserve margin-left/right which used as default indent style in the editor.\r
1154                                                 [ ( /^margin$|^margin-(?!bottom|top)/ ), null, function( value, element, name )\r
1155                                                         {\r
1156                                                                 if ( element.name in { p : 1, div : 1 } )\r
1157                                                                 {\r
1158                                                                         var indentStyleName = config.contentsLangDirection == 'ltr' ?\r
1159                                                                                         'margin-left' : 'margin-right';\r
1160 \r
1161                                                                         // Extract component value from 'margin' shorthand.\r
1162                                                                         if ( name == 'margin' )\r
1163                                                                         {\r
1164                                                                                 value = getStyleComponents( name, value,\r
1165                                                                                                 [ indentStyleName ] )[ indentStyleName ];\r
1166                                                                         }\r
1167                                                                         else if ( name != indentStyleName )\r
1168                                                                                 return null;\r
1169 \r
1170                                                                         if ( value && !emptyMarginRegex.test( value ) )\r
1171                                                                                 return [ indentStyleName, value ];\r
1172                                                                 }\r
1173 \r
1174                                                                 return null;\r
1175                                                         } ],\r
1176 \r
1177                                                 // Preserve clear float style.\r
1178                                                 [ ( /^clear$/ ) ],\r
1179 \r
1180                                                 [ ( /^border.*|margin.*|vertical-align|float$/ ), null,\r
1181                                                         function( value, element )\r
1182                                                         {\r
1183                                                                 if ( element.name == 'img' )\r
1184                                                                         return value;\r
1185                                                         } ],\r
1186 \r
1187                                                 [ (/^width|height$/ ), null,\r
1188                                                         function( value, element )\r
1189                                                         {\r
1190                                                                 if ( element.name in { table : 1, td : 1, th : 1, img : 1 } )\r
1191                                                                         return value;\r
1192                                                         } ]\r
1193                                         ] :\r
1194                                         // Otherwise provide a black-list of styles that we remove.\r
1195                                         [\r
1196                                                 [ ( /^mso-/ ) ],\r
1197                                                 // Fixing color values.\r
1198                                                 [ ( /-color$/ ), null, function( value )\r
1199                                                 {\r
1200                                                         if ( value == 'transparent' )\r
1201                                                                 return false;\r
1202                                                         if ( CKEDITOR.env.gecko )\r
1203                                                                 return value.replace( /-moz-use-text-color/g, 'transparent' );\r
1204                                                 } ],\r
1205                                                 // Remove empty margin values, e.g. 0.00001pt 0em 0pt\r
1206                                                 [ ( /^margin$/ ), emptyMarginRegex ],\r
1207                                                 [ 'text-indent', '0cm' ],\r
1208                                                 [ 'page-break-before' ],\r
1209                                                 [ 'tab-stops' ],\r
1210                                                 [ 'display', 'none' ],\r
1211                                                 removeFontStyles ? [ ( /font-?/ ) ] : null\r
1212                                         ], removeStyles ),\r
1213 \r
1214                                         // Prefer width styles over 'width' attributes.\r
1215                                         'width' : function( value, element )\r
1216                                         {\r
1217                                                 if ( element.name in dtd.$tableContent )\r
1218                                                         return false;\r
1219                                         },\r
1220                                         // Prefer border styles over table 'border' attributes.\r
1221                                         'border' : function( value, element )\r
1222                                         {\r
1223                                                 if ( element.name in dtd.$tableContent )\r
1224                                                         return false;\r
1225                                         },\r
1226 \r
1227                                         // Only Firefox carry style sheet from MS-Word, which\r
1228                                         // will be applied by us manually. For other browsers\r
1229                                         // the css className is useless.\r
1230                                         'class' : falsyFilter,\r
1231 \r
1232                                         // MS-Word always generate 'background-color' along with 'bgcolor',\r
1233                                         // simply drop the deprecated attributes.\r
1234                                         'bgcolor' : falsyFilter,\r
1235 \r
1236                                         // Deprecate 'valign' attribute in favor of 'vertical-align'.\r
1237                                         'valign' : removeStyles ? falsyFilter : function( value, element )\r
1238                                         {\r
1239                                                 element.addStyle( 'vertical-align', value );\r
1240                                                 return false;\r
1241                                         }\r
1242                                 },\r
1243 \r
1244                                 // Fore none-IE, some useful data might be buried under these IE-conditional\r
1245                                 // comments where RegExp were the right approach to dig them out where usual approach\r
1246                                 // is transform it into a fake element node which hold the desired data.\r
1247                                 comment :\r
1248                                         !CKEDITOR.env.ie ?\r
1249                                                 function( value, node )\r
1250                                                 {\r
1251                                                         var imageInfo = value.match( /<img.*?>/ ),\r
1252                                                                 listInfo = value.match( /^\[if !supportLists\]([\s\S]*?)\[endif\]$/ );\r
1253 \r
1254                                                         // Seek for list bullet indicator.\r
1255                                                         if ( listInfo )\r
1256                                                         {\r
1257                                                                 // Bullet symbol could be either text or an image.\r
1258                                                                 var listSymbol = listInfo[ 1 ] || ( imageInfo && 'l.' ),\r
1259                                                                         listType = listSymbol && listSymbol.match( />(?:[(]?)([^\s]+?)([.)]?)</ );\r
1260                                                                 return createListBulletMarker( listType, listSymbol );\r
1261                                                         }\r
1262 \r
1263                                                         // Reveal the <img> element in conditional comments for Firefox.\r
1264                                                         if ( CKEDITOR.env.gecko && imageInfo )\r
1265                                                         {\r
1266                                                                 var img = CKEDITOR.htmlParser.fragment.fromHtml( imageInfo[ 0 ] ).children[ 0 ],\r
1267                                                                         previousComment = node.previous,\r
1268                                                                         // Try to dig the real image link from vml markup from previous comment text.\r
1269                                                                         imgSrcInfo = previousComment && previousComment.value.match( /<v:imagedata[^>]*o:href=['"](.*?)['"]/ ),\r
1270                                                                         imgSrc = imgSrcInfo && imgSrcInfo[ 1 ];\r
1271 \r
1272                                                                 // Is there a real 'src' url to be used?\r
1273                                                                 imgSrc && ( img.attributes.src = imgSrc );\r
1274                                                                 return img;\r
1275                                                         }\r
1276 \r
1277                                                         return false;\r
1278                                                 }\r
1279                                         : falsyFilter\r
1280                         };\r
1281                 }\r
1282         });\r
1283 \r
1284         // The paste processor here is just a reduced copy of html data processor.\r
1285         var pasteProcessor = function()\r
1286         {\r
1287                 this.dataFilter = new CKEDITOR.htmlParser.filter();\r
1288         };\r
1289 \r
1290         pasteProcessor.prototype =\r
1291         {\r
1292                 toHtml : function( data )\r
1293                 {\r
1294                         var fragment = CKEDITOR.htmlParser.fragment.fromHtml( data, false ),\r
1295                                 writer = new CKEDITOR.htmlParser.basicWriter();\r
1296 \r
1297                         fragment.writeHtml( writer, this.dataFilter );\r
1298                         return writer.getHtml( true );\r
1299                 }\r
1300         };\r
1301 \r
1302         CKEDITOR.cleanWord = function( data, editor )\r
1303         {\r
1304                 // Firefox will be confused by those downlevel-revealed IE conditional\r
1305                 // comments, fixing them first( convert it to upperlevel-revealed one ).\r
1306                 // e.g. <![if !vml]>...<![endif]>\r
1307                 if ( CKEDITOR.env.gecko )\r
1308                         data = data.replace( /(<!--\[if[^<]*?\])-->([\S\s]*?)<!--(\[endif\]-->)/gi, '$1$2$3' );\r
1309 \r
1310                 var dataProcessor = new pasteProcessor(),\r
1311                         dataFilter = dataProcessor.dataFilter;\r
1312 \r
1313                 // These rules will have higher priorities than default ones.\r
1314                 dataFilter.addRules( CKEDITOR.plugins.pastefromword.getRules( editor ) );\r
1315 \r
1316                 // Allow extending data filter rules.\r
1317                 editor.fire( 'beforeCleanWord', { filter : dataFilter } );\r
1318 \r
1319                 try\r
1320                 {\r
1321                         data = dataProcessor.toHtml( data, false );\r
1322                 }\r
1323                 catch ( e )\r
1324                 {\r
1325                         alert( editor.lang.pastefromword.error );\r
1326                 }\r
1327 \r
1328                 /* Below post processing those things that are unable to delivered by filter rules. */\r
1329 \r
1330                 // Remove 'cke' namespaced attribute used in filter rules as marker.\r
1331                 data = data.replace( /cke:.*?".*?"/g, '' );\r
1332 \r
1333                 // Remove empty style attribute.\r
1334                 data = data.replace( /style=""/g, '' );\r
1335 \r
1336                 // Remove the dummy spans ( having no inline style ).\r
1337                 data = data.replace( /<span>/g, '' );\r
1338 \r
1339                 return data;\r
1340         };\r
1341 })();\r
1342 \r
1343 /**\r
1344  * Whether to ignore all font related formatting styles, including:\r
1345  * <ul> <li>font size;</li>\r
1346  *              <li>font family;</li>\r
1347  *              <li>font foreground/background color.</li></ul>\r
1348  * @name CKEDITOR.config.pasteFromWordRemoveFontStyles\r
1349  * @since 3.1\r
1350  * @type Boolean\r
1351  * @default true\r
1352  * @example\r
1353  * config.pasteFromWordRemoveFontStyles = false;\r
1354  */\r
1355 \r
1356 /**\r
1357  * Whether to transform MS Word outline numbered headings into lists.\r
1358  * @name CKEDITOR.config.pasteFromWordNumberedHeadingToList\r
1359  * @since 3.1\r
1360  * @type Boolean\r
1361  * @default false\r
1362  * @example\r
1363  * config.pasteFromWordNumberedHeadingToList = true;\r
1364  */\r
1365 \r
1366 /**\r
1367  * Whether to remove element styles that can't be managed with the editor. Note\r
1368  * that this doesn't handle the font specific styles, which depends on the\r
1369  * {@link CKEDITOR.config.pasteFromWordRemoveFontStyles} setting instead.\r
1370  * @name CKEDITOR.config.pasteFromWordRemoveStyles\r
1371  * @since 3.1\r
1372  * @type Boolean\r
1373  * @default true\r
1374  * @example\r
1375  * config.pasteFromWordRemoveStyles = false;\r
1376  */\r