JasonWoof Got questions, comments, patches, etc.? Contact Jason Woofenden
vanilla ckeditor-3.6.1
[ckeditor.git] / _source / plugins / pastefromword / filter / default.js
1 /*\r
2 Copyright (c) 2003-2011, CKSource - Frederico Knabben. All rights reserved.\r
3 For licensing, see LICENSE.html or http://ckeditor.com/license\r
4 */\r
5 \r
6 (function()\r
7 {\r
8         var fragmentPrototype = CKEDITOR.htmlParser.fragment.prototype,\r
9                 elementPrototype = CKEDITOR.htmlParser.element.prototype;\r
10 \r
11         fragmentPrototype.onlyChild = elementPrototype.onlyChild = function()\r
12         {\r
13                 var children = this.children,\r
14                         count = children.length,\r
15                         firstChild = ( count == 1 ) && children[ 0 ];\r
16                 return firstChild || null;\r
17         };\r
18 \r
19         elementPrototype.removeAnyChildWithName = function( tagName )\r
20         {\r
21                 var children = this.children,\r
22                         childs = [],\r
23                         child;\r
24 \r
25                 for ( var i = 0; i < children.length; i++ )\r
26                 {\r
27                         child = children[ i ];\r
28                         if ( !child.name )\r
29                                 continue;\r
30 \r
31                         if ( child.name == tagName )\r
32                         {\r
33                                 childs.push( child );\r
34                                 children.splice( i--, 1 );\r
35                         }\r
36                         childs = childs.concat( child.removeAnyChildWithName( tagName ) );\r
37                 }\r
38                 return childs;\r
39         };\r
40 \r
41         elementPrototype.getAncestor = function( tagNameRegex )\r
42         {\r
43                 var parent = this.parent;\r
44                 while ( parent && !( parent.name && parent.name.match( tagNameRegex ) ) )\r
45                         parent = parent.parent;\r
46                 return parent;\r
47         };\r
48 \r
49         fragmentPrototype.firstChild = elementPrototype.firstChild = function( evaluator )\r
50         {\r
51                 var child;\r
52 \r
53                 for ( var i = 0 ; i < this.children.length ; i++ )\r
54                 {\r
55                         child = this.children[ i ];\r
56                         if ( evaluator( child ) )\r
57                                 return child;\r
58                         else if ( child.name )\r
59                         {\r
60                                 child = child.firstChild( evaluator );\r
61                                 if ( child )\r
62                                         return child;\r
63                         }\r
64                 }\r
65 \r
66                 return null;\r
67         };\r
68 \r
69         // Adding a (set) of styles to the element's 'style' attributes.\r
70         elementPrototype.addStyle = function( name, value, isPrepend )\r
71         {\r
72                 var styleText, addingStyleText = '';\r
73                 // name/value pair.\r
74                 if ( typeof value == 'string' )\r
75                         addingStyleText += name + ':' + value + ';';\r
76                 else\r
77                 {\r
78                         // style literal.\r
79                         if ( typeof name == 'object' )\r
80                         {\r
81                                 for ( var style in name )\r
82                                 {\r
83                                         if ( name.hasOwnProperty( style ) )\r
84                                                 addingStyleText += style + ':' + name[ style ] + ';';\r
85                                 }\r
86                         }\r
87                         // raw style text form.\r
88                         else\r
89                                 addingStyleText += name;\r
90 \r
91                         isPrepend = value;\r
92                 }\r
93 \r
94                 if ( !this.attributes )\r
95                         this.attributes = {};\r
96 \r
97                 styleText = this.attributes.style || '';\r
98 \r
99                 styleText = ( isPrepend ?\r
100                               [ addingStyleText, styleText ]\r
101                                           : [ styleText, addingStyleText ] ).join( ';' );\r
102 \r
103                 this.attributes.style = styleText.replace( /^;|;(?=;)/, '' );\r
104         };\r
105 \r
106         /**\r
107          * Return the DTD-valid parent tag names of the specified one.\r
108          * @param tagName\r
109          */\r
110         CKEDITOR.dtd.parentOf = function( tagName )\r
111         {\r
112                 var result = {};\r
113                 for ( var tag in this )\r
114                 {\r
115                         if ( tag.indexOf( '$' ) == -1 && this[ tag ][ tagName ] )\r
116                                 result[ tag ] = 1;\r
117                 }\r
118                 return result;\r
119         };\r
120 \r
121         // 1. move consistent list item styles up to list root.\r
122         // 2. clear out unnecessary list item numbering.\r
123         function postProcessList( list )\r
124         {\r
125                 var children = list.children,\r
126                         child,\r
127                         attrs,\r
128                         count = list.children.length,\r
129                         match,\r
130                         mergeStyle,\r
131                         styleTypeRegexp = /list-style-type:(.*?)(?:;|$)/,\r
132                         stylesFilter = CKEDITOR.plugins.pastefromword.filters.stylesFilter;\r
133 \r
134                 attrs = list.attributes;\r
135                 if ( styleTypeRegexp.exec( attrs.style ) )\r
136                         return;\r
137 \r
138                 for ( var i = 0; i < count; i++ )\r
139                 {\r
140                         child = children[ i ];\r
141 \r
142                         if ( child.attributes.value && Number( child.attributes.value ) == i + 1 )\r
143                                 delete child.attributes.value;\r
144 \r
145                         match = styleTypeRegexp.exec( child.attributes.style );\r
146 \r
147                         if ( match )\r
148                         {\r
149                                 if ( match[ 1 ] == mergeStyle || !mergeStyle )\r
150                                         mergeStyle = match[ 1 ];\r
151                                 else\r
152                                 {\r
153                                         mergeStyle = null;\r
154                                         break;\r
155                                 }\r
156                         }\r
157                 }\r
158 \r
159                 if ( mergeStyle )\r
160                 {\r
161                         for ( i = 0; i < count; i++ )\r
162                         {\r
163                                 attrs = children[ i ].attributes;\r
164                                 attrs.style && ( attrs.style = stylesFilter( [ [ 'list-style-type'] ] )( attrs.style ) || '' );\r
165                         }\r
166 \r
167                         list.addStyle( 'list-style-type', mergeStyle );\r
168                 }\r
169         }\r
170 \r
171         var cssLengthRelativeUnit = /^([.\d]*)+(em|ex|px|gd|rem|vw|vh|vm|ch|mm|cm|in|pt|pc|deg|rad|ms|s|hz|khz){1}?/i;\r
172         var emptyMarginRegex = /^(?:\b0[^\s]*\s*){1,4}$/;               // e.g. 0px 0pt 0px\r
173         var romanLiternalPattern = '^m{0,4}(cm|cd|d?c{0,3})(xc|xl|l?x{0,3})(ix|iv|v?i{0,3})$',\r
174                 lowerRomanLiteralRegex = new RegExp( romanLiternalPattern ),\r
175                 upperRomanLiteralRegex = new RegExp( romanLiternalPattern.toUpperCase() );\r
176 \r
177         var orderedPatterns = { 'decimal' : /\d+/, 'lower-roman': lowerRomanLiteralRegex, 'upper-roman': upperRomanLiteralRegex, 'lower-alpha' : /^[a-z]+$/, 'upper-alpha': /^[A-Z]+$/ },\r
178                 unorderedPatterns = { 'disc' : /[l\u00B7\u2002]/, 'circle' : /[\u006F\u00D8]/,'square' : /[\u006E\u25C6]/},\r
179                 listMarkerPatterns = { 'ol' : orderedPatterns, 'ul' : unorderedPatterns },\r
180                 romans = [ [1000, 'M'], [900, 'CM'], [500, 'D'], [400, 'CD'], [100, 'C'], [90, 'XC'], [50, 'L'], [40, 'XL'], [10, 'X'], [9, 'IX'], [5, 'V'], [4, 'IV'], [1, 'I'] ],\r
181                 alpahbets = "ABCDEFGHIJKLMNOPQRSTUVWXYZ";\r
182 \r
183         // Convert roman numbering back to decimal.\r
184         function fromRoman( str )\r
185          {\r
186                  str = str.toUpperCase();\r
187                  var l = romans.length, retVal = 0;\r
188                  for ( var i = 0; i < l; ++i )\r
189                  {\r
190                          for ( var j = romans[i], k = j[1].length; str.substr( 0, k ) == j[1]; str = str.substr( k ) )\r
191                                  retVal += j[ 0 ];\r
192                  }\r
193                  return retVal;\r
194          }\r
195 \r
196         // Convert alphabet numbering back to decimal.\r
197         function fromAlphabet( str )\r
198         {\r
199                 str = str.toUpperCase();\r
200                 var l = alpahbets.length, retVal = 1;\r
201                 for ( var x = 1; str.length > 0; x *= l )\r
202                 {\r
203                         retVal += alpahbets.indexOf( str.charAt( str.length - 1 ) ) * x;\r
204                         str = str.substr( 0, str.length - 1 );\r
205                 }\r
206                 return retVal;\r
207         }\r
208 \r
209         var listBaseIndent = 0,\r
210                 previousListItemMargin = null,\r
211                 previousListId;\r
212 \r
213         var plugin = ( CKEDITOR.plugins.pastefromword =\r
214         {\r
215                 utils :\r
216                 {\r
217                         // Create a <cke:listbullet> which indicate an list item type.\r
218                         createListBulletMarker : function ( bullet, bulletText )\r
219                         {\r
220                                 var marker = new CKEDITOR.htmlParser.element( 'cke:listbullet' );\r
221                                 marker.attributes = { 'cke:listsymbol' : bullet[ 0 ] };\r
222                                 marker.add( new CKEDITOR.htmlParser.text( bulletText ) );\r
223                                 return marker;\r
224                         },\r
225 \r
226                         isListBulletIndicator : function( element )\r
227                         {\r
228                                 var styleText = element.attributes && element.attributes.style;\r
229                                 if ( /mso-list\s*:\s*Ignore/i.test( styleText ) )\r
230                                         return true;\r
231                         },\r
232 \r
233                         isContainingOnlySpaces : function( element )\r
234                         {\r
235                                 var text;\r
236                                 return ( ( text = element.onlyChild() )\r
237                                             && ( /^(:?\s|&nbsp;)+$/ ).test( text.value ) );\r
238                         },\r
239 \r
240                         resolveList : function( element )\r
241                         {\r
242                                 // <cke:listbullet> indicate a list item.\r
243                                 var attrs = element.attributes,\r
244                                         listMarker;\r
245 \r
246                                 if ( ( listMarker = element.removeAnyChildWithName( 'cke:listbullet' ) )\r
247                                                 && listMarker.length\r
248                                                 && ( listMarker = listMarker[ 0 ] ) )\r
249                                 {\r
250                                         element.name = 'cke:li';\r
251 \r
252                                         if ( attrs.style )\r
253                                         {\r
254                                                 attrs.style = plugin.filters.stylesFilter(\r
255                                                                 [\r
256                                                                         // Text-indent is not representing list item level any more.\r
257                                                                         [ 'text-indent' ],\r
258                                                                         [ 'line-height' ],\r
259                                                                         // First attempt is to resolve indent level from on a constant margin increment.\r
260                                                                         [ ( /^margin(:?-left)?$/ ), null, function( margin )\r
261                                                                         {\r
262                                                                                 // Deal with component/short-hand form.\r
263                                                                                 var values = margin.split( ' ' );\r
264                                                                                 margin = CKEDITOR.tools.convertToPx( values[ 3 ] || values[ 1 ] || values [ 0 ] );\r
265 \r
266                                                                                 // Figure out the indent unit by checking the first time of incrementation.\r
267                                                                                 if ( !listBaseIndent && previousListItemMargin !== null && margin > previousListItemMargin )\r
268                                                                                         listBaseIndent = margin - previousListItemMargin;\r
269 \r
270                                                                                 previousListItemMargin = margin;\r
271 \r
272                                                                                 attrs[ 'cke:indent' ] = listBaseIndent && ( Math.ceil( margin / listBaseIndent ) + 1 ) || 1;\r
273                                                                         } ],\r
274                                                                         // The best situation: "mso-list:l0 level1 lfo2" tells the belonged list root, list item indentation, etc.\r
275                                                                         [ ( /^mso-list$/ ), null, function( val )\r
276                                                                         {\r
277                                                                                 val = val.split( ' ' );\r
278                                                                                 var listId = Number( val[ 0 ].match( /\d+/ ) ),\r
279                                                                                         indent = Number( val[ 1 ].match( /\d+/ ) );\r
280 \r
281                                                                                 if ( indent == 1 )\r
282                                                                                 {\r
283                                                                                         listId !== previousListId && ( attrs[ 'cke:reset' ] = 1 );\r
284                                                                                         previousListId = listId;\r
285                                                                                 }\r
286                                                                                 attrs[ 'cke:indent' ] = indent;\r
287                                                                         } ]\r
288                                                                 ] )( attrs.style, element ) || '';\r
289                                         }\r
290 \r
291                                         // First level list item might be presented without a margin.\r
292 \r
293 \r
294                                         // In case all above doesn't apply.\r
295                                         if ( !attrs[ 'cke:indent' ] )\r
296                                         {\r
297                                                 previousListItemMargin = 0;\r
298                                                 attrs[ 'cke:indent' ] = 1;\r
299                                         }\r
300 \r
301                                         // Inherit attributes from bullet.\r
302                                         CKEDITOR.tools.extend( attrs, listMarker.attributes );\r
303                                         return true;\r
304                                 }\r
305                                 // Current list disconnected.\r
306                                 else\r
307                                         previousListId = previousListItemMargin = listBaseIndent = null;\r
308 \r
309                                 return false;\r
310                         },\r
311 \r
312                         // Providing a shorthand style then retrieve one or more style component values.\r
313                         getStyleComponents : ( function()\r
314                         {\r
315                                 var calculator = CKEDITOR.dom.element.createFromHtml(\r
316                                                                 '<div style="position:absolute;left:-9999px;top:-9999px;"></div>',\r
317                                                                 CKEDITOR.document );\r
318                                 CKEDITOR.document.getBody().append( calculator );\r
319 \r
320                                 return function( name, styleValue, fetchList )\r
321                                 {\r
322                                         calculator.setStyle( name, styleValue );\r
323                                         var styles = {},\r
324                                                 count = fetchList.length;\r
325                                         for ( var i = 0; i < count; i++ )\r
326                                                 styles[ fetchList[ i ] ]  = calculator.getStyle( fetchList[ i ] );\r
327 \r
328                                         return styles;\r
329                                 };\r
330                         } )(),\r
331 \r
332                         listDtdParents : CKEDITOR.dtd.parentOf( 'ol' )\r
333                 },\r
334 \r
335                 filters :\r
336                 {\r
337                                 // Transform a normal list into flat list items only presentation.\r
338                                 // E.g. <ul><li>level1<ol><li>level2</li></ol></li> =>\r
339                                 // <cke:li cke:listtype="ul" cke:indent="1">level1</cke:li>\r
340                                 // <cke:li cke:listtype="ol" cke:indent="2">level2</cke:li>\r
341                                 flattenList : function( element, level )\r
342                                 {\r
343                                         level = typeof level == 'number' ? level : 1;\r
344 \r
345                                         var     attrs = element.attributes,\r
346                                                 listStyleType;\r
347 \r
348                                         // All list items are of the same type.\r
349                                         switch ( attrs.type )\r
350                                         {\r
351                                                 case 'a' :\r
352                                                         listStyleType = 'lower-alpha';\r
353                                                         break;\r
354                                                 case '1' :\r
355                                                         listStyleType = 'decimal';\r
356                                                         break;\r
357                                                 // TODO: Support more list style type from MS-Word.\r
358                                         }\r
359 \r
360                                         var children = element.children,\r
361                                                 child;\r
362 \r
363                                         for ( var i = 0; i < children.length; i++ )\r
364                                         {\r
365                                                 child = children[ i ];\r
366 \r
367                                                 if ( child.name in CKEDITOR.dtd.$listItem )\r
368                                                 {\r
369                                                         var attributes = child.attributes,\r
370                                                                 listItemChildren = child.children,\r
371                                                                 count = listItemChildren.length,\r
372                                                                 last = listItemChildren[ count - 1 ];\r
373 \r
374                                                         // Move out nested list.\r
375                                                         if ( last.name in CKEDITOR.dtd.$list )\r
376                                                         {\r
377                                                                 element.add( last, i + 1 );\r
378 \r
379                                                                 // Remove the parent list item if it's just a holder.\r
380                                                                 if ( !--listItemChildren.length )\r
381                                                                         children.splice( i--, 1 );\r
382                                                         }\r
383 \r
384                                                         child.name = 'cke:li';\r
385 \r
386                                                         // Inherit numbering from list root on the first list item.\r
387                                                         attrs.start && !i && ( attributes.value = attrs.start );\r
388 \r
389                                                         plugin.filters.stylesFilter(\r
390                                                                 [\r
391                                                                         [ 'tab-stops', null, function( val )\r
392                                                                         {\r
393                                                                                 var margin = val.split( ' ' )[ 1 ].match( cssLengthRelativeUnit );\r
394                                                                                 margin && ( previousListItemMargin = CKEDITOR.tools.convertToPx( margin[ 0 ] ) );\r
395                                                                         } ],\r
396                                                                         ( level == 1 ? [ 'mso-list', null, function( val )\r
397                                                                         {\r
398                                                                                 val = val.split( ' ' );\r
399                                                                                 var listId = Number( val[ 0 ].match( /\d+/ ) );\r
400                                                                                 listId !== previousListId && ( attributes[ 'cke:reset' ] = 1 );\r
401                                                                                 previousListId = listId;\r
402                                                                          } ] : null )\r
403                                                                 ] )( attributes.style );\r
404 \r
405                                                         attributes[ 'cke:indent' ] = level;\r
406                                                         attributes[ 'cke:listtype' ] = element.name;\r
407                                                         attributes[ 'cke:list-style-type' ] = listStyleType;\r
408                                                 }\r
409                                                 // Flatten sub list.\r
410                                                 else if ( child.name in CKEDITOR.dtd.$list )\r
411                                                 {\r
412                                                         // Absorb sub list children.\r
413                                                         arguments.callee.apply( this, [ child, level + 1 ] );\r
414                                                         children = children.slice( 0, i ).concat( child.children ).concat( children.slice( i + 1 ) );\r
415                                                         element.children = [];\r
416                                                         for ( var j = 0, num = children.length; j < num ; j++ )\r
417                                                                 element.add( children[ j ] );\r
418                                                 }\r
419                                         }\r
420 \r
421                                         delete element.name;\r
422 \r
423                                         // We're loosing tag name here, signalize this element as a list.\r
424                                         attrs[ 'cke:list' ] = 1;\r
425                                 },\r
426 \r
427                                 /**\r
428                                  *  Try to collect all list items among the children and establish one\r
429                                  *  or more HTML list structures for them.\r
430                                  * @param element\r
431                                  */\r
432                                 assembleList : function( element )\r
433                                 {\r
434                                         var children = element.children, child,\r
435                                                         listItem,   // The current processing cke:li element.\r
436                                                         listItemAttrs,\r
437                                                         listItemIndent, // Indent level of current list item.\r
438                                                         lastIndent,\r
439                                                         lastListItem, // The previous one just been added to the list.\r
440                                                         list, // Current staging list and it's parent list if any.\r
441                                                         openedLists = [],\r
442                                                         previousListStyleType,\r
443                                                         previousListType;\r
444 \r
445                                         // Properties of the list item are to be resolved from the list bullet.\r
446                                         var bullet,\r
447                                                 listType,\r
448                                                 listStyleType,\r
449                                                 itemNumeric;\r
450 \r
451                                         for ( var i = 0; i < children.length; i++ )\r
452                                         {\r
453                                                 child = children[ i ];\r
454 \r
455                                                 if ( 'cke:li' == child.name )\r
456                                                 {\r
457                                                         child.name = 'li';\r
458                                                         listItem = child;\r
459                                                         listItemAttrs = listItem.attributes;\r
460                                                         bullet = listItemAttrs[ 'cke:listsymbol' ];\r
461                                                         bullet = bullet && bullet.match( /^(?:[(]?)([^\s]+?)([.)]?)$/ );\r
462                                                         listType = listStyleType = itemNumeric = null;\r
463 \r
464                                                         if ( listItemAttrs[ 'cke:ignored' ] )\r
465                                                         {\r
466                                                                 children.splice( i--, 1 );\r
467                                                                 continue;\r
468                                                         }\r
469 \r
470 \r
471                                                         // This's from a new list root.\r
472                                                         listItemAttrs[ 'cke:reset' ] && ( list = lastIndent = lastListItem = null );\r
473 \r
474                                                         // List item indent level might come from a real list indentation or\r
475                                                         // been resolved from a pseudo list item's margin value, even get\r
476                                                         // no indentation at all.\r
477                                                         listItemIndent = Number( listItemAttrs[ 'cke:indent' ] );\r
478 \r
479                                                         // We're moving out of the current list, cleaning up.\r
480                                                         if ( listItemIndent != lastIndent )\r
481                                                                 previousListType = previousListStyleType = null;\r
482 \r
483                                                         // List type and item style are already resolved.\r
484                                                         if ( !bullet )\r
485                                                         {\r
486                                                                 listType = listItemAttrs[ 'cke:listtype' ] || 'ol';\r
487                                                                 listStyleType = listItemAttrs[ 'cke:list-style-type' ];\r
488                                                         }\r
489                                                         else\r
490                                                         {\r
491                                                                 // Probably share the same list style type with previous list item,\r
492                                                                 // give it priority to avoid ambiguous between C(Alpha) and C.(Roman).\r
493                                                                 if ( previousListType && listMarkerPatterns[ previousListType ] [ previousListStyleType ].test( bullet[ 1 ] ) )\r
494                                                                 {\r
495                                                                         listType = previousListType;\r
496                                                                         listStyleType = previousListStyleType;\r
497                                                                 }\r
498                                                                 else\r
499                                                                 {\r
500                                                                         for ( var type in listMarkerPatterns )\r
501                                                                         {\r
502                                                                                 for ( var style in listMarkerPatterns[ type ] )\r
503                                                                                 {\r
504                                                                                         if ( listMarkerPatterns[ type ][ style ].test( bullet[ 1 ] ) )\r
505                                                                                         {\r
506                                                                                                 // Small numbering has higher priority, when dealing with ambiguous\r
507                                                                                                 // between C(Alpha) and C.(Roman).\r
508                                                                                                 if ( type == 'ol' && ( /alpha|roman/ ).test( style ) )\r
509                                                                                                 {\r
510                                                                                                         var num = /roman/.test( style ) ? fromRoman( bullet[ 1 ] ) : fromAlphabet( bullet[ 1 ] );\r
511                                                                                                         if ( !itemNumeric || num < itemNumeric )\r
512                                                                                                         {\r
513                                                                                                                 itemNumeric = num;\r
514                                                                                                                 listType = type;\r
515                                                                                                                 listStyleType = style;\r
516                                                                                                         }\r
517                                                                                                 }\r
518                                                                                                 else\r
519                                                                                                 {\r
520                                                                                                         listType = type;\r
521                                                                                                         listStyleType = style;\r
522                                                                                                         break;\r
523                                                                                                 }\r
524                                                                                         }\r
525                                                                                 }\r
526                                                                         }\r
527                                                                 }\r
528 \r
529                                                                 // Simply use decimal/disc for the rest forms of unrepresentable\r
530                                                                 // numerals, e.g. Chinese..., but as long as there a second part\r
531                                                                 // included, it has a bigger chance of being a order list ;)\r
532                                                                 !listType && ( listType = bullet[ 2 ] ? 'ol' : 'ul' );\r
533                                                         }\r
534 \r
535                                                         previousListType = listType;\r
536                                                         previousListStyleType = listStyleType || ( listType == 'ol' ? 'decimal' : 'disc' );\r
537                                                         if ( listStyleType && listStyleType != ( listType == 'ol' ? 'decimal' : 'disc' ) )\r
538                                                                 listItem.addStyle( 'list-style-type', listStyleType );\r
539 \r
540                                                         // Figure out start numbering.\r
541                                                         if ( listType == 'ol' && bullet )\r
542                                                         {\r
543                                                                 switch ( listStyleType )\r
544                                                                 {\r
545                                                                         case 'decimal' :\r
546                                                                                 itemNumeric = Number( bullet[ 1 ] );\r
547                                                                                 break;\r
548                                                                         case 'lower-roman':\r
549                                                                         case 'upper-roman':\r
550                                                                                 itemNumeric = fromRoman( bullet[ 1 ] );\r
551                                                                                 break;\r
552                                                                         case 'lower-alpha':\r
553                                                                         case 'upper-alpha':\r
554                                                                                 itemNumeric = fromAlphabet( bullet[ 1 ] );\r
555                                                                                 break;\r
556                                                                 }\r
557 \r
558                                                                 // Always create the numbering, swipe out unnecessary ones later.\r
559                                                                 listItem.attributes.value = itemNumeric;\r
560                                                         }\r
561 \r
562                                                         // Start the list construction.\r
563                                                         if ( !list )\r
564                                                         {\r
565                                                                 openedLists.push( list = new CKEDITOR.htmlParser.element( listType ) );\r
566                                                                 list.add( listItem );\r
567                                                                 children[ i ] = list;\r
568                                                         }\r
569                                                         else\r
570                                                         {\r
571                                                                 if ( listItemIndent > lastIndent )\r
572                                                                 {\r
573                                                                         openedLists.push( list = new CKEDITOR.htmlParser.element( listType ) );\r
574                                                                         list.add( listItem );\r
575                                                                         lastListItem.add( list );\r
576                                                                 }\r
577                                                                 else if ( listItemIndent < lastIndent )\r
578                                                                 {\r
579                                                                         // There might be a negative gap between two list levels. (#4944)\r
580                                                                         var diff = lastIndent - listItemIndent,\r
581                                                                                         parent;\r
582                                                                         while ( diff-- && ( parent = list.parent ) )\r
583                                                                                 list = parent.parent;\r
584 \r
585                                                                         list.add( listItem );\r
586                                                                 }\r
587                                                                 else\r
588                                                                         list.add( listItem );\r
589 \r
590                                                                 children.splice( i--, 1 );\r
591                                                         }\r
592 \r
593                                                         lastListItem = listItem;\r
594                                                         lastIndent = listItemIndent;\r
595                                                 }\r
596                                                 else if ( list )\r
597                                                         list = lastIndent = lastListItem = null;\r
598                                         }\r
599 \r
600                                         for ( i = 0; i < openedLists.length; i++ )\r
601                                                 postProcessList( openedLists[ i ] );\r
602 \r
603                                         list = lastIndent = lastListItem = previousListId = previousListItemMargin = listBaseIndent = null;\r
604                                 },\r
605 \r
606                                 /**\r
607                                  * A simple filter which always rejecting.\r
608                                  */\r
609                                 falsyFilter : function( value )\r
610                                 {\r
611                                         return false;\r
612                                 },\r
613 \r
614                                 /**\r
615                                  * A filter dedicated on the 'style' attribute filtering, e.g. dropping/replacing style properties.\r
616                                  * @param styles {Array} in form of [ styleNameRegexp, styleValueRegexp,\r
617                                  *  newStyleValue/newStyleGenerator, newStyleName ] where only the first\r
618                                  *  parameter is mandatory.\r
619                                  * @param whitelist {Boolean} Whether the {@param styles} will be considered as a white-list.\r
620                                  */\r
621                                 stylesFilter : function( styles, whitelist )\r
622                                 {\r
623                                         return function( styleText, element )\r
624                                         {\r
625                                                  var rules = [];\r
626                                                 // html-encoded quote might be introduced by 'font-family'\r
627                                                 // from MS-Word which confused the following regexp. e.g.\r
628                                                 //'font-family: &quot;Lucida, Console&quot;'\r
629                                                 ( styleText || '' )\r
630                                                         .replace( /&quot;/g, '"' )\r
631                                                         .replace( /\s*([^ :;]+)\s*:\s*([^;]+)\s*(?=;|$)/g,\r
632                                                                  function( match, name, value )\r
633                                                                  {\r
634                                                                          name = name.toLowerCase();\r
635                                                                          name == 'font-family' && ( value = value.replace( /["']/g, '' ) );\r
636 \r
637                                                                          var namePattern,\r
638                                                                                  valuePattern,\r
639                                                                                  newValue,\r
640                                                                                  newName;\r
641                                                                          for ( var i = 0 ; i < styles.length; i++ )\r
642                                                                          {\r
643                                                                                 if ( styles[ i ] )\r
644                                                                                 {\r
645                                                                                         namePattern = styles[ i ][ 0 ];\r
646                                                                                         valuePattern = styles[ i ][ 1 ];\r
647                                                                                         newValue = styles[ i ][ 2 ];\r
648                                                                                         newName = styles[ i ][ 3 ];\r
649 \r
650                                                                                         if ( name.match( namePattern )\r
651                                                                                                  && ( !valuePattern || value.match( valuePattern ) ) )\r
652                                                                                         {\r
653                                                                                                 name = newName || name;\r
654                                                                                                 whitelist && ( newValue = newValue || value );\r
655 \r
656                                                                                                 if ( typeof newValue == 'function' )\r
657                                                                                                         newValue = newValue( value, element, name );\r
658 \r
659                                                                                                 // Return an couple indicate both name and value\r
660                                                                                                 // changed.\r
661                                                                                                 if ( newValue && newValue.push )\r
662                                                                                                         name = newValue[ 0 ], newValue = newValue[ 1 ];\r
663 \r
664                                                                                                 if ( typeof newValue == 'string' )\r
665                                                                                                         rules.push( [ name, newValue ] );\r
666                                                                                                 return;\r
667                                                                                         }\r
668                                                                                 }\r
669                                                                          }\r
670 \r
671                                                                          !whitelist && rules.push( [ name, value ] );\r
672 \r
673                                                                  });\r
674 \r
675                                                 for ( var i = 0 ; i < rules.length ; i++ )\r
676                                                          rules[ i ] = rules[ i ].join( ':' );\r
677                                                 return rules.length ?\r
678                                                          ( rules.join( ';' ) + ';' ) : false;\r
679                                          };\r
680                                 },\r
681 \r
682                                 /**\r
683                                  * Migrate the element by decorate styles on it.\r
684                                  * @param styleDefiniton\r
685                                  * @param variables\r
686                                  */\r
687                                 elementMigrateFilter : function ( styleDefiniton, variables )\r
688                                 {\r
689                                         return function( element )\r
690                                                 {\r
691                                                         var styleDef =\r
692                                                                         variables ?\r
693                                                                                 new CKEDITOR.style( styleDefiniton, variables )._.definition\r
694                                                                                 : styleDefiniton;\r
695                                                         element.name = styleDef.element;\r
696                                                         CKEDITOR.tools.extend( element.attributes, CKEDITOR.tools.clone( styleDef.attributes ) );\r
697                                                         element.addStyle( CKEDITOR.style.getStyleText( styleDef ) );\r
698                                                 };\r
699                                 },\r
700 \r
701                                 /**\r
702                                  * Migrate styles by creating a new nested stylish element.\r
703                                  * @param styleDefinition\r
704                                  */\r
705                                 styleMigrateFilter : function( styleDefinition, variableName )\r
706                                 {\r
707 \r
708                                         var elementMigrateFilter = this.elementMigrateFilter;\r
709                                         return function( value, element )\r
710                                         {\r
711                                                 // Build an stylish element first.\r
712                                                 var styleElement = new CKEDITOR.htmlParser.element( null ),\r
713                                                         variables = {};\r
714 \r
715                                                 variables[ variableName ] = value;\r
716                                                 elementMigrateFilter( styleDefinition, variables )( styleElement );\r
717                                                 // Place the new element inside the existing span.\r
718                                                 styleElement.children = element.children;\r
719                                                 element.children = [ styleElement ];\r
720                                         };\r
721                                 },\r
722 \r
723                                 /**\r
724                                  * A filter which remove cke-namespaced-attribute on\r
725                                  * all none-cke-namespaced elements.\r
726                                  * @param value\r
727                                  * @param element\r
728                                  */\r
729                                 bogusAttrFilter : function( value, element )\r
730                                 {\r
731                                         if ( element.name.indexOf( 'cke:' ) == -1 )\r
732                                                 return false;\r
733                                 },\r
734 \r
735                                 /**\r
736                                  * A filter which will be used to apply inline css style according the stylesheet\r
737                                  * definition rules, is generated lazily when filtering.\r
738                                  */\r
739                                 applyStyleFilter : null\r
740 \r
741                         },\r
742 \r
743                 getRules : function( editor )\r
744                 {\r
745                         var dtd = CKEDITOR.dtd,\r
746                                 blockLike = CKEDITOR.tools.extend( {}, dtd.$block, dtd.$listItem, dtd.$tableContent ),\r
747                                 config = editor.config,\r
748                                 filters = this.filters,\r
749                                 falsyFilter = filters.falsyFilter,\r
750                                 stylesFilter = filters.stylesFilter,\r
751                                 elementMigrateFilter = filters.elementMigrateFilter,\r
752                                 styleMigrateFilter = CKEDITOR.tools.bind( this.filters.styleMigrateFilter, this.filters ),\r
753                                 createListBulletMarker = this.utils.createListBulletMarker,\r
754                                 flattenList = filters.flattenList,\r
755                                 assembleList = filters.assembleList,\r
756                                 isListBulletIndicator = this.utils.isListBulletIndicator,\r
757                                 containsNothingButSpaces = this.utils.isContainingOnlySpaces,\r
758                                 resolveListItem = this.utils.resolveList,\r
759                                 convertToPx = function( value )\r
760                                         {\r
761                                                 value = CKEDITOR.tools.convertToPx( value );\r
762                                                 return isNaN( value ) ? value : value + 'px';\r
763                                         },\r
764                                 getStyleComponents = this.utils.getStyleComponents,\r
765                                 listDtdParents = this.utils.listDtdParents,\r
766                                 removeFontStyles = config.pasteFromWordRemoveFontStyles !== false,\r
767                                 removeStyles = config.pasteFromWordRemoveStyles !== false;\r
768 \r
769                         return {\r
770 \r
771                                 elementNames :\r
772                                 [\r
773                                         // Remove script, meta and link elements.\r
774                                         [ ( /meta|link|script/ ), '' ]\r
775                                 ],\r
776 \r
777                                 root : function( element )\r
778                                 {\r
779                                         element.filterChildren();\r
780                                         assembleList( element );\r
781                                 },\r
782 \r
783                                 elements :\r
784                                 {\r
785                                         '^' : function( element )\r
786                                         {\r
787                                                 // Transform CSS style declaration to inline style.\r
788                                                 var applyStyleFilter;\r
789                                                 if ( CKEDITOR.env.gecko && ( applyStyleFilter = filters.applyStyleFilter ) )\r
790                                                         applyStyleFilter( element );\r
791                                         },\r
792 \r
793                                         $ : function( element )\r
794                                         {\r
795                                                 var tagName = element.name || '',\r
796                                                         attrs = element.attributes;\r
797 \r
798                                                 // Convert length unit of width/height on blocks to\r
799                                                 // a more editor-friendly way (px).\r
800                                                 if ( tagName in blockLike\r
801                                                         && attrs.style )\r
802                                                 {\r
803                                                         attrs.style = stylesFilter(\r
804                                                                                 [ [ ( /^(:?width|height)$/ ), null, convertToPx ] ] )( attrs.style ) || '';\r
805                                                 }\r
806 \r
807                                                 // Processing headings.\r
808                                                 if ( tagName.match( /h\d/ ) )\r
809                                                 {\r
810                                                         element.filterChildren();\r
811                                                         // Is the heading actually a list item?\r
812                                                         if ( resolveListItem( element ) )\r
813                                                                 return;\r
814 \r
815                                                         // Adapt heading styles to editor's convention.\r
816                                                         elementMigrateFilter( config[ 'format_' + tagName ] )( element );\r
817                                                 }\r
818                                                 // Remove inline elements which contain only empty spaces.\r
819                                                 else if ( tagName in dtd.$inline )\r
820                                                 {\r
821                                                         element.filterChildren();\r
822                                                         if ( containsNothingButSpaces( element ) )\r
823                                                                 delete element.name;\r
824                                                 }\r
825                                                 // Remove element with ms-office namespace,\r
826                                                 // with it's content preserved, e.g. 'o:p'.\r
827                                                 else if ( tagName.indexOf( ':' ) != -1\r
828                                                                  && tagName.indexOf( 'cke' ) == -1 )\r
829                                                 {\r
830                                                         element.filterChildren();\r
831 \r
832                                                         // Restore image real link from vml.\r
833                                                         if ( tagName == 'v:imagedata' )\r
834                                                         {\r
835                                                                 var href = element.attributes[ 'o:href' ];\r
836                                                                 if ( href )\r
837                                                                         element.attributes.src = href;\r
838                                                                 element.name = 'img';\r
839                                                                 return;\r
840                                                         }\r
841                                                         delete element.name;\r
842                                                 }\r
843 \r
844                                                 // Assembling list items into a whole list.\r
845                                                 if ( tagName in listDtdParents )\r
846                                                 {\r
847                                                         element.filterChildren();\r
848                                                         assembleList( element );\r
849                                                 }\r
850                                         },\r
851 \r
852                                         // We'll drop any style sheet, but Firefox conclude\r
853                                         // certain styles in a single style element, which are\r
854                                         // required to be changed into inline ones.\r
855                                         'style' : function( element )\r
856                                         {\r
857                                                 if ( CKEDITOR.env.gecko )\r
858                                                 {\r
859                                                         // Grab only the style definition section.\r
860                                                         var styleDefSection = element.onlyChild().value.match( /\/\* Style Definitions \*\/([\s\S]*?)\/\*/ ),\r
861                                                                 styleDefText = styleDefSection && styleDefSection[ 1 ],\r
862                                                                 rules = {}; // Storing the parsed result.\r
863 \r
864                                                         if ( styleDefText )\r
865                                                         {\r
866                                                                 styleDefText\r
867                                                                         // Remove line-breaks.\r
868                                                                         .replace(/[\n\r]/g,'')\r
869                                                                         // Extract selectors and style properties.\r
870                                                                         .replace( /(.+?)\{(.+?)\}/g,\r
871                                                                                 function( rule, selectors, styleBlock )\r
872                                                                                 {\r
873                                                                                         selectors = selectors.split( ',' );\r
874                                                                                         var length = selectors.length, selector;\r
875                                                                                         for ( var i = 0; i < length; i++ )\r
876                                                                                         {\r
877                                                                                                 // Assume MS-Word mostly generate only simple\r
878                                                                                                 // selector( [Type selector][Class selector]).\r
879                                                                                                 CKEDITOR.tools.trim( selectors[ i ] )\r
880                                                                                                                           .replace( /^(\w+)(\.[\w-]+)?$/g,\r
881                                                                                                 function( match, tagName, className )\r
882                                                                                                 {\r
883                                                                                                         tagName = tagName || '*';\r
884                                                                                                         className = className.substring( 1, className.length );\r
885 \r
886                                                                                                         // Reject MS-Word Normal styles.\r
887                                                                                                         if ( className.match( /MsoNormal/ ) )\r
888                                                                                                                 return;\r
889 \r
890                                                                                                         if ( !rules[ tagName ] )\r
891                                                                                                                 rules[ tagName ] = {};\r
892                                                                                                         if ( className )\r
893                                                                                                                 rules[ tagName ][ className ] = styleBlock;\r
894                                                                                                         else\r
895                                                                                                                 rules[ tagName ] = styleBlock;\r
896                                                                                                 } );\r
897                                                                                         }\r
898                                                                                 });\r
899 \r
900                                                                 filters.applyStyleFilter = function( element )\r
901                                                                 {\r
902                                                                         var name = rules[ '*' ] ? '*' : element.name,\r
903                                                                                 className = element.attributes && element.attributes[ 'class' ],\r
904                                                                                 style;\r
905                                                                         if ( name in rules )\r
906                                                                         {\r
907                                                                                 style = rules[ name ];\r
908                                                                                 if ( typeof style == 'object' )\r
909                                                                                         style = style[ className ];\r
910                                                                                 // Maintain style rules priorities.\r
911                                                                                 style && element.addStyle( style, true );\r
912                                                                         }\r
913                                                                 };\r
914                                                         }\r
915                                                 }\r
916                                                 return false;\r
917                                         },\r
918 \r
919                                         'p' : function( element )\r
920                                         {\r
921                                                 // This's a fall-back approach to recognize list item in FF3.6,\r
922                                                 // as it's not perfect as not all list style (e.g. "heading list") is shipped\r
923                                                 // with this pattern. (#6662)\r
924                                                 if ( /MsoListParagraph/.exec( element.attributes[ 'class' ] ) )\r
925                                                 {\r
926                                                         var bulletText = element.firstChild( function( node )\r
927                                                         {\r
928                                                                 return node.type == CKEDITOR.NODE_TEXT && !containsNothingButSpaces( node.parent );\r
929                                                         });\r
930                                                         var bullet = bulletText && bulletText.parent,\r
931                                                                 bulletAttrs = bullet && bullet.attributes;\r
932                                                         bulletAttrs && !bulletAttrs.style && ( bulletAttrs.style = 'mso-list: Ignore;' );\r
933                                                 }\r
934 \r
935                                                 element.filterChildren();\r
936 \r
937                                                 // Is the paragraph actually a list item?\r
938                                                 if ( resolveListItem( element ) )\r
939                                                         return;\r
940 \r
941                                                 // Adapt paragraph formatting to editor's convention\r
942                                                 // according to enter-mode.\r
943                                                 if ( config.enterMode == CKEDITOR.ENTER_BR )\r
944                                                 {\r
945                                                         // We suffer from attribute/style lost in this situation.\r
946                                                         delete element.name;\r
947                                                         element.add( new CKEDITOR.htmlParser.element( 'br' ) );\r
948                                                 }\r
949                                                 else\r
950                                                         elementMigrateFilter( config[ 'format_' + ( config.enterMode == CKEDITOR.ENTER_P ? 'p' : 'div' ) ] )( element );\r
951                                         },\r
952 \r
953                                         'div' : function( element )\r
954                                         {\r
955                                                 // Aligned table with no text surrounded is represented by a wrapper div, from which\r
956                                                 // table cells inherit as text-align styles, which is wrong.\r
957                                                 // Instead we use a clear-float div after the table to properly achieve the same layout.\r
958                                                 var singleChild = element.onlyChild();\r
959                                                 if ( singleChild && singleChild.name == 'table' )\r
960                                                 {\r
961                                                         var attrs = element.attributes;\r
962                                                         singleChild.attributes = CKEDITOR.tools.extend( singleChild.attributes, attrs );\r
963                                                         attrs.style && singleChild.addStyle( attrs.style );\r
964 \r
965                                                         var clearFloatDiv = new CKEDITOR.htmlParser.element( 'div' );\r
966                                                         clearFloatDiv.addStyle( 'clear' ,'both' );\r
967                                                         element.add( clearFloatDiv );\r
968                                                         delete element.name;\r
969                                                 }\r
970                                         },\r
971 \r
972                                         'td' : function ( element )\r
973                                         {\r
974                                                 // 'td' in 'thead' is actually <th>.\r
975                                                 if ( element.getAncestor( 'thead') )\r
976                                                         element.name = 'th';\r
977                                         },\r
978 \r
979                                         // MS-Word sometimes present list as a mixing of normal list\r
980                                         // and pseudo-list, normalize the previous ones into pseudo form.\r
981                                         'ol' : flattenList,\r
982                                         'ul' : flattenList,\r
983                                         'dl' : flattenList,\r
984 \r
985                                         'font' : function( element )\r
986                                         {\r
987                                                 // Drop the font tag if it comes from list bullet text.\r
988                                                 if ( isListBulletIndicator( element.parent ) )\r
989                                                 {\r
990                                                         delete element.name;\r
991                                                         return;\r
992                                                 }\r
993 \r
994                                                 element.filterChildren();\r
995 \r
996                                                 var attrs = element.attributes,\r
997                                                         styleText = attrs.style,\r
998                                                         parent = element.parent;\r
999 \r
1000                                                 if ( 'font' == parent.name )     // Merge nested <font> tags.\r
1001                                                 {\r
1002                                                         CKEDITOR.tools.extend( parent.attributes,\r
1003                                                                         element.attributes );\r
1004                                                         styleText && parent.addStyle( styleText );\r
1005                                                         delete element.name;\r
1006                                                 }\r
1007                                                 // Convert the merged into a span with all attributes preserved.\r
1008                                                 else\r
1009                                                 {\r
1010                                                         styleText = styleText || '';\r
1011                                                         // IE's having those deprecated attributes, normalize them.\r
1012                                                         if ( attrs.color )\r
1013                                                         {\r
1014                                                                 attrs.color != '#000000' && ( styleText += 'color:' + attrs.color + ';' );\r
1015                                                                 delete attrs.color;\r
1016                                                         }\r
1017                                                         if ( attrs.face )\r
1018                                                         {\r
1019                                                                 styleText += 'font-family:' + attrs.face + ';';\r
1020                                                                 delete attrs.face;\r
1021                                                         }\r
1022                                                         // TODO: Mapping size in ranges of xx-small,\r
1023                                                         // x-small, small, medium, large, x-large, xx-large.\r
1024                                                         if ( attrs.size )\r
1025                                                         {\r
1026                                                                 styleText += 'font-size:' +\r
1027                                                                              ( attrs.size > 3 ? 'large'\r
1028                                                                                              : ( attrs.size < 3 ? 'small' : 'medium' ) ) + ';';\r
1029                                                                 delete attrs.size;\r
1030                                                         }\r
1031 \r
1032                                                         element.name = 'span';\r
1033                                                         element.addStyle( styleText );\r
1034                                                 }\r
1035                                         },\r
1036 \r
1037                                         'span' : function( element )\r
1038                                         {\r
1039                                                 // Remove the span if it comes from list bullet text.\r
1040                                                 if ( isListBulletIndicator( element.parent ) )\r
1041                                                         return false;\r
1042 \r
1043                                                 element.filterChildren();\r
1044                                                 if ( containsNothingButSpaces( element ) )\r
1045                                                 {\r
1046                                                         delete element.name;\r
1047                                                         return null;\r
1048                                                 }\r
1049 \r
1050                                                 // List item bullet type is supposed to be indicated by\r
1051                                                 // the text of a span with style 'mso-list : Ignore' or an image.\r
1052                                                 if ( isListBulletIndicator( element ) )\r
1053                                                 {\r
1054                                                         var listSymbolNode = element.firstChild( function( node )\r
1055                                                         {\r
1056                                                                 return node.value || node.name == 'img';\r
1057                                                         });\r
1058 \r
1059                                                         var listSymbol =  listSymbolNode && ( listSymbolNode.value || 'l.' ),\r
1060                                                                 listType = listSymbol && listSymbol.match( /^(?:[(]?)([^\s]+?)([.)]?)$/ );\r
1061 \r
1062                                                         if ( listType )\r
1063                                                         {\r
1064                                                                 var marker = createListBulletMarker( listType, listSymbol );\r
1065                                                                 // Some non-existed list items might be carried by an inconsequential list, indicate by "mso-hide:all/display:none",\r
1066                                                                 // those are to be removed later, now mark it with "cke:ignored".\r
1067                                                                 var ancestor = element.getAncestor( 'span' );\r
1068                                                                 if ( ancestor && (/ mso-hide:\s*all|display:\s*none /).test( ancestor.attributes.style ) )\r
1069                                                                         marker.attributes[ 'cke:ignored' ] = 1;\r
1070                                                                 return marker;\r
1071                                                         }\r
1072                                                 }\r
1073 \r
1074                                                 // Update the src attribute of image element with href.\r
1075                                                 var children = element.children,\r
1076                                                         attrs = element.attributes,\r
1077                                                         styleText = attrs && attrs.style,\r
1078                                                         firstChild = children && children[ 0 ];\r
1079 \r
1080                                                 // Assume MS-Word mostly carry font related styles on <span>,\r
1081                                                 // adapting them to editor's convention.\r
1082                                                 if ( styleText )\r
1083                                                 {\r
1084                                                         attrs.style = stylesFilter(\r
1085                                                                         [\r
1086                                                                                 // Drop 'inline-height' style which make lines overlapping.\r
1087                                                                                 [ 'line-height' ],\r
1088                                                                                 [ ( /^font-family$/ ), null, !removeFontStyles ? styleMigrateFilter( config[ 'font_style' ], 'family' ) : null ] ,\r
1089                                                                                 [ ( /^font-size$/ ), null, !removeFontStyles ? styleMigrateFilter( config[ 'fontSize_style' ], 'size' ) : null ] ,\r
1090                                                                                 [ ( /^color$/ ), null, !removeFontStyles ? styleMigrateFilter( config[ 'colorButton_foreStyle' ], 'color' ) : null ] ,\r
1091                                                                                 [ ( /^background-color$/ ), null, !removeFontStyles ? styleMigrateFilter( config[ 'colorButton_backStyle' ], 'color' ) : null ]\r
1092                                                                         ] )( styleText, element ) || '';\r
1093                                                 }\r
1094 \r
1095                                                 return null;\r
1096                                         },\r
1097 \r
1098                                         // Migrate basic style formats to editor configured ones.\r
1099                                         'b' : elementMigrateFilter( config[ 'coreStyles_bold' ] ),\r
1100                                         'i' : elementMigrateFilter( config[ 'coreStyles_italic' ] ),\r
1101                                         'u' : elementMigrateFilter( config[ 'coreStyles_underline' ] ),\r
1102                                         's' : elementMigrateFilter( config[ 'coreStyles_strike' ] ),\r
1103                                         'sup' : elementMigrateFilter( config[ 'coreStyles_superscript' ] ),\r
1104                                         'sub' : elementMigrateFilter( config[ 'coreStyles_subscript' ] ),\r
1105                                         // Editor doesn't support anchor with content currently (#3582),\r
1106                                         // drop such anchors with content preserved.\r
1107                                         'a' : function( element )\r
1108                                         {\r
1109                                                 var attrs = element.attributes;\r
1110                                                 if ( attrs && !attrs.href && attrs.name )\r
1111                                                         delete element.name;\r
1112                                                 else if ( CKEDITOR.env.webkit && attrs.href && attrs.href.match( /file:\/\/\/[\S]+#/i ) )\r
1113                                                         attrs.href = attrs.href.replace( /file:\/\/\/[^#]+/i,'' );\r
1114                                         },\r
1115                                         'cke:listbullet' : function( element )\r
1116                                         {\r
1117                                                 if ( element.getAncestor( /h\d/ ) && !config.pasteFromWordNumberedHeadingToList )\r
1118                                                         delete element.name;\r
1119                                         }\r
1120                                 },\r
1121 \r
1122                                 attributeNames :\r
1123                                 [\r
1124                                         // Remove onmouseover and onmouseout events (from MS Word comments effect)\r
1125                                         [ ( /^onmouse(:?out|over)/ ), '' ],\r
1126                                         // Onload on image element.\r
1127                                         [ ( /^onload$/ ), '' ],\r
1128                                         // Remove office and vml attribute from elements.\r
1129                                         [ ( /(?:v|o):\w+/ ), '' ],\r
1130                                         // Remove lang/language attributes.\r
1131                                         [ ( /^lang/ ), '' ]\r
1132                                 ],\r
1133 \r
1134                                 attributes :\r
1135                                 {\r
1136                                         'style' : stylesFilter(\r
1137                                         removeStyles ?\r
1138                                         // Provide a white-list of styles that we preserve, those should\r
1139                                         // be the ones that could later be altered with editor tools.\r
1140                                         [\r
1141                                                 // Leave list-style-type\r
1142                                                 [ ( /^list-style-type$/ ), null ],\r
1143 \r
1144                                                 // Preserve margin-left/right which used as default indent style in the editor.\r
1145                                                 [ ( /^margin$|^margin-(?!bottom|top)/ ), null, function( value, element, name )\r
1146                                                         {\r
1147                                                                 if ( element.name in { p : 1, div : 1 } )\r
1148                                                                 {\r
1149                                                                         var indentStyleName = config.contentsLangDirection == 'ltr' ?\r
1150                                                                                         'margin-left' : 'margin-right';\r
1151 \r
1152                                                                         // Extract component value from 'margin' shorthand.\r
1153                                                                         if ( name == 'margin' )\r
1154                                                                         {\r
1155                                                                                 value = getStyleComponents( name, value,\r
1156                                                                                                 [ indentStyleName ] )[ indentStyleName ];\r
1157                                                                         }\r
1158                                                                         else if ( name != indentStyleName )\r
1159                                                                                 return null;\r
1160 \r
1161                                                                         if ( value && !emptyMarginRegex.test( value ) )\r
1162                                                                                 return [ indentStyleName, value ];\r
1163                                                                 }\r
1164 \r
1165                                                                 return null;\r
1166                                                         } ],\r
1167 \r
1168                                                 // Preserve clear float style.\r
1169                                                 [ ( /^clear$/ ) ],\r
1170 \r
1171                                                 [ ( /^border.*|margin.*|vertical-align|float$/ ), null,\r
1172                                                         function( value, element )\r
1173                                                         {\r
1174                                                                 if ( element.name == 'img' )\r
1175                                                                         return value;\r
1176                                                         } ],\r
1177 \r
1178                                                 [ (/^width|height$/ ), null,\r
1179                                                         function( value, element )\r
1180                                                         {\r
1181                                                                 if ( element.name in { table : 1, td : 1, th : 1, img : 1 } )\r
1182                                                                         return value;\r
1183                                                         } ]\r
1184                                         ] :\r
1185                                         // Otherwise provide a black-list of styles that we remove.\r
1186                                         [\r
1187                                                 [ ( /^mso-/ ) ],\r
1188                                                 // Fixing color values.\r
1189                                                 [ ( /-color$/ ), null, function( value )\r
1190                                                 {\r
1191                                                         if ( value == 'transparent' )\r
1192                                                                 return false;\r
1193                                                         if ( CKEDITOR.env.gecko )\r
1194                                                                 return value.replace( /-moz-use-text-color/g, 'transparent' );\r
1195                                                 } ],\r
1196                                                 // Remove empty margin values, e.g. 0.00001pt 0em 0pt\r
1197                                                 [ ( /^margin$/ ), emptyMarginRegex ],\r
1198                                                 [ 'text-indent', '0cm' ],\r
1199                                                 [ 'page-break-before' ],\r
1200                                                 [ 'tab-stops' ],\r
1201                                                 [ 'display', 'none' ],\r
1202                                                 removeFontStyles ? [ ( /font-?/ ) ] : null\r
1203                                         ], removeStyles ),\r
1204 \r
1205                                         // Prefer width styles over 'width' attributes.\r
1206                                         'width' : function( value, element )\r
1207                                         {\r
1208                                                 if ( element.name in dtd.$tableContent )\r
1209                                                         return false;\r
1210                                         },\r
1211                                         // Prefer border styles over table 'border' attributes.\r
1212                                         'border' : function( value, element )\r
1213                                         {\r
1214                                                 if ( element.name in dtd.$tableContent )\r
1215                                                         return false;\r
1216                                         },\r
1217 \r
1218                                         // Only Firefox carry style sheet from MS-Word, which\r
1219                                         // will be applied by us manually. For other browsers\r
1220                                         // the css className is useless.\r
1221                                         'class' : falsyFilter,\r
1222 \r
1223                                         // MS-Word always generate 'background-color' along with 'bgcolor',\r
1224                                         // simply drop the deprecated attributes.\r
1225                                         'bgcolor' : falsyFilter,\r
1226 \r
1227                                         // Deprecate 'valign' attribute in favor of 'vertical-align'.\r
1228                                         'valign' : removeStyles ? falsyFilter : function( value, element )\r
1229                                         {\r
1230                                                 element.addStyle( 'vertical-align', value );\r
1231                                                 return false;\r
1232                                         }\r
1233                                 },\r
1234 \r
1235                                 // Fore none-IE, some useful data might be buried under these IE-conditional\r
1236                                 // comments where RegExp were the right approach to dig them out where usual approach\r
1237                                 // is transform it into a fake element node which hold the desired data.\r
1238                                 comment :\r
1239                                         !CKEDITOR.env.ie ?\r
1240                                                 function( value, node )\r
1241                                                 {\r
1242                                                         var imageInfo = value.match( /<img.*?>/ ),\r
1243                                                                 listInfo = value.match( /^\[if !supportLists\]([\s\S]*?)\[endif\]$/ );\r
1244 \r
1245                                                         // Seek for list bullet indicator.\r
1246                                                         if ( listInfo )\r
1247                                                         {\r
1248                                                                 // Bullet symbol could be either text or an image.\r
1249                                                                 var listSymbol = listInfo[ 1 ] || ( imageInfo && 'l.' ),\r
1250                                                                         listType = listSymbol && listSymbol.match( />(?:[(]?)([^\s]+?)([.)]?)</ );\r
1251                                                                 return createListBulletMarker( listType, listSymbol );\r
1252                                                         }\r
1253 \r
1254                                                         // Reveal the <img> element in conditional comments for Firefox.\r
1255                                                         if ( CKEDITOR.env.gecko && imageInfo )\r
1256                                                         {\r
1257                                                                 var img = CKEDITOR.htmlParser.fragment.fromHtml( imageInfo[ 0 ] ).children[ 0 ],\r
1258                                                                         previousComment = node.previous,\r
1259                                                                         // Try to dig the real image link from vml markup from previous comment text.\r
1260                                                                         imgSrcInfo = previousComment && previousComment.value.match( /<v:imagedata[^>]*o:href=['"](.*?)['"]/ ),\r
1261                                                                         imgSrc = imgSrcInfo && imgSrcInfo[ 1 ];\r
1262 \r
1263                                                                 // Is there a real 'src' url to be used?\r
1264                                                                 imgSrc && ( img.attributes.src = imgSrc );\r
1265                                                                 return img;\r
1266                                                         }\r
1267 \r
1268                                                         return false;\r
1269                                                 }\r
1270                                         : falsyFilter\r
1271                         };\r
1272                 }\r
1273         });\r
1274 \r
1275         // The paste processor here is just a reduced copy of html data processor.\r
1276         var pasteProcessor = function()\r
1277         {\r
1278                 this.dataFilter = new CKEDITOR.htmlParser.filter();\r
1279         };\r
1280 \r
1281         pasteProcessor.prototype =\r
1282         {\r
1283                 toHtml : function( data )\r
1284                 {\r
1285                         var fragment = CKEDITOR.htmlParser.fragment.fromHtml( data, false ),\r
1286                                 writer = new CKEDITOR.htmlParser.basicWriter();\r
1287 \r
1288                         fragment.writeHtml( writer, this.dataFilter );\r
1289                         return writer.getHtml( true );\r
1290                 }\r
1291         };\r
1292 \r
1293         CKEDITOR.cleanWord = function( data, editor )\r
1294         {\r
1295                 // Firefox will be confused by those downlevel-revealed IE conditional\r
1296                 // comments, fixing them first( convert it to upperlevel-revealed one ).\r
1297                 // e.g. <![if !vml]>...<![endif]>\r
1298                 if ( CKEDITOR.env.gecko )\r
1299                         data = data.replace( /(<!--\[if[^<]*?\])-->([\S\s]*?)<!--(\[endif\]-->)/gi, '$1$2$3' );\r
1300 \r
1301                 var dataProcessor = new pasteProcessor(),\r
1302                         dataFilter = dataProcessor.dataFilter;\r
1303 \r
1304                 // These rules will have higher priorities than default ones.\r
1305                 dataFilter.addRules( CKEDITOR.plugins.pastefromword.getRules( editor ) );\r
1306 \r
1307                 // Allow extending data filter rules.\r
1308                 editor.fire( 'beforeCleanWord', { filter : dataFilter } );\r
1309 \r
1310                 try\r
1311                 {\r
1312                         data = dataProcessor.toHtml( data, false );\r
1313                 }\r
1314                 catch ( e )\r
1315                 {\r
1316                         alert( editor.lang.pastefromword.error );\r
1317                 }\r
1318 \r
1319                 /* Below post processing those things that are unable to delivered by filter rules. */\r
1320 \r
1321                 // Remove 'cke' namespaced attribute used in filter rules as marker.\r
1322                 data = data.replace( /cke:.*?".*?"/g, '' );\r
1323 \r
1324                 // Remove empty style attribute.\r
1325                 data = data.replace( /style=""/g, '' );\r
1326 \r
1327                 // Remove the dummy spans ( having no inline style ).\r
1328                 data = data.replace( /<span>/g, '' );\r
1329 \r
1330                 return data;\r
1331         };\r
1332 })();\r
1333 \r
1334 /**\r
1335  * Whether to ignore all font related formatting styles, including:\r
1336  * <ul> <li>font size;</li>\r
1337  *              <li>font family;</li>\r
1338  *              <li>font foreground/background color.</li></ul>\r
1339  * @name CKEDITOR.config.pasteFromWordRemoveFontStyles\r
1340  * @since 3.1\r
1341  * @type Boolean\r
1342  * @default true\r
1343  * @example\r
1344  * config.pasteFromWordRemoveFontStyles = false;\r
1345  */\r
1346 \r
1347 /**\r
1348  * Whether to transform MS Word outline numbered headings into lists.\r
1349  * @name CKEDITOR.config.pasteFromWordNumberedHeadingToList\r
1350  * @since 3.1\r
1351  * @type Boolean\r
1352  * @default false\r
1353  * @example\r
1354  * config.pasteFromWordNumberedHeadingToList = true;\r
1355  */\r
1356 \r
1357 /**\r
1358  * Whether to remove element styles that can't be managed with the editor. Note\r
1359  * that this doesn't handle the font specific styles, which depends on the\r
1360  * {@link CKEDITOR.config.pasteFromWordRemoveFontStyles} setting instead.\r
1361  * @name CKEDITOR.config.pasteFromWordRemoveStyles\r
1362  * @since 3.1\r
1363  * @type Boolean\r
1364  * @default true\r
1365  * @example\r
1366  * config.pasteFromWordRemoveStyles = false;\r
1367  */\r