js清理word生成的HTML冗余代码

上一篇 / 下一篇  2007-05-26 14:40:01 / 精华(2)

<script language="javascript">
<!--
function cleanWordHtml(html){
// Remove all SPAN tags
html = html.replace(/</?SPAN[^>]*>/gi, "");
// Remove Class attributes
html = html.replace(/<(w[^>]*) class=([^ |>]*)([^>]*)/gi, "<$1$3") ;
// Remove Style attributes
html = html.replace(/<(w[^>]*) style="([^"]*)"([^>]*)/gi, "<$1$3") ;
// Remove Lang attributes
html = html.replace(/<(w[^>]*) lang=([^ |>]*)([^>]*)/gi, "<$1$3") ;
// Remove XML elements and declarations
html = html.replace(/<\??xml[^>]*>/gi, "") ;
// Remove Tags with XML namespace declarations: <o:p></o:p>
html = html.replace(/</?w+:[^>]*>/gi, "") ;
// Replace the &nbsp;
html = html.replace(/&nbsp;/, " " );
// Transform <P> to <DIV>
var re = new RegExp("(<P)([^>]*>.*?)(</P>)","gi") ;
// Different because of a IE 5.0 error
html = html.replace( re, "<div$2</div>");return html;
}
//-->
</script>

TAG: 清理word html冗余代码

 

评分:0

我来说两句

显示全部

:loveliness: :handshake :victory: :funk: :time: :kiss: :call: :hug: :lol :'( :Q :L ;P :$ :P :o :@ :D :( :)

关于作者