日期:2014-05-17  浏览次数:22593 次

这个HTML过滤该怎么调用呢?
下面是源代码,我现在的内容字段是content,应该怎么调用才能有效去除HTML标记呢?谢谢。我是asp新手。

'去除HTML标记
Function HTMLFilter(sHTML, sFilters)  
  If sHTML & "" = "" Then Exit Function 
  If sFilters & "" = "" Then sFilters = "SCRIPT,OBJECT" 
  Dim aFilters  
  aFilters = Split(UCase(sFilters), ",")  
  For i = 0 To UBound(aFilters)  
  Select Case UCase(Trim(aFilters(i)))  
  Case "JORKIN" 
  Do While InStr(sHTML, " ") >0  
  sHTML = Replace(sHTML, " ", " ")  
  Loop 
  Case "SCRIPT" 
  '// 去除脚本<scr ipt></scr ipt>及 onload 等  
  sHTML = RegReplace(sHTML, "<SCRIPT[\s\S]*?</SCRIPT>", "")  
  sHTML = RegReplace(sHTML, "\s[on].+?=\s+?([\""|\'])(.*?)\1", "")  
  sHTML = RegReplace(sHTML, "(JAVASCRIPT|JSCRIPT|VBSCRIPT|VBS):", "$1:") 
  Case "FIXIMG" 
  sHTML = RegReplace(sHTML, "<IMG.*?\sSRC=([^\""\'\s][^\""\'\s>]*).*?>", "<img src=$2 border=0>")  
  sHTML = RegReplace(sHTML, "<IMG.*SRC=([\""\']?)(.\1\S+).*?>", "<img src=$2 border=0>")  
  Case "TABLE" 
  '// 去除表格<table><tr><td><th> 
  sHTML = RegReplace(sHTML, "</?TABLE[^>]*>", "") 
  sHTML = RegReplace(sHTML, "</?TBODY[^>]*>", "") 
  sHTML = RegReplace(sHTML, "<(/?)TR[^>]*>", "<$1p>") 
  sHTML = RegReplace(sHTML, "</?TH[^>]*>", " ") 
  sHTML = RegReplace(sHTML, "</?TD[^>]*>", " ") 
  Case "CLASS" 
  '// 去除样式类class="" 
  sHTML = RegReplace(sHTML, "(<[^>]+) CLASS=[^ |^>]+([^>]*>)", "$1 $2") 
  sHTML = RegReplace(sHTML, "\sCLASS\s*?=\s*?([\""|\'])(.*?)\1", "")  
  Case "STYLE" 
  '// 去除样式style="" 
  sHTML = RegReplace(sHTML, "(<[^>]+) STYLE=[^ |^>]+([^>]*>)", "$1 $2") 
  sHTML = RegReplace(sHTML, "\sSTYLE\s*?=\s*?([\""|\'])(.*?)\1", "")  
  Case "XML" 
  '// 去除XML<?xml> 
  sHTML = RegReplace(sHTML, "<?XML[^>]*>", "") 
  Case "NAMESPACE" 
  '// 去除命名空间<o:p></o:p> 
  sHTML = RegReplace(sHTML, "<\/?[a-z]+:[^>]*>", "") 
  Case "FONT" 
  '// 去除字体<font></font> 
  sHTML = RegReplace(sHTML, "</?FONT[^>]*>", "") 
  Case "MARQUEE" 
  '/