過濾超級鏈接
復制代碼 代碼如下:
Function RegRemoveHref(HTMLstr)
Set ra = New RegExp
ra.IgnoreCase = True
ra.Global = True
ra.Pattern = “<A[^>]+>(.+?)</A>”
RegRemoveHref = ra.replace(HTMLstr,”$1″)
END Function
Set ra = New RegExp
ra.IgnoreCase = True
ra.Global = True
ra.Pattern = “<A[^>]+>(.+?)</A>”
RegRemoveHref = ra.replace(HTMLstr,”$1″)
END Function
過濾所有HTML代碼
復制代碼 代碼如下:
Function RemoveHTML(strHTML)
Dim objRegExp, Match, Matches
Set objRegExp = New Regexp
objRegExp.IgnoreCase = True
objRegExp.Global = True
‘取閉合的<>
objRegExp.Pattern = “<.+?>”
‘進行匹配
Set Matches = objRegExp.Execute(strHTML)
‘ 遍歷匹配集合,并替換掉匹配的項目
For Each Match in Matches
strHtml=Replace(strHTML,Match.Value,””)
Next
RemoveHTML=strHTML
Set objRegExp = Nothing
End Function
Dim objRegExp, Match, Matches
Set objRegExp = New Regexp
objRegExp.IgnoreCase = True
objRegExp.Global = True
‘取閉合的<>
objRegExp.Pattern = “<.+?>”
‘進行匹配
Set Matches = objRegExp.Execute(strHTML)
‘ 遍歷匹配集合,并替換掉匹配的項目
For Each Match in Matches
strHtml=Replace(strHTML,Match.Value,””)
Next
RemoveHTML=strHTML
Set objRegExp = Nothing
End Function
過濾所有HTML代碼 和空格換行
復制代碼 代碼如下:
Function RemoveHTML(strHTML)
Dim objRegExp, Match, Matches
Set objRegExp = New Regexp
objRegExp.IgnoreCase = True
objRegExp.Global = True
objRegExp.Pattern = “<.+?>”
‘objRegExp.Pattern = “(r|n|rn| |t| )”
Set Matches = objRegExp.Execute(strHTML)
For Each Match in Matches
strHtml=Replace(strHTML,Match.Value,””)
Next
objRegExp.Pattern = “(r|n|rn| |t| )”
Set Matches = objRegExp.Execute(strHTML)
For Each Match in Matches
strHtml=Replace(strHTML,Match.Value,””)
Next
RemoveHTML=strHTML
Set objRegExp = Nothing
End Function
Dim objRegExp, Match, Matches
Set objRegExp = New Regexp
objRegExp.IgnoreCase = True
objRegExp.Global = True
objRegExp.Pattern = “<.+?>”
‘objRegExp.Pattern = “(r|n|rn| |t| )”
Set Matches = objRegExp.Execute(strHTML)
For Each Match in Matches
strHtml=Replace(strHTML,Match.Value,””)
Next
objRegExp.Pattern = “(r|n|rn| |t| )”
Set Matches = objRegExp.Execute(strHTML)
For Each Match in Matches
strHtml=Replace(strHTML,Match.Value,””)
Next
RemoveHTML=strHTML
Set objRegExp = Nothing
End Function
asp使用正則表達式去除script代碼和HTML代碼
一、清楚內(nèi)容中的Javsscript 代碼 這個代碼的作用是去掉用<script </script>標記包含的所有部分。
根據(jù)實際需要,它也許不能滿足要求。如果用在屏蔽客戶提交代碼的地方,應保證這一步在最后執(zhí)行。
很多人還會拼湊這樣的標記,應小心。
復制代碼 代碼如下:
Function ClearJSCode(originCode)
Dim reg
set reg = New RegExp
reg.Pattern = “<SCRIPT[^<]*</SCRIPT>”
reg.IgnoreCase = True
reg.Global = True
clearJSCode = reg.Replace(originCode, “”)
End Function
Dim reg
set reg = New RegExp
reg.Pattern = “<SCRIPT[^<]*</SCRIPT>”
reg.IgnoreCase = True
reg.Global = True
clearJSCode = reg.Replace(originCode, “”)
End Function
二、清除內(nèi)容中的HTML代碼
復制代碼 代碼如下:
Function ClearHTMLCode(originCode)
Dim reg
set reg = new RegExp
reg.Pattern = “<[^>]*>”
reg.IgnoreCase = True
reg.Global = True
ClearHTMLCode = reg.Replace(originCode, “”)
End Function
Dim reg
set reg = new RegExp
reg.Pattern = “<[^>]*>”
reg.IgnoreCase = True
reg.Global = True
ClearHTMLCode = reg.Replace(originCode, “”)
End Function
復制代碼 代碼如下:
<js jsid=”1″ jsname=”去除內(nèi)容頁里干擾信息”><![CDATA[
var sourcehtml=function(){/*%s*/}.toString().slice(13, -3);
parser9527=function()
{
var ss=sourcehtml;
ss=ss.replace(/<.*?>/ig,””);
ss=ss.replace(/(r|n|rn| |t| )/ig,””);
ss=ss.replace(/(</a>)/ig,””);
ss=ss.replace(/<a((.|n)*?)>/ig,””);
ss=ss.replace(“_網(wǎng)易新聞中心”,””);
/*
ss=ss.replace(/<iframe((.|n)*?)</iframe>/ig,””);
ss=ss.replace(/<script((.|n)*?)</script>/ig,””);
ss=ss.replace(/<address((.|n)*?)</address>/ig,””);
ss=ss.replace(/(</a>)/ig,””);
ss=ss.replace(/<a((.|n)*?)>/ig,””);
ss=ss.replace(/<SELECT((.|n)*?)</SELECT>/ig,””);
ss=ss.replace(/<TABLE((.|n)*?)</TABLE>/ig,””);
ss=ss.replace(/<img((.|n)*?)>/ig,””);
ss=ss.replace(/<TABLE((.|n)*?)>/ig,””);
ss=ss.replace(/(</TABLE>)/ig,””);
ss=ss.replace(/<TR((.|n)*?)>/ig,”<BR>”);
ss=ss.replace(/(</TR>)/ig,””);
ss=ss.replace(/<nobr((.|n)*?)>/ig,”<BR>”);
ss=ss.replace(/<nobr((.|n)*?)>/ig,””);
ss=ss.replace(/(</nobr>)/ig,””);
ss=ss.replace(/<TD((.|n)*?)>/ig,” “);
ss=ss.replace(/(</TD>)/ig,””);
ss=ss.replace(/<span id=((.|n)*?)</small>/ig,””);
ss=ss.replace(/<div((.|n)*?)>/ig,””);
ss=ss.replace(/(</div>)/ig,””);
*/
return ss;
}
parser9527();
]]></js>
var sourcehtml=function(){/*%s*/}.toString().slice(13, -3);
parser9527=function()
{
var ss=sourcehtml;
ss=ss.replace(/<.*?>/ig,””);
ss=ss.replace(/(r|n|rn| |t| )/ig,””);
ss=ss.replace(/(</a>)/ig,””);
ss=ss.replace(/<a((.|n)*?)>/ig,””);
ss=ss.replace(“_網(wǎng)易新聞中心”,””);
/*
ss=ss.replace(/<iframe((.|n)*?)</iframe>/ig,””);
ss=ss.replace(/<script((.|n)*?)</script>/ig,””);
ss=ss.replace(/<address((.|n)*?)</address>/ig,””);
ss=ss.replace(/(</a>)/ig,””);
ss=ss.replace(/<a((.|n)*?)>/ig,””);
ss=ss.replace(/<SELECT((.|n)*?)</SELECT>/ig,””);
ss=ss.replace(/<TABLE((.|n)*?)</TABLE>/ig,””);
ss=ss.replace(/<img((.|n)*?)>/ig,””);
ss=ss.replace(/<TABLE((.|n)*?)>/ig,””);
ss=ss.replace(/(</TABLE>)/ig,””);
ss=ss.replace(/<TR((.|n)*?)>/ig,”<BR>”);
ss=ss.replace(/(</TR>)/ig,””);
ss=ss.replace(/<nobr((.|n)*?)>/ig,”<BR>”);
ss=ss.replace(/<nobr((.|n)*?)>/ig,””);
ss=ss.replace(/(</nobr>)/ig,””);
ss=ss.replace(/<TD((.|n)*?)>/ig,” “);
ss=ss.replace(/(</TD>)/ig,””);
ss=ss.replace(/<span id=((.|n)*?)</small>/ig,””);
ss=ss.replace(/<div((.|n)*?)>/ig,””);
ss=ss.replace(/(</div>)/ig,””);
*/
return ss;
}
parser9527();
]]></js>
ASP常用的正則過濾函數(shù) 可過濾html js style div font
開發(fā)程序,經(jīng)常要用到正則表達式進行過濾一些不需要的東西,比如html js style div font,有時候需要過濾極個別的,有時候需要過濾好幾種,不管怎么過濾,萬變不離其宗。
這是我收藏的一些過濾函數(shù),可以用來過濾您不需要的代碼。如果需要過濾多種,可以嵌套使用,也可以自己整合代碼。不過不建議嵌套使用,因為那樣效率太低。
Asp 正則表達式 過濾 所有 html 標記 :
復制代碼 代碼如下:
Function LoseHtml(ContentStr)
Dim ClsTempLoseStr,regEx
ClsTempLoseStr = Cstr(ContentStr)
Set regEx = New RegExp
regEx.Pattern = “</*[^<>]*>”
regEx.IgnoreCase = True
regEx.Global = True
ClsTempLoseStr = regEx.Replace(ClsTempLoseStr,””)
LoseHtml = ClsTempLoseStr
End function
Dim ClsTempLoseStr,regEx
ClsTempLoseStr = Cstr(ContentStr)
Set regEx = New RegExp
regEx.Pattern = “</*[^<>]*>”
regEx.IgnoreCase = True
regEx.Global = True
ClsTempLoseStr = regEx.Replace(ClsTempLoseStr,””)
LoseHtml = ClsTempLoseStr
End function
Asp 正則表達式 過濾 style 標記 :
regEx.Pattern = “(<style)+[^<>]*>[^