/// <summary>
/// 去除 html 标记
/// </summary>
/// <param name = "strhtml"> 包括 html 的源码 </param>
/// <seturns> 已经去除后的文字 </returns>
strip string statis publik (string strhtml)
{
string [] aryaRreg = {
@"<skrip [^>]*?>.*? </script>",
@"<(/// s*)?!?? ((/w+:)?/w+) (/w+(/s*=?/s*(([" "']) (file: // [" "' tbnr] | [^/7])*?/7 |/w+) |. {0}) |/s)*?
@"([/r/n]) [/s]+",
@"& (quot |#34);",
@"& (amp |#38);",
@"& (lt |#60);",
@"& (gt |#62);",
@"& (nbsp |#160);",
@"& (IExcl |#161);",
@"& (sen |#162);",
@"& (pound |#163);",
@"& (salin |#169);",
@"&#(/d+);",
@"->",
@"<!-.*/n"
};
string [] aryrep = {
"",
"",
"",
"/" ",
"&",
"<",
">",
"",
"/xa1", // chr (161),
"/xa2", // chr (162),
"/xa3", // chr (163),
"/xa9", // chr (169),
"",
"/r/n",
""
};
string newreg = aryreg [0];
string stroutput = strhtml;
untuk (int i = 0; i <aryreg.length; i ++)
{
regex regex = Regex baru (aryreg [i], regexoptions.ignorecase);
stroutput = regex.replace (stroutput, aryrep [i]);
}
stroutput.replace ("<", "");
stroutput.replace (">", "");
stroutput.replace ("/r/n", "");
mengembalikan stroutput;
}