C#使用正则表达式去除html标记:
using SystemTextRegularExpressions;
string strHtml = @"
带有HTML标记的字符";
Regex regex = new Regex("<+?>" RegexOptionsIgnoreCase);
string str = regexReplace(str "");
ConsoleWriteLine(strReplace("&nbsp;" " ));