#region License // Copyright (c) 2007 James Newton-King // // Permission is hereby granted, free of charge, to any person // obtaining a copy of this software and associated documentation // files (the "Software"), to deal in the Software without // restriction, including without limitation the rights to use, // copy, modify, merge, publish, distribute, sublicense, and/or sell // copies of the Software, and to permit persons to whom the // Software is furnished to do so, subject to the following // conditions: // // The above copyright notice and this permission notice shall be // included in all copies or substantial portions of the Software. // // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, // EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES // OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND // NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT // HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, // WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING // FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR // OTHER DEALINGS IN THE SOFTWARE. #endregion using System; using System.Collections.Generic; using System.IO; using System.Linq; using System.Text; using System.Text.RegularExpressions; namespace Newtonsoft.Utilities.Text { public static class StringExtensions { public static string RemoveHtml(this string s) { return RemoveHtmlInternal(s, null); } public static string RemoveHtml(this string s, IList<string> removeTags) { if (removeTags == null) throw new ArgumentNullException("removeTags"); return RemoveHtmlInternal(s, removeTags); } private static string RemoveHtmlInternal(string s, IList<string> removeTags) { List<string> removeTagsUpper = null; if (removeTags != null) { removeTagsUpper = new List<string>(removeTags.Count); foreach (string tag in removeTags) { removeTagsUpper.Add(tag.ToUpperInvariant()); } } Regex anyTag = new Regex(@"<[/]{0,1}s*(?<tag>w*)s*(?<attr>.*?=['""].*?[""'])*?s*[/]{0,1}>", RegexOptions.Compiled); return anyTag.Replace(s, delegate(Match match) { string tag = match.Groups["tag"].Value.ToUpperInvariant(); if (removeTagsUpper == null) return string.Empty; else if (removeTagsUpper.Contains(tag)) return string.Empty; else return match.Value; }); } } }