Im using the following method to extract text form html:
    public string getAllText(string _html)
    {
        string _allText = "";
        try
        {
            HtmlAgilityPack.HtmlDocument document = new HtmlAgilityPack.HtmlDocument();
            document.LoadHtml(_html);
            var root = document.DocumentNode;
            var sb = new StringBuilder();
            foreach (var node in root.DescendantNodesAndSelf())
            {
                if (!node.HasChildNodes)
                {
                    string text = node.InnerText;
                    if (!string.IsNullOrEmpty(text))
                        sb.AppendLine(text.Trim());
                }
            }
            _allText = sb.ToString();
        }
        catch (Exception)
        {
        }
        _allText = System.Web.HttpUtility.HtmlDecode(_allText);
        return _allText;
    }
Problem is that i also get script and style tags.
How could i exclude them?
 
     
     
     
     
    
? I see it in OuterHtml but would like to strip out all inline styles too.
– Jeremy Jun 03 '16 at 17:51