Example #1
0
        internal override IContentSource Crawl(IContentSource content, bool asList)
        {
            if (content == null)
            {
                return(GetDefault(string.Format("Null content")));
            }

            if (content.GetType() != typeof(XmlContent) && content.GetType() != typeof(XHtmlContent))
            {
                // convert to XHTML
                var strContent = content.ToString();
                content = new XHtmlContent();
                content.LoadRaw(strContent);
            }

            if (content.GetType() == typeof(XHtmlContent))
            {
                content = asList ? (content as XHtmlContent).CrawlList(XPath) : (content as XHtmlContent).Crawl(XPath);
            }
            else     //if (content.GetType() == typeof(XmlContent)) // last case
            {
                content = asList ? (content as XmlContent).CrawlList(XPath) : (content as XmlContent).Crawl(XPath);
            }

            if (content == null)
            {
                return(GetDefault(string.Format("Null content")));
            }

            return(content);
        }
        IContentSource CrawlObject(IContentSource content)
        {
            var match = Regex.Match(content.ToString(), Pattern, RegexOptions.Singleline | RegexOptions.IgnoreCase);
            if (match == null || match.Groups.Count <= MatchGroup)
                return GetDefault(string.Format("Could not match pattern {0}", Pattern));

            var plainContent = new PlainContent();
            plainContent.ContentList.Add(match.Groups[MatchGroup].Value);
            return plainContent;
        }
Example #3
0
        IContentSource CrawlObject(IContentSource content)
        {
            var match = Regex.Match(content.ToString(), Pattern, RegexOptions.Singleline | RegexOptions.IgnoreCase);

            if (match == null || match.Groups.Count <= MatchGroup)
            {
                return(GetDefault(string.Format("Could not match pattern {0}", Pattern)));
            }

            var plainContent = new PlainContent();

            plainContent.ContentList.Add(match.Groups[MatchGroup].Value);
            return(plainContent);
        }
        internal override IContentSource Crawl(IContentSource content, bool asList)
        {
            if (content == null)
                return GetDefault(string.Format("Null content"));

            if (content.GetType() != typeof(XmlContent) && content.GetType() != typeof(XHtmlContent)) {
                // convert to XHTML
                var strContent = content.ToString();
                content = new XHtmlContent();
                content.LoadRaw(strContent);
            }

            if (content.GetType() == typeof(XHtmlContent)) {
                content = asList ? (content as XHtmlContent).CrawlList(XPath) : (content as XHtmlContent).Crawl(XPath);
            } else { //if (content.GetType() == typeof(XmlContent)) // last case
                content = asList ? (content as XmlContent).CrawlList(XPath) : (content as XmlContent).Crawl(XPath);
            }

            if (content == null)
                return GetDefault(string.Format("Null content"));

            return content;
        }
Example #5
0
 public void Push(IContentSource node)
 {
     _descriptions.Add("".PadRight(_level * 2, ' ') + node.ToString());
     _level++;
 }
Example #6
0
 public void Push(IContentSource node)
 {
     _descriptions.Add("".PadRight(_level * 2, ' ') + node.ToString());
     _level++;
 }