Beispiel #1
0
        /// <summary>
        /// 详情
        /// </summary>
        public void RunArticleDetail()
        {
            var rule = new SpliderRule()
            {
                ContentXPath = "//div[@id='post_detail']",
                EachXPath    = "",
                Url          = " https://www.cnblogs.com/fancunwei/p/9581168.html",
                RuleFields   = new List <RuleField>()
                {
                    new RuleField()
                    {
                        DisplayName = "标题", XPath = "*//div[@class='post']//a[@id='cb_post_title_url']", IsFirstInnerText = true
                    },
                    new RuleField()
                    {
                        DisplayName = "详情", XPath = "*//div[@class='postBody']//div[@class='blogpost-body']", Attribute = "", IsFirstInnerText = false
                    }
                }
            };
            var splider = new ArticleSplider();
            var list    = splider.GetByRule(rule);

            foreach (var item in list)
            {
                var msg = string.Empty;
                item.Fields.ForEach(M =>
                {
                    Console.WriteLine($"{M.DisplayName}:{M.Value}");
                });
                Console.WriteLine(msg);
            }
        }
Beispiel #2
0
        /// <summary>
        /// 天气预报 - 15 days
        /// </summary>
        public void RunWeather15Days()
        {
            var rule = new SpliderRule()
            {
                ContentXPath = "//div[@id='15d']",
                EachXPath    = "*//li",
                Url          = "http://www.weather.com.cn/weather15d/101020100.shtml",
                RuleFields   = new List <RuleField>()
                {
                    new RuleField()
                    {
                        DisplayName = "日期", XPath = "span[@class='time']", IsFirstInnerText = true
                    },
                    new RuleField()
                    {
                        DisplayName = "天气", XPath = "span[@class='wea']", Attribute = "", IsFirstInnerText = false
                    },
                    new RuleField()
                    {
                        DisplayName = "区间", XPath = "span[@class='tem']", Attribute = "", IsFirstInnerText = false
                    },
                    new RuleField()
                    {
                        DisplayName = "风向", XPath = "span[@class='wind']", Attribute = "", IsFirstInnerText = false
                    },
                    new RuleField()
                    {
                        DisplayName = "风力", XPath = "span[@class='wind1']", Attribute = "", IsFirstInnerText = false
                    },
                }
            };
            var splider = new ArticleSplider();
            var list    = splider.GetByRule(rule);

            foreach (var item in list)
            {
                var msg = string.Empty;
                item.Fields.ForEach(M =>
                {
                    msg += $"{M.DisplayName}:{M.Value} ";
                });
                Console.WriteLine(msg);
            }
        }
Beispiel #3
0
        /// <summary>
        /// 天气预报 - 7 days
        /// </summary>
        public void RunWeather7Days()
        {
            var rule = new SpliderRule()
            {
                //ContentXPath = "//div[@id='7d']",
                ContentXPath = "//ul[@class='t clearfix']",
                EachXPath    = "li[@class]",
                Url          = "http://www.weather.com.cn/weather/101250101.shtml", //长沙7天天气
                RuleFields   = new List <RuleField>()
                {
                    new RuleField()
                    {
                        DisplayName = "日期", XPath = "h1", IsFirstInnerText = true
                    },
                    new RuleField()
                    {
                        DisplayName = "天气", XPath = "p[@class='wea']", Attribute = "", IsFirstInnerText = true
                    },
                    new RuleField()
                    {
                        DisplayName = "高", XPath = "p[@class='tem']/span", Attribute = "", IsFirstInnerText = true
                    },
                    new RuleField()
                    {
                        DisplayName = "低", XPath = "p[@class='tem']/i", Attribute = "", IsFirstInnerText = true
                    },
                    //new RuleField(){ DisplayName="风向",XPath="p[@class='win']",Attribute="", IsFirstInnerText=false },
                    //new RuleField(){ DisplayName="风力",XPath="p[@class='win']",Attribute="", IsFirstInnerText=false },
                }
            };
            var splider = new ArticleSplider();
            var list    = splider.GetByRule(rule);

            foreach (var item in list)
            {
                var msg = string.Empty;
                item.Fields.ForEach(M =>
                {
                    msg += $"{M.DisplayName}:{M.Value} ";
                });
                Console.WriteLine(msg);
            }
        }
Beispiel #4
0
        /// <summary>
        ///
        /// </summary>
        public void RunArticleRule()
        {
            var postitembodyXPath     = "div[@class='post_item_body']//";
            var postitembodyFootXPath = postitembodyXPath + "div[@class='post_item_foot']//";
            var rule = new SpliderRule()
            {
                ContentXPath = "//div[@id='post_list']",
                EachXPath    = "div[@class='post_item']",
                Url          = "https://www.cnblogs.com",
                RuleFields   = new List <RuleField>()
                {
                    new RuleField()
                    {
                        DisplayName = "推荐", XPath = "*//span[@class='diggnum']", IsFirstInnerText = true
                    },
                    new RuleField()
                    {
                        DisplayName = "标题", XPath = postitembodyXPath + "a[@class='titlelnk']", IsFirstInnerText = true
                    },
                    new RuleField()
                    {
                        DisplayName = "URL", XPath = postitembodyXPath + "a[@class='titlelnk']", Attribute = "href", IsFirstInnerText = true
                    },
                    new RuleField()
                    {
                        DisplayName = "简要", XPath = postitembodyXPath + "p[@class='post_item_summary']", IsFirstInnerText = true
                    },
                    new RuleField()
                    {
                        DisplayName = "作者", XPath = postitembodyFootXPath + "a[@class='lightblue']", IsFirstInnerText = true
                    },
                    new RuleField()
                    {
                        DisplayName = "作者URL", XPath = postitembodyFootXPath + "a[@class='lightblue']", Attribute = "href", IsFirstInnerText = true
                    },
                    new RuleField()
                    {
                        DisplayName = "讨论数", XPath = "span[@class='article_comment']", IsFirstInnerText = true, InnerTextRegex = @"[^0-9]+"
                    },
                    new RuleField()
                    {
                        DisplayName = "阅读数", XPath = postitembodyFootXPath + "span[@class='article_view']", IsFirstInnerText = true, InnerTextRegex = @"[^0-9]+"
                    },
                }
            };
            var splider = new ArticleSplider();
            var list    = splider.GetByRule(rule);

            foreach (var item in list)
            {
                var msg = string.Empty;
                item.Fields.ForEach(M =>
                {
                    if (M.DisplayName != "简要" && !M.DisplayName.Contains("URL"))
                    {
                        msg += $"{M.DisplayName}:{M.Value}";
                    }
                });
                Console.WriteLine(msg);
            }
        }