コード例 #1
0
        public void Constructor_ValidArg_SetsPublicProperty()
        {
            PageToCrawl page = new CrawledPage(new Uri("http://aaa.com/"));
            PageCrawlStartingArgs args = new PageCrawlStartingArgs(new CrawlContext(), page);

            Assert.AreSame(page, args.PageToCrawl);
        }
コード例 #2
0
ファイル: WebCrawlerTest.cs プロジェクト: obender/abot
 private void ThrowExceptionWhen_PageCrawlStarting(object sender, PageCrawlStartingArgs e)
 {
     throw new Exception("no!!!");
 }
コード例 #3
0
 void crawler_ProcessPageCrawlStarting(object sender, PageCrawlStartingArgs e)
 {
     PageToCrawl pageToCrawl = e.PageToCrawl;
     Console.WriteLine("About to crawl link {0} which was found on page {1}", pageToCrawl.Uri.AbsoluteUri, pageToCrawl.ParentUri.AbsoluteUri);
 }
コード例 #4
0
ファイル: Crawler.cs プロジェクト: VAmaral/SRS
        /// <summary>
        /// Asynchronous event that is fired before a page is crawled.
        /// </summary>
        public static void ProcessPageCrawlStarting(object sender, PageCrawlStartingArgs e)
        {
            PageToCrawl pageToCrawl = e.PageToCrawl;
            String uri = e.PageToCrawl.Uri.AbsoluteUri;
            //Console.WriteLine("About to crawl link {0} which was found on page {1}", pageToCrawl.Uri.AbsoluteUri, pageToCrawl.ParentUri.AbsoluteUri);

            //Check if the page has been modified since the last crawl

            if (_crawledPages.ContainsKey(uri) && !ReVisit.ShouldReVisit(_crawledPages, uri))
            {
                PageCrawlDisallowed(pageToCrawl, null);
            }
        }
コード例 #5
0
ファイル: Program.cs プロジェクト: krishnakanthms/abot
 static void crawler_ProcessPageCrawlStarting(object sender, PageCrawlStartingArgs e)
 {
     //Process data
 }
コード例 #6
0
ファイル: MainWindow.xaml.cs プロジェクト: rhjv55/Utilities
 static void crawler_ProcessPageCrawlStarting(object sender, PageCrawlStartingArgs e)
 {
     PageToCrawl pageToCrawl = e.PageToCrawl;
     //Debug.WriteLine(string.Format("从链接: {1},获得链接: {0}", pageToCrawl.Uri.AbsoluteUri, pageToCrawl.ParentUri.AbsoluteUri));
 }
コード例 #7
0
ファイル: CrawlDaddy.cs プロジェクト: BgRva/ThrongBot
        private void crawler_ProcessPageCrawlStarting(object sender, PageCrawlStartingArgs e)
        {
            CrawlContext context = e.CrawlContext;

            //Also id info to the page to crawl (will be passed to Crawled Page)
            e.PageToCrawl.PageBag.SessionId = SessionId;
            e.PageToCrawl.PageBag.CrawlerId = CrawlerId;

            PageToCrawl pageToCrawl = e.PageToCrawl;
            _logger.DebugFormat("Page Crawl Starting {0} which was found on page {1}", 
                                pageToCrawl.Uri.AbsoluteUri, 
                                pageToCrawl.ParentUri.AbsoluteUri);
        }
コード例 #8
0
 private void PageCrawlStartingEvent(object sender, PageCrawlStartingArgs e)
 {
 }