Beispiel #1
0
 private void Finish()
 {
     _driver.Quit();
     SaveSitemap();
     Save404Pages();
     ExcelHandler.DataTableToExcel(_options.FolderPath + "\\PageNonValidateList.xlsx", pagesErrorList);
     _watch.Stop();
     logger.Info("Finish all task in {0}", _watch.Elapsed);
 }
Beispiel #2
0
        private Dictionary <string, string> pageParentURLMapping;  //Key is current Page, Content is parent Page
        public Crawler(CrawlerOptions options)
        {
            _options             = options;
            pagesVisited         = new HashSet <Uri>();
            pagesNotFound        = new HashSet <Uri>();
            pagesToVisit         = new List <Uri>();
            _watch               = new Stopwatch();
            pagesErrorList       = new DataTable();
            pagesErrorList       = ExcelHandler.InitTable(pagesErrorList);
            logger               = LogManager.GetCurrentClassLogger();
            pageParentURLMapping = new Dictionary <string, string>();
            var chromeOptions = new ChromeOptions();

            chromeOptions.AddArgument("--user-agent=" + _options.UserAgent);
            _driver = new ChromeDriver(chromeOptions);
        }