public void Extract_Url()
        {
            string html = "<a href=\"https://github.com\">";

            var extractor = new HtmlAgilityBasedUrlExtractor();
            var urls      = extractor.ExtractUrls(html);

            Assert.Single(urls);
            Assert.Equal("https://github.com", urls[0]);
        }
示例#2
0
        private static void ListLinksForUrl(string url)
        {
            IDownloadAWebpage downloadWebpage = new DownloadAWebpage();
            IUrlExtractor     extractor       = new HtmlAgilityBasedUrlExtractor();

            var website = downloadWebpage.Download(url);
            var links   = extractor.ExtractUrls(website.Result.RawContent);

            for (var index = 0; index < links.Length; index++)
            {
                var link = links[index];
                Console.WriteLine($"{index,4}. {link}");
            }
        }