Beispiel #1
0
        public void Process(string baseUrl)
        {
            var doc = pageRetriever.GetPage(baseUrl);

            Logger.Log("crawling data");

            var body            = this.GetBody(doc);
            var footer          = this.GetFooter(body);
            var containerFooter = footer.ChildNodes.Single(node => node.Name == "div");
            var imgs            = this.GetImagesUrls(containerFooter);

            foreach (var url in imgs)
            {
                var imageBytes = pageRetriever.GetImage($"{baseUrl}{url}");
                fileManager.SaveImage(imageBytes, $"../../images/{url.Split('/').Last()}");
            }

            Logger.Log("done!");
        }