private void StartWebCrawler() { websitelToCrawler = httpValue + "://www." + websitelToCrawler; CurrentUrl = websitelToCrawler; Uri _uri = new Uri(websitelToCrawler); fullUriWebsite = _uri; fullUrlWebsite = _uri.GetLeftPart(UriPartial.Authority) + "/"; UrlToDo.Add(fullUrlWebsite); StartCrawlerAsync(); }
private bool AnalizePage(HtmlResponseData replay) { try { HtmlNodeCollection _list = replay.document.DocumentNode.SelectNodes("//a[@href]"); if (_list.Count == 0) { return(false); } foreach (HtmlNode link in _list) { HtmlAttribute att = null; try { att = link.Attributes["href"]; } catch (Exception err2) { var dedug2 = ""; } if (att != null) { //HtmlAttribute att = link.Attributes["href"]; string linkToAdd = IsValidLink(att.Value); if (linkToAdd != null) { UrlToDo.Add(linkToAdd.ToLower().Trim()); NotifyPropertyChanged("UrlDone"); } } } NotifyPropertyChanged(); } catch (Exception err1) { var dedug1 = ""; return(false); } return(true); }