C# (CSharp) SimpleCrawler urldetail Examples

Programming Language: C# (CSharp)

Namespace/Package Name: SimpleCrawler

Class/Type: urldetail

Examples at hotexamples.com: 2

C# (CSharp) SimpleCrawler urldetail - 2 examples found. These are the top rated real world C# (CSharp) examples of SimpleCrawler.urldetail extracted from open source projects. You can rate examples to help us improve the quality of examples.

Example #1

Show file

File: SimpleCrawler.cs Project: CN-Haoling/Csharplearning

 public void Process(urldetail url)
 {
     try
     {
         WebClient webClient = new WebClient();
         webClient.Encoding = Encoding.UTF8;
         string html     = webClient.DownloadString(url.url);
         string fileName = count.ToString();
         File.WriteAllText(fileName, html, Encoding.UTF8);
         url.html = html;
         PageDownloaded(this, url);
         Parse(html, url.url);//解析,并加入新的链接
     }
     catch (Exception)
     {
     }
 }

Example #2

Show file

File: SimpleCrawler.cs Project: CN-Haoling/Csharplearning

        public void Crawl()
        {
            urldetail surl = new urldetail()
            {
                url = startUrl, processing = false, html = ""
            };

            urls.Add(surl);

            string str = @"(www\.){0,1}.*?\..*?/";
            Regex  r   = new Regex(str);
            Match  m   = r.Match(startUrl);

            startWith = m.Value;

            while (true)
            {
                urldetail current = null;
                foreach (var url in urls)
                {
                    if (url.processing)
                    {
                        continue;
                    }
                    current = url;
                    if (count > 20)
                    {
                        break;
                    }
                    if (current == null)
                    {
                        continue;
                    }
                    current.processing = true;
                    var t = new Thread(() => Process(current));
                    t.Start();
                    count++;
                }
            }
        }