Пример #1
0
        void BeginCheckAnonymous(RatedProxy proxy)
        {
            Uri           anonymUri = new Uri("http://checker.samair.ru/");
            DownloaderObj obj       = new DownloaderObj(anonymUri, EndCheckAnonimous, true, proxy, CookieOptions.NoCookies, 3);

            Downloader.Queue(obj);
        }
Пример #2
0
        void CheckRBL(RatedProxy proxy)
        {
            DateTime start = DateTime.Now; //DEBUG

            List <string[]> rblList    = GlobalResourceCache.RBLList;
            double          rblBanRate = 0;

            int RBLChecks = 0;

            foreach (var rblSet in rblList)
            {
                Uri   rblUri     = new Uri(rblSet[0].Replace("*IP*", proxy.Address.Host));
                Regex positiveRx = new Regex(rblSet[1]);
                Regex negativeRx = new Regex(rblSet[2]);

                double rate = GetRblBanRate(rblUri, positiveRx, negativeRx, proxy);
                if (rate > -1)
                {
                    RBLChecks++;
                    rblBanRate += rate;
                }
            }

            if (RBLChecks > 0)
            {
                proxy.RBLBanRate = rblBanRate / RBLChecks;
            }
            Console.WriteLine("CheckRBL - elapsed {0}s, rate {1}", (DateTime.Now - start).TotalSeconds, rblBanRate / RBLChecks); //DEBUG
        }
Пример #3
0
        int?GetAvgLatency(Uri uri, RatedProxy proxy, int attempts)
        {
            Stopwatch timer        = new Stopwatch();
            int       totalLatency = 0;
            int       score        = 0;

            for (int i = 0; i < attempts; i++)
            {
                DownloaderObj obj = new DownloaderObj(uri, null, false, proxy, CookieOptions.Empty, 1);
                timer.Restart();
                bool haveResponse = Downloader.HaveResponce(obj);
                timer.Stop();

                if (haveResponse)
                {
                    totalLatency += (int)timer.ElapsedMilliseconds;
                    score++;
                }
            }
            if (score == 0)
            {
                return(null);
            }

            return(totalLatency / score);
        }
Пример #4
0
        void TestByActions(List <RatedProxy> proxies, List <Action <RatedProxy> > tests)
        {
            if (proxies.Count == 0)
            {
                return;
            }
            _proxiesTesting = proxies.Count;

            foreach (var proxy in proxies)
            {
                RatedProxy tmpProxy = proxy;
                ThreadPool.QueueUserWorkItem((object o) =>
                {
                    if (!HostReply(tmpProxy.Address.Host, 5))
                    {
                        EndTest(tmpProxy, true);
                    }
                    else
                    {
                        foreach (var test in tests)
                        {
                            if (test != null)
                            {
                                test.Invoke(tmpProxy);
                            }
                        }
                    }
                });
            }
        }
Пример #5
0
        public static void RemoveDuplicates()
        {
            List <RatedProxy> proxies     = LoadProxies();
            Hashtable         uniqueHosts = new Hashtable();

            foreach (var proxy in proxies)
            {
                if (!uniqueHosts.ContainsKey(proxy.Address.OriginalString))
                {
                    uniqueHosts.Add(proxy.Address.OriginalString, proxy);
                }
                else
                {
                    RatedProxy rp = uniqueHosts[proxy.Address.OriginalString] as RatedProxy;
                    if (proxy.CheckTimes > rp.CheckTimes)
                    {
                        uniqueHosts[proxy.Address.OriginalString] = proxy;
                    }
                }
            }
            RatedProxy[] uniqueHostsArray = new RatedProxy[uniqueHosts.Values.Count];
            uniqueHosts.Values.CopyTo(uniqueHostsArray, 0);

            SaveProxies(uniqueHostsArray.ToList(), false);
        }
Пример #6
0
        //ASYNC(NOT TESTED)
        #region Async RBL
        //void BeginRBLCheck(RatedProxy proxy)
        //{
        //    List<string[]> rblList = GlobalResourceCache.RBLList;
        //    int indx = 0;
        //    double rblBanRate = 0;
        //    int rblChecks = rblList.Count;

        //    BeginRBLCheck(indx, rblBanRate, rblChecks, proxy);
        //}
        //void EndRBLCheck(DownloaderObj obj)
        //{
        //    object[] args = obj.Arg as object[];
        //    int indx = (int)args[0];
        //    double rblBanRate = (double)args[1];
        //    int rblChecks = (int)args[2];

        //    List<string[]> rblList = GlobalResourceCache.RBLList;
        //    string[] rblSet = rblList[indx];
        //    Regex positiveRx = new Regex(rblSet[1]);
        //    Regex negativeRx = new Regex(rblSet[2]);

        //    double rate = GetRblBanRate(obj.DataStr, positiveRx, negativeRx);
        //    if (rate > -1)
        //    {
        //        rblBanRate += rate;
        //    }
        //    else
        //        rblChecks--;

        //    indx++;
        //    if (indx < rblList.Count)
        //    {
        //        BeginRBLCheck(indx, rblBanRate, rblChecks, obj.PrxContainer);
        //    }
        //    else if (rblChecks > 0)
        //    {
        //        obj.PrxContainer.RBLBanRate = rblBanRate / rblChecks;
        //    }
        //}
        //double GetRblBanRate(string data, Regex positiveRx, Regex negativeRx)
        //{
        //    if (data == null)
        //        return -1;
        //    double blocked = negativeRx.Matches(data).Count;
        //    double ok = positiveRx.Matches(data).Count;

        //    bool noResults = blocked == 0 && ok == 0;

        //    if (noResults)
        //        return -1;
        //    if (blocked == 0)
        //        return 0;
        //    if (ok == 0)
        //        return 1;

        //    return blocked / ok;
        //}
        //void BeginRBLCheck(int indx, double rblBanRate, int rblChecks, RatedProxy proxy)
        //{
        //    List<string[]> rblList = GlobalResourceCache.RBLList;

        //    if (indx < rblList.Count)
        //    {
        //        string[] rblSet = rblList[indx];
        //        DownloaderObj obj = new DownloaderObj(new Uri(rblSet[0]), EndRBLCheck, true, proxy, CookieOptions.NoCookies, 3, new object[] { indx, rblBanRate, rblChecks });
        //        Downloader.Queue(obj);
        //    }
        //}
        #endregion
        #endregion

        #region DownloadsCheck
        void BeginDownloads(RatedProxy proxy)
        {
            //Console.WriteLine("Downloads START {0}", DateTime.Now.ToShortTimeString());
            List <PatternsContainer> sitePatterns = PagePatternGrabber.LoadPatterns(PATH.TagClassPatterns);
            SyncWaitObj waiter = new SyncWaitObj(0);

            foreach (var patt in sitePatterns)
            {
                object[]      args = { patt, waiter, sitePatterns.Count };
                DownloaderObj obj  = new DownloaderObj(patt.Uri, EndDownload, true, proxy, CookieOptions.NoCookies, DownloadsAttempts, args);
                Downloader.Queue(obj);
            }
        }
Пример #7
0
        void FillProxyList(List <RatedProxy> proxies)
        {
            proxies.ForEach((cur_p) =>
            {
                ProxyContainer p_container = new ProxyContainer(cur_p, _maxOccupiedTimes, _prxLifes);

                if (_proxies.Count == 0)
                {
                    _proxies.Add(p_container);
                }
                else
                {
                    bool inserted = false;
                    for (int i = 0; i < _proxies.Count; i++)
                    {
                        ProxyContainer selec_cont = _proxies[i];
                        RatedProxy selected_p     = selec_cont.Proxy;

                        bool speedBetter    = cur_p.AvgSpeed > selected_p.AvgSpeed;
                        bool siteRateBetter = cur_p.SitesRate > selected_p.SitesRate;
                        bool latencyBetter  = (cur_p.AvgLatency != RatedProxy.DefaultVal && cur_p.AvgLatency < selected_p.AvgLatency);
                        bool cur_p_better   = speedBetter || siteRateBetter || latencyBetter;

                        if (cur_p_better)                                                   /* better proxies will be on the top of list */
                        {
                            p_container.Rating = ++selec_cont.Rating;
                            _proxies.Insert(i, p_container);
                            inserted = true;
                            break;
                        }
                    }

                    if (!inserted)
                    {
                        p_container.Rating = _proxies.Last().Rating;
                        _proxies.Add(p_container);
                    }
                }
            });

            if (_useLocalhost)
            {
                ProxyContainer localhost = new ProxyContainer(null, _localhost_occupation, _localhost_lives);
                _proxies.Insert(0, localhost);

                localhost.Rating = 999;
            }
        }
Пример #8
0
 static List <RatedProxy> SortBySpeed(List <RatedProxy> proxies)
 {
     for (int j = 0; j < proxies.Count; j++)
     {
         for (int i = 1; i < proxies.Count; i++)
         {
             if (proxies[i - 1].AvgSpeed < proxies[i].AvgSpeed)
             {
                 RatedProxy temp = proxies[i - 1];
                 proxies[i - 1] = proxies[i];
                 proxies[i]     = temp;
             }
         }
     }
     return(proxies);
 }
Пример #9
0
 static List <RatedProxy> SortByRBL(List <RatedProxy> proxies)
 {
     for (int j = 0; j < proxies.Count; j++)
     {
         for (int i = 1; i < proxies.Count; i++)
         {
             if (proxies[i - 1].RBLBanRate > proxies[i].RBLBanRate)
             {
                 RatedProxy temp = proxies[i - 1];
                 proxies[i - 1] = proxies[i];
                 proxies[i]     = temp;
             }
         }
     }
     return(proxies);
 }
Пример #10
0
        private void EndTest(RatedProxy proxy, bool unpingable = false)
        {
            int proxiesCount = Interlocked.Decrement(ref _proxiesTesting);

            if (OnProgressChanged != null)
            {
                OnProgressChanged(proxiesCount, unpingable);
            }
            if (OnProxyTestComplete != null)
            {
                OnProxyTestComplete(proxy);
            }
            if (proxiesCount == 0)
            {
                OnTestsComplete();
            }
        }
Пример #11
0
        void DownloadGooglePage(RatedProxy proxy)
        {
            Uri           googleUri = new Uri("http://www.google.com/search?q=flowers&sourceid=opera&ie=utf-8&oe=utf-8");
            DownloaderObj obj       = new DownloaderObj(googleUri, CheckGooglePage, true, proxy, CookieOptions.Empty, 2);

            if (Downloader.HaveResponce(obj))
            {
                obj.Attempts = 2;
                Downloader.Queue(obj);
            }
            else
            {
                if (_logging)
                {
                    GlobalLog.Err("Cant get responce from http://google.com, perhaps proxy or ya host is down, p:" + obj.Proxy.Address.Host);
                }
            }
        }
Пример #12
0
        void VerifySites(RatedProxy proxy)
        {
            //DEBUG
            DateTime start = DateTime.Now;

            int    downloadCheked = 0;
            int    latencyCheked  = 0;
            double totalSiteRate  = 0;
            double totalSpeed     = 0;
            long   totalLatency   = 0;

            List <PatternsContainer> siteChecks = PagePatternGrabber.LoadPatterns(PATH.TagClassPatterns);

            foreach (var siteCheck in siteChecks)
            {
                double siteRate      = 0;
                double downloadSpeed = 0;
                if (TryCheckDownloadSpeed(proxy, siteCheck.Uri, siteCheck.Validation, ref siteRate, ref downloadSpeed))
                {
                    totalSiteRate += siteRate;
                    totalSpeed    += downloadSpeed;
                    downloadCheked++;
                }

                int?latency = GetAvgLatency(siteCheck.Uri, proxy, 4);
                if (latency.HasValue)
                {
                    latencyCheked++;
                    totalLatency += latency.Value;
                }
            }
            if (latencyCheked > 0)
            {
                proxy.AvgLatency = (int)(totalLatency / latencyCheked);
            }
            if (downloadCheked > 0)
            {
                proxy.SitesRate = totalSiteRate / downloadCheked;
                proxy.AvgSpeed  = totalSpeed / downloadCheked;
            }
            //DEBUG
            Console.WriteLine("VerifySites - elapsed {0}s, latency {1}, sites rate {2}, speed {3} ", (DateTime.Now - start).TotalSeconds, (int)(totalLatency / latencyCheked), totalSiteRate / downloadCheked, totalSpeed / downloadCheked); //DEBUG
            proxy.CheckTimes++;
        }
Пример #13
0
        void DownloadYaPage(RatedProxy proxy)
        {
            Uri           yandexUri = new Uri("http://kiks.yandex.ru/su/");
            DownloaderObj obj       = new DownloaderObj(yandexUri, CheckYaPage, true, proxy, CookieOptions.Take, 2);

            if (Downloader.HaveResponce(obj))
            {
                obj.Uri      = new Uri("http://wordstat.yandex.ru/");
                obj.Attempts = 2;
                Downloader.Queue(obj);
            }
            else
            {
                if (_logging)
                {
                    GlobalLog.Err("Cant get responce from http://kiks.yandex.ru, perhaps proxy or ya host is down, p:" + obj.Proxy.Address.Host);
                }
            }
        }
Пример #14
0
        double GetRblBanRate(Uri rblUri, Regex positiveRx, Regex negativeRx, RatedProxy proxy)
        {
            DownloaderObj obj = new DownloaderObj(rblUri, null, true, proxy, CookieOptions.NoCookies, 4, null, null, false, 1000, new TimingParams(TimingPattern.BigWait));

            Downloader.DownloadSync(obj);

            if (obj.DataStr == null)
            {
                return(-1);
            }

            int blocked   = negativeRx.Matches(obj.DataStr).Count;
            int noblocked = positiveRx.Matches(obj.DataStr).Count;

            bool noResults = (blocked == 0) && (noblocked == 0);

            if (noResults)
            {
                return(-1);
            }
            return((double)blocked / (noblocked + blocked));
        }
Пример #15
0
        private bool TryCheckDownloadSpeed(RatedProxy proxy, Uri uri, IPageValidator validator, ref double siteRate, ref double downloadSpeed)
        {
            Stopwatch timer = new Stopwatch();

            for (int i = 0; i < 3; i++)
            {
                DownloaderObj obj = new DownloaderObj(uri, null, true, proxy, CookieOptions.Empty, 1);
                timer.Restart();
                Downloader.DownloadSync(obj);
                timer.Stop();
                string data = obj.DataStr;
                if (data != null)
                {
                    if (validator.Validate(data))
                    {
                        siteRate = (1 - i / 3d);
                        int leng = Encoding.UTF8.GetBytes(data).Length;
                        downloadSpeed = Encoding.UTF8.GetBytes(data).Length / (double)timer.ElapsedMilliseconds; //KB-sec
                        return(true);
                    }
                }
            }
            return(false);
        }
Пример #16
0
 void BeginCheckAnonymous(RatedProxy proxy)
 {
     Uri anonymUri = new Uri("http://checker.samair.ru/");
     DownloaderObj obj = new DownloaderObj(anonymUri, EndCheckAnonimous, true, proxy, CookieOptions.NoCookies, 3);
     Downloader.Queue(obj);
 }
Пример #17
0
        void BeginDownloads(RatedProxy proxy)
        {
            //Console.WriteLine("Downloads START {0}", DateTime.Now.ToShortTimeString());
            List<PatternsContainer> sitePatterns = PagePatternGrabber.LoadPatterns(PATH.TagClassPatterns);
            SyncWaitObj waiter = new SyncWaitObj(0);

            foreach (var patt in sitePatterns)
            {
                object[] args = { patt, waiter, sitePatterns.Count };
                DownloaderObj obj = new DownloaderObj(patt.Uri, EndDownload, true, proxy, CookieOptions.NoCookies, DownloadsAttempts, args);
                Downloader.Queue(obj);
            }
        }
Пример #18
0
        void CheckRBL(RatedProxy proxy)
        {
            DateTime start = DateTime.Now; //DEBUG

            List<string[]> rblList = GlobalResourceCache.RBLList;
            double rblBanRate = 0;

            int RBLChecks = 0;

            foreach (var rblSet in rblList)
            {
                Uri rblUri = new Uri(rblSet[0].Replace("*IP*", proxy.Address.Host));
                Regex positiveRx = new Regex(rblSet[1]);
                Regex negativeRx = new Regex(rblSet[2]);

                double rate = GetRblBanRate(rblUri, positiveRx, negativeRx, proxy);
                if (rate > -1)
                {
                    RBLChecks++;
                    rblBanRate += rate;
                }
            }

            if (RBLChecks > 0)
            {
                proxy.RBLBanRate = rblBanRate / RBLChecks;
            }
            Console.WriteLine("CheckRBL - elapsed {0}s, rate {1}", (DateTime.Now - start).TotalSeconds, rblBanRate / RBLChecks); //DEBUG
        }
Пример #19
0
 void DownloadGooglePage(RatedProxy proxy)
 {
     Uri googleUri = new Uri("http://www.google.com/search?q=flowers&sourceid=opera&ie=utf-8&oe=utf-8");
     DownloaderObj obj = new DownloaderObj(googleUri, CheckGooglePage, true, proxy, CookieOptions.Empty, 2);
     if (Downloader.HaveResponce(obj))
     {
         obj.Attempts = 2;
         Downloader.Queue(obj);
     }
     else
     {
         if (_logging)
             GlobalLog.Err("Cant get responce from http://google.com, perhaps proxy or ya host is down, p:" + obj.Proxy.Address.Host);
     }
 }
Пример #20
0
 void DownloadYaPage(RatedProxy proxy)
 {
     Uri yandexUri = new Uri("http://kiks.yandex.ru/su/");
     DownloaderObj obj = new DownloaderObj(yandexUri, CheckYaPage, true, proxy, CookieOptions.Take, 2);
     if (Downloader.HaveResponce(obj))
     {
         obj.Uri = new Uri("http://wordstat.yandex.ru/");
         obj.Attempts = 2;
         Downloader.Queue(obj);
     }
     else
     {
         if (_logging)
             GlobalLog.Err("Cant get responce from http://kiks.yandex.ru, perhaps proxy or ya host is down, p:" + obj.Proxy.Address.Host);
     }
 }
Пример #21
0
        void VerifySites(RatedProxy proxy)
        {
            //DEBUG
            DateTime start = DateTime.Now;

            int downloadCheked  = 0;
            int latencyCheked   = 0;
            double totalSiteRate = 0;
            double totalSpeed = 0;
            long totalLatency = 0;

            List<PatternsContainer> siteChecks = PagePatternGrabber.LoadPatterns(PATH.TagClassPatterns);

            foreach (var siteCheck in siteChecks)
            {
                double siteRate = 0;
                double downloadSpeed = 0;
                if (TryCheckDownloadSpeed(proxy, siteCheck.Uri, siteCheck.Validation, ref siteRate, ref downloadSpeed))
                {
                    totalSiteRate += siteRate;
                    totalSpeed += downloadSpeed;
                    downloadCheked++;
                }

                int? latency = GetAvgLatency(siteCheck.Uri, proxy, 4);
                if (latency.HasValue)
                {
                    latencyCheked++;
                    totalLatency += latency.Value;
                }
            }
            if (latencyCheked > 0)
            {
                proxy.AvgLatency = (int)(totalLatency / latencyCheked);
            }
            if (downloadCheked > 0)
            {
                proxy.SitesRate = totalSiteRate / downloadCheked;
                proxy.AvgSpeed = totalSpeed / downloadCheked;
            }
            //DEBUG
            Console.WriteLine("VerifySites - elapsed {0}s, latency {1}, sites rate {2}, speed {3} ", (DateTime.Now - start).TotalSeconds, (int)(totalLatency / latencyCheked), totalSiteRate / downloadCheked, totalSpeed / downloadCheked); //DEBUG
            proxy.CheckTimes++;
        }
Пример #22
0
        int? GetAvgLatency(Uri uri, RatedProxy proxy, int attempts)
        {
            Stopwatch timer = new Stopwatch();
            int totalLatency = 0;
            int score = 0;

            for (int i = 0; i < attempts; i++)
            {
                DownloaderObj obj = new DownloaderObj(uri, null, false, proxy, CookieOptions.Empty, 1);
                timer.Restart();
                bool haveResponse = Downloader.HaveResponce(obj);
                timer.Stop();

                if (haveResponse)
                {
                    totalLatency += (int)timer.ElapsedMilliseconds;
                    score++;
                }
            }
            if (score == 0)
                return null;

            return totalLatency / score;
        }
Пример #23
0
        double GetRblBanRate(Uri rblUri, Regex positiveRx, Regex negativeRx, RatedProxy proxy)
        {
            DownloaderObj obj = new DownloaderObj(rblUri, null, true, proxy, CookieOptions.NoCookies, 4, null, null, false, 1000, new TimingParams(TimingPattern.BigWait));
            Downloader.DownloadSync(obj);

            if (obj.DataStr == null)
                return -1;

            int blocked = negativeRx.Matches(obj.DataStr).Count;
            int noblocked = positiveRx.Matches(obj.DataStr).Count;

            bool noResults = (blocked == 0) && (noblocked == 0);
            if (noResults)
                return -1;
            return (double)blocked / (noblocked + blocked);
        }
Пример #24
0
        public static void RemoveDuplicates()
        {
            List<RatedProxy> proxies = LoadProxies();
            Hashtable uniqueHosts = new Hashtable();
            foreach (var proxy in proxies)
            {
                if (!uniqueHosts.ContainsKey(proxy.Address.OriginalString))
                {
                    uniqueHosts.Add(proxy.Address.OriginalString, proxy);
                }
                else
                {
                    RatedProxy rp = uniqueHosts[proxy.Address.OriginalString] as RatedProxy;
                    if (proxy.CheckTimes > rp.CheckTimes)
                        uniqueHosts[proxy.Address.OriginalString] = proxy;
                }
            }
            RatedProxy[] uniqueHostsArray = new RatedProxy[uniqueHosts.Values.Count];
            uniqueHosts.Values.CopyTo(uniqueHostsArray, 0);

            SaveProxies(uniqueHostsArray.ToList(), false);
        }
Пример #25
0
 public ProxyContainer(RatedProxy proxy, int maxOccupied, int maxLifes)
 {
     _proxy     = proxy;
     _maxOccups = maxOccupied;
     _lifes     = maxLifes;
 }
Пример #26
0
 private void EndTest(RatedProxy proxy, bool unpingable = false)
 {
     int proxiesCount = Interlocked.Decrement(ref _proxiesTesting);
     if (OnProgressChanged != null) OnProgressChanged(proxiesCount, unpingable);
     if (OnProxyTestComplete != null) OnProxyTestComplete(proxy);
     if (proxiesCount == 0) OnTestsComplete();
 }
Пример #27
0
 public ProxyContainer(RatedProxy proxy, int maxOccupied, int maxLifes)
 {
     _proxy = proxy;
     _maxOccups = maxOccupied;
     _lifes = maxLifes;
 }
Пример #28
0
 private bool TryCheckDownloadSpeed(RatedProxy proxy, Uri uri, IPageValidator validator, ref double siteRate, ref double downloadSpeed)
 {
     Stopwatch timer = new Stopwatch();
     for (int i = 0; i < 3; i++)
     {
         DownloaderObj obj = new DownloaderObj(uri, null, true, proxy, CookieOptions.Empty, 1);
         timer.Restart();
         Downloader.DownloadSync(obj);
         timer.Stop();
         string data = obj.DataStr;
         if (data != null)
         {
             if (validator.Validate(data))
             {
                 siteRate = (1 - i / 3d);
                 int leng = Encoding.UTF8.GetBytes(data).Length;
                 downloadSpeed = Encoding.UTF8.GetBytes(data).Length / (double)timer.ElapsedMilliseconds; //KB-sec
                 return true;
             }
         }
     }
     return false;
 }