public static void Main(string[] args) { #if NETCOREAPP2_0 Encoding.RegisterProvider(CodePagesEncodingProvider.Instance); #else ThreadPool.SetMinThreads(200, 200); OcrDemo.Process(); #endif MyTest(); Startup.Run(new string[] { "-s:BaiduSearch", "-tid:BaiduSearch", "-i:guid", "-a:" }); Startup.Run(new string[] { "-s:CustomSpider1", "-tid:CustomSpider1", "-i:CustomSpider1" }); Startup.Run(new string[] { "-s:DefaultMySqlPipeline", "-tid:DefaultMySqlPipeline", "-i:guid", "-a:" }); //ConfigurableSpider.Run(); // Custmize processor and pipeline 完全自定义页面解析和数据管道 BaseUsage.CustmizeProcessorAndPipeline(); Console.WriteLine("Press any key to continue..."); Console.Read(); // Crawler pages without traverse 采集指定页面不做遍历 BaseUsage.CrawlerPagesWithoutTraverse(); Console.WriteLine("Press any key to continue..."); Console.Read(); // Crawler pages traversal 遍历整站 BaseUsage.CrawlerPagesTraversal(); Console.WriteLine("Press any key to continue..."); Console.Read(); DDengEntitySpider dDengEntitySpider = new DDengEntitySpider(); dDengEntitySpider.Run(); Console.WriteLine("Press any key to continue..."); Console.Read(); Cnblogs.Run(); Console.WriteLine("Press any key to continue..."); Console.Read(); CasSpider casSpider = new CasSpider(); casSpider.Run(); Console.WriteLine("Press any key to continue..."); Console.Read(); BaiduSearchSpider baiduSearchSpider = new BaiduSearchSpider(); baiduSearchSpider.Run(); Console.WriteLine("Press any key to continue..."); Console.Read(); JdSkuSampleSpider jdSkuSampleSpider = new JdSkuSampleSpider(); jdSkuSampleSpider.Run(); Console.WriteLine("Press any key to continue..."); Console.Read(); Situoli.Run(); }
public static void Main(string[] args) { #if NETCOREAPP Encoding.RegisterProvider(CodePagesEncodingProvider.Instance); #else ThreadPool.SetMinThreads(200, 200); OcrDemo.Process(); #endif DataHandlerSpider.Run(); }
public static void Main(string[] args) { #if NETCOREAPP Encoding.RegisterProvider(CodePagesEncodingProvider.Instance); #else ThreadPool.SetMinThreads(200, 200); OcrDemo.Process(); #endif AutoIncrementTargetUrlsExtractor.Run(); MyTest(); }
public static void Main(string[] args) { #if NETCOREAPP2_0 // 注册了CodePages 编码则为UTF-8 Encoding.RegisterProvider(CodePagesEncodingProvider.Instance); #else ThreadPool.SetMinThreads(200, 200); OcrDemo.Process(); #endif //MyTest(); //Startup.Run("-s:BaiduSearchSpider", "-tid:1", "-i:guid"); //Startup.Run("-s:DotnetSpider.Sample.CustomSpider1", "-tid:CustomSpider1", "-i:CustomSpider1"); //Startup.Run("-s:DotnetSpider.Sample.DefaultMySqlPipelineSpider", "-tid:DefaultMySqlPipeline", "-i:guid", "-a:"); ////ConfigurableSpider.Run(); // Custmize processor and pipeline 完全自定义页面解析和数据管道 //BaseUsage.CustmizeProcessorAndPipeline(); //Console.WriteLine("Press any key to continue..."); //Console.Read(); //// Crawler pages without traverse 采集指定页面不做遍历 //BaseUsage.CrawlerPagesWithoutTraverse(); //Console.WriteLine("Press any key to continue..."); //Console.Read(); // Crawler pages traversal 遍历整站 //BaseUsage.CrawlerPagesTraversal(); //Console.WriteLine("Press any key to continue..."); //Console.Read(); //DDengEntitySpider dDengEntitySpider = new DDengEntitySpider(); //dDengEntitySpider.Run(); //Console.WriteLine("Press any key to continue..."); //Console.Read(); //Cnblogs.Run(); //Console.WriteLine("Press any key to continue..."); //Console.Read(); ////CasSpider casSpider = new CasSpider(); ////casSpider.Run(); ////Console.WriteLine("Press any key to continue..."); ////Console.Read(); //BaiduSearchSpider baiduSearchSpider = new BaiduSearchSpider(); //baiduSearchSpider.Run(); //Console.WriteLine("Press any key to continue..."); //Console.Read(); //JdSkuSampleSpider jdSkuSampleSpider = new JdSkuSampleSpider(); //jdSkuSampleSpider.Run(); //Console.WriteLine("Press any key to continue..."); //Console.Read(); //LyProductSpider lyProductSpider = new LyProductSpider(); //lyProductSpider.Run(); //Console.WriteLine("Press any key to continue..."); //Console.Read(); ZhiPinSpider spider = new ZhiPinSpider(); spider.Run(); Console.WriteLine("Press any key to continue..."); Console.Read(); //Situoli.Run(); }