public static string[,] Parse(ReplParserCfg cfg) { var ModuleCfg = ReplacementsModuleConfig.Get(); string html = HTMLLoader.Load(cfg.GetRequest(), ModuleCfg.ReplacementsString); List <string> trArray = new List <string>(); while (html.IndexOf("<tr>", StringComparison.Ordinal) != -1) { int start = html.IndexOf("<tr>", StringComparison.Ordinal); int finish = html.IndexOf("</tr>", StringComparison.Ordinal); trArray.Add(html.Substring(start + 4, finish - 4)); html = html.Remove(start, finish + 5); } string[,] DataArray = new string[trArray.Count, 6]; for (int i = 0; i < trArray.Count; i++) { for (int j = 0; j < 6; j++) { int start = trArray[i].IndexOf("<td>", StringComparison.Ordinal); int finish = trArray[i].IndexOf("</td>", StringComparison.Ordinal); DataArray[i, j] = trArray[i].Substring(start + 4, finish - 4); trArray[i] = trArray[i].Remove(start, finish + 5); } } return(DataArray); }
public static string[] Parse() { var ModuleCfg = ReplacementsModuleConfig.Get(); string Response = HTMLLoader.Load(ModuleCfg.GroupString); List <string> DataArray = new List <string>(); while (Response.IndexOf("\">", System.StringComparison.Ordinal) != -1) { int start = Response.IndexOf("\">", System.StringComparison.Ordinal); int finish = Response.IndexOf("</", System.StringComparison.Ordinal); DataArray.Add(Response.Substring(start + 2, finish - 2 - start)); Response = Response.Remove(start, finish + 2 - start); } DataArray.Remove("Будь-яка"); return(DataArray.ToArray()); }
public List <int> ExtractUrlRank(SearchEngine engine, SearchParameter parameter) { List <int> result = new List <int>(); if (engine != null) { //loop through all pages foreach (var currentUrl in engine.searchPages) { var html = HTMLLoader.LoadUrl(currentUrl); var tempRanks = ExtractURLRankOnCurrentPage(html, parameter, engine); //for all ranks returned in that page foreach (var rank in tempRanks) { if (rank > 0 && rank <= 50) { result.Add(rank); } } } } return(result);; }
public void InValidHTMLPageLoaderTest() { var result = HTMLLoader.LoadUrl(_generator.GenerateInvalidURL()); Assert.IsNull(result); }