/// <summary> /// /// </summary> /// <param name="texts"></param> /// <param name="options"></param> public static TextParseResult Parse(List <TextPartInfo> texts, TextParseOptions options) { var tokenParts = options.Tokenizer.GetTokens(texts); PrepareTokens(options, tokenParts); FilterTokens(options.Filters, tokenParts); AnalyzeTokens(options, tokenParts); FilterTokens(options.AfterAnalyzeFilters, tokenParts); return(new TextParseResult(tokenParts)); }
/// <summary> /// /// </summary> /// <param name="text"></param> /// <param name="options"></param> public static TextParseResult Parse(string text, TextParseOptions options) { var textPartInfo = new TextPartInfo(); textPartInfo.Text = text; textPartInfo.PartNumber = 1; var textParts = new List <TextPartInfo>(); textParts.Add(textPartInfo); return(Parse(textParts, options)); }
/// <summary> /// /// </summary> /// <param name="tokenParts"></param> private static void PrepareTokens(TextParseOptions options, List <TextTokenPartInfo> tokenParts) { options.Prepares.ForEach(f => PreparePagesTokens(f, tokenParts)); }
/// <summary> /// /// </summary> /// <param name="options"></param> /// <param name="tokenParts"></param> private static void AnalyzeTokens(TextParseOptions options, List <TextTokenPartInfo> tokenParts) { options.Analyzers.ForEach(f => AnalyzePartsTokens(f, tokenParts)); }