Esempio n. 1
0
        public static List <OcrResult.OcrWord> CompareWordsToListPerPage(OcrResult.OcrPage MyPage, HashSet <String> BannedWords, HashSet <String> EnglishWords)
        {
            List <OcrResult.OcrWord> MyWords = new List <OcrResult.OcrWord>();

            foreach (var paragraph in MyPage.Paragraphs)
            {
                foreach (var line in paragraph.Lines)
                {
                    foreach (var word in line.Words)
                    {
                        //Console.WriteLine(word.Text.ToLower());
                        //Console.WriteLine(EnglishWords.Contains(word.Text.ToLower()));
                        if (!(BannedWords.Contains(word.Text.ToLower())) && (EnglishWords.Contains(word.Text.ToLower())))
                        {
                            MyWords.Add(word);
                        }
                    }
                }
            }
            return(MyWords);
        }
Esempio n. 2
0
        private static List <string> ParseNameList(OcrResult.OcrPage page, int lineNo)
        {
            List <string> names     = new List <string>();
            List <string> redNames  = new List <string>();
            List <string> blueNames = new List <string>();
            var           lines     = page.LinesOfText;
            int           lineCount = lines.Length;

            for (int i = lineNo; i < lineCount; i++)
            {
                var    line = lines[i];
                string name1, name2;
                if (GetNamesFromLine(line, out name1, out name2))
                {
                    redNames.Add(name2);
                    blueNames.Add(name1);
                }
            }

            names.AddRange(redNames);
            names.AddRange(blueNames);

            return(names);
        }