Exemplo n.º 1
0
 public virtual void TestIncorrectLanguageForUserWordsAsList()
 {
     NUnit.Framework.Assert.That(() => {
         Tesseract4OcrEngineProperties properties = tesseractReader.GetTesseract4OcrEngineProperties();
         properties.SetUserWords("eng1", JavaUtil.ArraysAsList("word1", "word2"));
         properties.SetLanguages(new List <String>());
     }
                                 , NUnit.Framework.Throws.InstanceOf <Tesseract4OcrException>().With.Message.EqualTo(MessageFormatUtil.Format(Tesseract4OcrException.LANGUAGE_IS_NOT_IN_THE_LIST, "eng1")))
     ;
 }
Exemplo n.º 2
0
 public virtual void TestUserWordsWithLanguageNotInList()
 {
     NUnit.Framework.Assert.That(() => {
         String userWords = TEST_DOCUMENTS_DIRECTORY + "userwords.txt";
         Tesseract4OcrEngineProperties properties = tesseractReader.GetTesseract4OcrEngineProperties();
         properties.SetUserWords("spa", new FileStream(userWords, FileMode.Open, FileAccess.Read));
         properties.SetLanguages(new List <String>());
     }
                                 , NUnit.Framework.Throws.InstanceOf <Tesseract4OcrException>().With.Message.EqualTo(MessageFormatUtil.Format(Tesseract4OcrException.LANGUAGE_IS_NOT_IN_THE_LIST, "spa")))
     ;
 }
Exemplo n.º 3
0
        public virtual void TestUserWordsWithDefaultLanguageNotInList()
        {
            String userWords = TEST_DOCUMENTS_DIRECTORY + "userwords.txt";
            Tesseract4OcrEngineProperties properties = tesseractReader.GetTesseract4OcrEngineProperties();

            properties.SetUserWords("eng", new FileStream(userWords, FileMode.Open, FileAccess.Read));
            properties.SetLanguages(new List <String>());
            tesseractReader.SetTesseract4OcrEngineProperties(properties);
            String imgPath        = TEST_IMAGES_DIRECTORY + "numbers_01.jpg";
            String expectedOutput = "619121";
            String result         = GetRecognizedTextFromTextFile(tesseractReader, imgPath);

            NUnit.Framework.Assert.IsTrue(result.StartsWith(expectedOutput));
        }
Exemplo n.º 4
0
        public virtual void TestCustomUserWords()
        {
            String         imgPath   = TEST_IMAGES_DIRECTORY + "wierdwords.png";
            IList <String> userWords = JavaUtil.ArraysAsList("he23llo", "qwetyrtyqpwe-rty");
            Tesseract4OcrEngineProperties properties = tesseractReader.GetTesseract4OcrEngineProperties();

            properties.SetLanguages(JavaUtil.ArraysAsList("fra"));
            properties.SetUserWords("fra", userWords);
            tesseractReader.SetTesseract4OcrEngineProperties(properties);
            String result = GetRecognizedTextFromTextFile(tesseractReader, imgPath);

            NUnit.Framework.Assert.IsTrue(result.Contains(userWords[0]) || result.Contains(userWords[1]));
            NUnit.Framework.Assert.IsTrue(tesseractReader.GetTesseract4OcrEngineProperties().GetPathToUserWordsFile().
                                          EndsWith(".user-words"));
        }
Exemplo n.º 5
0
        public virtual void TestCustomUserWordsWithListOfLanguages()
        {
            String imgPath        = TEST_IMAGES_DIRECTORY + "bogusText.jpg";
            String expectedOutput = "B1adeb1ab1a";
            Tesseract4OcrEngineProperties properties = tesseractReader.GetTesseract4OcrEngineProperties();

            properties.SetLanguages(JavaUtil.ArraysAsList("fra", "eng"));
            properties.SetUserWords("eng", JavaUtil.ArraysAsList("b1adeb1ab1a"));
            tesseractReader.SetTesseract4OcrEngineProperties(properties);
            String result = GetRecognizedTextFromTextFile(tesseractReader, imgPath);

            result = result.Replace("\n", "").Replace("\f", "");
            result = iText.IO.Util.StringUtil.ReplaceAll(result, "[^\\u0009\\u000A\\u000D\\u0020-\\u007E]", "");
            NUnit.Framework.Assert.IsTrue(result.StartsWith(expectedOutput));
            NUnit.Framework.Assert.IsTrue(tesseractReader.GetTesseract4OcrEngineProperties().GetPathToUserWordsFile().
                                          EndsWith(".user-words"));
        }