Beispiel #1
0
        public void QuickStart_BreakSentences()
        {
            string text = "Sveika, pasaule! Man iet labi. Šodienas datums ir 2014-01-01";

            LatvianTokenizer tokenizer = new LatvianTokenizer();

            Token[] tokens = tokenizer.Tokenize(text).ToArray();
            Sentence[] sentences = tokenizer.BreakSentences(tokens).ToArray();

            Assert.AreEqual(3, sentences.Count());
            Assert.AreEqual(4, sentences[0].Count());
            Assert.AreEqual(4, sentences[1].Count());
            Assert.AreEqual(4, sentences[2].Count());
        }