public void SymbolPunctuationOnly() { ValidCharacters validChars = ValidCharacters.Load(ksXmlHeader + "<ValidCharacters><WordForming>a\uFFFCb\uFFFCc\uFFFCd\uFFFCe</WordForming>" + "<Numeric>1\uFFFC2\uFFFC3\uFFFC4\uFFFC5</Numeric>" + "<Other>'\uFFFC-\uFFFC#</Other>" + "</ValidCharacters>", "Test WS", null); ILgCharacterPropertyEngine lgCharPropEngineEn = (ILgCharacterPropertyEngine) m_cache.Cache.LanguageWritingSystemFactoryAccessor.get_CharPropEngine( InMemoryFdoCache.s_wsHvos.En); FwCharacterCategorizer categorizer = new FwCharacterCategorizer(validChars, lgCharPropEngineEn); Assert.IsTrue(categorizer.IsPunctuation('#')); Assert.IsFalse(categorizer.IsWordFormingCharacter('#')); }
public void WordAndPuncs_OverridePunc() { ValidCharacters validChars = ValidCharacters.Load(ksXmlHeader + "<ValidCharacters><WordForming>a\uFFFCb\uFFFCc\uFFFCd\uFFFCe\uFFFC.</WordForming>" + "<Numeric>1\uFFFC2\uFFFC3\uFFFC4\uFFFC5</Numeric>" + "<Other>'\uFFFC-\uFFFC#</Other>" + "</ValidCharacters>", "Test WS", null); ILgCharacterPropertyEngine lgCharPropEngineEn = (ILgCharacterPropertyEngine) m_cache.Cache.LanguageWritingSystemFactoryAccessor.get_CharPropEngine( InMemoryFdoCache.s_wsHvos.En); FwCharacterCategorizer categorizer = new FwCharacterCategorizer(validChars, lgCharPropEngineEn); List<WordAndPunct> wordsAndPunc = categorizer.WordAndPuncts("abc.de"); // We expect one word to be returned. Assert.AreEqual(1, wordsAndPunc.Count); Assert.AreEqual("abc.de", wordsAndPunc[0].Word); }
public void WordAndPuncs_Spaces() { ValidCharacters validChars = ValidCharacters.Load(ksXmlHeader + "<ValidCharacters><WordForming>a\uFFFCb\uFFFCc</WordForming>" + "<Numeric>1\uFFFC2\uFFFC3\uFFFC4\uFFFC5</Numeric>" + "<Other>-\uFFFCU+0020</Other>" + "</ValidCharacters>", "Test WS", null); ILgCharacterPropertyEngine lgCharPropEngineEn = (ILgCharacterPropertyEngine) m_cache.Cache.LanguageWritingSystemFactoryAccessor.get_CharPropEngine( InMemoryFdoCache.s_wsHvos.En); FwCharacterCategorizer categorizer = new FwCharacterCategorizer(validChars, lgCharPropEngineEn); List<WordAndPunct> wordsAndPunc = categorizer.WordAndPuncts(" "); Assert.AreEqual(0, wordsAndPunc.Count); wordsAndPunc = categorizer.WordAndPuncts(" "); Assert.AreEqual(0, wordsAndPunc.Count); }