public void SymbolPunctuationOnly() { var validChars = ValidCharacters.Load(ksXmlHeader + "<ValidCharacters><WordForming>a\uFFFCb\uFFFCc\uFFFCd\uFFFCe</WordForming>" + "<Numeric>1\uFFFC2\uFFFC3\uFFFC4\uFFFC5</Numeric>" + "<Other>'\uFFFC-\uFFFC#</Other>" + "</ValidCharacters>", "Test WS", null, null, FwDirectoryFinder.LegacyWordformingCharOverridesFile); ILgCharacterPropertyEngine lgCharPropEngineEn = Cache.WritingSystemFactory.get_CharPropEngine( m_wsEn); FwCharacterCategorizer categorizer = new FwCharacterCategorizer(validChars, lgCharPropEngineEn); Assert.IsTrue(categorizer.IsPunctuation('#')); Assert.IsFalse(categorizer.IsWordFormingCharacter('#')); }
public void SymbolPunctuationOnly() { var validChars = ValidCharacters.Load(ksXmlHeader + "<ValidCharacters><WordForming>a\uFFFCb\uFFFCc\uFFFCd\uFFFCe</WordForming>" + "<Numeric>1\uFFFC2\uFFFC3\uFFFC4\uFFFC5</Numeric>" + "<Other>'\uFFFC-\uFFFC#</Other>" + "</ValidCharacters>", "Test WS", null, null, FwDirectoryFinder.LegacyWordformingCharOverridesFile); ILgCharacterPropertyEngine lgCharPropEngineEn = Cache.WritingSystemFactory.get_CharPropEngine( m_wsEn); FwCharacterCategorizer categorizer = new FwCharacterCategorizer(validChars, lgCharPropEngineEn); Assert.IsTrue(categorizer.IsPunctuation('#')); Assert.IsFalse(categorizer.IsWordFormingCharacter('#')); }
public void SymbolPunctuationOnly() { ValidCharacters validChars = ValidCharacters.Load(ksXmlHeader + "<ValidCharacters><WordForming>a\uFFFCb\uFFFCc\uFFFCd\uFFFCe</WordForming>" + "<Numeric>1\uFFFC2\uFFFC3\uFFFC4\uFFFC5</Numeric>" + "<Other>'\uFFFC-\uFFFC#</Other>" + "</ValidCharacters>", "Test WS", null); ILgCharacterPropertyEngine lgCharPropEngineEn = (ILgCharacterPropertyEngine) m_cache.Cache.LanguageWritingSystemFactoryAccessor.get_CharPropEngine( InMemoryFdoCache.s_wsHvos.En); FwCharacterCategorizer categorizer = new FwCharacterCategorizer(validChars, lgCharPropEngineEn); Assert.IsTrue(categorizer.IsPunctuation('#')); Assert.IsFalse(categorizer.IsWordFormingCharacter('#')); }
public void WordAndPuncs_OverridePunc() { var validChars = ValidCharacters.Load(ksXmlHeader + "<ValidCharacters><WordForming>a\uFFFCb\uFFFCc\uFFFCd\uFFFCe\uFFFC.</WordForming>" + "<Numeric>1\uFFFC2\uFFFC3\uFFFC4\uFFFC5</Numeric>" + "<Other>'\uFFFC-\uFFFC#</Other>" + "</ValidCharacters>", "Test WS", null, null, FwDirectoryFinder.LegacyWordformingCharOverridesFile); ILgCharacterPropertyEngine lgCharPropEngineEn = Cache.WritingSystemFactory.get_CharPropEngine( m_wsEn); FwCharacterCategorizer categorizer = new FwCharacterCategorizer(validChars, lgCharPropEngineEn); List <WordAndPunct> wordsAndPunc = categorizer.WordAndPuncts("abc.de"); // We expect one word to be returned. Assert.AreEqual(1, wordsAndPunc.Count); Assert.AreEqual("abc.de", wordsAndPunc[0].Word); }
public void WordAndPuncs_EmptyString() { var validChars = ValidCharacters.Load(ksXmlHeader + "<ValidCharacters><WordForming>a\uFFFCb\uFFFCc</WordForming>" + "<Numeric>1\uFFFC2\uFFFC3\uFFFC4\uFFFC5</Numeric>" + "<Other>-\uFFFCU+0020</Other>" + "</ValidCharacters>", "Test WS", null, null, FwDirectoryFinder.LegacyWordformingCharOverridesFile); var english = Cache.ServiceLocator.WritingSystemManager.Get("en"); var lgCharPropEngineEn = Cache.WritingSystemFactory.get_CharPropEngine( english.Handle); FwCharacterCategorizer categorizer = new FwCharacterCategorizer(validChars, lgCharPropEngineEn); List <WordAndPunct> wordsAndPunc = categorizer.WordAndPuncts(""); // We expect one word to be returned. Assert.AreEqual(0, wordsAndPunc.Count); }
public void WordAndPuncs_OverridePunc() { var validChars = ValidCharacters.Load(ksXmlHeader + "<ValidCharacters><WordForming>a\uFFFCb\uFFFCc\uFFFCd\uFFFCe\uFFFC.</WordForming>" + "<Numeric>1\uFFFC2\uFFFC3\uFFFC4\uFFFC5</Numeric>" + "<Other>'\uFFFC-\uFFFC#</Other>" + "</ValidCharacters>", "Test WS", null, null, FwDirectoryFinder.LegacyWordformingCharOverridesFile); ILgCharacterPropertyEngine lgCharPropEngineEn = Cache.WritingSystemFactory.get_CharPropEngine( m_wsEn); FwCharacterCategorizer categorizer = new FwCharacterCategorizer(validChars, lgCharPropEngineEn); List<WordAndPunct> wordsAndPunc = categorizer.WordAndPuncts("abc.de"); // We expect one word to be returned. Assert.AreEqual(1, wordsAndPunc.Count); Assert.AreEqual("abc.de", wordsAndPunc[0].Word); }
public void WordAndPuncs_EmptyString() { ValidCharacters validChars = ValidCharacters.Load(ksXmlHeader + "<ValidCharacters><WordForming>a\uFFFCb\uFFFCc</WordForming>" + "<Numeric>1\uFFFC2\uFFFC3\uFFFC4\uFFFC5</Numeric>" + "<Other>-\uFFFCU+0020</Other>" + "</ValidCharacters>", "Test WS", null); ILgCharacterPropertyEngine lgCharPropEngineEn = (ILgCharacterPropertyEngine) m_cache.Cache.LanguageWritingSystemFactoryAccessor.get_CharPropEngine( InMemoryFdoCache.s_wsHvos.En); FwCharacterCategorizer categorizer = new FwCharacterCategorizer(validChars, lgCharPropEngineEn); List <WordAndPunct> wordsAndPunc = categorizer.WordAndPuncts(""); // We expect one word to be returned. Assert.AreEqual(0, wordsAndPunc.Count); }
public void WordAndPuncs_Spaces() { var validChars = ValidCharacters.Load(ksXmlHeader + "<ValidCharacters><WordForming>a\uFFFCb\uFFFCc</WordForming>" + "<Numeric>1\uFFFC2\uFFFC3\uFFFC4\uFFFC5</Numeric>" + "<Other>-\uFFFCU+0020</Other>" + "</ValidCharacters>", "Test WS", null, null); var english = Cache.ServiceLocator.WritingSystemManager.Get("en"); var lgCharPropEngineEn = Cache.WritingSystemFactory.get_CharPropEngine(english.Handle); FwCharacterCategorizer categorizer = new FwCharacterCategorizer(validChars, lgCharPropEngineEn); List <WordAndPunct> wordsAndPunc = categorizer.WordAndPuncts(" "); Assert.AreEqual(0, wordsAndPunc.Count); wordsAndPunc = categorizer.WordAndPuncts(" "); Assert.AreEqual(0, wordsAndPunc.Count); }
public void WordAndPuncs_NoOverridePunc() { ValidCharacters validChars = ValidCharacters.Load(ksXmlHeader + "<ValidCharacters><WordForming>a\uFFFCb\uFFFCc\uFFFCd\uFFFCe</WordForming>" + "<Numeric>1\uFFFC2\uFFFC3\uFFFC4\uFFFC5</Numeric>" + "<Other>'\uFFFC-\uFFFC#</Other>" + "</ValidCharacters>", "Test WS", null); ILgCharacterPropertyEngine lgCharPropEngineEn = (ILgCharacterPropertyEngine) m_cache.Cache.LanguageWritingSystemFactoryAccessor.get_CharPropEngine( InMemoryFdoCache.s_wsHvos.En); FwCharacterCategorizer categorizer = new FwCharacterCategorizer(validChars, lgCharPropEngineEn); List <WordAndPunct> wordsAndPunc = categorizer.WordAndPuncts("abc.de"); // We expect two words to be returned. Assert.AreEqual(2, wordsAndPunc.Count); Assert.AreEqual("abc", wordsAndPunc[0].Word); Assert.AreEqual("de", wordsAndPunc[1].Word); }
public void WordAndPuncs_EmptyString() { var validChars = ValidCharacters.Load(ksXmlHeader + "<ValidCharacters><WordForming>a\uFFFCb\uFFFCc</WordForming>" + "<Numeric>1\uFFFC2\uFFFC3\uFFFC4\uFFFC5</Numeric>" + "<Other>-\uFFFCU+0020</Other>" + "</ValidCharacters>", "Test WS", null, null, FwDirectoryFinder.LegacyWordformingCharOverridesFile); var english = Cache.ServiceLocator.WritingSystemManager.Get("en"); var lgCharPropEngineEn = Cache.WritingSystemFactory.get_CharPropEngine( english.Handle); FwCharacterCategorizer categorizer = new FwCharacterCategorizer(validChars, lgCharPropEngineEn); List<WordAndPunct> wordsAndPunc = categorizer.WordAndPuncts(""); // We expect one word to be returned. Assert.AreEqual(0, wordsAndPunc.Count); }