예제 #1
0
 /// <summary>
 /// Use NLP method to process the token
 /// </summary>
 /// <param name="tk"></param>
 private void ProcessToken(Token tk)
 {
     PunctuationMarker.Mark(tk);
     Stemmer.Stem(tk); // convert to root form
     StopwordMarker.Mark(tk);
     IrregularMarker.Mark(tk);
 }
예제 #2
0
        /// <summary>
        /// Load the stopwords from the txt file
        /// </summary>
        internal static async Task <string[]> Load()
        {
            StorageFolder folder = Windows.ApplicationModel.Package.Current.InstalledLocation;
            StorageFile   file   = await folder.GetFileAsync(FilePath.StopWords);

            List <string> stopwordlist = new List <string>();
            var           lines        = await FileIO.ReadLinesAsync(file);

            foreach (string line in lines)
            {
                string stemmedStopword = Stemmer.Stem(line.Trim());
                stopwordlist.Add(stemmedStopword);
            }
            stopwords = stopwordlist.ToArray();
            return(stopwords);
        }