Esempio n. 1
0
 private static void test_floresta_reader()
 {
     var floresta = new FlorestaCorpusReader(Path.Combine(
       Environment.GetFolderPath(Environment.SpecialFolder.MyDocuments), @"Data/floresta"));
       foreach ( var word in floresta.words().Select((x)=>TextTools.trim_punctuation(x)).Freqs().Generate().OrderBy((x)=>x.Value))
       {
     Console.WriteLine("{0}: {1}", word.Key, word.Value);
       }
 }
Esempio n. 2
0
        private static void portuguese_word_frequency()
        {
            var floresta = new FlorestaCorpusReader(Path.Combine(
              Environment.GetFolderPath(Environment.SpecialFolder.MyDocuments), @"Data/floresta"));
              var mac_morpho = new Mac_morphoCorpusReader(Path.Combine(
              Environment.GetFolderPath(Environment.SpecialFolder.MyDocuments), @"Data/mac_morpho"));

              using (StreamWriter outfile = new StreamWriter(Path.Combine(
            Environment.GetFolderPath(Environment.SpecialFolder.Desktop), "portuguese_words.txt"), false, Encoding.UTF8))
              {
            foreach (var word in mac_morpho.words().Where((x) => !TextTools.is_puctuation(x))
              .Concat(floresta.words().Select((x) => TextTools.trim_punctuation(x)))
              .Freqs().Generate().OrderBy((x) => x.Value).Reverse())
            {
              outfile.WriteLine("{0}: {1}", word.Key, word.Value);
            }
              }
        }