示例#1
0
 public void Output(List <Term> result, string path)
 {
     using (System.IO.StreamWriter file =
                new System.IO.StreamWriter(path))
     {
         foreach (Term term in result)
         {
             ISet <string> originals = index.RetrieveVariantsOfCanonicalTerm(term.GetConcept());
             file.WriteLine(term.GetConcept() + " |" + WriteToString(originals) + "\t\t\t" + term.GetConfidence());
         }
     }
 }
示例#2
0
        private void Count(GlobalIndex index, FeatureCorpusTermFrequency featureCorpusTermFrequency)
        {
            TermFrequencyCounter termFrequencyCounter = new TermFrequencyCounter();

            foreach (Document document in index.GetDocuments())
            {
                string        context    = WordUtil.ApplyCharacterReplacement(document.GetContent(), RuntimeProperties.TERM_CLEAN_PATTERN);
                ISet <string> candidates = index.RetrieveCanonicalTermsInDoc(document);
                foreach (string term in candidates)
                {
                    int frequency = termFrequencyCounter.Count(context, index.RetrieveVariantsOfCanonicalTerm(term));
                    featureCorpusTermFrequency.AddToTermFrequency(term, frequency);
                }
            }
        }