/** * <summary>Train method for the Dummy pos tagger. The algorithm gets all possible tag list.</summary> * * <param name="corpus">Training data for the tagger.</param> */ public void Train(PosTaggedCorpus corpus) { var corpusTagList = corpus.GetTagList(); _tagList = new string[corpusTagList.Count]; _tagList = corpusTagList.ToArray(); }
/** * <summary>Train method for the Hmm pos tagger. The algorithm trains an Hmm from the corpus, where corpus constitutes * as an observation array.</summary> * * <param name="corpus">Training data for the tagger.</param> */ public void Train(PosTaggedCorpus corpus) { var emittedSymbols = new List <string> [corpus.SentenceCount()]; for (var i = 0; i < emittedSymbols.Length; i++) { emittedSymbols[i] = new List <string>(); for (var j = 0; j < corpus.GetSentence(i).WordCount(); j++) { var word = (PosTaggedWord)corpus.GetSentence(i).GetWord(j); emittedSymbols[i].Add(word.GetTag()); } } _hmm = new Hmm1 <string, Word>(corpus.GetTagList(), emittedSymbols, corpus.GetAllWordsAsArray()); }