public void GenerateObjectAndStringifyParseGloss() { //Important! create teh dialect only once, mixing this is bad biz. Dialect dialect = Dialect.LooseyGoosey; dialect.IncludeApocrypha = false; List <Sentence> sentences = new List <Sentence>(); TextGenerator tg = new TextGenerator(dialect); for (int i = 0; i < 1000; i++) { sentences.Add(tg.GenerateSentence()); } ParserUtils pu = new ParserUtils(dialect); GlossMaker gm = new GlossMaker(); foreach (Sentence sentence in sentences) { string s = sentence.ToString(); NormalizeExplicit norm = new NormalizeExplicit(dialect); string sn = norm.NormalizeText(s); Console.WriteLine(sn); Console.WriteLine(sentence.ToString("b")); Console.WriteLine(gm.Gloss(sn, s, dialect)); Sentence reparsed = pu.ParsedSentenceFactory(sn, s); string reparseString = reparsed.ToString(); //string normalize = Normalizer.NormalizeText(reparseString, dialect); string normalize = norm.NormalizeText(reparseString); Console.WriteLine(normalize); Console.WriteLine(gm.Gloss(normalize, s, dialect)); } }
public void IdentifyDiscourses_CanItEvenParseTheSentences() { string sample = CorpusTexts.UnpaText; Dialect dialect = Dialect.LooseyGoosey; dialect.TargetGloss = "en"; CorpusKnowledge ck = new CorpusKnowledge(sample, dialect); NormalizeExplicit norm = new NormalizeExplicit(dialect); List <Sentence>[] s = ck.MakeSentences(); for (int i = 0; i < s.Length; i++) { foreach (Sentence sentence in s[i]) { string reToStringed = sentence.ToString(); bool match = ck.Setences.Any(x => x.Trim() == reToStringed); if (!match) { Console.WriteLine(match + " O:" + ck.Setences[i]); Console.WriteLine(match + " R:" + sentence.ToString("b")); } } } }