Example #1
0
        public static SharpEntropy.GisModel TrainModel(string trainingFile, EventType modelType, string headRulesFile, int iterations, int cutoff)
        {
            var rules = new EnglishHeadRules(headRulesFile);

            SharpEntropy.ITrainingEventReader eventReader = new ParserEventReader(new SharpEntropy.PlainTextByLineDataReader(new StreamReader(trainingFile)), rules, modelType);
            return(Train(eventReader, iterations, cutoff));
        }
        public EnglishTreebankParser(string dataDirectory, bool useTagDictionary, bool useCaseSensitiveTagDictionary, int beamSize, double advancePercentage)
        {
            SharpEntropy.IO.BinaryGisModelReader buildModelReader = new SharpEntropy.IO.BinaryGisModelReader(dataDirectory + "parser\\build.nbin");
            SharpEntropy.GisModel buildModel = new SharpEntropy.GisModel(buildModelReader);

            SharpEntropy.IO.BinaryGisModelReader checkModelReader = new SharpEntropy.IO.BinaryGisModelReader(dataDirectory + "parser\\check.nbin");
            SharpEntropy.IMaximumEntropyModel checkModel = new SharpEntropy.GisModel(checkModelReader);

            EnglishTreebankPosTagger posTagger;

            if (useTagDictionary)
            {
                posTagger = new EnglishTreebankPosTagger(dataDirectory + "parser\\tag.nbin", dataDirectory + "parser\\tagdict", useCaseSensitiveTagDictionary);
            }
            else
            {
                posTagger = new EnglishTreebankPosTagger(dataDirectory + "parser\\tag.nbin");
            }

            EnglishTreebankParserChunker chunker = new EnglishTreebankParserChunker(dataDirectory + "parser\\chunk.nbin");
            EnglishHeadRules headRules = new EnglishHeadRules(dataDirectory + "parser\\head_rules");

            mParser = new MaximumEntropyParser(buildModel, checkModel, posTagger, chunker, headRules, beamSize, advancePercentage);

            mTokenizer = new OpenNLP.Tools.Tokenize.EnglishMaximumEntropyTokenizer(dataDirectory + "EnglishTok.nbin");
        }
        public EnglishTreebankParser(string dataDirectory, bool useTagDictionary, bool useCaseSensitiveTagDictionary, int beamSize, double advancePercentage)
        {
            SharpEntropy.IO.BinaryGisModelReader buildModelReader = new SharpEntropy.IO.BinaryGisModelReader(dataDirectory + "parser\\build.nbin");
            SharpEntropy.GisModel buildModel = new SharpEntropy.GisModel(buildModelReader);

            SharpEntropy.IO.BinaryGisModelReader checkModelReader = new SharpEntropy.IO.BinaryGisModelReader(dataDirectory + "parser\\check.nbin");
            SharpEntropy.IMaximumEntropyModel    checkModel       = new SharpEntropy.GisModel(checkModelReader);

            EnglishTreebankPosTagger posTagger;

            if (useTagDictionary)
            {
                posTagger = new EnglishTreebankPosTagger(dataDirectory + "parser\\tag.nbin", dataDirectory + "parser\\tagdict", useCaseSensitiveTagDictionary);
            }
            else
            {
                posTagger = new EnglishTreebankPosTagger(dataDirectory + "parser\\tag.nbin");
            }

            EnglishTreebankParserChunker chunker   = new EnglishTreebankParserChunker(dataDirectory + "parser\\chunk.nbin");
            EnglishHeadRules             headRules = new EnglishHeadRules(dataDirectory + "parser\\head_rules");

            mParser = new MaximumEntropyParser(buildModel, checkModel, posTagger, chunker, headRules, beamSize, advancePercentage);

            mTokenizer = new OpenNLP.Tools.Tokenize.EnglishMaximumEntropyTokenizer(dataDirectory + "EnglishTok.nbin");
        }
Example #4
0
        public static SharpEntropy.GisModel TrainModel(string trainingFile, EventType modelType, string headRulesFile, int iterations, int cutoff)
        {
            var rules = new EnglishHeadRules(headRulesFile);

#if DNF
            SharpEntropy.ITrainingEventReader eventReader = new ParserEventReader(new SharpEntropy.PlainTextByLineDataReader(new StreamReader(trainingFile)), rules, modelType);
#else
            SharpEntropy.ITrainingEventReader eventReader =
                new ParserEventReader(
                    new SharpEntropy.PlainTextByLineDataReader(
                        new StreamReader(new FileStream(trainingFile, FileMode.OpenOrCreate, FileAccess.Read))), rules, modelType);
#endif
            return(Train(eventReader, iterations, cutoff));
        }
Example #5
0
        // Constructors ---------------------

        public EnglishTreebankParser(string dataDirectory, bool useTagDictionary, bool useCaseSensitiveTagDictionary, int beamSize, double advancePercentage)
        {
            var buildModelReader = new SharpEntropy.IO.BinaryGisModelReader(dataDirectory + Path.Combine("parser", "build.nbin"));
            var buildModel       = new SharpEntropy.GisModel(buildModelReader);

            var checkModelReader = new SharpEntropy.IO.BinaryGisModelReader(dataDirectory + Path.Combine("parser", "check.nbin"));

            SharpEntropy.IMaximumEntropyModel checkModel = new SharpEntropy.GisModel(checkModelReader);

            EnglishTreebankPosTagger posTagger = useTagDictionary ?
                                                 new EnglishTreebankPosTagger(dataDirectory + Path.Combine("parser", "tag.nbin"), dataDirectory + Path.Combine("parser", "tagdict"), useCaseSensitiveTagDictionary)
                : new EnglishTreebankPosTagger(dataDirectory + Path.Combine("parser", "tag.nbin"));

            var chunker   = new EnglishTreebankParserChunker(dataDirectory + Path.Combine("parser", "chunk.nbin"));
            var headRules = new EnglishHeadRules(dataDirectory + Path.Combine("parser", "head_rules"));

            _parser = new MaximumEntropyParser(buildModel, checkModel, posTagger, chunker, headRules, beamSize, advancePercentage);

            _tokenizer = new Tokenize.EnglishMaximumEntropyTokenizer(dataDirectory + "EnglishTok.nbin");
        }
Example #6
0
		public static SharpEntropy.GisModel TrainModel(string trainingFile, EventType modelType, string headRulesFile, int iterations, int cutoff)
		{
			var rules = new EnglishHeadRules(headRulesFile);
			SharpEntropy.ITrainingEventReader eventReader = new ParserEventReader(new SharpEntropy.PlainTextByLineDataReader(new StreamReader(trainingFile)), rules, modelType);
			return Train(eventReader, iterations, cutoff);
		}