public static Edu.Stanford.Nlp.Objectbank.ObjectBank <X> GetLineIterator <X, _T1>(ICollection <_T1> filesStringsAndReaders, IFunction <string, X> op, string encoding)
        {
            ReaderIteratorFactory          rif  = new ReaderIteratorFactory(filesStringsAndReaders, encoding);
            IIteratorFromReaderFactory <X> ifrf = LineIterator.GetFactory(op);

            return(new Edu.Stanford.Nlp.Objectbank.ObjectBank <X>(rif, ifrf));
        }
Exemplo n.º 2
0
        public static Edu.Stanford.Nlp.Objectbank.ObjectBank <X> GetLineIterator <X>(File file, Func <string, X> op, string encoding)
        {
            ReaderIteratorFactory          rif  = new ReaderIteratorFactory(file, encoding);
            IIteratorFromReaderFactory <X> ifrf = LineIterator.GetFactory(op);

            return(new Edu.Stanford.Nlp.Objectbank.ObjectBank <X>(rif, ifrf));
        }
        public static Edu.Stanford.Nlp.Objectbank.ObjectBank <X> GetLineIterator <X>(Reader reader, IFunction <string, X> op)
        {
            ReaderIteratorFactory          rif  = new ReaderIteratorFactory(reader);
            IIteratorFromReaderFactory <X> ifrf = LineIterator.GetFactory(op);

            return(new Edu.Stanford.Nlp.Objectbank.ObjectBank <X>(rif, ifrf));
        }
Exemplo n.º 4
0
 /// <param name="hasSegMarkers">if true, input has segmentation markers</param>
 /// <param name="hasTags">if true, input has morphological analyses separated by tagDelimiter.</param>
 /// <param name="hasDomainLabels">
 /// if true, input has a whitespace-terminated domain at the beginning
 /// of each line of text
 /// </param>
 /// <param name="stripRewrites">
 /// if true, erase orthographical rewrites from the gold labels (for
 /// comparison purposes)
 /// </param>
 /// <param name="tokFactory">a TokenizerFactory for the input</param>
 public ArabicDocumentReaderAndWriter(bool hasSegMarkers, bool hasTags, bool hasDomainLabels, string domain, bool stripRewrites, ITokenizerFactory <CoreLabel> tokFactory)
 {
     tf                   = tokFactory;
     inputHasTags         = hasTags;
     inputHasDomainLabels = hasDomainLabels;
     inputDomain          = domain;
     shouldStripRewrites  = stripRewrites;
     segMarker            = hasSegMarkers ? DefaultSegMarker : null;
     factory              = LineIterator.GetFactory(new _ISerializableFunction_131(this));
 }
 public virtual void Init(SeqClassifierFlags flags)
 {
     this.flags = flags;
     factory    = LineIterator.GetFactory(new Sighan2005DocumentReaderAndWriter.CTBDocumentParser(this));
     // pichuan : flags.normalizationTable is null --> i believe this is replaced by some java class??
     // (Thu Apr 24 11:10:42 2008)
     cdtos = new ChineseDocumentToSentenceProcessor(flags.normalizationTable);
     if (flags.dictionary != null)
     {
         string[] dicts = flags.dictionary.Split(",");
         cdict = new ChineseDictionary(dicts, cdtos, flags.expandMidDot);
     }
     if (flags.serializedDictionary != null)
     {
         string dict = flags.serializedDictionary;
         cdict = new ChineseDictionary(dict, cdtos, flags.expandMidDot);
     }
     if (flags.dictionary2 != null)
     {
         string[] dicts2 = flags.dictionary2.Split(",");
         cdict2 = new ChineseDictionary(dicts2, cdtos, flags.expandMidDot);
     }
 }
 public virtual void Init(SeqClassifierFlags flags)
 {
     this.flags = flags;
     factory    = XMLBeginEndIterator.GetFactory("DOC", new MUCDocumentReaderAndWriter.MUCDocumentParser(), true, true);
 }
 /// <summary>
 /// This creates a new ObjectBank with the given ReaderIteratorFactory
 /// and ObjectIteratorFactory.
 /// </summary>
 /// <param name="rif">
 /// The
 /// <see cref="ReaderIteratorFactory"/>
 /// from which to get Readers
 /// </param>
 /// <param name="ifrf">
 /// The
 /// <see cref="IIteratorFromReaderFactory{T}"/>
 /// which turns java.io.Readers
 /// into Iterators of Objects
 /// </param>
 public ObjectBank(ReaderIteratorFactory rif, IIteratorFromReaderFactory <E> ifrf)
 {
     this.rif  = rif;
     this.ifrf = ifrf;
 }
Exemplo n.º 8
0
 public CoNLLUDocumentReader()
 {
     this.ifrf = DelimitRegExIterator.GetFactory("\n(\\s*\n)+", new CoNLLUDocumentReader.SentenceProcessor());
 }
 //TODO: repair this so it works with the feature label/coreLabel change
 public virtual void Init(SeqClassifierFlags flags)
 {
     this.flags = flags;
     factory    = DelimitRegExIterator.GetFactory("\n(\\s*\n)+", new LibSVMReaderAndWriter.ColumnDocParser(this));
 }
 public virtual void Init(SeqClassifierFlags flags)
 {
     verboseForTrueCasing = flags.verboseForTrueCasing;
     factory = LineIterator.GetFactory(new TrueCasingForNISTDocumentReaderAndWriter.LineToTrueCasesParser());
 }
 public virtual void Init(string map)
 {
     // this.flags = null;
     this.map = CoreLabel.ParseStringKeys(StringUtils.MapStringToArray(map));
     factory  = DelimitRegExIterator.GetFactory("\n(?:\\s*\n)+", new ColumnDocumentReaderAndWriter.ColumnDocParser(this));
 }
Exemplo n.º 12
0
 public virtual void Init(SeqClassifierFlags flags)
 {
     this.flags = flags;
     this.map   = StringUtils.MapStringToArray(flags.map);
     factory    = DelimitRegExIterator.GetFactory("\n(\\s*\n)+", new MalletReaderAndWriter.MalletDocParser(this));
 }