public static Edu.Stanford.Nlp.Objectbank.ObjectBank <X> GetLineIterator <X, _T1>(ICollection <_T1> filesStringsAndReaders, IFunction <string, X> op, string encoding) { ReaderIteratorFactory rif = new ReaderIteratorFactory(filesStringsAndReaders, encoding); IIteratorFromReaderFactory <X> ifrf = LineIterator.GetFactory(op); return(new Edu.Stanford.Nlp.Objectbank.ObjectBank <X>(rif, ifrf)); }
public static Edu.Stanford.Nlp.Objectbank.ObjectBank <X> GetLineIterator <X>(File file, Func <string, X> op, string encoding) { ReaderIteratorFactory rif = new ReaderIteratorFactory(file, encoding); IIteratorFromReaderFactory <X> ifrf = LineIterator.GetFactory(op); return(new Edu.Stanford.Nlp.Objectbank.ObjectBank <X>(rif, ifrf)); }
public static Edu.Stanford.Nlp.Objectbank.ObjectBank <X> GetLineIterator <X>(Reader reader, IFunction <string, X> op) { ReaderIteratorFactory rif = new ReaderIteratorFactory(reader); IIteratorFromReaderFactory <X> ifrf = LineIterator.GetFactory(op); return(new Edu.Stanford.Nlp.Objectbank.ObjectBank <X>(rif, ifrf)); }
/// <param name="hasSegMarkers">if true, input has segmentation markers</param> /// <param name="hasTags">if true, input has morphological analyses separated by tagDelimiter.</param> /// <param name="hasDomainLabels"> /// if true, input has a whitespace-terminated domain at the beginning /// of each line of text /// </param> /// <param name="stripRewrites"> /// if true, erase orthographical rewrites from the gold labels (for /// comparison purposes) /// </param> /// <param name="tokFactory">a TokenizerFactory for the input</param> public ArabicDocumentReaderAndWriter(bool hasSegMarkers, bool hasTags, bool hasDomainLabels, string domain, bool stripRewrites, ITokenizerFactory <CoreLabel> tokFactory) { tf = tokFactory; inputHasTags = hasTags; inputHasDomainLabels = hasDomainLabels; inputDomain = domain; shouldStripRewrites = stripRewrites; segMarker = hasSegMarkers ? DefaultSegMarker : null; factory = LineIterator.GetFactory(new _ISerializableFunction_131(this)); }
public virtual void Init(SeqClassifierFlags flags) { this.flags = flags; factory = LineIterator.GetFactory(new Sighan2005DocumentReaderAndWriter.CTBDocumentParser(this)); // pichuan : flags.normalizationTable is null --> i believe this is replaced by some java class?? // (Thu Apr 24 11:10:42 2008) cdtos = new ChineseDocumentToSentenceProcessor(flags.normalizationTable); if (flags.dictionary != null) { string[] dicts = flags.dictionary.Split(","); cdict = new ChineseDictionary(dicts, cdtos, flags.expandMidDot); } if (flags.serializedDictionary != null) { string dict = flags.serializedDictionary; cdict = new ChineseDictionary(dict, cdtos, flags.expandMidDot); } if (flags.dictionary2 != null) { string[] dicts2 = flags.dictionary2.Split(","); cdict2 = new ChineseDictionary(dicts2, cdtos, flags.expandMidDot); } }
public virtual void Init(SeqClassifierFlags flags) { this.flags = flags; factory = XMLBeginEndIterator.GetFactory("DOC", new MUCDocumentReaderAndWriter.MUCDocumentParser(), true, true); }
/// <summary> /// This creates a new ObjectBank with the given ReaderIteratorFactory /// and ObjectIteratorFactory. /// </summary> /// <param name="rif"> /// The /// <see cref="ReaderIteratorFactory"/> /// from which to get Readers /// </param> /// <param name="ifrf"> /// The /// <see cref="IIteratorFromReaderFactory{T}"/> /// which turns java.io.Readers /// into Iterators of Objects /// </param> public ObjectBank(ReaderIteratorFactory rif, IIteratorFromReaderFactory <E> ifrf) { this.rif = rif; this.ifrf = ifrf; }
public CoNLLUDocumentReader() { this.ifrf = DelimitRegExIterator.GetFactory("\n(\\s*\n)+", new CoNLLUDocumentReader.SentenceProcessor()); }
//TODO: repair this so it works with the feature label/coreLabel change public virtual void Init(SeqClassifierFlags flags) { this.flags = flags; factory = DelimitRegExIterator.GetFactory("\n(\\s*\n)+", new LibSVMReaderAndWriter.ColumnDocParser(this)); }
public virtual void Init(SeqClassifierFlags flags) { verboseForTrueCasing = flags.verboseForTrueCasing; factory = LineIterator.GetFactory(new TrueCasingForNISTDocumentReaderAndWriter.LineToTrueCasesParser()); }
public virtual void Init(string map) { // this.flags = null; this.map = CoreLabel.ParseStringKeys(StringUtils.MapStringToArray(map)); factory = DelimitRegExIterator.GetFactory("\n(?:\\s*\n)+", new ColumnDocumentReaderAndWriter.ColumnDocParser(this)); }
public virtual void Init(SeqClassifierFlags flags) { this.flags = flags; this.map = StringUtils.MapStringToArray(flags.map); factory = DelimitRegExIterator.GetFactory("\n(\\s*\n)+", new MalletReaderAndWriter.MalletDocParser(this)); }