/// <summary> /// Extract the field from the delimited file, removing separators and quotes /// and any duplicate quotes within the record /// </summary> /// <param name="line">line containing record input</param> /// <returns>Extract information</returns> public override ExtractedInfo ExtractFieldString(LineInfo line) { if (IsOptional && line.IsEOL()) { return(Visyn.Windows.Io.FileHelper.Core.ExtractedInfo.Empty); } if (QuoteChar == '\0') { return(BasicExtractString(line)); } if (TrimMode == TrimMode.Both || TrimMode == TrimMode.Left) { line.TrimStart(TrimChars); } var quotedStr = QuoteChar.ToString(); if (line.StartsWith(quotedStr)) { var res = StringHelper.ExtractQuotedString(line, QuoteChar, QuoteMultiline == MultilineMode.AllowForBoth || QuoteMultiline == MultilineMode.AllowForRead); if (TrimMode == TrimMode.Both || TrimMode == TrimMode.Right) { line.TrimStart(TrimChars); } if (!IsLast && !line.StartsWith(Separator) && !line.IsEOL()) { throw new BadUsageException(line, "The field " + FieldInfo.Name + " is quoted but the quoted char: " + quotedStr + " not is just before the separator (You can use [FieldTrim] to avoid this error)"); } return(res); } if (QuoteMode == QuoteMode.OptionalForBoth || QuoteMode == QuoteMode.OptionalForRead) { return(BasicExtractString(line)); } if (line.StartsWithTrim(quotedStr)) { throw new BadUsageException( $"The field '{FieldInfo.Name}' has spaces before the QuotedChar at line {line.mReader.LineNumber}. Use the TrimAttribute to by pass this error. Field String: {line.CurrentString}"); } throw new BadUsageException( $"The field '{FieldInfo.Name}' does not begin with the QuotedChar at line {line.mReader.LineNumber}. You can use FieldQuoted(QuoteMode.OptionalForRead) to allow optional quoted field. Field String: {line.CurrentString}"); }
/// <summary> /// Extract a string from a quoted string, allows for doubling the quotes /// for example 'o''clock' /// </summary> /// <param name="line">Line to extract from (with extra info)</param> /// <param name="quoteChar">Quote char to remove</param> /// <param name="allowMultiline">can we have a new line in middle of string</param> /// <returns>Extracted information</returns> internal static ExtractedInfo ExtractQuotedString(LineInfo line, char quoteChar, bool allowMultiline) { // if (line.mReader == null) // throw new BadUsageException("The reader can´t be null"); if (line.IsEOL()) { throw new BadUsageException( "An empty String found. This can not be parsed like a QuotedString try to use SafeExtractQuotedString"); } if (line.mLineStr[line.mCurrentPos] != quoteChar) { throw new BadUsageException("The source string does not begin with the quote char: " + quoteChar); } var res = new StringBuilder(32); bool firstFound = false; int i = line.mCurrentPos + 1; //bool mustContinue = true; while (line.mLineStr != null) { while (i < line.mLineStr.Length) { if (line.mLineStr[i] == quoteChar) { if (firstFound) { // Is an escaped quoted char res.Append(quoteChar); firstFound = false; } else { firstFound = true; } } else { if (firstFound) { // This was the end of the string line.mCurrentPos = i; return(new ExtractedInfo(res.ToString())); } else { res.Append(line.mLineStr[i]); } } i++; } if (firstFound) { line.mCurrentPos = i; return(new ExtractedInfo(res.ToString())); } else { if (allowMultiline == false) { throw new BadUsageException("The current field has an unclosed quoted string. Complete line: " + res.ToString()); } line.ReadNextLine(); res.Append(NewLine); //lines++; i = 0; } } throw new BadUsageException("The current field has an unclosed quoted string. Complete Filed String: " + res.ToString()); }
protected override ExtractedInfo ExtractFieldString(LineInfo line) { if (mIsOptional && line.IsEOL()) { return(ExtractedInfo.Empty); } if (mQuoteChar == '\0') { return(BasicExtractString(line)); } else { //TODO: UnComment and Fix if (mTrimMode == TrimMode.Both || mTrimMode == TrimMode.Left) { //int pos = line.mCurrentPos; line.TrimStart(mTrimChars); // from2 = from.TrimStart(mTrimChars); //res.CharsRemoved = line.mCurrentPos - pos; } var quotedStr = mQuoteChar.ToString(); if (line.StartsWith(quotedStr)) { // ExtractedInfo res = null; // res = new ExtractedInfo(line, line.mCurrentPos); return(StringHelper.ExtractQuotedString(line, mQuoteChar, mQuoteMultiline == MultilineMode.AllowForBoth || mQuoteMultiline == MultilineMode.AllowForRead)); // if (mQuoteMultiline == MultilineMode.AllowForBoth || mQuoteMultiline == MultilineMode.AllowForRead) // { // // //res.ExtractedString = ei.ExtractedString; // //res.CharsRemoved += ei.CharsRemoved; // //res.ExtraLines = ei.ExtraLines; // //res.NewRestOfLine = ei.NewRestOfLine; // } // else // { // return StringHelper.ExtractQuotedString(from2, mQuoteChar, out index); // //res.CharsRemoved += index; // } // return res; } else { if (mQuoteMode == QuoteMode.OptionalForBoth || mQuoteMode == QuoteMode.OptionalForRead) { return(BasicExtractString(line)); } else if (line.StartsWithTrim(quotedStr)) { throw new BadUsageException("The field '" + mFieldInfo.Name + "' has spaces before the QuotedChar at line " + line.mReader.LineNumber.ToString() + ". Use the TrimAttribute to by pass this error. Field String: " + line.CurrentString); } else { throw new BadUsageException("The field '" + mFieldInfo.Name + "' not begin with the QuotedChar at line " + line.mReader.LineNumber.ToString() + ". You can use FieldQuoted(QuoteMode.OptionalForRead) to allow optional quoted field.. Field String: " + line.CurrentString); } } } }
/// <summary> /// Get the data out of the records /// </summary> /// <param name="line">Line handler containing text</param> /// <returns></returns> public object ExtractFieldValue(LineInfo line) { //-> extract only what I need if (InNewLine) { // Any trailing characters, terminate if (line.EmptyFromPos() == false) { throw new BadUsageException(line, $"Text '{line.CurrentString}' found before the new line of the field: {FieldInfo.Name} (this is not allowed when you use [FieldInNewLine])"); } line.ReLoad(line.mReader.ReadNextLine()); if (line.mLineStr == null) { throw new BadUsageException(line, $"End of stream found parsing the field {FieldInfo.Name}. Please check the class record."); } } if (IsArray == false) { var info = ExtractFieldString(line); if (info.mCustomExtractedString == null) { line.mCurrentPos = info.ExtractedTo + 1; } line.mCurrentPos += CharsToDiscard; //total; return(Discarded ? GetDiscardedNullValue() : AssignFromString(info, line).Value); } if (ArrayMinLength <= 0) { ArrayMinLength = 0; } var i = 0; var res = new ArrayList(Math.Max(ArrayMinLength, 10)); while (line.mCurrentPos - CharsToDiscard < line.mLineStr.Length && i < ArrayMaxLength) { var info = ExtractFieldString(line); if (info.mCustomExtractedString == null) { line.mCurrentPos = info.ExtractedTo + 1; } line.mCurrentPos += CharsToDiscard; try { var value = AssignFromString(info, line); if (value.NullValueUsed && i == 0 && line.IsEOL()) { break; } res.Add(value.Value); } catch (NullValueNotFoundException) { if (i == 0) { break; } throw; } i++; } if (res.Count < ArrayMinLength) { throw new InvalidOperationException($"Line: {line.mReader.LineNumber} Column: {line.mCurrentPos} Field: {FieldInfo.Name}. The array has only {res.Count} values, less than the minimum length of {ArrayMinLength}"); } if (IsLast && line.IsEOL() == false) { throw new InvalidOperationException($"Line: {line.mReader.LineNumber} Column: {line.mCurrentPos} Field: {FieldInfo.Name}. The array has more values than the maximum length of {ArrayMaxLength}"); } // TODO: is there a reason we go through all the array processing then discard it return(Discarded ? null : res.ToArray(ArrayType)); }