C# (CSharp) Microsoft.ML.Auto TextFileSample Examples

Programming Language: C# (CSharp)

Namespace/Package Name: Microsoft.ML.Auto

Class/Type: TextFileSample

Examples at hotexamples.com: 6

C# (CSharp) Microsoft.ML.Auto TextFileSample - 6 examples found. These are the top rated real world C# (CSharp) examples of Microsoft.ML.Auto.TextFileSample extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

CreateFromFullFile(1)

CreateFromFullStream(1)

Example #1

Show file

File: ColumnInferenceApi.cs Project: daholste/AutoMLDotNet

        private static ColumnInferenceResult InferColumns(MLContext context,
                                                          TextFileSample sample, Func <TextLoader, IDataView> createDataView, string label,
                                                          bool hasHeader, string separator, bool?isQuoted, bool?isSparse)
        {
            var splitInference  = InferSplit(sample, separator, isQuoted, isSparse);
            var typeInference   = InferColumnTypes(context, sample, splitInference);
            var typedLoaderArgs = new TextLoader.Arguments
            {
                Column       = ColumnTypeInference.GenerateLoaderColumns(typeInference.Columns),
                Separator    = splitInference.Separator,
                AllowSparse  = splitInference.AllowSparse,
                AllowQuoting = splitInference.AllowQuote,
                HasHeader    = hasHeader
            };
            var textLoader = context.Data.CreateTextReader(typedLoaderArgs);
            var dataView   = createDataView(textLoader);

            var purposeInferenceResult = PurposeInference.InferPurposes(context, dataView, label);

            // infer column grouping and generate column names
            var groupingResult = ColumnGroupingInference.InferGroupingAndNames(context, hasHeader,
                                                                               typeInference.Columns, purposeInferenceResult);

            // build result objects & return
            var inferredColumns = groupingResult.Select(c => (c.GenerateTextLoaderColumn(), c.Purpose)).ToArray();

            return(new ColumnInferenceResult(inferredColumns, splitInference.AllowQuote, splitInference.AllowSparse, splitInference.Separator, hasHeader));
        }

Example #2

Show file

 public static ColumnInferenceResult InferColumns(MLContext context, string path, string label, 
     bool hasHeader = false, string separator = null)
 {
     var sample = TextFileSample.CreateFromFullFile(path);
     Func<TextLoader, IDataView> createDataView = (textLoader) => 
     {
         return textLoader.Read(path); 
     };
     return InferColumns(context, sample, createDataView, label, hasHeader, separator);
 }

Example #3

Show file

        private static TextFileContents.ColumnSplitResult InferSplit(TextFileSample sample, string separator)
        {
            var separatorCandidates = separator == null ? TextFileContents.DefaultSeparators : new string[] { separator };
            var splitInference = TextFileContents.TrySplitColumns(sample, separatorCandidates);
            
            if (!splitInference.IsSuccess)
            {
                throw new InferenceException(InferenceType.ColumnSplit, "Unable to split the file provided into multiple, consistent columns.");
            }

            return splitInference;
        }

Example #4

Show file

File: ColumnInferenceApi.cs Project: daholste/AutoMLDotNet

        public static ColumnInferenceResult InferColumns(MLContext context, IMultiStreamSource multiStreamSource,
                                                         string label, bool hasHeader, string separator, bool?isQuoted, bool?isSparse)
        {
            // heuristic: use first stream in multi-stream source to infer column types & split
            var stream = multiStreamSource.Open(0);
            var sample = TextFileSample.CreateFromFullStream(stream);

            Func <TextLoader, IDataView> createDataView = (textLoader) =>
            {
                return(textLoader.Read(multiStreamSource));
            };

            return(InferColumns(context, sample, createDataView, label, hasHeader, separator, isQuoted, isSparse));
        }

Example #5

Show file

File: ColumnInferenceApi.cs Project: daholste/AutoMLDotNet

        private static TextFileContents.ColumnSplitResult InferSplit(TextFileSample sample, string separator, bool?isQuoted, bool?isSparse)
        {
            var separatorCandidates = separator == null ? TextFileContents.DefaultSeparators : new string[] { separator };
            var splitInference      = TextFileContents.TrySplitColumns(sample, separatorCandidates);

            // respect passed-in overrides
            if (isQuoted != null)
            {
                splitInference.AllowQuote = isQuoted.Value;
            }
            if (isSparse != null)
            {
                splitInference.AllowSparse = isSparse.Value;
            }

            if (!splitInference.IsSuccess)
            {
                throw new InferenceException(InferenceType.ColumnSplit, "Unable to split the file provided into multiple, consistent columns.");
            }

            return(splitInference);
        }

Example #6

Show file

File: ColumnInferenceApi.cs Project: daholste/AutoMLDotNet

        private static ColumnTypeInference.InferenceResult InferColumnTypes(MLContext context, TextFileSample sample,
                                                                            TextFileContents.ColumnSplitResult splitInference)
        {
            // infer column types
            var typeInferenceResult = ColumnTypeInference.InferTextFileColumnTypes(context, sample,
                                                                                   new ColumnTypeInference.Arguments
            {
                ColumnCount = splitInference.ColumnCount,
                Separator   = splitInference.Separator,
                AllowSparse = splitInference.AllowSparse,
                AllowQuote  = splitInference.AllowQuote,
            });

            if (!typeInferenceResult.IsSuccess)
            {
                throw new InferenceException(InferenceType.ColumnDataKind, "Unable to infer column types of the file provided.");
            }

            return(typeInferenceResult);
        }