C# (CSharp) Microsoft.Spark.Sql.Types StructType 예제들

프로그래밍 언어: C# (CSharp)

네임스페이스/패키지 이름: Microsoft.Spark.Sql.Types

클래스/타입: StructType

hotexamples.com에서의 예제들: 3

C# (CSharp) Microsoft.Spark.Sql.Types StructType - 3개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 C# (CSharp)의 Microsoft.Spark.Sql.Types.StructType에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

예제 #1

파일 보기

        public static void RunSparkStream(string streamInputPath)
        {
            var foreachWriter = new TestForeachWriter();

            SparkSession spark = SparkSession
                                 .Builder()
                                 .AppName("itur")
                                 .GetOrCreate();


            var mySchema = new Microsoft.Spark.Sql.Types.StructType(new[]
            {
                new StructField("IturCode", new Microsoft.Spark.Sql.Types.StringType()),
                new StructField("IturERP", new Microsoft.Spark.Sql.Types.StringType()),
                new StructField("QuantityEdit", new Microsoft.Spark.Sql.Types.StringType()),
                new StructField("PartialQuantity", new Microsoft.Spark.Sql.Types.StringType())
            });

            DataFrame lines = spark
                              .ReadStream()
                              .Schema(mySchema)
                              .Csv(streamInputPath);

            s_query = lines
                      .WriteStream()
                      .Foreach(foreachWriter)
                      .Trigger(Trigger.ProcessingTime(5000))
                      .Start();


            s_query.AwaitTermination();
        }

예제 #2

파일 보기

        public string SparkTest([FromServices] IAWSSettings awsSettings)
        {
            string result = "ok";

            try
            {
                SparkSession spark = SparkSession
                                     .Builder()
                                     .AppName("itur")
                                     .GetOrCreate();

                var mySchema = new Microsoft.Spark.Sql.Types.StructType(new[]
                {
                    new StructField("IturCode", new Microsoft.Spark.Sql.Types.StringType()),
                    new StructField("IturERP", new Microsoft.Spark.Sql.Types.StringType()),
                    new StructField("QuantityEdit", new Microsoft.Spark.Sql.Types.StringType()),
                    new StructField("PartialQuantity", new Microsoft.Spark.Sql.Types.StringType())
                });

                string assemblyLocation = Path.GetDirectoryName(Assembly.GetExecutingAssembly().Location);
                string iturInputPath    = Path.Combine(assemblyLocation, "data", "itur.csv");

                DataFrame df = spark.Read()
                               .Format("csv")
                               .Schema(mySchema)
                               .Option("delimiter", ",")
                               .Option("header", true)
                               //.Option("dateFormat", "dd/MM/yyyy")
                               .Load(iturInputPath);

                string dt         = DateTime.Now.ToString("MMddhhmmss");
                string outputfile = Path.Combine(assemblyLocation, "outputData", $"itur_out{dt}.json");
                df.Write().Json(outputfile);

                //string toPath = $"s3n://{awsSettings.AccessKey}:{awsSettings.SecretKey}@{_bucketName}/{path}";
                //spark.Range(100).Repartition(5).Write().Mode("overwrite").Text(toPath) ;

                spark.Stop();
            }
            catch (Exception ex)
            {
                result = ex.Message;
            }
            return(result);
        }

예제 #3

파일 보기

파일: VectorDataFrameUdfs.cs 프로젝트: zwhrenxiaoxue/spark

        public void Run(string[] args)
        {
            if (args.Length != 1)
            {
                Console.Error.WriteLine(
                    "Usage: Sql.VectorDataFrameUdfs <path to SPARK_HOME/examples/src/main/resources/people.json>");
                Environment.Exit(1);
            }

            SparkSession spark = SparkSession
                                 .Builder()
                                 // Lower the shuffle partitions to speed up groupBy() operations.
                                 .Config("spark.sql.shuffle.partitions", "3")
                                 .AppName("SQL VectorUdfs example using .NET for Apache Spark")
                                 .GetOrCreate();

            DataFrame df = spark.Read().Schema("age INT, name STRING").Json(args[0]);

            StructType schema = df.Schema();

            Console.WriteLine(schema.SimpleString);

            df.Show();

            df.PrintSchema();

            // Grouped Map Vector UDF
            // able to return different shapes and record lengths
            df.GroupBy("age")
            .Apply(
                new StructType(new[]
            {
                new StructField("age", new IntegerType()),
                new StructField("nameCharCount", new IntegerType())
            }),
                r => CountCharacters(r))
            .Show();

            spark.Stop();
        }