/*
         * Cloud Functions entry point, this is where we get Storage events and respond to it.
         * In this case, we will collect all Document AI result files (they are placed in the Storage Bucket we specified)
         */
        public Task HandleAsync(CloudEvent cloudEvent, StorageObjectData data, CancellationToken cancellationToken)
        {
            dynamic configuration = ConfigHelper.ReadAppSettings();

            if (cloudEvent.Type == "google.cloud.storage.object.v1.finalized" &&
                data.Id.StartsWith($"{configuration.integration.DocumentAI.gcs}/completed/"))
            {
                var     gen         = "/" + data.Generation;
                var     url         = $"gs://{data.Id.Replace(gen, "")}";
                var     operationId = data.Id.Split('/')[2];
                dynamic result      = DocumentAI.GetOperationStatusAsync(operationId).GetAwaiter().GetResult();

                if (result.State == "SUCCEEDED")
                {
                    foreach (var o in result.Files)
                    {
                        var source = o.InputFile;
                        var sb     = new System.Text.StringBuilder();
                        var p      = $"gs://{configuration.integration.DocumentAI.gcs}/";
                        var fields = new List <KeyValuePair <string, string> >();
                        foreach (var outputPath in o.Output)
                        {
                            var ocrText = StorageAPI.GetDocumentAIResultsAsync(outputPath.Replace(p, "")).GetAwaiter().GetResult();
                            sb.Append(ocrText).Append(Environment.NewLine);
                            //===
                            var items = StorageAPI.GetFormFieldsResultsAsync(outputPath.Replace(p, "")).GetAwaiter().GetResult();
                            fields.AddRange(items);
                            //===
                        }

                        Console.WriteLine(JsonConvert.SerializeObject(fields.ToArray()));
                        string text = sb.ToString();
                        //  Upload CSC
                        string csv = StorageAPI.CreateCSV(fields.ToArray());
                        StorageAPI.UploadAsync($"{DateTime.Now.Ticks}.csv", System.Text.Encoding.UTF8.GetBytes(csv)).GetAwaiter().GetResult();
                        //
                        var     metaDataText = StorageAPI.DownloadAsync(source.Replace("gs://", ""), true).GetAwaiter().GetResult();
                        dynamic metaData     = JObject.Parse(metaDataText);
                        var     itemId       = MD5Hash.Calculate($"{metaData.name}");
                        CloudSearchAPI.IndexSmallMediaFileAsync(itemId,
                                                                $"{metaData.name}",
                                                                new string[] { $"{metaData.name}" },
                                                                $"{metaData.metadata.original_path}",
                                                                "TEXT",
                                                                DateTime.Parse($"{metaData.updated}"),
                                                                DateTime.Parse($"{metaData.timeCreated}"),
                                                                "TEXT",
                                                                DateTime.UtcNow.Ticks.ToString(),
                                                                text).GetAwaiter().GetResult();
                    }
                }
            }
            return(Task.CompletedTask);
        }
Example #2
0
        static void Test()
        {
            dynamic configuration = ConfigHelper.ReadAppSettings();
            dynamic result        = DocumentAI.GetOperationStatusAsync("13566904154644279726").GetAwaiter().GetResult();

            if (result.State == "SUCCEEDED")
            {
                foreach (var o in result.Files)
                {
                    var source = o.InputFile;
                    var sb     = new System.Text.StringBuilder();
                    var p      = $"gs://{configuration.integration.DocumentAI.gcs}/";
                    foreach (var outputPath in o.Output)
                    {
                        var ocrText = StorageAPI.GetDocumentAIResultsAsync(outputPath.Replace(p, "")).GetAwaiter().GetResult();
                        sb.Append(ocrText).Append(Environment.NewLine);
                    }
                    string text = sb.ToString();

                    var     metaDataText = StorageAPI.DownloadAsync(source.Replace("gs://", ""), true).GetAwaiter().GetResult();
                    dynamic metaData     = JObject.Parse(metaDataText);
                    var     itemId       = MD5Hash.Calculate($"{metaData.name}");

                    CloudSearchAPI.IndexSmallMediaFileAsync(itemId,
                                                            $"{metaData.name}",
                                                            new string[] { $"{metaData.name}" },
                                                            $"{metaData.metadata.original_path}",
                                                            "TEXT",
                                                            DateTime.Parse($"{metaData.updated}"),
                                                            DateTime.Parse($"{metaData.timeCreated}"),
                                                            "TEXT",
                                                            DateTime.UtcNow.Ticks.ToString(),
                                                            sb.ToString()).GetAwaiter().GetResult();
                }
            }
        }