public void Process()
        {
            var pipelineText = _context.GetPipelineText <TextSegment>();

            var resultPipeline = pipelineText
                                 .ConvertText <CreateTreeSegments, TextSegment>(true)
                                 .ShowPdf <ShowTitleSegment>($"{_context.OutputFilePrefix}-titles.pdf")
                                 .Log <AnalyzeSegmentTitles>($"{_context.OutputFilePrefix}-analyze-segment-titles.txt")
                                 .Log <AnalyzeTreeStructureFontSize2>($"{_context.OutputFilePrefix}-tree-fontsize.txt")
                                 .Log <AnalyzeTreeStructure2>($"{_context.OutputFilePrefix}-tree.txt");

            _context.SetPipelineText <TextSegment>(resultPipeline);

            _context.AddOutput("titles", $"{_context.OutputFilePrefix}-titles.pdf");
            _context.AddOutput("tree", $"{_context.OutputFilePrefix}-tree.txt");
        }
示例#2
0
        public void Process()
        {
            var pipelineText = _context.GetPipelineText <TextSegment>();

            var filename = _context.CreateGlobalInstance <InjectFilename>();

            filename.Filename = _context.Basename;

            var artigos = pipelineText
                          .ConvertText <CreateTaggedSegments, TextTaggedSegment>()
                          .ConvertText <TransformConteudo4, Conteudo>()
                          .ConvertText <TransformArtigo2, Artigo>()
                          .LogFiles <GenerateArtigoTmp>($"{_context.OutputFolder}/{_context.Basename}/artigos/{_context.Basename}-artigo{{0}}.xml")
                          .LogFiles <GenerateArtigoGN4>($"{_context.OutputFolder}/{_context.Basename}/artigosGN4/{_context.Basename}-artigo{{0}}.xml")
                          .ToList();

            _context.AddOutput("artigosGN", $"{_context.OutputFolder}/{_context.Basename}/artigos/{_context.Basename}-artigo{{0}}.xml");
            _context.AddOutput("artigosGN4", $"{_context.OutputFolder}/{_context.Basename}/artigosGN4/{_context.Basename}-artigo{{0}}.xml");
        }
示例#3
0
        public void Process()
        {
            string   basename = _context.Basename;
            Pipeline pipeline = _context.GetPipeline();

            pipeline.Input($"{_context.InputFilePrefix}.pdf")
            .Output($"{_context.OutputFilePrefix}-stage0-input.pdf")
            .StageProcess(InitialCache);

            _context.AddOutput("stage0-input", $"{_context.OutputFilePrefix}-stage0-input.pdf");
        }
        public void Process()
        {
            string   basename = _context.Basename;
            Pipeline pipeline = _context.GetPipeline();

            pipeline.Input($"{_context.InputFilePrefix}.pdf")
            .Output($"{_context.OutputFilePrefix}-stage3-retrieve.pdf")
            .Global <BasicFirstPageStats>()
            .StageProcess(RetrieveBlocks);

            _context.AddOutput("stage3", $"{_context.OutputFilePrefix}-stage3-retrieve.pdf");
        }
示例#5
0
        public void Process()
        {
            Pipeline pipeline = _context.GetPipeline();

            pipeline.Input($"{_context.InputFilePrefix}.pdf")
            .StageProcess(FindBlocksets);

            pipeline.Input($"{_context.InputFilePrefix}.pdf")
            .Output($"{_context.OutputFilePrefix}-stage2-blocksets.pdf")
            .StageProcess(ShowColors);

            _context.AddOutput("stage2-blocksets", $"{_context.OutputFilePrefix}-stage2-blocksets.pdf");
        }
示例#6
0
        public void Process()
        {
            var pipelineText = _context.GetPipelineText <TextSegment>();

            var resultPipeline = pipelineText
                                 .ConvertText <CreateTreeSegments, TextSegment>(true)
                                 //.ConvertText<MergeTreeSegments, TextSegment>(true)
                                 .Log <AnalyzeSegmentTitles>($"{_context.OutputFilePrefix}-analyze-segment-titles.txt")
                                 .Log <AnalyzeTreeStructure>($"{_context.OutputFilePrefix}-tree.txt");

            _context.SetPipelineText <TextSegment>(resultPipeline);

            _context.AddOutput("tree", $"{_context.OutputFilePrefix}-tree.txt");
        }
        public void Process()
        {
            var pipelineText = _context.GetPipelineText <TextSegment>();

            var conteudo = pipelineText
                           .ConvertText <TransformConteudo2, Conteudo>()
                           .ToList();

            var createArticle = new TransformArtigo();
            var artigos       = createArticle.Create(conteudo);

            createArticle.CreateXML(artigos, $"{_context.OutputFolder}/{_context.Basename}/artigos", _context.Basename);

            _context.AddOutput("artigosGN", $"{_context.OutputFolder}/{_context.Basename}/artigos/{_context.Basename}-artigo{{0}}.xml");
        }
        public void Process()
        {
            Pipeline pipeline = _context.GetPipeline();

            var result = pipeline.Input($"{_context.InputFilePrefix}.pdf")
                         .AllPages <CreateTextLines>(GetLines)
                         .ConvertText <CreateTextLineIndex, TextLine>(true)
                         .ConvertText <PreCreateStructures, TextLine2>()
                         .ConvertText <CreateStructures3, TextStructure>()
                         .ConvertText <PreCreateTextSegments, TextStructureAgg>()
                         .ConvertText <AggregateStructures, TextStructure>(true)
                         .ShowPdf <ShowStructureCentral>($"{_context.OutputFilePrefix}-show-central.pdf")
                         .Log <AnalyzeStructures>($"{_context.OutputFilePrefix}-analyze-structures.txt")
                         .Log <AnalyzeStructuresCentral>($"{_context.OutputFilePrefix}-analyze-structures-central.txt");

            _context.SetPipelineText <TextStructure>(result);

            _context.AddOutput("show-central", $"{_context.OutputFilePrefix}-show-central.pdf");
        }