public void Process() { var pipelineText = _context.GetPipelineText <TextSegment>(); var resultPipeline = pipelineText .ConvertText <CreateTreeSegments, TextSegment>(true) .ShowPdf <ShowTitleSegment>($"{_context.OutputFilePrefix}-titles.pdf") .Log <AnalyzeSegmentTitles>($"{_context.OutputFilePrefix}-analyze-segment-titles.txt") .Log <AnalyzeTreeStructureFontSize2>($"{_context.OutputFilePrefix}-tree-fontsize.txt") .Log <AnalyzeTreeStructure2>($"{_context.OutputFilePrefix}-tree.txt"); _context.SetPipelineText <TextSegment>(resultPipeline); _context.AddOutput("titles", $"{_context.OutputFilePrefix}-titles.pdf"); _context.AddOutput("tree", $"{_context.OutputFilePrefix}-tree.txt"); }
public void Process() { var pipelineText = _context.GetPipelineText <TextSegment>(); var filename = _context.CreateGlobalInstance <InjectFilename>(); filename.Filename = _context.Basename; var artigos = pipelineText .ConvertText <CreateTaggedSegments, TextTaggedSegment>() .ConvertText <TransformConteudo4, Conteudo>() .ConvertText <TransformArtigo2, Artigo>() .LogFiles <GenerateArtigoTmp>($"{_context.OutputFolder}/{_context.Basename}/artigos/{_context.Basename}-artigo{{0}}.xml") .LogFiles <GenerateArtigoGN4>($"{_context.OutputFolder}/{_context.Basename}/artigosGN4/{_context.Basename}-artigo{{0}}.xml") .ToList(); _context.AddOutput("artigosGN", $"{_context.OutputFolder}/{_context.Basename}/artigos/{_context.Basename}-artigo{{0}}.xml"); _context.AddOutput("artigosGN4", $"{_context.OutputFolder}/{_context.Basename}/artigosGN4/{_context.Basename}-artigo{{0}}.xml"); }
public void Process() { string basename = _context.Basename; Pipeline pipeline = _context.GetPipeline(); pipeline.Input($"{_context.InputFilePrefix}.pdf") .Output($"{_context.OutputFilePrefix}-stage0-input.pdf") .StageProcess(InitialCache); _context.AddOutput("stage0-input", $"{_context.OutputFilePrefix}-stage0-input.pdf"); }
public void Process() { string basename = _context.Basename; Pipeline pipeline = _context.GetPipeline(); pipeline.Input($"{_context.InputFilePrefix}.pdf") .Output($"{_context.OutputFilePrefix}-stage3-retrieve.pdf") .Global <BasicFirstPageStats>() .StageProcess(RetrieveBlocks); _context.AddOutput("stage3", $"{_context.OutputFilePrefix}-stage3-retrieve.pdf"); }
public void Process() { Pipeline pipeline = _context.GetPipeline(); pipeline.Input($"{_context.InputFilePrefix}.pdf") .StageProcess(FindBlocksets); pipeline.Input($"{_context.InputFilePrefix}.pdf") .Output($"{_context.OutputFilePrefix}-stage2-blocksets.pdf") .StageProcess(ShowColors); _context.AddOutput("stage2-blocksets", $"{_context.OutputFilePrefix}-stage2-blocksets.pdf"); }
public void Process() { var pipelineText = _context.GetPipelineText <TextSegment>(); var resultPipeline = pipelineText .ConvertText <CreateTreeSegments, TextSegment>(true) //.ConvertText<MergeTreeSegments, TextSegment>(true) .Log <AnalyzeSegmentTitles>($"{_context.OutputFilePrefix}-analyze-segment-titles.txt") .Log <AnalyzeTreeStructure>($"{_context.OutputFilePrefix}-tree.txt"); _context.SetPipelineText <TextSegment>(resultPipeline); _context.AddOutput("tree", $"{_context.OutputFilePrefix}-tree.txt"); }
public void Process() { var pipelineText = _context.GetPipelineText <TextSegment>(); var conteudo = pipelineText .ConvertText <TransformConteudo2, Conteudo>() .ToList(); var createArticle = new TransformArtigo(); var artigos = createArticle.Create(conteudo); createArticle.CreateXML(artigos, $"{_context.OutputFolder}/{_context.Basename}/artigos", _context.Basename); _context.AddOutput("artigosGN", $"{_context.OutputFolder}/{_context.Basename}/artigos/{_context.Basename}-artigo{{0}}.xml"); }
public void Process() { Pipeline pipeline = _context.GetPipeline(); var result = pipeline.Input($"{_context.InputFilePrefix}.pdf") .AllPages <CreateTextLines>(GetLines) .ConvertText <CreateTextLineIndex, TextLine>(true) .ConvertText <PreCreateStructures, TextLine2>() .ConvertText <CreateStructures3, TextStructure>() .ConvertText <PreCreateTextSegments, TextStructureAgg>() .ConvertText <AggregateStructures, TextStructure>(true) .ShowPdf <ShowStructureCentral>($"{_context.OutputFilePrefix}-show-central.pdf") .Log <AnalyzeStructures>($"{_context.OutputFilePrefix}-analyze-structures.txt") .Log <AnalyzeStructuresCentral>($"{_context.OutputFilePrefix}-analyze-structures-central.txt"); _context.SetPipelineText <TextStructure>(result); _context.AddOutput("show-central", $"{_context.OutputFilePrefix}-show-central.pdf"); }