add content order text extractor and example of use

This commit is contained in:
Eliot Jones
2020-04-19 17:06:34 +01:00
parent f18bc0766a
commit 407ee5ca51
8 changed files with 202 additions and 3 deletions

View File

@@ -0,0 +1,22 @@
namespace UglyToad.Examples
{
using System;
using PdfPig;
using PdfPig.DocumentLayoutAnalysis.TextExtractor;
internal static class ExtractTextWithNewlines
{
public static void Run(string filePath)
{
using (var document = PdfDocument.Open(filePath))
{
foreach (var page in document.GetPages())
{
var text = ContentOrderTextExtractor.GetText(page, true);
Console.WriteLine(text);
}
}
}
}
}