add content order text extractor and example of use

2025-12-21 19:29:51 +08:00 · 2020-04-19 17:06:34 +01:00
parent f18bc0766a
commit 407ee5ca51
8 changed files with 202 additions and 3 deletions
--- a/examples/Program.cs
+++ b/examples/Program.cs
@@ -17,12 +17,16 @@
            var examples = new Dictionary<int, (string name, Action action)>
            {
                {1,
-                    ("Extract Words with newline detection",
+                    ("Extract Words with newline detection (example with algorithm)",
                    () => OpenDocumentAndExtractWords.Run(Path.Combine(filesDirectory, "Two Page Text Only - from libre office.pdf")))
                },
                {2,
                    ("Extract images",
                    () => ExtractImages.Run(Path.Combine(filesDirectory, "2006_Swedish_Touring_Car_Championship.pdf")))
+                },
+                {3,
+                    ("Extract Text with newlines (using built-in content extractor)",
+                    () => ExtractTextWithNewlines.Run(Path.Combine(filesDirectory, "Two Page Text Only - from libre office.pdf")))
                }
            };