namespace UglyToad.PdfPig.Writer { using Content; using Core; using Fonts; using Graphics.Colors; using Graphics.Operations; using Graphics.Operations.General; using Graphics.Operations.PathConstruction; using Graphics.Operations.SpecialGraphicsState; using Graphics.Operations.TextObjects; using Graphics.Operations.TextPositioning; using Graphics.Operations.TextShowing; using Graphics.Operations.TextState; using Images; using System; using System.Collections.Generic; using System.Diagnostics; using System.IO; using System.Linq; using PdfFonts; using Tokens; using Graphics.Operations.PathPainting; using Images.Png; /// /// A builder used to add construct a page in a PDF document. /// public class PdfPageBuilder { // parent private readonly PdfDocumentBuilder documentBuilder; // all page data other than content streams internal readonly Dictionary pageDictionary = new Dictionary(); // streams internal readonly List contentStreams; private IPageContentStream currentStream; // maps fonts added using PdfDocumentBuilder to page font names private readonly Dictionary documentFonts = new Dictionary(); internal int nextFontId = 1; //a sequence number of ShowText operation to determine whether letters belong to same operation or not (letters that belong to different operations have less changes to belong to same word) private int textSequence; private int imageKey = 1; internal IReadOnlyDictionary Resources => pageDictionary.GetOrCreateDict(NameToken.Resources); /// /// The number of this page, 1-indexed. /// public int PageNumber { get; } /// /// The current size of the page. /// public PdfRectangle PageSize { get; set; } /// /// Access to the underlying data structures for advanced use cases. /// public IContentStream CurrentStream => currentStream; /// /// Access to /// public IReadOnlyList ContentStreams => contentStreams; internal PdfPageBuilder(int number, PdfDocumentBuilder documentBuilder) { this.documentBuilder = documentBuilder ?? throw new ArgumentNullException(nameof(documentBuilder)); PageNumber = number; currentStream = new DefaultContentStream(); contentStreams = new List() {currentStream}; } internal PdfPageBuilder(int number, PdfDocumentBuilder documentBuilder, IEnumerable copied, Dictionary pageDict) { this.documentBuilder = documentBuilder ?? throw new ArgumentNullException(nameof(documentBuilder)); PageNumber = number; pageDictionary = pageDict; contentStreams = new List(); contentStreams.AddRange(copied); currentStream = new DefaultContentStream(); contentStreams.Add(currentStream); } /// /// Allow to append a new content stream before the current one and select it /// public void NewContentStreamBefore() { var index = Math.Max(contentStreams.IndexOf(currentStream) - 1, 0); currentStream = new DefaultContentStream(); contentStreams.Insert(index, currentStream); } /// /// Allow to append a new content stream after the current one and select it /// public void NewContentStreamAfter() { var index = Math.Min(contentStreams.IndexOf(currentStream) + 1, contentStreams.Count); currentStream = new DefaultContentStream(); contentStreams.Insert(index, currentStream); } /// /// Select a content stream from the list, by his index /// /// index of the content stream to be selected public void SelectContentStream(int index) { if (index < 0 || index >= contentStreams.Count) { throw new IndexOutOfRangeException(nameof(index)); } currentStream = contentStreams[index]; } /// /// Draws a line on the current page between two points with the specified line width. /// /// The first point on the line. /// The last point on the line. /// The width of the line in user space units. public void DrawLine(PdfPoint from, PdfPoint to, decimal lineWidth = 1) { if (lineWidth != 1) { currentStream.Add(new SetLineWidth(lineWidth)); } currentStream.Add(new BeginNewSubpath((decimal)from.X, (decimal)from.Y)); currentStream.Add(new AppendStraightLineSegment((decimal)to.X, (decimal)to.Y)); currentStream.Add(StrokePath.Value); if (lineWidth != 1) { currentStream.Add(new SetLineWidth(1)); } } /// /// Draws a rectangle on the current page starting at the specified point with the given width, height and line width. /// /// The position of the rectangle, for positive width and height this is the bottom-left corner. /// The width of the rectangle. /// The height of the rectangle. /// The width of the line border of the rectangle. /// Whether to fill with the color set by . public void DrawRectangle(PdfPoint position, decimal width, decimal height, decimal lineWidth = 1, bool fill = false) { if (lineWidth != 1) { currentStream.Add(new SetLineWidth(lineWidth)); } currentStream.Add(new AppendRectangle((decimal)position.X, (decimal)position.Y, width, height)); if (fill) { currentStream.Add(FillPathEvenOddRuleAndStroke.Value); } else { currentStream.Add(StrokePath.Value); } if (lineWidth != 1) { currentStream.Add(new SetLineWidth(lineWidth)); } } /// /// Sets the stroke color for any following operations to the RGB value. Use to reset. /// /// Red - 0 to 255 /// Green - 0 to 255 /// Blue - 0 to 255 public void SetStrokeColor(byte r, byte g, byte b) { currentStream.Add(Push.Value); currentStream.Add(new SetStrokeColorDeviceRgb(RgbToDecimal(r), RgbToDecimal(g), RgbToDecimal(b))); } /// /// Sets the stroke color with the exact decimal value between 0 and 1 for any following operations to the RGB value. Use to reset. /// /// Red - 0 to 1 /// Green - 0 to 1 /// Blue - 0 to 1 internal void SetStrokeColorExact(decimal r, decimal g, decimal b) { currentStream.Add(Push.Value); currentStream.Add(new SetStrokeColorDeviceRgb(CheckRgbDecimal(r, nameof(r)), CheckRgbDecimal(g, nameof(g)), CheckRgbDecimal(b, nameof(b)))); } /// /// Sets the fill and text color for any following operations to the RGB value. Use to reset. /// /// Red - 0 to 255 /// Green - 0 to 255 /// Blue - 0 to 255 public void SetTextAndFillColor(byte r, byte g, byte b) { currentStream.Add(Push.Value); currentStream.Add(new SetNonStrokeColorDeviceRgb(RgbToDecimal(r), RgbToDecimal(g), RgbToDecimal(b))); } /// /// Restores the stroke, text and fill color to default (black). /// public void ResetColor() { currentStream.Add(Pop.Value); } /// /// Calculates the size and position of each letter in a given string in the provided font without changing the state of the page. /// /// The text to measure each letter of. /// The size of the font in user space units. /// The position of the baseline (lower-left corner) to start drawing the text from. /// /// A font added to the document using /// or methods. /// /// The letters from the input text with their corresponding size and position. public IReadOnlyList MeasureText(string text, decimal fontSize, PdfPoint position, PdfDocumentBuilder.AddedFont font) { if (font == null) { throw new ArgumentNullException(nameof(font)); } if (text == null) { throw new ArgumentNullException(nameof(text)); } if (!documentBuilder.Fonts.TryGetValue(font.Id, out var fontStore)) { throw new ArgumentException($"No font has been added to the PdfDocumentBuilder with Id: {font.Id}. " + $"Use {nameof(documentBuilder.AddTrueTypeFont)} to register a font.", nameof(font)); } if (fontSize <= 0) { throw new ArgumentOutOfRangeException(nameof(fontSize), "Font size must be greater than 0"); } var fontProgram = fontStore.FontProgram; var fm = fontProgram.GetFontMatrix(); var textMatrix = TransformationMatrix.FromValues(1, 0, 0, 1, position.X, position.Y); var letters = DrawLetters(null, text, fontProgram, fm, fontSize, textMatrix); return letters; } /// /// Draws the text in the provided font at the specified position and returns the letters which will be drawn. /// /// The text to draw to the page. /// The size of the font in user space units. /// The position of the baseline (lower-left corner) to start drawing the text from. /// /// A font added to the document using /// or methods. /// /// The letters from the input text with their corresponding size and position. public IReadOnlyList AddText(string text, decimal fontSize, PdfPoint position, PdfDocumentBuilder.AddedFont font) { if (font == null) { throw new ArgumentNullException(nameof(font)); } if (text == null) { throw new ArgumentNullException(nameof(text)); } if (!documentBuilder.Fonts.TryGetValue(font.Id, out var fontStore)) { throw new ArgumentException($"No font has been added to the PdfDocumentBuilder with Id: {font.Id}. " + $"Use {nameof(documentBuilder.AddTrueTypeFont)} to register a font.", nameof(font)); } if (fontSize <= 0) { throw new ArgumentOutOfRangeException(nameof(fontSize), "Font size must be greater than 0"); } var fontName = GetAddedFont(font); var fontProgram = fontStore.FontProgram; var fm = fontProgram.GetFontMatrix(); var textMatrix = TransformationMatrix.FromValues(1, 0, 0, 1, position.X, position.Y); var letters = DrawLetters(fontName, text, fontProgram, fm, fontSize, textMatrix); currentStream.Add(BeginText.Value); currentStream.Add(new SetFontAndSize(fontName, fontSize)); currentStream.Add(new MoveToNextLineWithOffset((decimal)position.X, (decimal)position.Y)); var bytesPerShow = new List(); foreach (var letter in text) { if (char.IsWhiteSpace(letter)) { currentStream.Add(new ShowText(bytesPerShow.ToArray())); bytesPerShow.Clear(); } var b = fontProgram.GetValueForCharacter(letter); bytesPerShow.Add(b); } if (bytesPerShow.Count > 0) { currentStream.Add(new ShowText(bytesPerShow.ToArray())); } currentStream.Add(EndText.Value); return letters; } private NameToken GetAddedFont(PdfDocumentBuilder.AddedFont font) { if (!documentFonts.TryGetValue(font.Id, out NameToken value)) { value = NameToken.Create($"F{nextFontId++}"); var resources = pageDictionary.GetOrCreateDict(NameToken.Resources); var fonts = resources.GetOrCreateDict(NameToken.Font); while (fonts.ContainsKey(value)) { value = NameToken.Create($"F{nextFontId++}"); } documentFonts[font.Id] = value; fonts[value] = font.Reference; } return value; } /// /// Adds the JPEG image represented by the input bytes at the specified location. /// public AddedImage AddJpeg(byte[] fileBytes, PdfRectangle placementRectangle) { using (var stream = new MemoryStream(fileBytes)) { return AddJpeg(stream, placementRectangle); } } /// /// Adds the JPEG image represented by the input stream at the specified location. /// public AddedImage AddJpeg(Stream fileStream, PdfRectangle placementRectangle) { var startFrom = fileStream.Position; var info = JpegHandler.GetInformation(fileStream); byte[] data; using (var memory = new MemoryStream()) { fileStream.Seek(startFrom, SeekOrigin.Begin); fileStream.CopyTo(memory); data = memory.ToArray(); } var imgDictionary = new Dictionary { {NameToken.Type, NameToken.Xobject }, {NameToken.Subtype, NameToken.Image }, {NameToken.Width, new NumericToken(info.Width) }, {NameToken.Height, new NumericToken(info.Height) }, {NameToken.BitsPerComponent, new NumericToken(info.BitsPerComponent)}, {NameToken.ColorSpace, NameToken.Devicergb}, {NameToken.Filter, NameToken.DctDecode}, {NameToken.Length, new NumericToken(data.Length)} }; var reference = documentBuilder.AddImage(new DictionaryToken(imgDictionary), data); var resources = pageDictionary.GetOrCreateDict(NameToken.Resources); var xObjects = resources.GetOrCreateDict(NameToken.Xobject); var key = NameToken.Create($"I{imageKey++}"); xObjects[key] = reference; currentStream.Add(Push.Value); // This needs to be the placement rectangle. currentStream.Add(new ModifyCurrentTransformationMatrix(new [] { (decimal)placementRectangle.Width, 0, 0, (decimal)placementRectangle.Height, (decimal)placementRectangle.BottomLeft.X, (decimal)placementRectangle.BottomLeft.Y })); currentStream.Add(new InvokeNamedXObject(key)); currentStream.Add(Pop.Value); return new AddedImage(reference.Data, info.Width, info.Height); } /// /// Adds the JPEG image previously added using , /// this will share the same image data to prevent duplication. /// /// An image previously added to this page or another page. /// The size and location to draw the image on this page. public void AddJpeg(AddedImage image, PdfRectangle placementRectangle) => AddImage(image, placementRectangle); /// /// Adds the image previously added using /// or sharing the same image to prevent duplication. /// public void AddImage(AddedImage image, PdfRectangle placementRectangle) { var resources = pageDictionary.GetOrCreateDict(NameToken.Resources); var xObjects = resources.GetOrCreateDict(NameToken.Xobject); var key = NameToken.Create($"I{imageKey++}"); xObjects[key] = new IndirectReferenceToken(image.Reference); currentStream.Add(Push.Value); // This needs to be the placement rectangle. currentStream.Add(new ModifyCurrentTransformationMatrix(new[] { (decimal)placementRectangle.Width, 0, 0, (decimal)placementRectangle.Height, (decimal)placementRectangle.BottomLeft.X, (decimal)placementRectangle.BottomLeft.Y })); currentStream.Add(new InvokeNamedXObject(key)); currentStream.Add(Pop.Value); } /// /// Adds the PNG image represented by the input bytes at the specified location. /// public AddedImage AddPng(byte[] pngBytes, PdfRectangle placementRectangle) { using (var memoryStream = new MemoryStream(pngBytes)) { return AddPng(memoryStream, placementRectangle); } } /// /// Adds the PNG image represented by the input stream at the specified location. /// public AddedImage AddPng(Stream pngStream, PdfRectangle placementRectangle) { var png = Png.Open(pngStream); byte[] data; var pixelBuffer = new byte[3]; using (var memoryStream = new MemoryStream()) { for (var rowIndex = 0; rowIndex < png.Height; rowIndex++) { for (var colIndex = 0; colIndex < png.Width; colIndex++) { var pixel = png.GetPixel(colIndex, rowIndex); pixelBuffer[0] = pixel.R; pixelBuffer[1] = pixel.G; pixelBuffer[2] = pixel.B; memoryStream.Write(pixelBuffer, 0, pixelBuffer.Length); } } data = memoryStream.ToArray(); } var compressed = DataCompresser.CompressBytes(data); var imgDictionary = new Dictionary { {NameToken.Type, NameToken.Xobject }, {NameToken.Subtype, NameToken.Image }, {NameToken.Width, new NumericToken(png.Width) }, {NameToken.Height, new NumericToken(png.Height) }, {NameToken.BitsPerComponent, new NumericToken(png.Header.BitDepth)}, {NameToken.ColorSpace, NameToken.Devicergb}, {NameToken.Filter, NameToken.FlateDecode}, {NameToken.Length, new NumericToken(compressed.Length)} }; var reference = documentBuilder.AddImage(new DictionaryToken(imgDictionary), compressed); var resources = pageDictionary.GetOrCreateDict(NameToken.Resources); var xObjects = resources.GetOrCreateDict(NameToken.Xobject); var key = NameToken.Create($"I{imageKey++}"); xObjects[key] = reference; currentStream.Add(Push.Value); // This needs to be the placement rectangle. currentStream.Add(new ModifyCurrentTransformationMatrix(new[] { (decimal)placementRectangle.Width, 0, 0, (decimal)placementRectangle.Height, (decimal)placementRectangle.BottomLeft.X, (decimal)placementRectangle.BottomLeft.Y })); currentStream.Add(new InvokeNamedXObject(key)); currentStream.Add(Pop.Value); return new AddedImage(reference.Data, png.Width, png.Height); } /// /// Copy a page from unknown source to this page /// /// Page to be copied public void CopyFrom(Page srcPage) { if (currentStream.Operations.Count > 0) { NewContentStreamAfter(); } var destinationStream = currentStream; if (!srcPage.Dictionary.TryGet(NameToken.Resources, srcPage.pdfScanner, out DictionaryToken srcResourceDictionary)) { // If the page doesn't have resources, then we copy the entire content stream, since not operation would collide // with the ones already written destinationStream.Operations.AddRange(srcPage.Operations); return; } // TODO: How should we handle any other token in the page dictionary (Eg. LastModified, MediaBox, CropBox, BleedBox, TrimBox, ArtBox, // BoxColorInfo, Rotate, Group, Thumb, B, Dur, Trans, Annots, AA, Metadata, PieceInfo, StructParents, ID, PZ, SeparationInfo, Tabs, // TemplateInstantiated, PresSteps, UserUnit, VP) var operations = new List(srcPage.Operations); // We need to relocate the resources, and we have to make sure that none of the resources collide with // the already written operation's resources var resources = pageDictionary.GetOrCreateDict(NameToken.Resources); foreach (var set in srcResourceDictionary.Data) { var nameToken = NameToken.Create(set.Key); if (nameToken == NameToken.Font || nameToken == NameToken.Xobject) { // We have to skip this two because we have a separate dictionary for them continue; } if (!resources.ContainsKey(nameToken)) { // It means that this type of resources doesn't currently exist in the page, so we can copy it // with no problem resources[nameToken] = documentBuilder.CopyToken(srcPage.pdfScanner, set.Value); continue; } // TODO: I need to find a test case // It would have ExtendedGraphics or colorspaces, etc... } // Special cases // Since we don't directly add font's to the pages resources, we have to go look at the document's font if(srcResourceDictionary.TryGet(NameToken.Font, srcPage.pdfScanner, out DictionaryToken fontsDictionary)) { var pageFontsDictionary = resources.GetOrCreateDict(NameToken.Font); foreach (var fontSet in fontsDictionary.Data) { var fontName = NameToken.Create(fontSet.Key); if (pageFontsDictionary.ContainsKey(fontName)) { // This would mean that the imported font collide with one of the added font. so we have to rename it var newName = NameToken.Create($"F{nextFontId++}"); while (pageFontsDictionary.ContainsKey(newName)) { newName = NameToken.Create($"F{nextFontId++}"); } // Set all the pertinent SetFontAndSize operations with the new name operations = operations.Select(op => { if (!(op is SetFontAndSize fontAndSizeOperation)) { return op; } if (fontAndSizeOperation.Font.Data == fontName) { return new SetFontAndSize(newName, fontAndSizeOperation.Size); } return op; }).ToList(); fontName = newName; } if (!(fontSet.Value is IndirectReferenceToken fontReferenceToken)) { throw new PdfDocumentFormatException($"Expected a IndirectReferenceToken for the font, got a {fontSet.Value.GetType().Name}"); } pageFontsDictionary.Add(fontName, documentBuilder.CopyToken(srcPage.pdfScanner, fontReferenceToken)); } } // Since we don't directly add xobjects's to the pages resources, we have to go look at the document's xobjects if (srcResourceDictionary.TryGet(NameToken.Xobject, srcPage.pdfScanner, out DictionaryToken xobjectsDictionary)) { var pageXobjectsDictionary = resources.GetOrCreateDict(NameToken.Xobject); var xobjectNamesUsed = Enumerable.Range(0, imageKey).Select(i => $"I{i}"); foreach (var xobjectSet in xobjectsDictionary.Data) { var xobjectName = xobjectSet.Key; if (xobjectName[0] == 'I' && xobjectNamesUsed.Any(s => s == xobjectName)) { // This would mean that the imported xobject collide with one of the added image. so we have to rename it var newName = $"I{imageKey++}"; // Set all the pertinent SetFontAndSize operations with the new name operations = operations.Select(op => { if (!(op is InvokeNamedXObject invokeNamedOperation)) { return op; } if (invokeNamedOperation.Name.Data == xobjectName) { return new InvokeNamedXObject(NameToken.Create(newName)); } return op; }).ToList(); xobjectName = newName; } if (!(xobjectSet.Value is IndirectReferenceToken fontReferenceToken)) { throw new PdfDocumentFormatException($"Expected a IndirectReferenceToken for the XObject, got a {xobjectSet.Value.GetType().Name}"); } pageXobjectsDictionary[xobjectName] = documentBuilder.CopyToken(srcPage.pdfScanner, fontReferenceToken); } } destinationStream.Operations.AddRange(operations); } private List DrawLetters(NameToken name, string text, IWritingFont font, TransformationMatrix fontMatrix, decimal fontSize, TransformationMatrix textMatrix) { var horizontalScaling = 1; var rise = 0; var letters = new List(); var renderingMatrix = TransformationMatrix.FromValues((double)fontSize * horizontalScaling, 0, 0, (double)fontSize, 0, rise); var width = 0.0; textSequence++; for (var i = 0; i < text.Length; i++) { var c = text[i]; if (!font.TryGetBoundingBox(c, out var rect)) { throw new InvalidOperationException($"The font does not contain a character: {c}."); } if (!font.TryGetAdvanceWidth(c, out var charWidth)) { throw new InvalidOperationException($"The font does not contain a character: {c}."); } var advanceRect = new PdfRectangle(0, 0, charWidth, 0); advanceRect = textMatrix.Transform(renderingMatrix.Transform(fontMatrix.Transform(advanceRect))); var documentSpace = textMatrix.Transform(renderingMatrix.Transform(fontMatrix.Transform(rect))); var letter = new Letter(c.ToString(), documentSpace, advanceRect.BottomLeft, advanceRect.BottomRight, width, (double)fontSize, FontDetails.GetDefault(name), GrayColor.Black, (double)fontSize, textSequence); letters.Add(letter); var tx = advanceRect.Width * horizontalScaling; var ty = 0; var translate = TransformationMatrix.GetTranslationMatrix(tx, ty); width += tx; textMatrix = translate.Multiply(textMatrix); } return letters; } private static decimal RgbToDecimal(byte value) { var res = Math.Max(0, value / (decimal)byte.MaxValue); res = Math.Round(Math.Min(1, res), 4); return res; } private static decimal CheckRgbDecimal(decimal value, string argument) { if (value < 0) { throw new ArgumentOutOfRangeException(argument, $"Provided decimal for RGB color was less than zero: {value}."); } if (value > 1) { throw new ArgumentOutOfRangeException(argument, $"Provided decimal for RGB color was greater than one: {value}."); } return value; } /// /// Provides access to the raw page data structures for advanced editing use cases. /// public interface IContentStream { /// /// The operations making up the page content stream. /// List Operations { get; } } internal interface IPageContentStream : IContentStream { bool ReadOnly { get; } bool HasContent { get; } void Add(IGraphicsStateOperation operation); IndirectReferenceToken Write(IPdfStreamWriter writer); } internal class DefaultContentStream : IPageContentStream { private readonly List operations; public DefaultContentStream() : this(new List()) { } public DefaultContentStream(List operations) { this.operations = operations; } public bool ReadOnly => false; public bool HasContent => operations.Any(); public void Add(IGraphicsStateOperation operation) { operations.Add(operation); } public List Operations => operations; public IndirectReferenceToken Write(IPdfStreamWriter writer) { using (var memoryStream = new MemoryStream()) { foreach (var operation in operations) { operation.Write(memoryStream); } var bytes = memoryStream.ToArray(); var stream = DataCompresser.CompressToStream(bytes); return writer.WriteToken(stream); } } } internal class CopiedContentStream : IPageContentStream { private readonly IndirectReferenceToken token; public bool ReadOnly => true; public bool HasContent => true; public CopiedContentStream(IndirectReferenceToken indirectReferenceToken) { token = indirectReferenceToken; } public IndirectReferenceToken Write(IPdfStreamWriter writer) { return token; } public void Add(IGraphicsStateOperation operation) { throw new NotSupportedException("Writing to a copied content stream is not supported."); } public List Operations => throw new NotSupportedException("Reading raw operations is not supported from a copied content stream."); } /// /// A key representing an image available to use for the current document builder. /// Create it by adding an image to a page using . /// public class AddedImage { /// /// The Id uniquely identifying this image on the builder. /// internal Guid Id { get; } /// /// The reference to the stored image XObject. /// internal IndirectReference Reference { get; } /// /// The width of the raw image in pixels. /// public int Width { get; } /// /// The height of the raw image in pixels. /// public int Height { get; } /// /// Create a new . /// internal AddedImage(IndirectReference reference, int width, int height) { Id = Guid.NewGuid(); Reference = reference; Width = width; Height = height; } } } }