16

I would like to create dynamic PDF documents using HTML and dynamic images. My code works fine with standard HTML and full paths for the images, but when I try to embed the image inline in the document I get the error

Exception Details: System.IO.IOException: The document has no pages.

Is there a way to embed the images without an HTTP call per image? I don't want that because I think it will cause scalability issues and the images are sensitive.

Here is my code that gives the IOException:

 public ActionResult MakePdf() { string html = @"<?xml version=""1.0"" encoding=""UTF-8""?> <!DOCTYPE html PUBLIC ""-//W3C//DTD XHTML 1.0 Strict//EN"" ""http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd""> <html xmlns=""http://www.w3.org/1999/xhtml"" xml:lang=""en"" lang=""en""> <head> <title>Minimal XHTML 1.0 Document with W3C DTD</title> </head> <body><img src='' width='62' height='80' style='float: left; margin-right: 28px;' /></body></html>"; var bytes = Encoding.UTF8.GetBytes(html); using (MemoryStream input = new MemoryStream(bytes)) { MemoryStream output = new MemoryStream(); using (Document document = new Document(PageSize.LETTER, 50, 50, 50, 50)) { using (PdfWriter writer = PdfWriter.GetInstance(document, output)) { writer.CloseStream = false; document.Open(); XMLWorkerHelper xmlWorker = XMLWorkerHelper.GetInstance(); xmlWorker.ParseXHtml(writer, document, input, null); document.Close(); output.Position = 0; return new FileStreamResult(output, "application/pdf"); } } } } 

2 Answers 2

33

We need to write our own ImageTagProcessor to support processing of base 64 images:

public class CustomImageTagProcessor : iTextSharp.tool.xml.html.Image { public override IList<IElement> End(IWorkerContext ctx, Tag tag, IList<IElement> currentContent) { IDictionary<string, string> attributes = tag.Attributes; string src; if (!attributes.TryGetValue(HTML.Attribute.SRC, out src)) return new List<IElement>(1); if (string.IsNullOrEmpty(src)) return new List<IElement>(1); if (src.StartsWith("data:image/", StringComparison.InvariantCultureIgnoreCase)) { // data:[<MIME-type>][;charset=<encoding>][;base64],<data> var base64Data = src.Substring(src.IndexOf(",") + 1); var imagedata = Convert.FromBase64String(base64Data); var image = iTextSharp.text.Image.GetInstance(imagedata); var list = new List<IElement>(); var htmlPipelineContext = GetHtmlPipelineContext(ctx); list.Add(GetCssAppliers().Apply(new Chunk((iTextSharp.text.Image)GetCssAppliers().Apply(image, tag, htmlPipelineContext), 0, 0, true), tag, htmlPipelineContext)); return list; } else { return base.End(ctx, tag, currentContent); } } } 

Then we can inject this new processor into the HtmlPipelineContext:

 using (var doc = new Document(PageSize.A4)) { var writer = PdfWriter.GetInstance(doc, new FileStream("test.pdf", FileMode.Create)); doc.Open(); var html = @"<img src='' width='62' height='80' style='float: left; margin-right: 28px;' />"; var tagProcessors = (DefaultTagProcessorFactory)Tags.GetHtmlTagProcessorFactory(); tagProcessors.RemoveProcessor(HTML.Tag.IMG); // remove the default processor tagProcessors.AddProcessor(HTML.Tag.IMG, new CustomImageTagProcessor()); // use our new processor CssFilesImpl cssFiles = new CssFilesImpl(); cssFiles.Add(XMLWorkerHelper.GetInstance().GetDefaultCSS()); var cssResolver = new StyleAttrCSSResolver(cssFiles); cssResolver.AddCss(@"code { padding: 2px 4px; }", "utf-8", true); var charset = Encoding.UTF8; var hpc = new HtmlPipelineContext(new CssAppliersImpl(new XMLWorkerFontProvider())); hpc.SetAcceptUnknown(true).AutoBookmark(true).SetTagFactory(tagProcessors); // inject the tagProcessors var htmlPipeline = new HtmlPipeline(hpc, new PdfWriterPipeline(doc, writer)); var pipeline = new CssResolverPipeline(cssResolver, htmlPipeline); var worker = new XMLWorker(pipeline, true); var xmlParser = new XMLParser(true, worker, charset); xmlParser.Parse(new StringReader(html)); } Process.Start("test.pdf"); 
Sign up to request clarification or add additional context in comments.

6 Comments

Nice job! I was trying to get a custom IImageProvider to work but never thought to try a custom img tag!
Awesome! I read about that this morning demo.itextsupport.com/xmlworker/itextdoc/flatsite.html but hadn't started implementation yet. Thanks for the quick response!
Gread example. But the code works great but in Acrobat Reader, the first page is not rendered correctely. Text is not shown. Is there any known issue with this?
How to use this in XMLWorkerHelper.ParseToElementList? I need to add paragraphs in HTML to the PDF.... not to perform a whole HTML to PDF conversion.
it worked if i have one page string but my string is too long so it is showing error: document has no pages. thank you.
|
0
 string originalFile = "Original1.pdf"; string copyOfOriginal = "Re-copia.pdf"; byte[] bytes = Convert.FromBase64String(archivo); System.IO.FileStream stream = new FileStream(originalFile, FileMode.CreateNew); System.IO.BinaryWriter writer = new BinaryWriter(stream); writer.Write(bytes, 0, bytes.Length); writer.Close(); PdfReader reader1 = new PdfReader(originalFile); using (FileStream fs = new FileStream(copyOfOriginal, FileMode.Create, FileAccess.Write, FileShare.None)) // Creating iTextSharp.text.pdf.PdfStamper object to write // Data from iTextSharp.text.pdf.PdfReader object to FileStream object using (PdfStamper stamper = new PdfStamper(reader1, fs)) { int pageCount = reader1.NumberOfPages; // Create New Layer for Watermark PdfLayer layer = new PdfLayer("WatermarkLayer", stamper.Writer); // Loop through each Page for (int i = pageCount; i <= pageCount; i++) { // Getting the Page Size Rectangle rect = reader1.GetPageSize(i); // Get the ContentByte object PdfContentByte cb = stamper.GetUnderContent(i); // Tell the cb that the next commands should be "bound" to this new layer cb.BeginLayer(layer); cb.SetFontAndSize(BaseFont.CreateFont(BaseFont.HELVETICA, BaseFont.CP1252, BaseFont.NOT_EMBEDDED), 50); PdfGState gState = new PdfGState(); cb.SetGState(gState); string codbartest = codBarras; BarcodePDF417 bcpdf417 = new BarcodePDF417(); //Asigna el código de barras en base64 a la propiedad text del objeto.. bcpdf417.Text = ASCIIEncoding.ASCII.GetBytes(codbartest); Image imgpdf417 = bcpdf417.GetImage(); imgpdf417.SetAbsolutePosition(50, 50); imgpdf417.ScalePercent(100); cb.AddImage(imgpdf417); // Close the layer cb.EndLayer(); }[enter image description here][1] 

3 Comments

your answer completely ignores that the op is asking about this in a html-to-pdf use case...
Fue implemetado en web services para ser consumido por html, este es sólo parte del código basado en un ejemplo.
Please use English here.

Start asking to get answers

Find the answer to your question by asking.

Ask question

Explore related questions

See similar questions with these tags.