2013-10-15 62 views
11

我想创建使用HTML和动态图像的动态PDF文档。我的代码工作正常标准的HTML和图像的完整路径,但是当我尝试嵌入图像嵌入文档我得到的错误itextsharp.xmlworker可以呈现嵌入图像吗?

异常详细信息的信息:System.IO.IOException:该文件有没有页面。

有没有一种方法可以在没有每个图像的HTTP调用的情况下嵌入图像?我不希望这样,因为我认为这会导致可伸缩性问题,并且图像很敏感。

这里是我的代码,让IOException异常:

public ActionResult MakePdf() 
    { 
     string html = @"<?xml version=""1.0"" encoding=""UTF-8""?> 
      <!DOCTYPE html 
       PUBLIC ""-//W3C//DTD XHTML 1.0 Strict//EN"" 
       ""http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd""> 
      <html xmlns=""http://www.w3.org/1999/xhtml"" xml:lang=""en"" lang=""en""> 
       <head> 
        <title>Minimal XHTML 1.0 Document with W3C DTD</title> 
       </head> 
       <body><img src='' width='62' height='80' style='float: left; margin-right: 28px;' /></body></html>"; 

     var bytes = Encoding.UTF8.GetBytes(html); 

     using (MemoryStream input = new MemoryStream(bytes)) 
     { 
      MemoryStream output = new MemoryStream(); 
      using (Document document = new Document(PageSize.LETTER, 50, 50, 50, 50)) 
      { 
       using (PdfWriter writer = PdfWriter.GetInstance(document, output)) 
       { 
        writer.CloseStream = false; 
        document.Open(); 

        XMLWorkerHelper xmlWorker = XMLWorkerHelper.GetInstance(); 
        xmlWorker.ParseXHtml(writer, document, input, null); 
        document.Close(); 
        output.Position = 0; 

        return new FileStreamResult(output, "application/pdf"); 
       } 
      } 
     } 
    } 

回答

21

我们需要写我们自己的ImageTagProcessor支持基地的加工64张图片:

public class CustomImageTagProcessor : iTextSharp.tool.xml.html.Image 
{ 
    public override IList<IElement> End(IWorkerContext ctx, Tag tag, IList<IElement> currentContent) 
    { 
     IDictionary<string, string> attributes = tag.Attributes; 
     string src; 
     if (!attributes.TryGetValue(HTML.Attribute.SRC, out src)) 
      return new List<IElement>(1); 

     if (string.IsNullOrEmpty(src)) 
      return new List<IElement>(1); 

     if (src.StartsWith("data:image/", StringComparison.InvariantCultureIgnoreCase)) 
     { 
      // data:[<MIME-type>][;charset=<encoding>][;base64],<data> 
      var base64Data = src.Substring(src.IndexOf(",") + 1); 
      var imagedata = Convert.FromBase64String(base64Data); 
      var image = iTextSharp.text.Image.GetInstance(imagedata); 

      var list = new List<IElement>(); 
      var htmlPipelineContext = GetHtmlPipelineContext(ctx); 
      list.Add(GetCssAppliers().Apply(new Chunk((iTextSharp.text.Image)GetCssAppliers().Apply(image, tag, htmlPipelineContext), 0, 0, true), tag, htmlPipelineContext)); 
      return list; 
     } 
     else 
     { 
      return base.End(ctx, tag, currentContent); 
     } 
    } 
} 

然后我们可以注入这个新的处理器进入在HtmlPipelineContext:

 using (var doc = new Document(PageSize.A4)) 
     { 
      var writer = PdfWriter.GetInstance(doc, new FileStream("test.pdf", FileMode.Create)); 
      doc.Open(); 
      var html = @"<img src='' width='62' height='80' style='float: left; margin-right: 28px;' />"; 

      var tagProcessors = (DefaultTagProcessorFactory)Tags.GetHtmlTagProcessorFactory(); 
      tagProcessors.RemoveProcessor(HTML.Tag.IMG); // remove the default processor 
      tagProcessors.AddProcessor(HTML.Tag.IMG, new CustomImageTagProcessor()); // use our new processor 

      CssFilesImpl cssFiles = new CssFilesImpl(); 
      cssFiles.Add(XMLWorkerHelper.GetInstance().GetDefaultCSS()); 
      var cssResolver = new StyleAttrCSSResolver(cssFiles); 
      cssResolver.AddCss(@"code { padding: 2px 4px; }", "utf-8", true); 
      var charset = Encoding.UTF8; 
      var hpc = new HtmlPipelineContext(new CssAppliersImpl(new XMLWorkerFontProvider())); 
      hpc.SetAcceptUnknown(true).AutoBookmark(true).SetTagFactory(tagProcessors); // inject the tagProcessors 
      var htmlPipeline = new HtmlPipeline(hpc, new PdfWriterPipeline(doc, writer)); 
      var pipeline = new CssResolverPipeline(cssResolver, htmlPipeline); 
      var worker = new XMLWorker(pipeline, true); 
      var xmlParser = new XMLParser(true, worker, charset); 
      xmlParser.Parse(new StringReader(html)); 
     } 
     Process.Start("test.pdf"); 
+2

干得好!我试图让一个自定义的'IImageProvider'工作,但从来没有想过尝试一个自定义的'img'标签! –

+1

太棒了!我今天早上阅读了http://demo.itextsupport.com/xmlworker/itextdoc/flatsite.html,但尚未开始实施。感谢您及时的回复! –

+0

Gread示例。但代码工作得很好,但在Acrobat Reader中,第一页不能正确渲染。文字未显示。有没有什么已知的问题呢? – dixus

0
  string originalFile = "Original1.pdf"; 
      string copyOfOriginal = "Re-copia.pdf"; 

      byte[] bytes = Convert.FromBase64String(archivo); 

      System.IO.FileStream stream = new FileStream(originalFile, FileMode.CreateNew); 
      System.IO.BinaryWriter writer = new BinaryWriter(stream); 
      writer.Write(bytes, 0, bytes.Length); 
      writer.Close(); 

      PdfReader reader1 = new PdfReader(originalFile); 
      using (FileStream fs = new FileStream(copyOfOriginal, FileMode.Create, FileAccess.Write, FileShare.None)) 
      // Creating iTextSharp.text.pdf.PdfStamper object to write 
      // Data from iTextSharp.text.pdf.PdfReader object to FileStream object 
      using (PdfStamper stamper = new PdfStamper(reader1, fs)) 
      { 

       int pageCount = reader1.NumberOfPages; 

       // Create New Layer for Watermark 
       PdfLayer layer = new PdfLayer("WatermarkLayer", stamper.Writer); 
       // Loop through each Page 
       for (int i = pageCount; i <= pageCount; i++) 
       { 
        // Getting the Page Size 
        Rectangle rect = reader1.GetPageSize(i); 



        // Get the ContentByte object 
        PdfContentByte cb = stamper.GetUnderContent(i); 

        // Tell the cb that the next commands should be "bound" to this new layer 
        cb.BeginLayer(layer); 
        cb.SetFontAndSize(BaseFont.CreateFont(BaseFont.HELVETICA, BaseFont.CP1252, BaseFont.NOT_EMBEDDED), 50); 

        PdfGState gState = new PdfGState(); 
        cb.SetGState(gState); 


        string codbartest = codBarras; 
        BarcodePDF417 bcpdf417 = new BarcodePDF417(); 
        //Asigna el código de barras en base64 a la propiedad text del objeto.. 
        bcpdf417.Text = ASCIIEncoding.ASCII.GetBytes(codbartest); 
        Image imgpdf417 = bcpdf417.GetImage(); 
        imgpdf417.SetAbsolutePosition(50, 50); 
        imgpdf417.ScalePercent(100); 
        cb.AddImage(imgpdf417); 
        // Close the layer 
        cb.EndLayer(); 
       }[enter image description here][1] 
+0

你的回答完全忽略了这个操作是在html-to-pdf用例中询问这个问题...... – mkl