Java 使用iText将html转换为pdf

Java 使用iText将html转换为pdf,java,itext,Java,Itext,我想使用iText将带有图像的html文件转换为pdf。我在这里提供我的来源 这是我的HTML文件 <html> <body> <img src='

我想使用iText将带有图像的html文件转换为pdf。我在这里提供我的来源

这是我的HTML文件

 <html>

 <body>
 <img src='' width='62' height='80' style='float: left; margin-right: 28px;' alt="" /> 
<!-- <img src="add.png" alt="" /> -->  
</body>
</html>
我收到以下错误

Exception in thread "main" ExceptionConverter: java.io.IOException: The document has no pages.
at com.itextpdf.text.pdf.PdfPages.writePageTree(PdfPages.java:113)
at com.itextpdf.text.pdf.PdfWriter.close(PdfWriter.java:1243)
at com.itextpdf.text.pdf.PdfDocument.close(PdfDocument.java:849)
at com.itextpdf.text.Document.close(Document.java:416)
at App.main(App.java:64)

请帮助我如何使用itext将带有图像的html文件转换为pdf。如果我没有图像,或者如果我硬编码图像路径,我可以转换html文件。提前感谢

如果您的
pdf
页面中没有内容,则会发生此异常。 试着像这样传递您的
InputStream

String str="<html>

 <body>
 <img src='' width='62' height='80' style='float: left; margin-right: 28px;' alt="" /> 
<!-- <img src="add.png" alt="" /> -->  
</body>
</html>"

InputStream is = new ByteArrayInputStream(str.getBytes());
XMLWorkerHelper.getInstance().parseXHtml(writer, document, is);
String str=”
"
InputStream is=newbytearrayinputstream(str.getBytes());
XMLWorkerHelper.getInstance().parseXHtml(编写器、文档、is);

您需要实现一个自定义图像标记处理器来处理嵌入html中的图像:

package com.example.itext.processor;

import java.util.ArrayList;
import java.util.List;
import java.util.Map;

import com.itextpdf.text.Chunk;
import com.itextpdf.text.Element;
import com.itextpdf.text.Image;
import com.itextpdf.text.log.Level;
import com.itextpdf.text.log.Logger;
import com.itextpdf.text.log.LoggerFactory;
import com.itextpdf.text.pdf.codec.Base64;
import com.itextpdf.tool.xml.NoCustomContextException;
import com.itextpdf.tool.xml.Tag;
import com.itextpdf.tool.xml.WorkerContext;
import com.itextpdf.tool.xml.exceptions.LocaleMessages;
import com.itextpdf.tool.xml.exceptions.RuntimeWorkerException;
import com.itextpdf.tool.xml.html.HTML;
import com.itextpdf.tool.xml.pipeline.html.HtmlPipelineContext;

public class ImageTagProcessor extends com.itextpdf.tool.xml.html.Image {

private final Logger logger = LoggerFactory.getLogger(getClass());

/*
 * (non-Javadoc)
 * 
 * @see com.itextpdf.tool.xml.TagProcessor#endElement(com.itextpdf.tool.xml.Tag, java.util.List, com.itextpdf.text.Document)
 */
@Override
public List<Element> end(final WorkerContext ctx, final Tag tag, final List<Element> currentContent) {
    final Map<String, String> attributes = tag.getAttributes();
    String src = attributes.get(HTML.Attribute.SRC);
    List<Element> elements = new ArrayList<Element>(1);
    if (null != src && src.length() > 0) {
        Image img = null;
        if (src.startsWith("data:image/")) {
            final String base64Data = src.substring(src.indexOf(",") + 1);
            try {
                img = Image.getInstance(Base64.decode(base64Data));
            } catch (Exception e) {
                if (logger.isLogging(Level.ERROR)) {
                    logger.error(String.format(LocaleMessages.getInstance().getMessage(LocaleMessages.HTML_IMG_RETRIEVE_FAIL), src), e);
                }
            }
            if (img != null) {
                try {
                    final HtmlPipelineContext htmlPipelineContext = getHtmlPipelineContext(ctx);
                    elements.add(getCssAppliers().apply(new Chunk((com.itextpdf.text.Image) getCssAppliers().apply(img, tag, htmlPipelineContext), 0, 0, true), tag,
                        htmlPipelineContext));
                } catch (NoCustomContextException e) {
                    throw new RuntimeWorkerException(e);
                }
            }
        }

        if (img == null) {
            elements = super.end(ctx, tag, currentContent);
        }
    }
    return elements;
}
}
package com.example.itext.processor;
导入java.util.ArrayList;
导入java.util.List;
导入java.util.Map;
导入com.itextpdf.text.Chunk;
导入com.itextpdf.text.Element;
导入com.itextpdf.text.Image;
导入com.itextpdf.text.log.Level;
导入com.itextpdf.text.log.Logger;
导入com.itextpdf.text.log.LoggerFactory;
导入com.itextpdf.text.pdf.codec.Base64;
导入com.itextpdf.tool.xml.NoCustomContextException;
导入com.itextpdf.tool.xml.Tag;
导入com.itextpdf.tool.xml.WorkerContext;
导入com.itextpdf.tool.xml.exceptions.LocaleMessages;
导入com.itextpdf.tool.xml.exceptions.RuntimeWorkerException;
导入com.itextpdf.tool.xml.html.html;
导入com.itextpdf.tool.xml.pipeline.html.HtmlPipelineContext;
公共类ImageTagProcessor扩展com.itextpdf.tool.xml.html.Image{
私有最终记录器Logger=LoggerFactory.getLogger(getClass());
/*
*(非Javadoc)
* 
*@请参阅com.itextpdf.tool.xml.TagProcessor#endElement(com.itextpdf.tool.xml.Tag、java.util.List、com.itextpdf.text.Document)
*/
@凌驾
公共列表结束(最终WorkerContext ctx、最终标记标签、最终列表内容){
最终映射属性=tag.getAttributes();
字符串src=attributes.get(HTML.Attribute.src);
列表元素=新的ArrayList(1);
if(null!=src&&src.length()>0){
图像img=null;
if(src.startsWith(“数据:image/”){
最终字符串base64Data=src.substring(src.indexOf(“,”)+1);
试一试{
img=Image.getInstance(Base64.decode(base64Data));
}捕获(例外e){
if(记录器isLogging(级别错误)){
错误(String.format(LocaleMessages.getInstance().getMessage(LocaleMessages.HTML\u IMG\u RETRIEVE\u FAIL),src),e);
}
}
如果(img!=null){
试一试{
最终HtmlPipelineContext HtmlPipelineContext=getHtmlPipelineContext(ctx);
elements.add(getCssAppliers().apply(新块((com.itextpdf.text.Image)getCssAppliers().apply(img,tag,htmlPipelineContext),0,0,true),tag,
htmlPipelineContext);
}捕获(NoCustomContextException e){
抛出新的RuntimeWorkerException(e);
}
}
}
如果(img==null){
elements=super.end(ctx、tag、currentContent);
}
}
返回元素;
}
}
下面的代码片段注册自定义图像标记处理器,并将HTML文档转换为PDF

public static void main(String[] args) {
    convertHtmlToPdf();

}

private static void convertHtmlToPdf() {
    try {
        final OutputStream file = new FileOutputStream(new File("C:\\Test.pdf"));
        final Document document = new Document();
        final PdfWriter writer = PdfWriter.getInstance(document, file);
        document.open();
        final TagProcessorFactory tagProcessorFactory = Tags.getHtmlTagProcessorFactory();
        tagProcessorFactory.removeProcessor(HTML.Tag.IMG);
        tagProcessorFactory.addProcessor(new ImageTagProcessor(), HTML.Tag.IMG);

        final CssFilesImpl cssFiles = new CssFilesImpl();
        cssFiles.add(XMLWorkerHelper.getInstance().getDefaultCSS());
        final StyleAttrCSSResolver cssResolver = new StyleAttrCSSResolver(cssFiles);
        final HtmlPipelineContext hpc = new HtmlPipelineContext(new CssAppliersImpl(new XMLWorkerFontProvider()));
        hpc.setAcceptUnknown(true).autoBookmark(true).setTagFactory(tagProcessorFactory);
        final HtmlPipeline htmlPipeline = new HtmlPipeline(hpc, new PdfWriterPipeline(document, writer));
        final Pipeline<?> pipeline = new CssResolverPipeline(cssResolver, htmlPipeline);
        final XMLWorker worker = new XMLWorker(pipeline, true);
        final Charset charset = Charset.forName("UTF-8");
        final XMLParser xmlParser = new XMLParser(true, worker, charset);
        final InputStream is = new FileInputStream("C:\\test.html");
        xmlParser.parse(is, charset);

        is.close();
        document.close();
        file.close();
    } catch (Exception e) {
        e.printStackTrace();
        // TODO
    }
}
publicstaticvoidmain(字符串[]args){
convertHtmlToPdf();
}
私有静态void convertHtmlToPdf(){
试一试{
最终输出流文件=新文件输出流(新文件(“C:\\Test.pdf”);
最终文件=新文件();
final PdfWriter writer=PdfWriter.getInstance(文档、文件);
document.open();
final TagProcessorFactory TagProcessorFactory=Tags.getHtmlTagProcessorFactory();
tagProcessorFactory.removeProcessor(HTML.Tag.IMG);
tagProcessorFactory.addProcessor(新的ImageTagProcessor(),HTML.Tag.IMG);
final cssfilesiml cssFiles=新的cssfilesiml();
添加(XMLWorkerHelper.getInstance().getDefaultCSS());
最终样式AttrCSSresolver cssResolver=新样式AttrCSSresolver(cssFiles);
final HtmlPipelineContext hpc=新的HtmlPipelineContext(新的CssAppliersImpl(新的XMLWorkerFontProvider());
hpc.setAcceptUnknown(true).autoBookmark(true).setTagFactory(tagProcessorFactory);
最终HtmlPipeline HtmlPipeline=新HtmlPipeline(hpc、新PdfWriterPipeline(文档、编写器));
最终管道=新的cssResolver管道(cssResolver,htmlPipeline);
最终XMLWorker=新XMLWorker(管道,true);
最终字符集Charset=Charset.forName(“UTF-8”);
final XMLParser=new XMLParser(true,worker,charset);
最终输入流为=新文件输入流(“C:\\test.html”);
parse(is,charset);
is.close();
document.close();
file.close();
}捕获(例外e){
e、 printStackTrace();
//待办事项
}
}
public static void main(String[] args) {
    convertHtmlToPdf();

}

private static void convertHtmlToPdf() {
    try {
        final OutputStream file = new FileOutputStream(new File("C:\\Test.pdf"));
        final Document document = new Document();
        final PdfWriter writer = PdfWriter.getInstance(document, file);
        document.open();
        final TagProcessorFactory tagProcessorFactory = Tags.getHtmlTagProcessorFactory();
        tagProcessorFactory.removeProcessor(HTML.Tag.IMG);
        tagProcessorFactory.addProcessor(new ImageTagProcessor(), HTML.Tag.IMG);

        final CssFilesImpl cssFiles = new CssFilesImpl();
        cssFiles.add(XMLWorkerHelper.getInstance().getDefaultCSS());
        final StyleAttrCSSResolver cssResolver = new StyleAttrCSSResolver(cssFiles);
        final HtmlPipelineContext hpc = new HtmlPipelineContext(new CssAppliersImpl(new XMLWorkerFontProvider()));
        hpc.setAcceptUnknown(true).autoBookmark(true).setTagFactory(tagProcessorFactory);
        final HtmlPipeline htmlPipeline = new HtmlPipeline(hpc, new PdfWriterPipeline(document, writer));
        final Pipeline<?> pipeline = new CssResolverPipeline(cssResolver, htmlPipeline);
        final XMLWorker worker = new XMLWorker(pipeline, true);
        final Charset charset = Charset.forName("UTF-8");
        final XMLParser xmlParser = new XMLParser(true, worker, charset);
        final InputStream is = new FileInputStream("C:\\test.html");
        xmlParser.parse(is, charset);

        is.close();
        document.close();
        file.close();
    } catch (Exception e) {
        e.printStackTrace();
        // TODO
    }
}