PDF转图片,拼接图片

一、导入PDF处理的包

  阿里云仓库搜索icepdf-core依赖,找到合适的版本,导入pom.xml文件。

<dependency>
        <groupId>org.icepdf.os</groupId>
        <artifactId>icepdf-core</artifactId>
        <version>6.1.2</version>
</dependency>

二、PDF转图片存储

  1、读取目标PDF文件;

  2、创建Document对象,通过getNumberOfPages方法获取PDF页数;

  3、循环创建BufferedImage对象,读取每页PDF,并以图片流的方式输出,将图片写入指定路径。

import org.icepdf.core.pobjects.Document;
import org.icepdf.core.pobjects.Page;
import org.icepdf.core.util.GraphicsRenderingHints;

import javax.imageio.ImageIO;
import java.awt.image.BufferedImage;
import java.io.File;
import java.io.IOException;
import java.util.ArrayList;
import java.util.Date;
import java.util.List;

public class PDFToImageUtil {

    /*获取pdf文件名*/
    public String getPDFName(String filePath){
        File fileOrigin = new File(filePath);
        String fileName = fileOrigin.getName();
        fileName = fileName.substring(0,fileName.lastIndexOf("."));
        return fileName;
    }
    /*pdf转图片*/
    public List<String> Pdf2Img(String filePath,String imagePath) throws Exception {
        String fileName = getPDFName(filePath);
        File dir = new File(imagePath);
        if(!dir.exists()){
            boolean b = dir.mkdir();
            if(!b){
                return null;
            }
        }
        Document document = new Document();
        document.setFile(filePath);
        float scale = 2.5f;//缩放比例
        float rotation = 0f;//旋转角度
        List<String> filePaths = new ArrayList<String>();
        for(int i = 0; i<document.getNumberOfPages();i++){
            BufferedImage bufferedImage = (BufferedImage) document.getPageImage(i, GraphicsRenderingHints.SCREEN, Page.BOUNDARY_CROPBOX,rotation,scale);
            try {
                File file = new File(imagePath+"/"+fileName+new Date().getTime() +".png");
                filePaths.add(file.getPath());
                ImageIO.write(bufferedImage,"png",file);
            }catch (IOException e){
                e.printStackTrace();
            }
            bufferedImage.flush();
        }
        document.dispose();
        return  filePaths;
    }
}

  4、生成图片后,方法会将图片的全路径存入List并返回。

三、拼接图片

  1、获取所有图片路径,循环遍历图片,用BufferedImage对象存储;

  2、获取每张图片的RGB,用数组存储;

  3、以每张图片的左上角为起始坐标,根据纵向坐标不断累加的原理,将RGB拼接;

  4、循环完成后,对最终拼接完成的BufferedImage对象写入指定位置生成拼接后的图片。

import java.awt.image.BufferedImage;
import java.io.File;
import java.io.IOException;
import java.util.List;

import javax.imageio.ImageIO;


public class PDFToMergeImageUtil {
    public String Pdf2MergeImg(String filePath,String imagePath) throws Exception {
        PDFToImageUtil pdfToImageUtil = new PDFToImageUtil();
        List<String> filePaths = pdfToImageUtil.Pdf2Img(filePath, imagePath);
        String fileName = pdfToImageUtil.getPDFName(filePath);
        BufferedImage destImage = null;
        for(int i =0 ; i < filePaths.size() - 1;i++){
            BufferedImage img1 = null;
            BufferedImage img2 = null;
            if(i == 0){
                img1 = getBufferedImage(filePaths.get(i));
                img2 = getBufferedImage(filePaths.get(i+1));
            }else{
                img1 = destImage;
                img2 = getBufferedImage(filePaths.get(i+1));
            }

            // 从图片中读取RGB
            int[] imageArrayOne = new int[img1.getWidth() * img1.getHeight()];
            imageArrayOne = img1.getRGB(0, 0, img1.getWidth(), img1.getHeight(), imageArrayOne, 0, img1.getWidth()); // 逐行扫描图像中各个像素的RGB到数组中
            int[] imageArrayTwo = new int[img2.getWidth() * img2.getHeight()];
            imageArrayTwo = img2.getRGB(0, 0, img2.getWidth(), img2.getHeight(), imageArrayTwo, 0, img2.getWidth());
            destImage = new BufferedImage(img1.getWidth(), img1.getHeight()+img2.getHeight(), BufferedImage.TYPE_INT_RGB);
            destImage.setRGB(0, 0, img1.getWidth(), img1.getHeight(), imageArrayOne, 0, img1.getWidth()); // 设置上半部分或左半部分的RGB
            destImage.setRGB(0, img1.getHeight(), img2.getWidth(), img2.getHeight(), imageArrayTwo, 0, img2.getWidth()); // 设置下半部分的RGB
        }
        File fileAll = new File(imagePath+"/"+fileName+".jpg");
        ImageIO.write(destImage,"png",fileAll);
        destImage.flush();
        return  fileAll.getPath();
    }
    /**
     * @param fileUrl
     *            文件绝对路径或相对路径
     * @return 读取到的缓存图像
     * @throws IOException
     *             路径错误或者不存在该文件时抛出IO异常
     */
    private BufferedImage getBufferedImage(String fileUrl)
            throws IOException {
        File f = new File(fileUrl);
        return ImageIO.read(f);
    }
}

四、测试

import org.jeecg.business.utils.PDFToMergeImageUtil;
import org.junit.Test;
import org.junit.runner.RunWith;
import org.springframework.beans.factory.annotation.Value;
import org.springframework.boot.test.context.SpringBootTest;
import org.springframework.test.context.junit4.SpringRunner;
import java.io.IOException;
import java.util.List;

@RunWith(SpringRunner.class)
@SpringBootTest(webEnvironment = SpringBootTest.WebEnvironment.RANDOM_PORT)
public class Pdf2Image {

    @Value(value = "${path.imagePath}")
    private String imagePath;
    @Test
    public void test1() throws Exception {
        PDFToMergeImageUtil pdf = new PDFToMergeImageUtil();
        String listImg = pdf.Pdf2MergeImg("D://java//maven.pdf",imagePath);
        System.out.println(listImg);
    }
}

五、总结

  总的来说就是通过BufferedImage的读写及RGB渲染实现,如果PDF文件的页数较多时,可能会出现堆内存不够的情况。

上一篇:javaCV 视频处理技术 ->提取人像视频 | 百度AI


下一篇:java poi 填充word(合并单元格,添加图片,设置字号)