添加PDAnnotationLinks后的PDFBOX文件大小增加了两倍

时间:2016-03-23 10:05:48

标签: java pdf pdfbox

我正在研究Java项目,我有以下情况:

  1. 我已经用apache FOP生成了现有的PDF文件。里面有书签,我可以随身携带:

    Map<String, PDAction> actionsMap = new HashMap<String, PDAction>();
    PDDocumentOutline bookmarks = doc1.getDocumentCatalog().getDocumentOutline();
    PDOutlineItem item = bookmarks.getFirstChild();
    while(item != null ){
       actionsMap.put(item.getTitle(), item.getAction());
       item = item.getNextSibling();
    }
    
  2. 我用PDFBOX 2.0.0打开第二个文件(再次生成FOP),并将3个PDAnnotationLink添加到文本的特定部分。该文件是单页,几个图表。然后我从第1点添加动作

    PDPage page = (PDPage) diagramDocument.getDocumentCatalog().getPages().get(0);
    //objCoordinates is retrieved from another class with PDFTextStripper
    Iterator entries = objCoordinates.entrySet().iterator();
    while (entries.hasNext()) {
      Entry entry = (Entry) entries.next();
      String key = (String) entry.getKey();
      PDAnnotationLink txtLink = new PDAnnotationLink();
      PDBorderStyleDictionary borderULine = new PDBorderStyleDictionary();
      borderULine.setWidth(0);
      txtLink.setBorderStyle(borderULine);
      PDActionGoTo action = (PDActionGoTo) actionsMap.get(key);
      txtLink.setAction(action);
    
      final float[] quads = (float[]) entry.getValue();
      PDRectangle rect = new PDRectangle();
      rect.setLowerLeftX(quads[0]);
      rect.setLowerLeftY(quads[5]);
      rect.setUpperRightX(quads[2]);
      rect.setUpperRightY(quads[1]);
      txtLink.setRectangle(rect);
    
      page.getAnnotations().add(txtLink);
    } 
    
  3. 保存第二个文件后,链接正常,但文件大小加倍。 PDF版本是1.6。该文件已经有过滤器FlateDecode。 我确实尝试过在线PDF文件比较(初始文件和结果文件与链接),但结果是文件没有区别。 当我用文本编辑器打开文件时 - 原始文件 - 1类型/页面/实例 - 结果文件 - 18 /类型/页面实例 我的猜测是PDFBOX正在添加一些额外的(重复?)信息。

    如果有人遇到过这个问题我会很感激。

    由于

1 个答案:

答案 0 :(得分:1)

我只是想知道如何给你一个信用Tilman ...... :-) 好的,我已经重新编写并简化了代码,所以我可以在这里发布。 希望很清楚

    import java.io.File;
    import java.util.ArrayList;
    import java.util.HashMap;
    import java.util.Iterator;
    import java.util.List;
    import java.util.Map;
    import java.util.Map.Entry;

    import org.apache.pdfbox.pdmodel.PDDocument;
    import org.apache.pdfbox.pdmodel.PDPage;
    import org.apache.pdfbox.pdmodel.common.PDRectangle;
    import org.apache.pdfbox.pdmodel.interactive.action.PDAction;
    import org.apache.pdfbox.pdmodel.interactive.action.PDActionGoTo;
    import org.apache.pdfbox.pdmodel.interactive.annotation.PDAnnotationLink;
    import org.apache.pdfbox.pdmodel.interactive.annotation.PDBorderStyleDictionary;
    import org.apache.pdfbox.pdmodel.interactive.documentnavigation.outline.PDDocumentOutline;
    import org.apache.pdfbox.pdmodel.interactive.documentnavigation.outline.PDOutlineItem;
    import org.apache.pdfbox.text.PDFTextStripper;

    /**
     * @author micky
     *
     * The class merges PDF files
     *  - one file with item details info
     *  - one or more files with items diagrams
     *  
     *   Purpose is to merge diagram files into item details file and create links 
     *   from the items in diagrams to item details
     */
    public class PDFReportHyperlinks {

         public static void main(String[] args){

             PDDocument reportDocument = null;
             try {

                 String reportFileName = "D:/ItemsDetails.pdf";

                 Map<String, PDAction> actionsMap = new HashMap<String, PDAction>();
                 reportDocument = PDDocument.load(new File(reportFileName));

                 // Get the bookmarks i.e. existing GoTo actions
                 PDDocumentOutline bookmarks = reportDocument.getDocumentCatalog().getDocumentOutline();
                 PDOutlineItem item = bookmarks.getFirstChild();
                 while(item != null ){
                     actionsMap.put(item.getTitle(), item.getAction());
                     item = item.getNextSibling();
                 }

                 // Diagram files, they have single page
                 List diagamFiles = new ArrayList<String>() {{
                        add("D:/Diagram_1.pdf");
                        add("D:/Diagram_2.pdf");
                        add("D:/Diagram_3.pdf");
                 }};

                 Iterator diagramsIt = diagamFiles.iterator();
                 while (diagramsIt.hasNext()) {
                     String diagramName = (String) diagramsIt.next();

                     //--<Import diagram>---------------------------------
                     PDDocument sourceDocument = PDDocument.load(new File(diagramName));
                     PDPage pp = (PDPage) sourceDocument .getDocumentCatalog().getPages().get(0);
                     PDPage page = reportDocument.importPage(pp);

                     //--<Create links from diagrams to objects>---------------------------------

                     // TextStripper is separate class extending PDFTextStripper
                     // It is searching for items names and returning Map with their coordinates
                     TextStripper stripper = new TextStripper(sourceDocument,
                             new ArrayList<String>() {{
                                 add("Item1_Name");
                                 add("Item2_Name");
                                 add("Item3_Name");
                                 add("Item4_Name");
                                 add("Item5_Name");
                             }});

                     Map<String, float[]> objCoordinates = stripper.getObjCoordinates();

                     Iterator entries = objCoordinates.entrySet().iterator();
                     while (entries.hasNext()) {
                         Entry entry = (Entry) entries.next();
                         String key = (String) entry.getKey();

                         PDAnnotationLink txtLink = new PDAnnotationLink();
                         PDBorderStyleDictionary borderULine = new PDBorderStyleDictionary();
                         borderULine.setWidth(0);
                         txtLink.setBorderStyle(borderULine);
                         PDActionGoTo action = (PDActionGoTo) actionsMap.get(key);
                         txtLink.setAction(action);

                         final float[] quads = (float[]) entry.getValue();
                         PDRectangle rect = new PDRectangle();
                         rect.setLowerLeftX(quads[0]);
                         rect.setLowerLeftY(quads[5]);
                         rect.setUpperRightX(quads[2]);
                         rect.setUpperRightY(quads[1]);
                         txtLink.setRectangle(rect);

                         page.getAnnotations().add(txtLink);
                     }

                     //--<Create bookmarks for new pages (diagrams)>---------------------------------
                     PDOutlineItem menuItem = new PDOutlineItem();
                     menuItem.setTitle(diagramName);
                     menuItem.setDestination(page);
                     bookmarks.addLast(menuItem);
                     menuItem.openNode();
                     bookmarks.openNode();

                 }

                 reportDocument.save(new File(reportFileName));
                 reportDocument.close();

                 // Alternative merging documents example not feasible in this case
                 //PDFMergerUtility ut = new PDFMergerUtility();
                 //ut.addSource(reportFileName);
                 //diagramsIt = diagamFiles.iterator();
                 //while (diagramsIt.hasNext()) {
                 //  String diagramName = (String) diagramsIt.next();
                 //  ut.addSource(diagramName);
                 // }
                 //ut.setDestinationFileName(reportFileName);
                 //ut.mergeDocuments(MemoryUsageSetting.setupMainMemoryOnly());

                System.out.println("COMPLETED");

             } catch (Exception e) {
                 System.out.println(e);
             } finally {
                 try {
                     reportDocument.close();
                 } catch (Exception e) {
                     System.out.println(e);
                 }
            }
        }
    }