Search in sources :

Example 6 with PDPageDestination

use of com.tom_roush.pdfbox.pdmodel.interactive.documentnavigation.destination.PDPageDestination in project PdfBox-Android by TomRoush.

the class PDFMergerUtility method appendDocument.

/**
 * append all pages from source to destination.
 *
 * @param destination the document to receive the pages
 * @param source the document originating the new pages
 *
 * @throws IOException If there is an error accessing data from either
 * document.
 */
public void appendDocument(PDDocument destination, PDDocument source) throws IOException {
    if (source.getDocument().isClosed()) {
        throw new IOException("Error: source PDF is closed.");
    }
    if (destination.getDocument().isClosed()) {
        throw new IOException("Error: destination PDF is closed.");
    }
    PDDocumentCatalog destCatalog = destination.getDocumentCatalog();
    PDDocumentCatalog srcCatalog = source.getDocumentCatalog();
    if (isDynamicXfa(srcCatalog.getAcroForm())) {
        throw new IOException("Error: can't merge source document containing dynamic XFA form content.");
    }
    PDDocumentInformation destInfo = destination.getDocumentInformation();
    PDDocumentInformation srcInfo = source.getDocumentInformation();
    mergeInto(srcInfo.getCOSObject(), destInfo.getCOSObject(), Collections.<COSName>emptySet());
    // use the highest version number for the resulting pdf
    float destVersion = destination.getVersion();
    float srcVersion = source.getVersion();
    if (destVersion < srcVersion) {
        destination.setVersion(srcVersion);
    }
    int pageIndexOpenActionDest = -1;
    if (destCatalog.getOpenAction() == null) {
        // PDFBOX-3972: get local dest page index, it must be reassigned after the page cloning
        PDDestinationOrAction openAction = null;
        try {
            openAction = srcCatalog.getOpenAction();
        } catch (IOException ex) {
            // PDFBOX-4223
            Log.e("PdfBox-Android", "Invalid OpenAction ignored", ex);
        }
        PDDestination openActionDestination = null;
        if (openAction instanceof PDActionGoTo) {
            openActionDestination = ((PDActionGoTo) openAction).getDestination();
        } else if (openAction instanceof PDDestination) {
            openActionDestination = (PDDestination) openAction;
        }
        if (openActionDestination instanceof PDPageDestination) {
            PDPage page = ((PDPageDestination) openActionDestination).getPage();
            if (page != null) {
                pageIndexOpenActionDest = srcCatalog.getPages().indexOf(page);
            }
        }
        destCatalog.setOpenAction(openAction);
    }
    PDFCloneUtility cloner = new PDFCloneUtility(destination);
    mergeAcroForm(cloner, destCatalog, srcCatalog);
    COSArray destThreads = (COSArray) destCatalog.getCOSObject().getDictionaryObject(COSName.THREADS);
    COSArray srcThreads = (COSArray) cloner.cloneForNewDocument(destCatalog.getCOSObject().getDictionaryObject(COSName.THREADS));
    if (destThreads == null) {
        destCatalog.getCOSObject().setItem(COSName.THREADS, srcThreads);
    } else {
        destThreads.addAll(srcThreads);
    }
    PDDocumentNameDictionary destNames = destCatalog.getNames();
    PDDocumentNameDictionary srcNames = srcCatalog.getNames();
    if (srcNames != null) {
        if (destNames == null) {
            destCatalog.getCOSObject().setItem(COSName.NAMES, cloner.cloneForNewDocument(srcNames));
        } else {
            cloner.cloneMerge(srcNames, destNames);
        }
    }
    if (destNames != null) {
        // found in 054080.pdf from PDFBOX-4417 and doesn't belong there
        destNames.getCOSObject().removeItem(COSName.ID_TREE);
        Log.w("PdfBox-Android", "Removed /IDTree from /Names dictionary, doesn't belong there");
    }
    PDDocumentNameDestinationDictionary destDests = destCatalog.getDests();
    PDDocumentNameDestinationDictionary srcDests = srcCatalog.getDests();
    if (srcDests != null) {
        if (destDests == null) {
            destCatalog.getCOSObject().setItem(COSName.DESTS, cloner.cloneForNewDocument(srcDests));
        } else {
            cloner.cloneMerge(srcDests, destDests);
        }
    }
    PDDocumentOutline destOutline = destCatalog.getDocumentOutline();
    PDDocumentOutline srcOutline = srcCatalog.getDocumentOutline();
    if (srcOutline != null) {
        if (destOutline == null || destOutline.getFirstChild() == null) {
            PDDocumentOutline cloned = new PDDocumentOutline((COSDictionary) cloner.cloneForNewDocument(srcOutline));
            destCatalog.setDocumentOutline(cloned);
        } else {
            // search last sibling for dest, because /Last entry is sometimes wrong
            PDOutlineItem destLastOutlineItem = destOutline.getFirstChild();
            while (destLastOutlineItem.getNextSibling() != null) {
                destLastOutlineItem = destLastOutlineItem.getNextSibling();
            }
            for (PDOutlineItem item : srcOutline.children()) {
                // get each child, clone its dictionary, remove siblings info,
                // append outline item created from there
                COSDictionary clonedDict = (COSDictionary) cloner.cloneForNewDocument(item);
                clonedDict.removeItem(COSName.PREV);
                clonedDict.removeItem(COSName.NEXT);
                PDOutlineItem clonedItem = new PDOutlineItem(clonedDict);
                destLastOutlineItem.insertSiblingAfter(clonedItem);
                destLastOutlineItem = destLastOutlineItem.getNextSibling();
            }
        }
    }
    PageMode destPageMode = destCatalog.getPageMode();
    PageMode srcPageMode = srcCatalog.getPageMode();
    if (destPageMode == null) {
        destCatalog.setPageMode(srcPageMode);
    }
    COSDictionary destLabels = destCatalog.getCOSObject().getCOSDictionary(COSName.PAGE_LABELS);
    COSDictionary srcLabels = srcCatalog.getCOSObject().getCOSDictionary(COSName.PAGE_LABELS);
    if (srcLabels != null) {
        int destPageCount = destination.getNumberOfPages();
        COSArray destNums;
        if (destLabels == null) {
            destLabels = new COSDictionary();
            destNums = new COSArray();
            destLabels.setItem(COSName.NUMS, destNums);
            destCatalog.getCOSObject().setItem(COSName.PAGE_LABELS, destLabels);
        } else {
            destNums = (COSArray) destLabels.getDictionaryObject(COSName.NUMS);
        }
        COSArray srcNums = (COSArray) srcLabels.getDictionaryObject(COSName.NUMS);
        if (srcNums != null) {
            int startSize = destNums.size();
            for (int i = 0; i < srcNums.size(); i += 2) {
                COSBase base = srcNums.getObject(i);
                if (!(base instanceof COSNumber)) {
                    Log.e("PdfBox-Android", "page labels ignored, index " + i + " should be a number, but is " + base);
                    // remove what we added
                    while (destNums.size() > startSize) {
                        destNums.remove(startSize);
                    }
                    break;
                }
                COSNumber labelIndex = (COSNumber) base;
                long labelIndexValue = labelIndex.intValue();
                destNums.add(COSInteger.get(labelIndexValue + destPageCount));
                destNums.add(cloner.cloneForNewDocument(srcNums.getObject(i + 1)));
            }
        }
    }
    COSStream destMetadata = destCatalog.getCOSObject().getCOSStream(COSName.METADATA);
    COSStream srcMetadata = srcCatalog.getCOSObject().getCOSStream(COSName.METADATA);
    if (destMetadata == null && srcMetadata != null) {
        try {
            PDStream newStream = new PDStream(destination, srcMetadata.createInputStream(), (COSName) null);
            mergeInto(srcMetadata, newStream.getCOSObject(), new HashSet<COSName>(Arrays.asList(COSName.FILTER, COSName.LENGTH)));
            destCatalog.getCOSObject().setItem(COSName.METADATA, newStream);
        } catch (IOException ex) {
            // PDFBOX-4227 cleartext XMP stream with /Flate
            Log.e("PdfBox-Android", "Metadata skipped because it could not be read", ex);
        }
    }
    COSDictionary destOCP = destCatalog.getCOSObject().getCOSDictionary(COSName.OCPROPERTIES);
    COSDictionary srcOCP = srcCatalog.getCOSObject().getCOSDictionary(COSName.OCPROPERTIES);
    if (destOCP == null && srcOCP != null) {
        destCatalog.getCOSObject().setItem(COSName.OCPROPERTIES, cloner.cloneForNewDocument(srcOCP));
    } else if (destOCP != null && srcOCP != null) {
        cloner.cloneMerge(srcOCP, destOCP);
    }
    mergeOutputIntents(cloner, srcCatalog, destCatalog);
    // merge logical structure hierarchy
    boolean mergeStructTree = false;
    int destParentTreeNextKey = -1;
    Map<Integer, COSObjectable> srcNumberTreeAsMap = null;
    Map<Integer, COSObjectable> destNumberTreeAsMap = null;
    PDStructureTreeRoot srcStructTree = srcCatalog.getStructureTreeRoot();
    PDStructureTreeRoot destStructTree = destCatalog.getStructureTreeRoot();
    if (destStructTree == null && srcStructTree != null) {
        // create a dummy structure tree in the destination, so that the source
        // tree is cloned. (We can't just copy the tree reference due to PDFBOX-3999)
        destStructTree = new PDStructureTreeRoot();
        destCatalog.setStructureTreeRoot(destStructTree);
        destStructTree.setParentTree(new PDNumberTreeNode(PDParentTreeValue.class));
        // PDFBOX-4429: remove bogus StructParent(s)
        for (PDPage page : destCatalog.getPages()) {
            page.getCOSObject().removeItem(COSName.STRUCT_PARENTS);
            for (PDAnnotation ann : page.getAnnotations()) {
                ann.getCOSObject().removeItem(COSName.STRUCT_PARENT);
            }
        }
    }
    if (destStructTree != null) {
        PDNumberTreeNode destParentTree = destStructTree.getParentTree();
        destParentTreeNextKey = destStructTree.getParentTreeNextKey();
        if (destParentTree != null) {
            destNumberTreeAsMap = getNumberTreeAsMap(destParentTree);
            if (destParentTreeNextKey < 0) {
                if (destNumberTreeAsMap.isEmpty()) {
                    destParentTreeNextKey = 0;
                } else {
                    destParentTreeNextKey = Collections.max(destNumberTreeAsMap.keySet()) + 1;
                }
            }
            if (destParentTreeNextKey >= 0 && srcStructTree != null) {
                PDNumberTreeNode srcParentTree = srcStructTree.getParentTree();
                if (srcParentTree != null) {
                    srcNumberTreeAsMap = getNumberTreeAsMap(srcParentTree);
                    if (!srcNumberTreeAsMap.isEmpty()) {
                        mergeStructTree = true;
                    }
                }
            }
        }
    }
    Map<COSDictionary, COSDictionary> objMapping = new HashMap<COSDictionary, COSDictionary>();
    int pageIndex = 0;
    for (PDPage page : srcCatalog.getPages()) {
        PDPage newPage = new PDPage((COSDictionary) cloner.cloneForNewDocument(page.getCOSObject()));
        if (!mergeStructTree) {
            // PDFBOX-4429: remove bogus StructParent(s)
            newPage.getCOSObject().removeItem(COSName.STRUCT_PARENTS);
            for (PDAnnotation ann : newPage.getAnnotations()) {
                ann.getCOSObject().removeItem(COSName.STRUCT_PARENT);
            }
        }
        newPage.setCropBox(page.getCropBox());
        newPage.setMediaBox(page.getMediaBox());
        newPage.setRotation(page.getRotation());
        PDResources resources = page.getResources();
        if (resources != null) {
            // this is smart enough to just create references for resources that are used on multiple pages
            newPage.setResources(new PDResources((COSDictionary) cloner.cloneForNewDocument(resources)));
        } else {
            newPage.setResources(new PDResources());
        }
        if (mergeStructTree) {
            // add the value of the destination ParentTreeNextKey to every source element
            // StructParent(s) value so that these don't overlap with the existing values
            updateStructParentEntries(newPage, destParentTreeNextKey);
            objMapping.put(page.getCOSObject(), newPage.getCOSObject());
            List<PDAnnotation> oldAnnots = page.getAnnotations();
            List<PDAnnotation> newAnnots = newPage.getAnnotations();
            for (int i = 0; i < oldAnnots.size(); i++) {
                objMapping.put(oldAnnots.get(i).getCOSObject(), newAnnots.get(i).getCOSObject());
            }
        // TODO update mapping for XObjects
        }
        destination.addPage(newPage);
        if (pageIndex == pageIndexOpenActionDest) {
            // PDFBOX-3972: reassign the page.
            // The openAction is either a PDActionGoTo or a PDPageDestination
            PDDestinationOrAction openAction = destCatalog.getOpenAction();
            PDPageDestination pageDestination;
            if (openAction instanceof PDActionGoTo) {
                pageDestination = (PDPageDestination) ((PDActionGoTo) openAction).getDestination();
            } else {
                pageDestination = (PDPageDestination) openAction;
            }
            pageDestination.setPage(newPage);
        }
        ++pageIndex;
    }
    if (mergeStructTree) {
        updatePageReferences(cloner, srcNumberTreeAsMap, objMapping);
        int maxSrcKey = -1;
        for (Map.Entry<Integer, COSObjectable> entry : srcNumberTreeAsMap.entrySet()) {
            int srcKey = entry.getKey();
            maxSrcKey = Math.max(srcKey, maxSrcKey);
            destNumberTreeAsMap.put(destParentTreeNextKey + srcKey, cloner.cloneForNewDocument(entry.getValue()));
        }
        destParentTreeNextKey += maxSrcKey + 1;
        PDNumberTreeNode newParentTreeNode = new PDNumberTreeNode(PDParentTreeValue.class);
        // Note that all elements are stored flatly. This could become a problem for large files
        // when these are opened in a viewer that uses the tagging information.
        // If this happens, then ​PDNumberTreeNode should be improved with a convenience method that
        // stores the map into a B+Tree, see https://en.wikipedia.org/wiki/B+_tree
        newParentTreeNode.setNumbers(destNumberTreeAsMap);
        destStructTree.setParentTree(newParentTreeNode);
        destStructTree.setParentTreeNextKey(destParentTreeNextKey);
        mergeKEntries(cloner, srcStructTree, destStructTree);
        mergeRoleMap(srcStructTree, destStructTree);
        mergeIDTree(cloner, srcStructTree, destStructTree);
        mergeMarkInfo(destCatalog, srcCatalog);
        mergeLanguage(destCatalog, srcCatalog);
        mergeViewerPreferences(destCatalog, srcCatalog);
    }
}
Also used : COSStream(com.tom_roush.pdfbox.cos.COSStream) PDPage(com.tom_roush.pdfbox.pdmodel.PDPage) HashMap(java.util.HashMap) LinkedHashMap(java.util.LinkedHashMap) PDDestinationOrAction(com.tom_roush.pdfbox.pdmodel.common.PDDestinationOrAction) PDStructureTreeRoot(com.tom_roush.pdfbox.pdmodel.documentinterchange.logicalstructure.PDStructureTreeRoot) PDPageDestination(com.tom_roush.pdfbox.pdmodel.interactive.documentnavigation.destination.PDPageDestination) COSObjectable(com.tom_roush.pdfbox.pdmodel.common.COSObjectable) PDNumberTreeNode(com.tom_roush.pdfbox.pdmodel.common.PDNumberTreeNode) COSArray(com.tom_roush.pdfbox.cos.COSArray) COSName(com.tom_roush.pdfbox.cos.COSName) COSNumber(com.tom_roush.pdfbox.cos.COSNumber) COSBase(com.tom_roush.pdfbox.cos.COSBase) PDDocumentInformation(com.tom_roush.pdfbox.pdmodel.PDDocumentInformation) PDActionGoTo(com.tom_roush.pdfbox.pdmodel.interactive.action.PDActionGoTo) PDDocumentNameDestinationDictionary(com.tom_roush.pdfbox.pdmodel.PDDocumentNameDestinationDictionary) PageMode(com.tom_roush.pdfbox.pdmodel.PageMode) COSDictionary(com.tom_roush.pdfbox.cos.COSDictionary) PDDocumentOutline(com.tom_roush.pdfbox.pdmodel.interactive.documentnavigation.outline.PDDocumentOutline) PDAnnotation(com.tom_roush.pdfbox.pdmodel.interactive.annotation.PDAnnotation) PDParentTreeValue(com.tom_roush.pdfbox.pdmodel.documentinterchange.logicalstructure.PDParentTreeValue) PDResources(com.tom_roush.pdfbox.pdmodel.PDResources) IOException(java.io.IOException) PDDestination(com.tom_roush.pdfbox.pdmodel.interactive.documentnavigation.destination.PDDestination) PDStream(com.tom_roush.pdfbox.pdmodel.common.PDStream) PDDocumentCatalog(com.tom_roush.pdfbox.pdmodel.PDDocumentCatalog) PDDocumentNameDictionary(com.tom_roush.pdfbox.pdmodel.PDDocumentNameDictionary) COSInteger(com.tom_roush.pdfbox.cos.COSInteger) PDOutlineItem(com.tom_roush.pdfbox.pdmodel.interactive.documentnavigation.outline.PDOutlineItem) Map(java.util.Map) HashMap(java.util.HashMap) LinkedHashMap(java.util.LinkedHashMap)

Example 7 with PDPageDestination

use of com.tom_roush.pdfbox.pdmodel.interactive.documentnavigation.destination.PDPageDestination in project PdfBox-Android by TomRoush.

the class PDFMergerUtilityTest method testPDFMergerOpenAction.

/**
 * PDFBOX-3972: Test that OpenAction page destination isn't lost after merge.
 *
 * @throws IOException
 */
@Test
public void testPDFMergerOpenAction() throws IOException {
    PDDocument doc1 = new PDDocument();
    doc1.addPage(new PDPage());
    doc1.addPage(new PDPage());
    doc1.addPage(new PDPage());
    doc1.save(new File(TARGETTESTDIR, "MergerOpenActionTest1.pdf"));
    doc1.close();
    PDDocument doc2 = new PDDocument();
    doc2.addPage(new PDPage());
    doc2.addPage(new PDPage());
    doc2.addPage(new PDPage());
    PDPageDestination dest = new PDPageFitDestination();
    dest.setPage(doc2.getPage(1));
    doc2.getDocumentCatalog().setOpenAction(dest);
    doc2.save(new File(TARGETTESTDIR, "MergerOpenActionTest2.pdf"));
    doc2.close();
    PDFMergerUtility pdfMergerUtility = new PDFMergerUtility();
    pdfMergerUtility.addSource(new File(TARGETTESTDIR, "MergerOpenActionTest1.pdf"));
    pdfMergerUtility.addSource(new File(TARGETTESTDIR, "MergerOpenActionTest2.pdf"));
    pdfMergerUtility.setDestinationFileName(TARGETTESTDIR + "MergerOpenActionTestResult.pdf");
    pdfMergerUtility.mergeDocuments(MemoryUsageSetting.setupMainMemoryOnly());
    PDDocument mergedDoc = PDDocument.load(new File(TARGETTESTDIR, "MergerOpenActionTestResult.pdf"));
    PDDocumentCatalog documentCatalog = mergedDoc.getDocumentCatalog();
    dest = (PDPageDestination) documentCatalog.getOpenAction();
    assertEquals(4, documentCatalog.getPages().indexOf(dest.getPage()));
    mergedDoc.close();
}
Also used : PDPage(com.tom_roush.pdfbox.pdmodel.PDPage) PDDocument(com.tom_roush.pdfbox.pdmodel.PDDocument) PDPageDestination(com.tom_roush.pdfbox.pdmodel.interactive.documentnavigation.destination.PDPageDestination) PDPageFitDestination(com.tom_roush.pdfbox.pdmodel.interactive.documentnavigation.destination.PDPageFitDestination) File(java.io.File) PDDocumentCatalog(com.tom_roush.pdfbox.pdmodel.PDDocumentCatalog) Test(org.junit.Test)

Example 8 with PDPageDestination

use of com.tom_roush.pdfbox.pdmodel.interactive.documentnavigation.destination.PDPageDestination in project PdfBox-Android by TomRoush.

the class PDActionEmbeddedGoTo method setDestination.

/**
 * This will set the destination to jump to.
 *
 * @param d The destination.
 *
 * @throws IllegalArgumentException if the destination is not a page dictionary object.
 */
public void setDestination(PDDestination d) {
    if (d instanceof PDPageDestination) {
        PDPageDestination pageDest = (PDPageDestination) d;
        COSArray destArray = pageDest.getCOSObject();
        if (destArray.size() >= 1) {
            COSBase page = destArray.getObject(0);
            if (!(page instanceof COSDictionary)) {
                throw new IllegalArgumentException("Destination of a GoToE action must be " + "a page dictionary object");
            }
        }
    }
    getCOSObject().setItem(COSName.D, d);
}
Also used : COSArray(com.tom_roush.pdfbox.cos.COSArray) COSDictionary(com.tom_roush.pdfbox.cos.COSDictionary) PDPageDestination(com.tom_roush.pdfbox.pdmodel.interactive.documentnavigation.destination.PDPageDestination) COSBase(com.tom_roush.pdfbox.cos.COSBase)

Aggregations

PDPageDestination (com.tom_roush.pdfbox.pdmodel.interactive.documentnavigation.destination.PDPageDestination)8 COSArray (com.tom_roush.pdfbox.cos.COSArray)3 COSBase (com.tom_roush.pdfbox.cos.COSBase)3 COSDictionary (com.tom_roush.pdfbox.cos.COSDictionary)3 PDPage (com.tom_roush.pdfbox.pdmodel.PDPage)3 PDActionGoTo (com.tom_roush.pdfbox.pdmodel.interactive.action.PDActionGoTo)3 PDDestination (com.tom_roush.pdfbox.pdmodel.interactive.documentnavigation.destination.PDDestination)3 PDDocumentCatalog (com.tom_roush.pdfbox.pdmodel.PDDocumentCatalog)2 PDAction (com.tom_roush.pdfbox.pdmodel.interactive.action.PDAction)2 PDAnnotation (com.tom_roush.pdfbox.pdmodel.interactive.annotation.PDAnnotation)2 IOException (java.io.IOException)2 COSInteger (com.tom_roush.pdfbox.cos.COSInteger)1 COSName (com.tom_roush.pdfbox.cos.COSName)1 COSNumber (com.tom_roush.pdfbox.cos.COSNumber)1 COSStream (com.tom_roush.pdfbox.cos.COSStream)1 PDDocument (com.tom_roush.pdfbox.pdmodel.PDDocument)1 PDDocumentInformation (com.tom_roush.pdfbox.pdmodel.PDDocumentInformation)1 PDDocumentNameDestinationDictionary (com.tom_roush.pdfbox.pdmodel.PDDocumentNameDestinationDictionary)1 PDDocumentNameDictionary (com.tom_roush.pdfbox.pdmodel.PDDocumentNameDictionary)1 PDResources (com.tom_roush.pdfbox.pdmodel.PDResources)1