blob: ec2517c580b33bd7a3d0deec550b4e3077b60628 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.pdfbox.pdmodel;
import java.io.ByteArrayInputStream;
import java.io.IOException;
import java.io.InputStream;
import java.io.SequenceInputStream;
import java.util.ArrayList;
import java.util.Collections;
import java.util.Iterator;
import java.util.List;
import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;
import org.apache.pdfbox.contentstream.PDContentStream;
import org.apache.pdfbox.cos.COSArray;
import org.apache.pdfbox.cos.COSBase;
import org.apache.pdfbox.cos.COSDictionary;
import org.apache.pdfbox.cos.COSFloat;
import org.apache.pdfbox.cos.COSName;
import org.apache.pdfbox.cos.COSNumber;
import org.apache.pdfbox.cos.COSStream;
import org.apache.pdfbox.io.RandomAccessRead;
import org.apache.pdfbox.io.RandomAccessReadBuffer;
import org.apache.pdfbox.io.SequenceRandomAccessRead;
import org.apache.pdfbox.pdmodel.common.COSArrayList;
import org.apache.pdfbox.pdmodel.common.COSObjectable;
import org.apache.pdfbox.pdmodel.common.PDMetadata;
import org.apache.pdfbox.pdmodel.common.PDRectangle;
import org.apache.pdfbox.pdmodel.common.PDStream;
import org.apache.pdfbox.pdmodel.interactive.action.PDPageAdditionalActions;
import org.apache.pdfbox.pdmodel.interactive.annotation.AnnotationFilter;
import org.apache.pdfbox.pdmodel.interactive.annotation.PDAnnotation;
import org.apache.pdfbox.pdmodel.interactive.measurement.PDViewportDictionary;
import org.apache.pdfbox.pdmodel.interactive.pagenavigation.PDThreadBead;
import org.apache.pdfbox.pdmodel.interactive.pagenavigation.PDTransition;
import org.apache.pdfbox.util.Matrix;
/**
* A page in a PDF document.
*
* @author Ben Litchfield
*/
public class PDPage implements COSObjectable, PDContentStream
{
/**
* Log instance
*/
private static final Log LOG = LogFactory.getLog(PDPage.class);
private final COSDictionary page;
private PDResources pageResources;
private ResourceCache resourceCache;
private PDRectangle mediaBox;
/**
* Creates a new PDPage instance for embedding, with a size of U.S. Letter (8.5 x 11 inches).
*/
public PDPage()
{
this(PDRectangle.LETTER);
}
/**
* Creates a new instance of PDPage for embedding.
*
* @param mediaBox The MediaBox of the page.
*/
public PDPage(PDRectangle mediaBox)
{
page = new COSDictionary();
page.setItem(COSName.TYPE, COSName.PAGE);
page.setItem(COSName.MEDIA_BOX, mediaBox);
}
/**
* Creates a new instance of PDPage for reading.
*
* @param pageDictionary A page dictionary in a PDF document.
*/
public PDPage(COSDictionary pageDictionary)
{
page = pageDictionary;
}
/**
* Creates a new instance of PDPage for reading.
*
* @param pageDictionary A page dictionary in a PDF document.
*/
PDPage(COSDictionary pageDictionary, ResourceCache resourceCache)
{
page = pageDictionary;
this.resourceCache = resourceCache;
}
/**
* Convert this standard java object to a COS object.
*
* @return The cos object that matches this Java object.
*/
@Override
public COSDictionary getCOSObject()
{
return page;
}
/**
* Returns the content streams which make up this page.
*
* @return content stream iterator
*/
public Iterator<PDStream> getContentStreams()
{
List<PDStream> streams = new ArrayList<>();
COSBase base = page.getDictionaryObject(COSName.CONTENTS);
if (base instanceof COSStream)
{
streams.add(new PDStream((COSStream) base));
}
else if (base instanceof COSArray)
{
COSArray array = (COSArray)base;
for (int i = 0; i < array.size(); i++)
{
COSStream stream = (COSStream) array.getObject(i);
streams.add(new PDStream(stream));
}
}
return streams.iterator();
}
/**
* Returns the content stream(s) of this page as a single input stream.
*
* @return An InputStream, never null. Multiple content streams are concatenated and separated
* with a newline. An empty stream is returned if the page doesn't have any content stream.
* @throws IOException If the stream could not be read
*/
@Override
public InputStream getContents() throws IOException
{
COSBase base = page.getDictionaryObject(COSName.CONTENTS);
if (base instanceof COSStream)
{
return ((COSStream)base).createInputStream();
}
else if (base instanceof COSArray && ((COSArray) base).size() > 0)
{
COSArray streams = (COSArray)base;
byte[] delimiter = new byte[] { '\n' };
List<InputStream> inputStreams = new ArrayList<>();
for (int i = 0; i < streams.size(); i++)
{
COSBase strm = streams.getObject(i);
if (strm instanceof COSStream)
{
COSStream stream = (COSStream) strm;
inputStreams.add(stream.createInputStream());
inputStreams.add(new ByteArrayInputStream(delimiter));
}
}
return new SequenceInputStream(Collections.enumeration(inputStreams));
}
return new ByteArrayInputStream(new byte[0]);
}
@Override
public RandomAccessRead getContentsForRandomAccess() throws IOException
{
COSBase base = page.getDictionaryObject(COSName.CONTENTS);
if (base instanceof COSStream)
{
return ((COSStream) base).createView();
}
else if (base instanceof COSArray && ((COSArray) base).size() > 0)
{
byte[] delimiter = new byte[] { '\n' };
COSArray streams = (COSArray) base;
List<RandomAccessRead> inputStreams = new ArrayList<>();
for (int i = 0; i < streams.size(); i++)
{
COSBase strm = streams.getObject(i);
if (strm instanceof COSStream)
{
inputStreams.add(((COSStream) strm).createView());
inputStreams.add(new RandomAccessReadBuffer(delimiter));
}
}
if (!inputStreams.isEmpty())
{
return new SequenceRandomAccessRead(inputStreams);
}
}
return new RandomAccessReadBuffer(new byte[0]);
}
/**
* Returns true if this page has one or more content streams.
*/
public boolean hasContents()
{
COSBase contents = page.getDictionaryObject(COSName.CONTENTS);
if (contents instanceof COSStream)
{
return ((COSStream) contents).size() > 0;
}
else if (contents instanceof COSArray)
{
return ((COSArray) contents).size() > 0;
}
return false;
}
/**
* A dictionary containing any resources required by the page.
*/
@Override
public PDResources getResources()
{
if (pageResources == null)
{
COSBase base = PDPageTree.getInheritableAttribute(page, COSName.RESOURCES);
// note: it's an error for resources to not be present
if (base instanceof COSDictionary)
{
pageResources = new PDResources((COSDictionary) base, resourceCache);
}
}
return pageResources;
}
/**
* This will set the resources for this page.
*
* @param resources The new resources for this page.
*/
public void setResources(PDResources resources)
{
pageResources = resources;
if (resources != null)
{
page.setItem(COSName.RESOURCES, resources);
}
else
{
page.removeItem(COSName.RESOURCES);
}
}
/**
* This will get the key of this Page in the structural parent tree.
*
* @return the integer key of the page's entry in the structural parent tree or -1 if
* there isn't any.
*/
public int getStructParents()
{
return page.getInt(COSName.STRUCT_PARENTS);
}
/**
* This will set the key for this page in the structural parent tree.
*
* @param structParents The new key for this page.
*/
public void setStructParents(int structParents)
{
page.setInt(COSName.STRUCT_PARENTS, structParents);
}
@Override
public PDRectangle getBBox()
{
return getCropBox();
}
@Override
public Matrix getMatrix()
{
// todo: take into account user-space unit redefinition as scale?
return new Matrix();
}
/**
* A rectangle, expressed in default user space units, defining the boundaries of the physical
* medium on which the page is intended to be displayed or printed.
*/
public PDRectangle getMediaBox()
{
if (mediaBox == null)
{
COSBase base = PDPageTree.getInheritableAttribute(page, COSName.MEDIA_BOX);
if (base instanceof COSArray)
{
mediaBox = new PDRectangle((COSArray) base);
}
else
{
LOG.debug("Can't find MediaBox, will use U.S. Letter");
mediaBox = PDRectangle.LETTER;
}
}
return mediaBox;
}
/**
* This will set the mediaBox for this page.
*
* @param mediaBox The new mediaBox for this page.
*/
public void setMediaBox(PDRectangle mediaBox)
{
this.mediaBox = mediaBox;
if (mediaBox == null)
{
page.removeItem(COSName.MEDIA_BOX);
}
else
{
page.setItem(COSName.MEDIA_BOX, mediaBox);
}
}
/**
* A rectangle, expressed in default user space units, defining the visible region of default
* user space. When the page is displayed or printed, its contents are to be clipped (cropped)
* to this rectangle.
*/
public PDRectangle getCropBox()
{
COSBase base = PDPageTree.getInheritableAttribute(page, COSName.CROP_BOX);
if (base instanceof COSArray)
{
return clipToMediaBox(new PDRectangle((COSArray) base));
}
else
{
return getMediaBox();
}
}
/**
* This will set the CropBox for this page.
*
* @param cropBox The new CropBox for this page.
*/
public void setCropBox(PDRectangle cropBox)
{
if (cropBox == null)
{
page.removeItem(COSName.CROP_BOX);
}
else
{
page.setItem(COSName.CROP_BOX, cropBox.getCOSArray());
}
}
/**
* A rectangle, expressed in default user space units, defining the region to which the contents
* of the page should be clipped when output in a production environment. The default is the
* CropBox.
*
* @return The BleedBox attribute.
*/
public PDRectangle getBleedBox()
{
COSArray bleedBox = page.getCOSArray(COSName.BLEED_BOX);
return bleedBox != null ? clipToMediaBox(new PDRectangle(bleedBox)) : getCropBox();
}
/**
* This will set the BleedBox for this page.
*
* @param bleedBox The new BleedBox for this page.
*/
public void setBleedBox(PDRectangle bleedBox)
{
if (bleedBox == null)
{
page.removeItem(COSName.BLEED_BOX);
}
else
{
page.setItem(COSName.BLEED_BOX, bleedBox);
}
}
/**
* A rectangle, expressed in default user space units, defining the intended dimensions of the
* finished page after trimming. The default is the CropBox.
*
* @return The TrimBox attribute.
*/
public PDRectangle getTrimBox()
{
COSArray trimBox = page.getCOSArray(COSName.TRIM_BOX);
return trimBox != null ? clipToMediaBox(new PDRectangle(trimBox)) : null;
}
/**
* This will set the TrimBox for this page.
*
* @param trimBox The new TrimBox for this page.
*/
public void setTrimBox(PDRectangle trimBox)
{
if (trimBox == null)
{
page.removeItem(COSName.TRIM_BOX);
}
else
{
page.setItem(COSName.TRIM_BOX, trimBox);
}
}
/**
* A rectangle, expressed in default user space units, defining the extent of the page's
* meaningful content (including potential white space) as intended by the page's creator The
* default is the CropBox.
*
* @return The ArtBox attribute.
*/
public PDRectangle getArtBox()
{
COSArray artBox = page.getCOSArray(COSName.ART_BOX);
return artBox != null ? clipToMediaBox(new PDRectangle(artBox)) : getCropBox();
}
/**
* This will set the ArtBox for this page.
*
* @param artBox The new ArtBox for this page.
*/
public void setArtBox(PDRectangle artBox)
{
if (artBox == null)
{
page.removeItem(COSName.ART_BOX);
}
else
{
page.setItem(COSName.ART_BOX, artBox);
}
}
/**
* Clips the given box to the bounds of the media box.
*/
private PDRectangle clipToMediaBox(PDRectangle box)
{
PDRectangle mediaBox = getMediaBox();
PDRectangle result = new PDRectangle();
result.setLowerLeftX(Math.max(mediaBox.getLowerLeftX(), box.getLowerLeftX()));
result.setLowerLeftY(Math.max(mediaBox.getLowerLeftY(), box.getLowerLeftY()));
result.setUpperRightX(Math.min(mediaBox.getUpperRightX(), box.getUpperRightX()));
result.setUpperRightY(Math.min(mediaBox.getUpperRightY(), box.getUpperRightY()));
return result;
}
/**
* Returns the rotation angle in degrees by which the page should be rotated
* clockwise when displayed or printed. Valid values in a PDF must be a
* multiple of 90.
*
* @return The rotation angle in degrees in normalized form (0, 90, 180 or
* 270) or 0 if invalid or not set at this level.
*/
public int getRotation()
{
COSBase obj = PDPageTree.getInheritableAttribute(page, COSName.ROTATE);
if (obj instanceof COSNumber)
{
int rotationAngle = ((COSNumber) obj).intValue();
if (rotationAngle % 90 == 0)
{
return (rotationAngle % 360 + 360) % 360;
}
}
return 0;
}
/**
* This will set the rotation for this page.
*
* @param rotation The new rotation for this page in degrees.
*/
public void setRotation(int rotation)
{
page.setInt(COSName.ROTATE, rotation);
}
/**
* This will set the contents of this page.
*
* @param contents The new contents of the page.
*/
public void setContents(PDStream contents)
{
page.setItem(COSName.CONTENTS, contents);
}
/**
* This will set the contents of this page.
*
* @param contents Array of new contents of the page.
*/
public void setContents(List<PDStream> contents)
{
page.setItem(COSName.CONTENTS, new COSArray(contents));
}
/**
* This will get a list of PDThreadBead objects, which are article threads in the document. This
* will return an empty list if there are no thread beads.
*
* @return A list of article threads on this page, never null. The returned list is backed by
* the beads COSArray, so any adding or deleting in this list will change the document too.
*/
public List<PDThreadBead> getThreadBeads()
{
COSArray beads = page.getCOSArray(COSName.B);
if (beads == null)
{
beads = new COSArray();
}
List<PDThreadBead> pdObjects = new ArrayList<>(beads.size());
for (int i = 0; i < beads.size(); i++)
{
COSBase base = beads.getObject(i);
PDThreadBead bead = null;
// in some cases the bead is null
if (base instanceof COSDictionary)
{
bead = new PDThreadBead((COSDictionary) base);
}
pdObjects.add(bead);
}
return new COSArrayList<>(pdObjects, beads);
}
/**
* This will set the list of thread beads.
*
* @param beads A list of PDThreadBead objects or null.
*/
public void setThreadBeads(List<PDThreadBead> beads)
{
page.setItem(COSName.B, new COSArray(beads));
}
/**
* Get the metadata that is part of the document catalog. This will return null if there is
* no meta data for this object.
*
* @return The metadata for this object.
*/
public PDMetadata getMetadata()
{
COSStream metadata = page.getCOSStream(COSName.METADATA);
return metadata != null ? new PDMetadata(metadata) : null;
}
/**
* Set the metadata for this object. This can be null.
*
* @param meta The meta data for this object.
*/
public void setMetadata(PDMetadata meta)
{
page.setItem(COSName.METADATA, meta);
}
/**
* Get the page actions.
*
* @return The Actions for this Page
*/
public PDPageAdditionalActions getActions()
{
COSDictionary addAct = page.getCOSDictionary(COSName.AA);
if (addAct == null)
{
addAct = new COSDictionary();
page.setItem(COSName.AA, addAct);
}
return new PDPageAdditionalActions(addAct);
}
/**
* Set the page actions.
*
* @param actions The actions for the page.
*/
public void setActions(PDPageAdditionalActions actions)
{
page.setItem(COSName.AA, actions);
}
/**
* @return The page transition associated with this page or null if no transition is defined
*/
public PDTransition getTransition()
{
COSDictionary transition = page.getCOSDictionary(COSName.TRANS);
return transition != null ? new PDTransition(transition) : null;
}
/**
* @param transition The new transition to set on this page.
*/
public void setTransition(PDTransition transition)
{
page.setItem(COSName.TRANS, transition);
}
/**
* Convenient method to set a transition and the display duration
*
* @param transition The new transition to set on this page.
* @param duration The maximum length of time, in seconds, that the page shall be displayed during presentations
* before the viewer application shall automatically advance to the next page.
*/
public void setTransition(PDTransition transition, float duration)
{
page.setItem(COSName.TRANS, transition);
page.setItem(COSName.DUR, new COSFloat(duration));
}
/**
* This will return a list of the annotations for this page.
*
* @return List of the PDAnnotation objects, never null. The returned list is backed by the
* annotations COSArray, so any adding or deleting in this list will change the document too.
*
* @throws IOException If there is an error while creating the annotation list.
*/
public List<PDAnnotation> getAnnotations() throws IOException
{
return getAnnotations(annotation -> true);
}
/**
* This will return a list of the annotations for this page.
*
* @param annotationFilter the annotation filter provided allowing to filter out specific annotations
* @return List of the PDAnnotation objects, never null. The returned list is backed by the
* annotations COSArray, so any adding or deleting in this list will change the document too.
*
* @throws IOException If there is an error while creating the annotation list.
*/
public List<PDAnnotation> getAnnotations(AnnotationFilter annotationFilter) throws IOException
{
COSArray annots = page.getCOSArray(COSName.ANNOTS);
if (annots == null)
{
return new COSArrayList<>(page, COSName.ANNOTS);
}
List<PDAnnotation> actuals = new ArrayList<>();
for (int i = 0; i < annots.size(); i++)
{
COSBase item = annots.getObject(i);
if (item == null)
{
continue;
}
PDAnnotation createdAnnotation = PDAnnotation.createAnnotation(item);
if (annotationFilter.accept(createdAnnotation))
{
actuals.add(createdAnnotation);
}
}
return new COSArrayList<>(actuals, annots);
}
/**
* This will set the list of annotations.
*
* @param annotations The new list of annotations.
*/
public void setAnnotations(List<PDAnnotation> annotations)
{
page.setItem(COSName.ANNOTS, new COSArray(annotations));
}
@Override
public boolean equals(Object other)
{
return other instanceof PDPage && ((PDPage) other).getCOSObject() == this.getCOSObject();
}
@Override
public int hashCode()
{
return page.hashCode();
}
/**
* Returns the resource cache associated with this page, or null if there is none.
*/
public ResourceCache getResourceCache()
{
return resourceCache;
}
/**
* Get the viewports.
*
* @return a list of viewports or null if there is no /VP entry.
*/
public List<PDViewportDictionary> getViewports()
{
COSArray array = page.getCOSArray(COSName.VP);
if (array == null)
{
return null;
}
List<PDViewportDictionary> viewports = new ArrayList<>();
for (int i = 0; i < array.size(); ++i)
{
COSBase base2 = array.getObject(i);
if (base2 instanceof COSDictionary)
{
viewports.add(new PDViewportDictionary((COSDictionary) base2));
}
else
{
LOG.warn("Array element " + base2 + " is skipped, must be a (viewport) dictionary");
}
}
return viewports;
}
/**
* Set the viewports.
*
* @param viewports A list of viewports, or null if the entry is to be deleted.
*/
public void setViewports(List<PDViewportDictionary> viewports)
{
if (viewports == null)
{
page.removeItem(COSName.VP);
return;
}
page.setItem(COSName.VP, new COSArray(viewports));
}
/**
* Get the user unit. This is a positive number that shall give the size of default user space
* units, in multiples of 1/72 inch, or 1 if it hasn't been set. This is supported by PDF 1.6
* and higher.
*
* @return the user unit.
*/
public float getUserUnit()
{
float userUnit = page.getFloat(COSName.USER_UNIT, 1.0f);
return userUnit > 0 ? userUnit : 1.0f;
}
/**
* Get the user unit. This is a positive number that shall give the size of default user space
* units, in multiples of 1/72 inch. This is supported by PDF 1.6 and higher.
*
* @param userUnit
* throws IllegalArgumentException if the parameter is not positive.
*/
public void setUserUnit(float userUnit)
{
if (userUnit <= 0)
{
throw new IllegalArgumentException("User unit must be positive");
}
page.setFloat(COSName.USER_UNIT, userUnit);
}
}