blob: 19ebf19aa9a87394d0aca9af573bd0a863b5db8e [file] [log] [blame]
/**************************************************************
*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*
*************************************************************/
#ifndef INCLUDED_PDFI_PDFPARSE_HXX
#define INCLUDED_PDFI_PDFPARSE_HXX
#include <sal/types.h>
#include <rtl/ustring.hxx>
#include <rtl/string.hxx>
#include <vector>
#include <hash_map>
namespace pdfparse
{
struct EmitImplData;
struct PDFContainer;
class EmitContext
{
public:
virtual bool write( const void* pBuf, unsigned int nLen ) = 0;
virtual unsigned int getCurPos() = 0;
virtual bool copyOrigBytes( unsigned int nOrigOffset, unsigned int nLen ) = 0;
virtual unsigned int readOrigBytes( unsigned int nOrigOffset, unsigned int nLen, void* pBuf ) = 0;
EmitContext( const PDFContainer* pTop = NULL );
virtual ~EmitContext();
// set this to deflate contained streams
bool m_bDeflate;
// set this to decrypt the PDF file
bool m_bDecrypt;
private:
friend struct PDFEntry;
EmitImplData* m_pImplData;
};
struct PDFEntry
{
PDFEntry() {}
virtual ~PDFEntry();
virtual bool emit( EmitContext& rWriteContext ) const = 0;
virtual PDFEntry* clone() const = 0;
protected:
EmitImplData* getEmitData( EmitContext& rContext ) const;
void setEmitData( EmitContext& rContext, EmitImplData* pNewEmitData ) const;
};
struct PDFComment : public PDFEntry
{
rtl::OString m_aComment;
PDFComment( const rtl::OString& rComment )
: PDFEntry(), m_aComment( rComment ) {}
virtual ~PDFComment();
virtual bool emit( EmitContext& rWriteContext ) const;
virtual PDFEntry* clone() const;
};
struct PDFValue : public PDFEntry
{
// abstract base class for simple values
PDFValue() : PDFEntry() {}
virtual ~PDFValue();
};
struct PDFName : public PDFValue
{
rtl::OString m_aName;
PDFName( const rtl::OString& rName )
: PDFValue(), m_aName( rName ) {}
virtual ~PDFName();
virtual bool emit( EmitContext& rWriteContext ) const;
virtual PDFEntry* clone() const;
rtl::OUString getFilteredName() const;
};
struct PDFString : public PDFValue
{
rtl::OString m_aString;
PDFString( const rtl::OString& rString )
: PDFValue(), m_aString( rString ) {}
virtual ~PDFString();
virtual bool emit( EmitContext& rWriteContext ) const;
virtual PDFEntry* clone() const;
rtl::OString getFilteredString() const;
};
struct PDFNumber : public PDFValue
{
double m_fValue;
PDFNumber( double fVal )
: PDFValue(), m_fValue( fVal ) {}
virtual ~PDFNumber();
virtual bool emit( EmitContext& rWriteContext ) const;
virtual PDFEntry* clone() const;
};
struct PDFBool : public PDFValue
{
bool m_bValue;
PDFBool( bool bVal )
: PDFValue(), m_bValue( bVal ) {}
virtual ~PDFBool();
virtual bool emit( EmitContext& rWriteContext ) const;
virtual PDFEntry* clone() const;
};
struct PDFObjectRef : public PDFValue
{
unsigned int m_nNumber;
unsigned int m_nGeneration;
PDFObjectRef( unsigned int nNr, unsigned int nGen )
: PDFValue(), m_nNumber( nNr ), m_nGeneration( nGen ) {}
virtual ~PDFObjectRef();
virtual bool emit( EmitContext& rWriteContext ) const;
virtual PDFEntry* clone() const;
};
struct PDFNull : public PDFValue
{
PDFNull() {}
virtual ~PDFNull();
virtual bool emit( EmitContext& rWriteContext ) const;
virtual PDFEntry* clone() const;
};
struct PDFObject;
struct PDFContainer : public PDFEntry
{
sal_Int32 m_nOffset;
std::vector<PDFEntry*> m_aSubElements;
// this is an abstract base class for identifying
// entries that can contain sub elements besides comments
PDFContainer() : PDFEntry(), m_nOffset( 0 ) {}
virtual ~PDFContainer();
virtual bool emitSubElements( EmitContext& rWriteContext ) const;
virtual void cloneSubElements( std::vector<PDFEntry*>& rNewSubElements ) const;
PDFObject* findObject( unsigned int nNumber, unsigned int nGeneration ) const;
PDFObject* findObject( PDFObjectRef* pRef ) const
{ return findObject( pRef->m_nNumber, pRef->m_nGeneration ); }
};
struct PDFArray : public PDFContainer
{
PDFArray() {}
virtual ~PDFArray();
virtual bool emit( EmitContext& rWriteContext ) const;
virtual PDFEntry* clone() const;
};
struct PDFDict : public PDFContainer
{
typedef std::hash_map<rtl::OString,PDFEntry*,rtl::OStringHash> Map;
Map m_aMap;
PDFDict() {}
virtual ~PDFDict();
virtual bool emit( EmitContext& rWriteContext ) const;
virtual PDFEntry* clone() const;
// inserting a value of NULL will remove rName and the previous value
// from the dictionary
void insertValue( const rtl::OString& rName, PDFEntry* pValue );
// removes a name/value pair from the dict
void eraseValue( const rtl::OString& rName );
// builds new map as of sub elements
// returns NULL if successfull, else the first offending element
PDFEntry* buildMap();
};
struct PDFStream : public PDFEntry
{
unsigned int m_nBeginOffset;
unsigned int m_nEndOffset; // offset of the byte after the stream
PDFDict* m_pDict;
PDFStream( unsigned int nBegin, unsigned int nEnd, PDFDict* pStreamDict )
: PDFEntry(), m_nBeginOffset( nBegin ), m_nEndOffset( nEnd ), m_pDict( pStreamDict ) {}
virtual ~PDFStream();
virtual bool emit( EmitContext& rWriteContext ) const;
virtual PDFEntry* clone() const;
unsigned int getDictLength( const PDFContainer* pObjectContainer = NULL ) const; // get contents of the "Length" entry of the dict
};
struct PDFTrailer : public PDFContainer
{
PDFDict* m_pDict;
PDFTrailer() : PDFContainer(), m_pDict( NULL ) {}
virtual ~PDFTrailer();
virtual bool emit( EmitContext& rWriteContext ) const;
virtual PDFEntry* clone() const;
};
struct PDFFileImplData;
struct PDFFile : public PDFContainer
{
private:
mutable PDFFileImplData* m_pData;
PDFFileImplData* impl_getData() const;
public:
unsigned int m_nMajor; // PDF major
unsigned int m_nMinor; // PDF minor
PDFFile()
: PDFContainer(),
m_pData( NULL ),
m_nMajor( 0 ), m_nMinor( 0 )
{}
virtual ~PDFFile();
virtual bool emit( EmitContext& rWriteContext ) const;
virtual PDFEntry* clone() const;
bool isEncrypted() const;
// this method checks whether rPwd is compatible with
// either user or owner password and sets up decrypt data in that case
// returns true if decryption can be done
bool setupDecryptionData( const rtl::OString& rPwd ) const;
bool decrypt( const sal_uInt8* pInBuffer, sal_uInt32 nLen,
sal_uInt8* pOutBuffer,
unsigned int nObject, unsigned int nGeneration ) const;
rtl::OUString getDecryptionKey() const;
};
struct PDFObject : public PDFContainer
{
PDFEntry* m_pObject;
PDFStream* m_pStream;
unsigned int m_nNumber;
unsigned int m_nGeneration;
PDFObject( unsigned int nNr, unsigned int nGen )
: m_pObject( NULL ), m_pStream( NULL ), m_nNumber( nNr ), m_nGeneration( nGen ) {}
virtual ~PDFObject();
virtual bool emit( EmitContext& rWriteContext ) const;
virtual PDFEntry* clone() const;
// writes only the contained stream, deflated if necessary
bool writeStream( EmitContext& rContext, const PDFFile* pPDFFile ) const;
private:
// returns true if stream is deflated
// fills *ppStream and *pBytes with start of stream and count of bytes
// memory returned in *ppStream must be freed with rtl_freeMemory afterwards
// fills in NULL and 0 in case of error
bool getDeflatedStream( char** ppStream, unsigned int* pBytes, const PDFContainer* pObjectContainer, EmitContext& rContext ) const;
};
struct PDFPart : public PDFContainer
{
PDFPart() : PDFContainer() {}
virtual ~PDFPart();
virtual bool emit( EmitContext& rWriteContext ) const;
virtual PDFEntry* clone() const;
};
class PDFReader
{
public:
PDFReader() {}
~PDFReader() {}
PDFEntry* read( const char* pFileName );
PDFEntry* read( const char* pBuffer, unsigned int nLen );
};
} // namespace
#endif