mirror of
https://github.com/qpdf/qpdf.git
synced 2024-11-16 17:45:09 +00:00
398354b6f0
git-svn-id: svn+q:///qpdf/trunk@830 71b93d88-0707-0410-a8cf-f5a4172ac649
801 lines
24 KiB
C++
801 lines
24 KiB
C++
// Copyright (c) 2005-2009 Jay Berkenbilt
|
|
//
|
|
// This file is part of qpdf. This software may be distributed under
|
|
// the terms of version 2 of the Artistic License which may be found
|
|
// in the source distribution. It is provided "as is" without express
|
|
// or implied warranty.
|
|
|
|
#ifndef __QPDF_HH__
|
|
#define __QPDF_HH__
|
|
|
|
#include <stdio.h>
|
|
#include <string>
|
|
#include <map>
|
|
#include <list>
|
|
|
|
#include <qpdf/DLL.h>
|
|
|
|
#include <qpdf/QPDFXRefEntry.hh>
|
|
#include <qpdf/QPDFObjectHandle.hh>
|
|
#include <qpdf/QPDFTokenizer.hh>
|
|
#include <qpdf/Buffer.hh>
|
|
|
|
class QPDF_Stream;
|
|
class BitStream;
|
|
class BitWriter;
|
|
class QPDFExc;
|
|
|
|
class DLL_EXPORT QPDF
|
|
{
|
|
public:
|
|
QPDF();
|
|
~QPDF();
|
|
|
|
// Associate a file with a QPDF object and do initial parsing of
|
|
// the file. PDF objects are not read until they are needed. A
|
|
// QPDF object may be associated with only one file in its
|
|
// lifetime. This method must be called before any methods that
|
|
// potentially ask for information about the PDF file are called.
|
|
// Prior to calling this, the only methods that are allowed are
|
|
// those that set parameters. If the input file is not
|
|
// encrypted,either a null password or an empty password can be
|
|
// used. If the file is encrypted, either the user password or
|
|
// the owner password may be supplied.
|
|
void processFile(char const* filename, char const* password = 0);
|
|
|
|
// Parameter settings
|
|
|
|
// If true, ignore any cross-reference streams in a hybrid file
|
|
// (one that contains both cross-reference streams and
|
|
// cross-reference tables). This can be useful for testing to
|
|
// ensure that a hybrid file would work with an older reader.
|
|
void setIgnoreXRefStreams(bool);
|
|
|
|
// By default, any warnings are issued to stderr as they are
|
|
// encountered. If this is called with a true value, reporting of
|
|
// warnings is suppressed. You may still retrieve warnings by
|
|
// calling getWarnings.
|
|
void setSuppressWarnings(bool);
|
|
|
|
// By default, QPDF will try to recover if it finds certain types
|
|
// of errors in PDF files. If turned off, it will throw an
|
|
// exception on the first such problem it finds without attempting
|
|
// recovery.
|
|
void setAttemptRecovery(bool);
|
|
|
|
// Other public methods
|
|
|
|
// Return the list of warnings that have been issued so far and
|
|
// clear the list. This method may be called even if processFile
|
|
// throws an exception. Note that if setSuppressWarnings was not
|
|
// called or was called with a false value, any warnings retrieved
|
|
// here will have already been issued to stderr.
|
|
std::vector<QPDFExc> getWarnings();
|
|
|
|
std::string getFilename() const;
|
|
std::string getPDFVersion() const;
|
|
QPDFObjectHandle getTrailer();
|
|
QPDFObjectHandle getRoot();
|
|
|
|
// Install this object handle as an indirect object and return an
|
|
// indirect reference to it.
|
|
QPDFObjectHandle makeIndirectObject(QPDFObjectHandle);
|
|
|
|
// Retrieve an object by object ID and generation. Returns an
|
|
// indirect reference to it.
|
|
QPDFObjectHandle getObjectByID(int objid, int generation);
|
|
|
|
// Encryption support
|
|
|
|
enum encryption_method_e { e_none, e_unknown, e_rc4, e_aes };
|
|
struct EncryptionData
|
|
{
|
|
// This class holds data read from the encryption dictionary.
|
|
EncryptionData(int V, int R, int Length_bytes, int P,
|
|
std::string const& O, std::string const& U,
|
|
std::string const& id1, bool encrypt_metadata) :
|
|
V(V),
|
|
R(R),
|
|
Length_bytes(Length_bytes),
|
|
P(P),
|
|
O(O),
|
|
U(U),
|
|
id1(id1),
|
|
encrypt_metadata(encrypt_metadata)
|
|
{
|
|
}
|
|
|
|
int V;
|
|
int R;
|
|
int Length_bytes;
|
|
int P;
|
|
std::string O;
|
|
std::string U;
|
|
std::string id1;
|
|
bool encrypt_metadata;
|
|
};
|
|
|
|
bool isEncrypted() const;
|
|
|
|
bool isEncrypted(int& R, int& P);
|
|
|
|
// Encryption permissions -- not enforced by QPDF
|
|
bool allowAccessibility();
|
|
bool allowExtractAll();
|
|
bool allowPrintLowRes();
|
|
bool allowPrintHighRes();
|
|
bool allowModifyAssembly();
|
|
bool allowModifyForm();
|
|
bool allowModifyAnnotation();
|
|
bool allowModifyOther();
|
|
bool allowModifyAll();
|
|
|
|
// Helper function to trim padding from user password. Calling
|
|
// trim_user_password on the result of getPaddedUserPassword gives
|
|
// getTrimmedUserPassword's result.
|
|
static void trim_user_password(std::string& user_password);
|
|
static std::string compute_data_key(
|
|
std::string const& encryption_key, int objid, int generation,
|
|
bool use_aes);
|
|
static std::string compute_encryption_key(
|
|
std::string const& password, EncryptionData const& data);
|
|
|
|
static void compute_encryption_O_U(
|
|
char const* user_password, char const* owner_password,
|
|
int V, int R, int key_len, int P, bool encrypt_metadata,
|
|
std::string const& id1,
|
|
std::string& O, std::string& U);
|
|
// Return the full user password as stored in the PDF file. If
|
|
// you are attempting to recover the user password in a
|
|
// user-presentable form, call getTrimmedUserPassword() instead.
|
|
std::string const& getPaddedUserPassword() const;
|
|
// Return human-readable form of user password.
|
|
std::string getTrimmedUserPassword() const;
|
|
|
|
// Linearization support
|
|
|
|
// Returns true iff the file starts with a linearization parameter
|
|
// dictionary. Does no additional validation.
|
|
bool isLinearized();
|
|
|
|
// Performs various sanity checks on a linearized file. Return
|
|
// true if no errors or warnings. Otherwise, return false and
|
|
// output errors and warnings to stdout.
|
|
bool checkLinearization();
|
|
|
|
// Calls checkLinearization() and, if possible, prints normalized
|
|
// contents of some of the hints tables to stdout. Normalization
|
|
// includes adding min values to delta values and adjusting
|
|
// offsets based on the location and size of the primary hint
|
|
// stream.
|
|
void showLinearizationData();
|
|
|
|
// Shows the contents of the cross-reference table
|
|
void showXRefTable();
|
|
|
|
// Optimization support -- see doc/optimization. Implemented in
|
|
// QPDF_optimization.cc
|
|
|
|
// The object_stream_data map maps from a "compressed" object to
|
|
// the object stream that contains it. This enables optimize to
|
|
// populate the object <-> user maps with only uncompressed
|
|
// objects. If allow_changes is false, an exception will be
|
|
// thrown if any changes are made during the optimization process.
|
|
// This is available so that the test suite can make sure that a
|
|
// linearized file is already optimized. When called in this way,
|
|
// optimize() still populates the object <-> user maps
|
|
void optimize(std::map<int, int> const& object_stream_data,
|
|
bool allow_changes = true);
|
|
|
|
// Replace all references to indirect objects that are "scalars"
|
|
// (i.e., things that don't have children: not arrays, streams, or
|
|
// dictionaries) with direct objects.
|
|
void flattenScalarReferences();
|
|
|
|
// Decode all streams, discarding the output. Used to check
|
|
// correctness of stream encoding.
|
|
void decodeStreams();
|
|
|
|
// For QPDFWriter:
|
|
|
|
// Remove /ID, /Encrypt, and /Prev keys from the trailer
|
|
// dictionary since these are regenerated during write.
|
|
void trimTrailerForWrite();
|
|
|
|
// Get lists of all objects in order according to the part of a
|
|
// linearized file that they belong to.
|
|
void getLinearizedParts(
|
|
std::map<int, int> const& object_stream_data,
|
|
std::vector<QPDFObjectHandle>& part4,
|
|
std::vector<QPDFObjectHandle>& part6,
|
|
std::vector<QPDFObjectHandle>& part7,
|
|
std::vector<QPDFObjectHandle>& part8,
|
|
std::vector<QPDFObjectHandle>& part9);
|
|
|
|
void generateHintStream(std::map<int, QPDFXRefEntry> const& xref,
|
|
std::map<int, size_t> const& lengths,
|
|
std::map<int, int> const& obj_renumber,
|
|
PointerHolder<Buffer>& hint_stream,
|
|
int& S, int& O);
|
|
|
|
// Map object to object stream that contains it
|
|
void getObjectStreamData(std::map<int, int>&);
|
|
// Get a list of objects that would be permitted in an object
|
|
// stream
|
|
std::vector<int> getCompressibleObjects();
|
|
|
|
// Convenience routines for common functions. See also
|
|
// QPDFObjectHandle.hh for additional convenience routines.
|
|
|
|
// Traverse page tree return all /Page objects.
|
|
std::vector<QPDFObjectHandle> const& getAllPages();
|
|
|
|
// Resolver class is restricted to QPDFObjectHandle so that only
|
|
// it can resolve indirect references.
|
|
class Resolver
|
|
{
|
|
friend class QPDFObjectHandle;
|
|
private:
|
|
static PointerHolder<QPDFObject> resolve(
|
|
QPDF* qpdf, int objid, int generation)
|
|
{
|
|
return qpdf->resolve(objid, generation);
|
|
}
|
|
};
|
|
friend class Resolver;
|
|
|
|
// Pipe class is restricted to QPDF_Stream
|
|
class Pipe
|
|
{
|
|
friend class QPDF_Stream;
|
|
private:
|
|
static void pipeStreamData(QPDF* qpdf, int objid, int generation,
|
|
off_t offset, size_t length,
|
|
QPDFObjectHandle dict,
|
|
Pipeline* pipeline)
|
|
{
|
|
qpdf->pipeStreamData(
|
|
objid, generation, offset, length, dict, pipeline);
|
|
}
|
|
};
|
|
friend class Pipe;
|
|
|
|
private:
|
|
class InputSource
|
|
{
|
|
public:
|
|
InputSource() :
|
|
last_offset(0)
|
|
{
|
|
}
|
|
virtual ~InputSource()
|
|
{
|
|
}
|
|
|
|
void setLastOffset(off_t);
|
|
off_t getLastOffset() const;
|
|
std::string readLine();
|
|
|
|
virtual std::string const& getName() const = 0;
|
|
virtual off_t tell() = 0;
|
|
virtual void seek(off_t offset, int whence) = 0;
|
|
virtual void rewind() = 0;
|
|
virtual size_t read(char* buffer, int length) = 0;
|
|
virtual void unreadCh(char ch) = 0;
|
|
|
|
protected:
|
|
off_t last_offset;
|
|
};
|
|
|
|
class FileInputSource: public InputSource
|
|
{
|
|
public:
|
|
FileInputSource();
|
|
void setFilename(char const* filename);
|
|
virtual ~FileInputSource();
|
|
virtual std::string const& getName() const;
|
|
virtual off_t tell();
|
|
virtual void seek(off_t offset, int whence);
|
|
virtual void rewind();
|
|
virtual size_t read(char* buffer, int length);
|
|
virtual void unreadCh(char ch);
|
|
|
|
private:
|
|
FileInputSource(FileInputSource const&);
|
|
FileInputSource& operator=(FileInputSource const&);
|
|
|
|
void destroy();
|
|
|
|
std::string filename;
|
|
FILE* file;
|
|
};
|
|
|
|
class BufferInputSource: public InputSource
|
|
{
|
|
public:
|
|
BufferInputSource(std::string const& description, Buffer* buf);
|
|
virtual ~BufferInputSource();
|
|
virtual std::string const& getName() const;
|
|
virtual off_t tell();
|
|
virtual void seek(off_t offset, int whence);
|
|
virtual void rewind();
|
|
virtual size_t read(char* buffer, int length);
|
|
virtual void unreadCh(char ch);
|
|
|
|
private:
|
|
std::string description;
|
|
Buffer* buf;
|
|
off_t cur_offset;
|
|
};
|
|
|
|
class ObjGen
|
|
{
|
|
public:
|
|
ObjGen();
|
|
ObjGen(int obj, int gen);
|
|
bool operator<(ObjGen const&) const;
|
|
|
|
int obj;
|
|
int gen;
|
|
};
|
|
|
|
class ObjCache
|
|
{
|
|
public:
|
|
ObjCache() :
|
|
end_before_space(0),
|
|
end_after_space(0)
|
|
{
|
|
}
|
|
ObjCache(PointerHolder<QPDFObject> object,
|
|
off_t end_before_space,
|
|
off_t end_after_space) :
|
|
object(object),
|
|
end_before_space(end_before_space),
|
|
end_after_space(end_after_space)
|
|
{
|
|
}
|
|
|
|
PointerHolder<QPDFObject> object;
|
|
off_t end_before_space;
|
|
off_t end_after_space;
|
|
};
|
|
|
|
void parse();
|
|
void warn(QPDFExc const& e);
|
|
void setTrailer(QPDFObjectHandle obj);
|
|
void read_xref(off_t offset);
|
|
void reconstruct_xref(QPDFExc& e);
|
|
int read_xrefTable(off_t offset);
|
|
int read_xrefStream(off_t offset);
|
|
int processXRefStream(off_t offset, QPDFObjectHandle& xref_stream);
|
|
void insertXrefEntry(int obj, int f0, int f1, int f2,
|
|
bool overwrite = false);
|
|
void setLastObjectDescription(std::string const& description,
|
|
int objid, int generation);
|
|
QPDFObjectHandle readObject(
|
|
InputSource*, std::string const& description,
|
|
int objid, int generation, bool in_object_stream);
|
|
QPDFObjectHandle readObjectInternal(
|
|
InputSource* input, int objid, int generation,
|
|
bool in_object_stream,
|
|
bool in_array, bool in_dictionary);
|
|
int recoverStreamLength(
|
|
InputSource* input, int objid, int generation, off_t stream_offset);
|
|
QPDFTokenizer::Token readToken(InputSource*);
|
|
|
|
QPDFObjectHandle readObjectAtOffset(
|
|
bool attempt_recovery,
|
|
off_t offset, std::string const& description,
|
|
int exp_objid, int exp_generation,
|
|
int& act_objid, int& act_generation);
|
|
PointerHolder<QPDFObject> resolve(int objid, int generation);
|
|
void resolveObjectsInStream(int obj_stream_number);
|
|
|
|
// Calls finish() on the pipeline when done but does not delete it
|
|
void pipeStreamData(int objid, int generation,
|
|
off_t offset, size_t length,
|
|
QPDFObjectHandle dict,
|
|
Pipeline* pipeline);
|
|
void getAllPagesInternal(QPDFObjectHandle cur_pages,
|
|
std::vector<QPDFObjectHandle>& result);
|
|
|
|
// methods to support encryption -- implemented in QPDF_encryption.cc
|
|
encryption_method_e interpretCF(QPDFObjectHandle);
|
|
void initializeEncryption();
|
|
std::string getKeyForObject(int objid, int generation, bool use_aes);
|
|
void decryptString(std::string&, int objid, int generation);
|
|
void decryptStream(
|
|
Pipeline*& pipeline, int objid, int generation,
|
|
QPDFObjectHandle& stream_dict,
|
|
std::vector<PointerHolder<Pipeline> >& heap);
|
|
|
|
// Linearization Hint table structures.
|
|
// Naming conventions:
|
|
|
|
// HSomething is the Something Hint Table or table header
|
|
// HSomethingEntry is an entry in the Something table
|
|
|
|
// delta_something + min_something = something
|
|
// nbits_something = number of bits required for something
|
|
|
|
// something_offset is the pre-adjusted offset in the file. If >=
|
|
// H0_offset, H0_length must be added to get an actual file
|
|
// offset.
|
|
|
|
// PDF 1.4: Table F.4
|
|
struct HPageOffsetEntry
|
|
{
|
|
HPageOffsetEntry() :
|
|
delta_nobjects(0),
|
|
delta_page_length(0),
|
|
nshared_objects(0),
|
|
delta_content_offset(0),
|
|
delta_content_length(0)
|
|
{
|
|
}
|
|
|
|
int delta_nobjects; // 1
|
|
int delta_page_length; // 2
|
|
int nshared_objects; // 3
|
|
// vectors' sizes = nshared_objects
|
|
std::vector<int> shared_identifiers; // 4
|
|
std::vector<int> shared_numerators; // 5
|
|
int delta_content_offset; // 6
|
|
int delta_content_length; // 7
|
|
};
|
|
|
|
// PDF 1.4: Table F.3
|
|
struct HPageOffset
|
|
{
|
|
HPageOffset() :
|
|
min_nobjects(0),
|
|
first_page_offset(0),
|
|
nbits_delta_nobjects(0),
|
|
min_page_length(0),
|
|
nbits_delta_page_length(0),
|
|
min_content_offset(0),
|
|
nbits_delta_content_offset(0),
|
|
min_content_length(0),
|
|
nbits_delta_content_length(0),
|
|
nbits_nshared_objects(0),
|
|
nbits_shared_identifier(0),
|
|
nbits_shared_numerator(0),
|
|
shared_denominator(0)
|
|
{
|
|
}
|
|
|
|
int min_nobjects; // 1
|
|
int first_page_offset; // 2
|
|
int nbits_delta_nobjects; // 3
|
|
int min_page_length; // 4
|
|
int nbits_delta_page_length; // 5
|
|
int min_content_offset; // 6
|
|
int nbits_delta_content_offset; // 7
|
|
int min_content_length; // 8
|
|
int nbits_delta_content_length; // 9
|
|
int nbits_nshared_objects; // 10
|
|
int nbits_shared_identifier; // 11
|
|
int nbits_shared_numerator; // 12
|
|
int shared_denominator; // 13
|
|
// vector size is npages
|
|
std::vector<HPageOffsetEntry> entries;
|
|
};
|
|
|
|
// PDF 1.4: Table F.6
|
|
struct HSharedObjectEntry
|
|
{
|
|
HSharedObjectEntry() :
|
|
delta_group_length(0),
|
|
signature_present(0),
|
|
nobjects_minus_one(0)
|
|
{
|
|
}
|
|
|
|
// Item 3 is a 128-bit signature (unsupported by Acrobat)
|
|
int delta_group_length; // 1
|
|
int signature_present; // 2 -- always 0
|
|
int nobjects_minus_one; // 4 -- always 0
|
|
};
|
|
|
|
// PDF 1.4: Table F.5
|
|
struct HSharedObject
|
|
{
|
|
HSharedObject() :
|
|
first_shared_obj(0),
|
|
first_shared_offset(0),
|
|
nshared_first_page(0),
|
|
nshared_total(0),
|
|
nbits_nobjects(0),
|
|
min_group_length(0),
|
|
nbits_delta_group_length(0)
|
|
{
|
|
}
|
|
|
|
int first_shared_obj; // 1
|
|
int first_shared_offset; // 2
|
|
int nshared_first_page; // 3
|
|
int nshared_total; // 4
|
|
int nbits_nobjects; // 5
|
|
int min_group_length; // 6
|
|
int nbits_delta_group_length; // 7
|
|
// vector size is nshared_total
|
|
std::vector<HSharedObjectEntry> entries;
|
|
};
|
|
|
|
// PDF 1.4: Table F.9
|
|
struct HGeneric
|
|
{
|
|
HGeneric() :
|
|
first_object(0),
|
|
first_object_offset(0),
|
|
nobjects(0),
|
|
group_length(0)
|
|
{
|
|
}
|
|
|
|
int first_object; // 1
|
|
int first_object_offset; // 2
|
|
int nobjects; // 3
|
|
int group_length; // 4
|
|
};
|
|
|
|
// Other linearization data structures
|
|
|
|
// Initialized from Linearization Parameter dictionary
|
|
struct LinParameters
|
|
{
|
|
LinParameters() :
|
|
file_size(0),
|
|
first_page_object(0),
|
|
first_page_end(0),
|
|
npages(0),
|
|
xref_zero_offset(0),
|
|
first_page(0),
|
|
H_offset(0),
|
|
H_length(0)
|
|
{
|
|
}
|
|
|
|
int file_size; // /L
|
|
int first_page_object; // /O
|
|
int first_page_end; // /E
|
|
int npages; // /N
|
|
int xref_zero_offset; // /T
|
|
int first_page; // /P
|
|
int H_offset; // offset of primary hint stream
|
|
int H_length; // length of primary hint stream
|
|
};
|
|
|
|
// Computed hint table value data structures. These tables
|
|
// contain the computed values on which the hint table values are
|
|
// based. They exclude things like number of bits and store
|
|
// actual values instead of mins and deltas. File offsets are
|
|
// also absolute rather than being offset by the size of the
|
|
// primary hint table. We populate the hint table structures from
|
|
// these during writing and compare the hint table values with
|
|
// these during validation. We ignore some values for various
|
|
// reasons described in the code. Those values are omitted from
|
|
// these structures. Note also that object numbers are object
|
|
// numbers from the input file, not the output file.
|
|
|
|
// Naming convention: CHSomething is analogous to HSomething
|
|
// above. "CH" is computed hint.
|
|
|
|
struct CHPageOffsetEntry
|
|
{
|
|
CHPageOffsetEntry() :
|
|
nobjects(0),
|
|
nshared_objects(0)
|
|
{
|
|
}
|
|
|
|
int nobjects;
|
|
int nshared_objects;
|
|
// vectors' sizes = nshared_objects
|
|
std::vector<int> shared_identifiers;
|
|
};
|
|
|
|
struct CHPageOffset
|
|
{
|
|
// vector size is npages
|
|
std::vector<CHPageOffsetEntry> entries;
|
|
};
|
|
|
|
struct CHSharedObjectEntry
|
|
{
|
|
CHSharedObjectEntry(int object) :
|
|
object(object)
|
|
{
|
|
}
|
|
|
|
int object;
|
|
};
|
|
|
|
// PDF 1.4: Table F.5
|
|
struct CHSharedObject
|
|
{
|
|
CHSharedObject() :
|
|
first_shared_obj(0),
|
|
nshared_first_page(0),
|
|
nshared_total(0)
|
|
{
|
|
}
|
|
|
|
int first_shared_obj;
|
|
int nshared_first_page;
|
|
int nshared_total;
|
|
// vector size is nshared_total
|
|
std::vector<CHSharedObjectEntry> entries;
|
|
};
|
|
|
|
// No need for CHGeneric -- HGeneric is fine as is.
|
|
|
|
|
|
// Data structures to support optimization -- implemented in
|
|
// QPDF_optimization.cc
|
|
|
|
class ObjUser
|
|
{
|
|
public:
|
|
enum user_e
|
|
{
|
|
ou_bad,
|
|
ou_page,
|
|
ou_thumb,
|
|
ou_trailer_key,
|
|
ou_root_key,
|
|
ou_root
|
|
};
|
|
|
|
// type is set to ou_bad
|
|
ObjUser();
|
|
|
|
// type must be ou_root
|
|
ObjUser(user_e type);
|
|
|
|
// type must be one of ou_page or ou_thumb
|
|
ObjUser(user_e type, int pageno);
|
|
|
|
// type must be one of ou_trailer_key or ou_root_key
|
|
ObjUser(user_e type, std::string const& key);
|
|
|
|
bool operator<(ObjUser const&) const;
|
|
|
|
user_e ou_type;
|
|
int pageno; // if ou_page;
|
|
std::string key; // if ou_trailer_key or ou_root_key
|
|
};
|
|
|
|
// methods to support linearization checking -- implemented in
|
|
// QPDF_linearization.cc
|
|
void readLinearizationData();
|
|
bool checkLinearizationInternal();
|
|
void dumpLinearizationDataInternal();
|
|
QPDFObjectHandle readHintStream(Pipeline&, off_t offset, size_t length);
|
|
void readHPageOffset(BitStream);
|
|
void readHSharedObject(BitStream);
|
|
void readHGeneric(BitStream, HGeneric&);
|
|
int maxEnd(ObjUser const& ou);
|
|
int getLinearizationOffset(ObjGen const&);
|
|
QPDFObjectHandle getUncompressedObject(
|
|
QPDFObjectHandle&, std::map<int, int> const& object_stream_data);
|
|
int lengthNextN(int first_object, int n,
|
|
std::list<std::string>& errors);
|
|
void checkHPageOffset(std::list<std::string>& errors,
|
|
std::list<std::string>& warnings,
|
|
std::vector<QPDFObjectHandle> const& pages,
|
|
std::map<int, int>& idx_to_obj);
|
|
void checkHSharedObject(std::list<std::string>& warnings,
|
|
std::list<std::string>& errors,
|
|
std::vector<QPDFObjectHandle> const& pages,
|
|
std::map<int, int>& idx_to_obj);
|
|
void checkHOutlines(std::list<std::string>& warnings);
|
|
void dumpHPageOffset();
|
|
void dumpHSharedObject();
|
|
void dumpHGeneric(HGeneric&);
|
|
int adjusted_offset(int offset);
|
|
QPDFObjectHandle objGenToIndirect(ObjGen const&);
|
|
void calculateLinearizationData(
|
|
std::map<int, int> const& object_stream_data);
|
|
void pushOutlinesToPart(
|
|
std::vector<QPDFObjectHandle>& part,
|
|
std::set<ObjGen>& lc_outlines,
|
|
std::map<int, int> const& object_stream_data);
|
|
int outputLengthNextN(
|
|
int in_object, int n,
|
|
std::map<int, size_t> const& lengths,
|
|
std::map<int, int> const& obj_renumber);
|
|
void calculateHPageOffset(
|
|
std::map<int, QPDFXRefEntry> const& xref,
|
|
std::map<int, size_t> const& lengths,
|
|
std::map<int, int> const& obj_renumber);
|
|
void calculateHSharedObject(
|
|
std::map<int, QPDFXRefEntry> const& xref,
|
|
std::map<int, size_t> const& lengths,
|
|
std::map<int, int> const& obj_renumber);
|
|
void calculateHOutline(
|
|
std::map<int, QPDFXRefEntry> const& xref,
|
|
std::map<int, size_t> const& lengths,
|
|
std::map<int, int> const& obj_renumber);
|
|
void writeHPageOffset(BitWriter&);
|
|
void writeHSharedObject(BitWriter&);
|
|
void writeHGeneric(BitWriter&, HGeneric&);
|
|
|
|
|
|
// Methods to support optimization
|
|
|
|
void optimizePagesTree(
|
|
QPDFObjectHandle,
|
|
std::map<std::string, std::vector<QPDFObjectHandle> >&,
|
|
int& pageno, bool allow_changes);
|
|
void updateObjectMaps(ObjUser const& ou, QPDFObjectHandle oh);
|
|
void updateObjectMapsInternal(ObjUser const& ou, QPDFObjectHandle oh,
|
|
std::set<ObjGen>& visited, bool top);
|
|
void filterCompressedObjects(std::map<int, int> const& object_stream_data);
|
|
|
|
|
|
QPDFTokenizer tokenizer;
|
|
FileInputSource file;
|
|
std::string last_object_description;
|
|
bool encrypted;
|
|
bool encryption_initialized;
|
|
bool ignore_xref_streams;
|
|
bool suppress_warnings;
|
|
bool attempt_recovery;
|
|
int encryption_V;
|
|
bool encrypt_metadata;
|
|
std::map<std::string, encryption_method_e> crypt_filters;
|
|
encryption_method_e cf_stream;
|
|
encryption_method_e cf_string;
|
|
encryption_method_e cf_file;
|
|
std::string provided_password;
|
|
std::string user_password;
|
|
std::string encryption_key;
|
|
std::string cached_object_encryption_key;
|
|
int cached_key_objid;
|
|
int cached_key_generation;
|
|
std::string pdf_version;
|
|
std::map<ObjGen, QPDFXRefEntry> xref_table;
|
|
std::set<int> deleted_objects;
|
|
std::map<ObjGen, ObjCache> obj_cache;
|
|
QPDFObjectHandle trailer;
|
|
std::vector<QPDFObjectHandle> all_pages;
|
|
std::vector<QPDFExc> warnings;
|
|
|
|
// Linearization data
|
|
int first_xref_item_offset; // actual value from file
|
|
bool uncompressed_after_compressed;
|
|
|
|
// Linearization parameter dictionary and hint table data: may be
|
|
// read from file or computed prior to writing a linearized file
|
|
QPDFObjectHandle lindict;
|
|
LinParameters linp;
|
|
HPageOffset page_offset_hints;
|
|
HSharedObject shared_object_hints;
|
|
HGeneric outline_hints;
|
|
|
|
// Computed linearization data: used to populate above tables
|
|
// during writing and to compare with them during validation. c_
|
|
// means computed.
|
|
LinParameters c_linp;
|
|
CHPageOffset c_page_offset_data;
|
|
CHSharedObject c_shared_object_data;
|
|
HGeneric c_outline_data;
|
|
|
|
// Object ordering data for linearized files: initialized by
|
|
// calculateLinearizationData(). Part numbers refer to the PDF
|
|
// 1.4 specification.
|
|
std::vector<QPDFObjectHandle> part4;
|
|
std::vector<QPDFObjectHandle> part6;
|
|
std::vector<QPDFObjectHandle> part7;
|
|
std::vector<QPDFObjectHandle> part8;
|
|
std::vector<QPDFObjectHandle> part9;
|
|
|
|
// Optimization data
|
|
std::map<ObjUser, std::set<ObjGen> > obj_user_to_objects;
|
|
std::map<ObjGen, std::set<ObjUser> > object_to_obj_users;
|
|
};
|
|
|
|
#endif // __QPDF_HH__
|