2
1
mirror of https://github.com/qpdf/qpdf.git synced 2024-12-22 10:58:58 +00:00

Move QPDF::read_xrefEntry to QPDF::Xref_table

This commit is contained in:
m-holger 2024-08-10 11:47:02 +01:00
parent 3fbff84594
commit 253d3aee8f
3 changed files with 45 additions and 32 deletions

View File

@ -762,10 +762,6 @@ class QPDF
void setTrailer(QPDFObjectHandle obj); void setTrailer(QPDFObjectHandle obj);
void read_xref(qpdf_offset_t offset); void read_xref(qpdf_offset_t offset);
bool resolveXRefTable(); bool resolveXRefTable();
bool parse_xrefFirst(std::string const& line, int& obj, int& num, int& bytes);
bool read_xrefEntry(qpdf_offset_t& f1, int& f2, char& type);
bool read_bad_xrefEntry(qpdf_offset_t& f1, int& f2, char& type);
qpdf_offset_t read_xrefTable(qpdf_offset_t offset);
qpdf_offset_t read_xrefStream(qpdf_offset_t offset); qpdf_offset_t read_xrefStream(qpdf_offset_t offset);
qpdf_offset_t processXRefStream(qpdf_offset_t offset, QPDFObjectHandle& xref_stream); qpdf_offset_t processXRefStream(qpdf_offset_t offset, QPDFObjectHandle& xref_stream);
std::pair<int, std::array<int, 3>> std::pair<int, std::array<int, 3>>

View File

@ -723,7 +723,7 @@ QPDF::read_xref(qpdf_offset_t xref_offset)
while (QUtil::is_space(buf[skip])) { while (QUtil::is_space(buf[skip])) {
++skip; ++skip;
} }
xref_offset = read_xrefTable(xref_offset + skip); xref_offset = m->xref_table.read_table(xref_offset + skip);
} else { } else {
xref_offset = read_xrefStream(xref_offset); xref_offset = read_xrefStream(xref_offset);
} }
@ -769,7 +769,7 @@ QPDF::read_xref(qpdf_offset_t xref_offset)
} }
bool bool
QPDF::parse_xrefFirst(std::string const& line, int& obj, int& num, int& bytes) QPDF::Xref_table::parse_first(std::string const& line, int& obj, int& num, int& bytes)
{ {
// is_space and is_digit both return false on '\0', so this will not overrun the null-terminated // is_space and is_digit both return false on '\0', so this will not overrun the null-terminated
// buffer. // buffer.
@ -817,8 +817,10 @@ QPDF::parse_xrefFirst(std::string const& line, int& obj, int& num, int& bytes)
} }
bool bool
QPDF::read_bad_xrefEntry(qpdf_offset_t& f1, int& f2, char& type) QPDF::Xref_table::read_bad_entry(qpdf_offset_t& f1, int& f2, char& type)
{ {
auto* m = qpdf.m.get();
// Reposition after initial read attempt and reread. // Reposition after initial read attempt and reread.
m->file->seek(m->file->getLastOffset(), SEEK_SET); m->file->seek(m->file->getLastOffset(), SEEK_SET);
auto line = m->file->readLine(30); auto line = m->file->readLine(30);
@ -887,7 +889,7 @@ QPDF::read_bad_xrefEntry(qpdf_offset_t& f1, int& f2, char& type)
} }
if (invalid) { if (invalid) {
warn(damagedPDF("xref table", "accepting invalid xref table entry")); qpdf.warn(damaged_table("accepting invalid xref table entry"));
} }
f1 = QUtil::string_to_ll(f1_str.c_str()); f1 = QUtil::string_to_ll(f1_str.c_str());
@ -899,8 +901,10 @@ QPDF::read_bad_xrefEntry(qpdf_offset_t& f1, int& f2, char& type)
// Optimistically read and parse xref entry. If entry is bad, call read_bad_xrefEntry and return // Optimistically read and parse xref entry. If entry is bad, call read_bad_xrefEntry and return
// result. // result.
bool bool
QPDF::read_xrefEntry(qpdf_offset_t& f1, int& f2, char& type) QPDF::Xref_table::read_entry(qpdf_offset_t& f1, int& f2, char& type)
{ {
auto* m = qpdf.m.get();
std::array<char, 21> line; std::array<char, 21> line;
if (m->file->read(line.data(), 20) != 20) { if (m->file->read(line.data(), 20) != 20) {
// C++20: [[unlikely]] // C++20: [[unlikely]]
@ -948,13 +952,15 @@ QPDF::read_xrefEntry(qpdf_offset_t& f1, int& f2, char& type)
return true; return true;
} }
} }
return read_bad_xrefEntry(f1, f2, type); return read_bad_entry(f1, f2, type);
} }
// Read a single cross-reference table section and associated trailer. // Read a single cross-reference table section and associated trailer.
qpdf_offset_t qpdf_offset_t
QPDF::read_xrefTable(qpdf_offset_t xref_offset) QPDF::Xref_table::read_table(qpdf_offset_t xref_offset)
{ {
auto* m = qpdf.m.get();
m->file->seek(xref_offset, SEEK_SET); m->file->seek(xref_offset, SEEK_SET);
std::string line; std::string line;
while (true) { while (true) {
@ -963,33 +969,32 @@ QPDF::read_xrefTable(qpdf_offset_t xref_offset)
int obj = 0; int obj = 0;
int num = 0; int num = 0;
int bytes = 0; int bytes = 0;
if (!parse_xrefFirst(line, obj, num, bytes)) { if (!parse_first(line, obj, num, bytes)) {
QTC::TC("qpdf", "QPDF invalid xref"); QTC::TC("qpdf", "QPDF invalid xref");
throw damagedPDF("xref table", "xref syntax invalid"); throw damaged_table("xref syntax invalid");
} }
m->file->seek(m->file->getLastOffset() + bytes, SEEK_SET); m->file->seek(m->file->getLastOffset() + bytes, SEEK_SET);
for (qpdf_offset_t i = obj; i - num < obj; ++i) { for (qpdf_offset_t i = obj; i - num < obj; ++i) {
if (i == 0) { if (i == 0) {
// This is needed by checkLinearization() // This is needed by checkLinearization()
m->xref_table.first_item_offset = m->file->tell(); first_item_offset = m->file->tell();
} }
// For xref_table, these will always be small enough to be ints // For xref_table, these will always be small enough to be ints
qpdf_offset_t f1 = 0; qpdf_offset_t f1 = 0;
int f2 = 0; int f2 = 0;
char type = '\0'; char type = '\0';
if (!read_xrefEntry(f1, f2, type)) { if (!read_entry(f1, f2, type)) {
QTC::TC("qpdf", "QPDF invalid xref entry"); QTC::TC("qpdf", "QPDF invalid xref entry");
throw damagedPDF( throw damaged_table("invalid xref entry (obj=" + std::to_string(i) + ")");
"xref table", "invalid xref entry (obj=" + std::to_string(i) + ")");
} }
if (type == 'f') { if (type == 'f') {
m->xref_table.insert_free(QPDFObjGen(toI(i), f2)); insert_free(QPDFObjGen(toI(i), f2));
} else { } else {
m->xref_table.insert(toI(i), 1, f1, f2); insert(toI(i), 1, f1, f2);
} }
} }
qpdf_offset_t pos = m->file->tell(); qpdf_offset_t pos = m->file->tell();
if (readToken(*m->file).isWord("trailer")) { if (qpdf.readToken(*m->file).isWord("trailer")) {
break; break;
} else { } else {
m->file->seek(pos, SEEK_SET); m->file->seek(pos, SEEK_SET);
@ -997,35 +1002,35 @@ QPDF::read_xrefTable(qpdf_offset_t xref_offset)
} }
// Set offset to previous xref table if any // Set offset to previous xref table if any
QPDFObjectHandle cur_trailer = readTrailer(); auto cur_trailer = qpdf.readTrailer();
if (!cur_trailer.isDictionary()) { if (!cur_trailer.isDictionary()) {
QTC::TC("qpdf", "QPDF missing trailer"); QTC::TC("qpdf", "QPDF missing trailer");
throw damagedPDF("", "expected trailer dictionary"); throw qpdf.damagedPDF("", "expected trailer dictionary");
} }
if (!m->xref_table.trailer) { if (!trailer) {
setTrailer(cur_trailer); trailer = cur_trailer;
if (!m->xref_table.trailer.hasKey("/Size")) { if (!trailer.hasKey("/Size")) {
QTC::TC("qpdf", "QPDF trailer lacks size"); QTC::TC("qpdf", "QPDF trailer lacks size");
throw damagedPDF("trailer", "trailer dictionary lacks /Size key"); throw qpdf.damagedPDF("trailer", "trailer dictionary lacks /Size key");
} }
if (!m->xref_table.trailer.getKey("/Size").isInteger()) { if (!trailer.getKey("/Size").isInteger()) {
QTC::TC("qpdf", "QPDF trailer size not integer"); QTC::TC("qpdf", "QPDF trailer size not integer");
throw damagedPDF("trailer", "/Size key in trailer dictionary is not an integer"); throw qpdf.damagedPDF("trailer", "/Size key in trailer dictionary is not an integer");
} }
} }
if (cur_trailer.hasKey("/XRefStm")) { if (cur_trailer.hasKey("/XRefStm")) {
if (m->xref_table.ignore_streams) { if (ignore_streams) {
QTC::TC("qpdf", "QPDF ignoring XRefStm in trailer"); QTC::TC("qpdf", "QPDF ignoring XRefStm in trailer");
} else { } else {
if (cur_trailer.getKey("/XRefStm").isInteger()) { if (cur_trailer.getKey("/XRefStm").isInteger()) {
// Read the xref stream but disregard any return value -- we'll use our trailer's // Read the xref stream but disregard any return value -- we'll use our trailer's
// /Prev key instead of the xref stream's. // /Prev key instead of the xref stream's.
(void)read_xrefStream(cur_trailer.getKey("/XRefStm").getIntValue()); (void)qpdf.read_xrefStream(cur_trailer.getKey("/XRefStm").getIntValue());
} else { } else {
throw damagedPDF("xref stream", xref_offset, "invalid /XRefStm"); throw qpdf.damagedPDF("xref stream", xref_offset, "invalid /XRefStm");
} }
} }
} }
@ -1033,7 +1038,7 @@ QPDF::read_xrefTable(qpdf_offset_t xref_offset)
if (cur_trailer.hasKey("/Prev")) { if (cur_trailer.hasKey("/Prev")) {
if (!cur_trailer.getKey("/Prev").isInteger()) { if (!cur_trailer.getKey("/Prev").isInteger()) {
QTC::TC("qpdf", "QPDF trailer prev not integer"); QTC::TC("qpdf", "QPDF trailer prev not integer");
throw damagedPDF("trailer", "/Prev key in trailer dictionary is not an integer"); throw qpdf.damagedPDF("trailer", "/Prev key in trailer dictionary is not an integer");
} }
QTC::TC("qpdf", "QPDF prev key in trailer dictionary"); QTC::TC("qpdf", "QPDF prev key in trailer dictionary");
return cur_trailer.getKey("/Prev").getIntValue(); return cur_trailer.getKey("/Prev").getIntValue();

View File

@ -12,6 +12,8 @@ class QPDF::Xref_table: public std::map<QPDFObjGen, QPDFXRefEntry>
{ {
} }
qpdf_offset_t read_table(qpdf_offset_t offset);
void insert_reconstructed(int obj, qpdf_offset_t f1, int f2); void insert_reconstructed(int obj, qpdf_offset_t f1, int f2);
void insert(int obj, int f0, qpdf_offset_t f1, int f2); void insert(int obj, int f0, qpdf_offset_t f1, int f2);
void insert_free(QPDFObjGen); void insert_free(QPDFObjGen);
@ -33,12 +35,22 @@ class QPDF::Xref_table: public std::map<QPDFObjGen, QPDFXRefEntry>
qpdf_offset_t first_item_offset{0}; // actual value from file qpdf_offset_t first_item_offset{0}; // actual value from file
private: private:
bool parse_first(std::string const& line, int& obj, int& num, int& bytes);
bool read_entry(qpdf_offset_t& f1, int& f2, char& type);
bool read_bad_entry(qpdf_offset_t& f1, int& f2, char& type);
QPDFExc QPDFExc
damaged_pdf(std::string const& msg) damaged_pdf(std::string const& msg)
{ {
return qpdf.damagedPDF("", 0, msg); return qpdf.damagedPDF("", 0, msg);
} }
QPDFExc
damaged_table(std::string const& msg)
{
return qpdf.damagedPDF("xref table", msg);
}
void void
warn_damaged(std::string const& msg) warn_damaged(std::string const& msg)
{ {