2
1
mirror of https://github.com/qpdf/qpdf.git synced 2025-01-03 07:12:28 +00:00
qpdf/qpdf/test_renumber.cc
2023-05-21 13:35:09 -04:00

261 lines
7.7 KiB
C++

#include <qpdf/Constants.h>
#include <qpdf/QPDF.hh>
#include <qpdf/QPDFObjGen.hh>
#include <qpdf/QPDFObjectHandle.hh>
#include <qpdf/QPDFWriter.hh>
#include <qpdf/QPDFXRefEntry.hh>
#include <cstdlib>
#include <iostream>
#include <set>
#include <string>
#include <vector>
void
usage()
{
std::cerr << "Usage: test_renumber [OPTION] INPUT.pdf" << std::endl
<< "Option:" << std::endl
<< " --object-streams=preserve|disable|generate" << std::endl
<< " --linearize" << std::endl
<< " --preserve-unreferenced" << std::endl;
}
bool
compare(QPDFObjectHandle a, QPDFObjectHandle b)
{
static std::set<QPDFObjGen> visited;
if (a.isIndirect()) {
if (visited.count(a.getObjGen())) {
return true;
}
visited.insert(a.getObjGen());
}
if (a.getTypeCode() != b.getTypeCode()) {
std::cerr << "different type code" << std::endl;
return false;
}
switch (a.getTypeCode()) {
case ::ot_boolean:
if (a.getBoolValue() != b.getBoolValue()) {
std::cerr << "different boolean" << std::endl;
return false;
}
break;
case ::ot_integer:
if (a.getIntValue() != b.getIntValue()) {
std::cerr << "different integer" << std::endl;
return false;
}
break;
case ::ot_real:
if (a.getRealValue() != b.getRealValue()) {
std::cerr << "different real" << std::endl;
return false;
}
break;
case ::ot_string:
if (a.getStringValue() != b.getStringValue()) {
std::cerr << "different string" << std::endl;
return false;
}
break;
case ::ot_name:
if (a.getName() != b.getName()) {
std::cerr << "different name" << std::endl;
return false;
}
break;
case ::ot_array:
{
std::vector<QPDFObjectHandle> objs_a = a.getArrayAsVector();
std::vector<QPDFObjectHandle> objs_b = b.getArrayAsVector();
size_t items = objs_a.size();
if (items != objs_b.size()) {
std::cerr << "different array size" << std::endl;
return false;
}
for (size_t i = 0; i < items; ++i) {
if (!compare(objs_a[i], objs_b[i])) {
std::cerr << "different array item" << std::endl;
return false;
}
}
}
break;
case ::ot_dictionary:
{
std::set<std::string> keys_a = a.getKeys();
std::set<std::string> keys_b = b.getKeys();
if (keys_a != keys_b) {
std::cerr << "different dictionary keys" << std::endl;
return false;
}
for (auto const& key: keys_a) {
if (!compare(a.getKey(key), b.getKey(key))) {
std::cerr << "different dictionary item" << std::endl;
return false;
}
}
}
break;
case ::ot_null:
break;
case ::ot_stream:
std::cout << "stream objects are not compared" << std::endl;
break;
default:
std::cerr << "unknown object type" << std::endl;
std::exit(2);
}
return true;
}
bool
compare_xref_table(std::map<QPDFObjGen, QPDFXRefEntry> a, std::map<QPDFObjGen, QPDFXRefEntry> b)
{
if (a.size() != b.size()) {
std::cerr << "different size" << std::endl;
return false;
}
for (auto const& iter: a) {
std::cout << "xref entry for " << iter.first.getObj() << "/" << iter.first.getGen()
<< std::endl;
if (b.count(iter.first) == 0) {
std::cerr << "not found" << std::endl;
return false;
}
QPDFXRefEntry xref_a = iter.second;
QPDFXRefEntry xref_b = b[iter.first];
if (xref_a.getType() != xref_b.getType()) {
std::cerr << "different xref entry type" << std::endl;
return false;
}
switch (xref_a.getType()) {
case 0:
break;
case 1:
if (xref_a.getOffset() != xref_a.getOffset()) {
std::cerr << "different offset" << std::endl;
return false;
}
break;
case 2:
if (xref_a.getObjStreamNumber() != xref_a.getObjStreamNumber() ||
xref_a.getObjStreamIndex() != xref_a.getObjStreamIndex()) {
std::cerr << "different stream number or index" << std::endl;
return false;
}
break;
default:
std::cerr << "unknown xref entry type" << std::endl;
std::exit(2);
}
}
return true;
}
int
main(int argc, char* argv[])
{
if (argc < 2) {
usage();
std::exit(2);
}
qpdf_object_stream_e mode = qpdf_o_preserve;
bool blinearize = false;
bool bpreserve_unreferenced = false;
std::string filename_input;
for (int i = 1; i < argc; ++i) {
if (argv[i][0] == '-') {
std::string opt = argv[i];
if (opt == "--object-streams=preserve") {
mode = qpdf_o_preserve;
} else if (opt == "--object-streams=disable") {
mode = qpdf_o_disable;
} else if (opt == "--object-streams=generate") {
mode = qpdf_o_generate;
} else if (opt == "--linearize") {
blinearize = true;
} else if (opt == "--preserve-unreferenced") {
bpreserve_unreferenced = true;
} else {
usage();
std::exit(2);
}
} else if (argc == i + 1) {
filename_input = argv[i];
break;
} else {
usage();
std::exit(2);
}
}
try {
QPDF qpdf_in;
qpdf_in.processFile(filename_input.c_str());
std::vector<QPDFObjectHandle> objs_in = qpdf_in.getAllObjects();
QPDFWriter w(qpdf_in);
w.setOutputMemory();
w.setObjectStreamMode(mode);
w.setLinearization(blinearize);
w.setPreserveUnreferencedObjects(bpreserve_unreferenced);
w.write();
std::map<QPDFObjGen, QPDFXRefEntry> xrefs_w = w.getWrittenXRefTable();
auto buf = w.getBufferSharedPointer();
QPDF qpdf_ren;
qpdf_ren.processMemoryFile(
"renumbered", reinterpret_cast<char*>(buf->getBuffer()), buf->getSize());
std::map<QPDFObjGen, QPDFXRefEntry> xrefs_ren = qpdf_ren.getXRefTable();
std::cout << "--- compare between input and renumbered objects ---" << std::endl;
for (auto const& iter: objs_in) {
QPDFObjGen og_in = iter.getObjGen();
QPDFObjGen og_ren = w.getRenumberedObjGen(og_in);
std::cout << "input " << og_in.getObj() << "/" << og_in.getGen() << " -> renumbered "
<< og_ren.getObj() << "/" << og_ren.getGen() << std::endl;
if (og_ren.getObj() == 0) {
std::cout << "deleted" << std::endl;
continue;
}
if (!compare(iter, qpdf_ren.getObjectByObjGen(og_ren))) {
std::cerr << "different" << std::endl;
std::exit(2);
}
}
std::cout << "complete" << std::endl;
std::cout << "--- compare between written and reloaded xref tables ---" << std::endl;
if (!compare_xref_table(xrefs_w, xrefs_ren)) {
std::cerr << "different" << std::endl;
std::exit(2);
}
std::cout << "complete" << std::endl;
std::cout << "succeeded" << std::endl;
} catch (std::exception& e) {
std::cerr << e.what() << std::endl;
std::exit(2);
}
return 0;
}