2008-04-29 12:55:25 +00:00
|
|
|
#include <qpdf/Pl_LZWDecoder.hh>
|
|
|
|
|
2019-06-21 03:35:23 +00:00
|
|
|
#include <qpdf/QIntC.hh>
|
2008-04-29 12:55:25 +00:00
|
|
|
#include <qpdf/QTC.hh>
|
2013-10-05 20:37:27 +00:00
|
|
|
#include <qpdf/QUtil.hh>
|
2023-05-20 11:22:32 +00:00
|
|
|
#include <cstring>
|
2009-09-26 18:36:04 +00:00
|
|
|
#include <stdexcept>
|
2008-04-29 12:55:25 +00:00
|
|
|
|
|
|
|
Pl_LZWDecoder::Pl_LZWDecoder(char const* identifier, Pipeline* next, bool early_code_change) :
|
|
|
|
Pipeline(identifier, next),
|
2024-08-07 16:20:19 +00:00
|
|
|
code_change_delta(early_code_change)
|
2008-04-29 12:55:25 +00:00
|
|
|
{
|
2024-08-07 16:20:19 +00:00
|
|
|
if (!next) {
|
|
|
|
throw std::logic_error("Attempt to create Pl_LZWDecoder with nullptr as next");
|
|
|
|
}
|
2008-04-29 12:55:25 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void
|
2022-05-03 21:43:07 +00:00
|
|
|
Pl_LZWDecoder::write(unsigned char const* bytes, size_t len)
|
2008-04-29 12:55:25 +00:00
|
|
|
{
|
2012-06-20 15:20:57 +00:00
|
|
|
for (size_t i = 0; i < len; ++i) {
|
2024-08-07 16:20:19 +00:00
|
|
|
buf[next_char_++] = bytes[i];
|
|
|
|
if (next_char_ == 3) {
|
|
|
|
next_char_ = 0;
|
2022-02-08 14:18:08 +00:00
|
|
|
}
|
|
|
|
this->bits_available += 8;
|
|
|
|
if (this->bits_available >= this->code_size) {
|
|
|
|
sendNextCode();
|
|
|
|
}
|
2008-04-29 12:55:25 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void
|
|
|
|
Pl_LZWDecoder::finish()
|
|
|
|
{
|
2024-08-07 16:20:19 +00:00
|
|
|
next()->finish();
|
2008-04-29 12:55:25 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void
|
|
|
|
Pl_LZWDecoder::sendNextCode()
|
|
|
|
{
|
2019-06-21 03:35:23 +00:00
|
|
|
unsigned int high = this->byte_pos;
|
|
|
|
unsigned int med = (this->byte_pos + 1) % 3;
|
|
|
|
unsigned int low = (this->byte_pos + 2) % 3;
|
2008-04-29 12:55:25 +00:00
|
|
|
|
2019-06-21 03:35:23 +00:00
|
|
|
unsigned int bits_from_high = 8 - this->bit_pos;
|
|
|
|
unsigned int bits_from_med = this->code_size - bits_from_high;
|
|
|
|
unsigned int bits_from_low = 0;
|
2008-04-29 12:55:25 +00:00
|
|
|
if (bits_from_med > 8) {
|
2022-02-08 14:18:08 +00:00
|
|
|
bits_from_low = bits_from_med - 8;
|
|
|
|
bits_from_med = 8;
|
2008-04-29 12:55:25 +00:00
|
|
|
}
|
2019-06-21 03:35:23 +00:00
|
|
|
unsigned int high_mask = (1U << bits_from_high) - 1U;
|
|
|
|
unsigned int med_mask = 0xff - ((1U << (8 - bits_from_med)) - 1U);
|
|
|
|
unsigned int low_mask = 0xff - ((1U << (8 - bits_from_low)) - 1U);
|
|
|
|
unsigned int code = 0;
|
2008-04-29 12:55:25 +00:00
|
|
|
code += (this->buf[high] & high_mask) << bits_from_med;
|
|
|
|
code += ((this->buf[med] & med_mask) >> (8 - bits_from_med));
|
|
|
|
if (bits_from_low) {
|
2022-02-08 14:18:08 +00:00
|
|
|
code <<= bits_from_low;
|
|
|
|
code += ((this->buf[low] & low_mask) >> (8 - bits_from_low));
|
|
|
|
this->byte_pos = low;
|
|
|
|
this->bit_pos = bits_from_low;
|
2008-04-29 12:55:25 +00:00
|
|
|
} else {
|
2022-02-08 14:18:08 +00:00
|
|
|
this->byte_pos = med;
|
|
|
|
this->bit_pos = bits_from_med;
|
2008-04-29 12:55:25 +00:00
|
|
|
}
|
|
|
|
if (this->bit_pos == 8) {
|
2022-02-08 14:18:08 +00:00
|
|
|
this->bit_pos = 0;
|
|
|
|
++this->byte_pos;
|
|
|
|
this->byte_pos %= 3;
|
2008-04-29 12:55:25 +00:00
|
|
|
}
|
|
|
|
this->bits_available -= this->code_size;
|
|
|
|
|
|
|
|
handleCode(code);
|
|
|
|
}
|
|
|
|
|
|
|
|
unsigned char
|
2019-06-21 03:35:23 +00:00
|
|
|
Pl_LZWDecoder::getFirstChar(unsigned int code)
|
2008-04-29 12:55:25 +00:00
|
|
|
{
|
|
|
|
unsigned char result = '\0';
|
|
|
|
if (code < 256) {
|
2022-02-08 14:18:08 +00:00
|
|
|
result = static_cast<unsigned char>(code);
|
2013-10-05 20:37:27 +00:00
|
|
|
} else if (code > 257) {
|
2022-02-08 14:18:08 +00:00
|
|
|
unsigned int idx = code - 258;
|
|
|
|
if (idx >= table.size()) {
|
2013-10-05 20:37:27 +00:00
|
|
|
throw std::runtime_error("Pl_LZWDecoder::getFirstChar: table overflow");
|
|
|
|
}
|
2022-02-08 14:18:08 +00:00
|
|
|
Buffer& b = table.at(idx);
|
|
|
|
result = b.getBuffer()[0];
|
2013-10-05 20:37:27 +00:00
|
|
|
} else {
|
2019-08-26 01:23:19 +00:00
|
|
|
throw std::runtime_error(
|
2013-10-05 20:37:27 +00:00
|
|
|
"Pl_LZWDecoder::getFirstChar called with invalid code (" + std::to_string(code) + ")");
|
|
|
|
}
|
2008-04-29 12:55:25 +00:00
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
|
|
|
void
|
2024-08-07 16:20:19 +00:00
|
|
|
Pl_LZWDecoder::addToTable(unsigned char c)
|
2008-04-29 12:55:25 +00:00
|
|
|
{
|
|
|
|
unsigned int last_size = 0;
|
2022-07-26 11:37:50 +00:00
|
|
|
unsigned char const* last_data = nullptr;
|
2008-04-29 12:55:25 +00:00
|
|
|
unsigned char tmp[1];
|
|
|
|
|
|
|
|
if (this->last_code < 256) {
|
2022-02-08 14:18:08 +00:00
|
|
|
tmp[0] = static_cast<unsigned char>(this->last_code);
|
|
|
|
last_data = tmp;
|
|
|
|
last_size = 1;
|
2013-10-05 20:37:27 +00:00
|
|
|
} else if (this->last_code > 257) {
|
2022-02-08 14:18:08 +00:00
|
|
|
unsigned int idx = this->last_code - 258;
|
|
|
|
if (idx >= table.size()) {
|
2013-10-05 20:37:27 +00:00
|
|
|
throw std::runtime_error("Pl_LZWDecoder::addToTable: table overflow");
|
|
|
|
}
|
2022-02-08 14:18:08 +00:00
|
|
|
Buffer& b = table.at(idx);
|
|
|
|
last_data = b.getBuffer();
|
|
|
|
last_size = QIntC::to_uint(b.getSize());
|
2013-10-05 20:37:27 +00:00
|
|
|
} else {
|
2019-08-26 01:23:19 +00:00
|
|
|
throw std::runtime_error(
|
2013-10-05 20:37:27 +00:00
|
|
|
"Pl_LZWDecoder::addToTable called with invalid code (" +
|
2022-09-21 16:49:21 +00:00
|
|
|
std::to_string(this->last_code) + ")");
|
2013-10-05 20:37:27 +00:00
|
|
|
}
|
2008-04-29 12:55:25 +00:00
|
|
|
|
|
|
|
Buffer entry(1 + last_size);
|
|
|
|
unsigned char* new_data = entry.getBuffer();
|
|
|
|
memcpy(new_data, last_data, last_size);
|
2024-08-07 16:20:19 +00:00
|
|
|
new_data[last_size] = c;
|
2023-05-25 13:10:47 +00:00
|
|
|
this->table.push_back(std::move(entry));
|
2008-04-29 12:55:25 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void
|
2019-06-21 03:35:23 +00:00
|
|
|
Pl_LZWDecoder::handleCode(unsigned int code)
|
2008-04-29 12:55:25 +00:00
|
|
|
{
|
|
|
|
if (this->eod) {
|
2022-02-08 14:18:08 +00:00
|
|
|
return;
|
2008-04-29 12:55:25 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
if (code == 256) {
|
2022-02-08 14:18:08 +00:00
|
|
|
if (!this->table.empty()) {
|
|
|
|
QTC::TC("libtests", "Pl_LZWDecoder intermediate reset");
|
|
|
|
}
|
|
|
|
this->table.clear();
|
|
|
|
this->code_size = 9;
|
2008-04-29 12:55:25 +00:00
|
|
|
} else if (code == 257) {
|
2022-02-08 14:18:08 +00:00
|
|
|
this->eod = true;
|
2008-04-29 12:55:25 +00:00
|
|
|
} else {
|
2022-02-08 14:18:08 +00:00
|
|
|
if (this->last_code != 256) {
|
|
|
|
// Add to the table from last time. New table entry would be what we read last plus the
|
|
|
|
// first character of what we're reading now.
|
2024-08-07 16:20:19 +00:00
|
|
|
unsigned char next_c = '\0';
|
2022-02-08 14:18:08 +00:00
|
|
|
unsigned int table_size = QIntC::to_uint(table.size());
|
|
|
|
if (code < 256) {
|
2024-08-07 16:20:19 +00:00
|
|
|
// just read < 256; last time's next_c was code
|
|
|
|
next_c = static_cast<unsigned char>(code);
|
2022-02-08 14:18:08 +00:00
|
|
|
} else if (code > 257) {
|
|
|
|
size_t idx = code - 258;
|
|
|
|
if (idx > table_size) {
|
|
|
|
throw std::runtime_error("LZWDecoder: bad code received");
|
|
|
|
} else if (idx == table_size) {
|
|
|
|
// The encoder would have just created this entry, so the first character of
|
|
|
|
// this entry would have been the same as the first character of the last entry.
|
|
|
|
QTC::TC("libtests", "Pl_LZWDecoder last was table size");
|
2024-08-07 16:20:19 +00:00
|
|
|
next_c = getFirstChar(this->last_code);
|
2022-02-08 14:18:08 +00:00
|
|
|
} else {
|
2024-08-07 16:20:19 +00:00
|
|
|
next_c = getFirstChar(code);
|
2022-02-08 14:18:08 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
unsigned int new_idx = 258 + table_size;
|
|
|
|
if (new_idx == 4096) {
|
|
|
|
throw std::runtime_error("LZWDecoder: table full");
|
|
|
|
}
|
2024-08-07 16:20:19 +00:00
|
|
|
addToTable(next_c);
|
2022-02-08 14:18:08 +00:00
|
|
|
unsigned int change_idx = new_idx + code_change_delta;
|
|
|
|
if ((change_idx == 511) || (change_idx == 1023) || (change_idx == 2047)) {
|
|
|
|
++this->code_size;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (code < 256) {
|
2023-05-20 12:34:53 +00:00
|
|
|
auto ch = static_cast<unsigned char>(code);
|
2024-08-07 16:20:19 +00:00
|
|
|
next()->write(&ch, 1);
|
2022-02-08 14:18:08 +00:00
|
|
|
} else {
|
2019-08-26 01:23:19 +00:00
|
|
|
unsigned int idx = code - 258;
|
|
|
|
if (idx >= table.size()) {
|
|
|
|
throw std::runtime_error("Pl_LZWDecoder::handleCode: table overflow");
|
|
|
|
}
|
2022-02-08 14:18:08 +00:00
|
|
|
Buffer& b = table.at(idx);
|
2024-08-07 16:20:19 +00:00
|
|
|
next()->write(b.getBuffer(), b.getSize());
|
2022-02-08 14:18:08 +00:00
|
|
|
}
|
2008-04-29 12:55:25 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
this->last_code = code;
|
|
|
|
}
|