2008-04-29 12:55:25 +00:00
|
|
|
#include <qpdf/Pl_QPDFTokenizer.hh>
|
2022-02-04 21:31:31 +00:00
|
|
|
|
2022-04-02 21:14:10 +00:00
|
|
|
#include <qpdf/BufferInputSource.hh>
|
2011-04-30 18:20:35 +00:00
|
|
|
#include <qpdf/QTC.hh>
|
2019-01-30 19:20:56 +00:00
|
|
|
#include <qpdf/QUtil.hh>
|
2009-09-26 18:36:04 +00:00
|
|
|
#include <stdexcept>
|
2008-05-04 16:02:53 +00:00
|
|
|
#include <string.h>
|
2008-04-29 12:55:25 +00:00
|
|
|
|
2018-02-02 23:21:34 +00:00
|
|
|
Pl_QPDFTokenizer::Members::Members() :
|
2022-07-26 11:37:50 +00:00
|
|
|
filter(nullptr),
|
2019-01-30 19:20:56 +00:00
|
|
|
buf("tokenizer buffer")
|
2008-04-29 12:55:25 +00:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
2022-04-02 21:14:10 +00:00
|
|
|
Pl_QPDFTokenizer::Pl_QPDFTokenizer(
|
|
|
|
char const* identifier,
|
|
|
|
QPDFObjectHandle::TokenFilter* filter,
|
|
|
|
Pipeline* next) :
|
2018-02-16 01:45:19 +00:00
|
|
|
Pipeline(identifier, next),
|
2018-02-02 23:21:34 +00:00
|
|
|
m(new Members)
|
2008-04-29 12:55:25 +00:00
|
|
|
{
|
2018-02-02 23:21:34 +00:00
|
|
|
m->filter = filter;
|
2018-02-16 01:45:19 +00:00
|
|
|
QPDFObjectHandle::TokenFilter::PipelineAccessor::setPipeline(
|
|
|
|
m->filter, next);
|
2018-02-02 23:21:34 +00:00
|
|
|
m->tokenizer.allowEOF();
|
|
|
|
m->tokenizer.includeIgnorable();
|
2008-04-29 12:55:25 +00:00
|
|
|
}
|
|
|
|
|
2018-02-02 23:21:34 +00:00
|
|
|
Pl_QPDFTokenizer::~Pl_QPDFTokenizer()
|
2008-04-29 12:55:25 +00:00
|
|
|
{
|
2022-04-15 23:44:07 +00:00
|
|
|
// Must be explicit and not inline -- see QPDF_DLL_CLASS in
|
|
|
|
// README-maintainer
|
2008-04-29 12:55:25 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void
|
2022-05-03 21:43:07 +00:00
|
|
|
Pl_QPDFTokenizer::write(unsigned char const* data, size_t len)
|
2008-04-29 12:55:25 +00:00
|
|
|
{
|
2019-01-30 19:20:56 +00:00
|
|
|
this->m->buf.write(data, len);
|
2008-04-29 12:55:25 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void
|
|
|
|
Pl_QPDFTokenizer::finish()
|
|
|
|
{
|
2019-01-30 19:20:56 +00:00
|
|
|
this->m->buf.finish();
|
2022-04-09 18:35:56 +00:00
|
|
|
auto input = std::shared_ptr<InputSource>(
|
2022-04-03 20:10:27 +00:00
|
|
|
// line-break
|
|
|
|
new BufferInputSource(
|
|
|
|
"tokenizer data", this->m->buf.getBuffer(), true));
|
2022-04-02 21:14:10 +00:00
|
|
|
|
|
|
|
while (true) {
|
2019-01-30 19:20:56 +00:00
|
|
|
QPDFTokenizer::Token token = this->m->tokenizer.readToken(
|
2022-09-21 16:49:21 +00:00
|
|
|
input, "offset " + std::to_string(input->tell()), true);
|
2022-02-08 14:18:08 +00:00
|
|
|
this->m->filter->handleToken(token);
|
2022-04-02 21:14:10 +00:00
|
|
|
if (token.getType() == QPDFTokenizer::tt_eof) {
|
2019-01-30 19:20:56 +00:00
|
|
|
break;
|
2022-09-29 13:33:11 +00:00
|
|
|
} else if (token.isWord("ID")) {
|
2019-01-31 04:24:09 +00:00
|
|
|
// Read the space after the ID.
|
|
|
|
char ch = ' ';
|
|
|
|
input->read(&ch, 1);
|
2022-04-03 20:10:27 +00:00
|
|
|
this->m->filter->handleToken(
|
|
|
|
// line-break
|
|
|
|
QPDFTokenizer::Token(
|
|
|
|
QPDFTokenizer::tt_space, std::string(1, ch)));
|
2019-01-30 19:20:56 +00:00
|
|
|
QTC::TC("qpdf", "Pl_QPDFTokenizer found ID");
|
|
|
|
this->m->tokenizer.expectInlineImage(input);
|
|
|
|
}
|
2008-04-29 12:55:25 +00:00
|
|
|
}
|
2018-02-02 23:21:34 +00:00
|
|
|
this->m->filter->handleEOF();
|
2022-07-26 11:37:50 +00:00
|
|
|
QPDFObjectHandle::TokenFilter::PipelineAccessor::setPipeline(
|
|
|
|
m->filter, nullptr);
|
2018-02-16 01:45:19 +00:00
|
|
|
Pipeline* next = this->getNext(true);
|
2022-04-02 21:14:10 +00:00
|
|
|
if (next) {
|
2018-02-16 01:45:19 +00:00
|
|
|
next->finish();
|
|
|
|
}
|
2008-04-29 12:55:25 +00:00
|
|
|
}
|