2012-07-21 05:37:14 -04:00
|
|
|
#include <qpdf/FileInputSource.hh>
|
2022-02-04 16:31:31 -05:00
|
|
|
|
2012-07-21 05:37:14 -04:00
|
|
|
#include <qpdf/QPDFExc.hh>
|
2022-04-02 17:14:10 -04:00
|
|
|
#include <qpdf/QUtil.hh>
|
2013-11-29 10:20:50 -05:00
|
|
|
#include <algorithm>
|
2023-05-20 12:22:32 +01:00
|
|
|
#include <cstring>
|
2012-07-21 05:37:14 -04:00
|
|
|
|
2019-06-21 21:32:47 -04:00
|
|
|
FileInputSource::FileInputSource() :
|
2022-08-25 12:42:14 +01:00
|
|
|
close_file(false),
|
|
|
|
file(nullptr)
|
2019-06-21 21:32:47 -04:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
2022-05-04 12:02:39 -04:00
|
|
|
FileInputSource::FileInputSource(char const* filename) :
|
2022-08-25 12:42:14 +01:00
|
|
|
close_file(true),
|
|
|
|
filename(filename),
|
|
|
|
file(QUtil::safe_fopen(filename, "rb"))
|
2022-05-04 12:02:39 -04:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
2023-05-21 13:35:09 -04:00
|
|
|
FileInputSource::FileInputSource(char const* description, FILE* filep, bool close_file) :
|
2022-08-25 12:42:14 +01:00
|
|
|
close_file(close_file),
|
|
|
|
filename(description),
|
|
|
|
file(filep)
|
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
FileInputSource::~FileInputSource()
|
2022-05-04 12:02:39 -04:00
|
|
|
{
|
2023-05-27 18:19:52 +01:00
|
|
|
// Must be explicit and not inline -- see QPDF_DLL_CLASS in README-maintainer
|
2022-08-25 12:42:14 +01:00
|
|
|
if (this->file && this->close_file) {
|
|
|
|
fclose(this->file);
|
|
|
|
}
|
2022-05-04 12:02:39 -04:00
|
|
|
}
|
|
|
|
|
2012-07-21 05:37:14 -04:00
|
|
|
void
|
|
|
|
FileInputSource::setFilename(char const* filename)
|
|
|
|
{
|
2022-08-25 12:42:14 +01:00
|
|
|
this->close_file = true;
|
|
|
|
this->filename = filename;
|
|
|
|
this->file = QUtil::safe_fopen(filename, "rb");
|
2012-07-21 05:37:14 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
void
|
2022-04-02 17:14:10 -04:00
|
|
|
FileInputSource::setFile(char const* description, FILE* filep, bool close_file)
|
2012-07-21 05:37:14 -04:00
|
|
|
{
|
2022-08-25 12:42:14 +01:00
|
|
|
this->filename = description;
|
|
|
|
this->file = filep;
|
2012-07-21 05:37:14 -04:00
|
|
|
this->seek(0, SEEK_SET);
|
|
|
|
}
|
|
|
|
|
|
|
|
qpdf_offset_t
|
|
|
|
FileInputSource::findAndSkipNextEOL()
|
|
|
|
{
|
|
|
|
qpdf_offset_t result = 0;
|
|
|
|
bool done = false;
|
|
|
|
char buf[10240];
|
2022-04-02 17:14:10 -04:00
|
|
|
while (!done) {
|
2022-08-25 12:42:14 +01:00
|
|
|
qpdf_offset_t cur_offset = QUtil::tell(this->file);
|
2012-07-21 05:37:14 -04:00
|
|
|
size_t len = this->read(buf, sizeof(buf));
|
2022-04-02 17:14:10 -04:00
|
|
|
if (len == 0) {
|
2012-07-21 05:37:14 -04:00
|
|
|
done = true;
|
|
|
|
result = this->tell();
|
2022-04-02 17:14:10 -04:00
|
|
|
} else {
|
2013-02-23 21:46:21 -05:00
|
|
|
char* p1 = static_cast<char*>(memchr(buf, '\r', len));
|
|
|
|
char* p2 = static_cast<char*>(memchr(buf, '\n', len));
|
2012-07-21 05:37:14 -04:00
|
|
|
char* p = (p1 && p2) ? std::min(p1, p2) : p1 ? p1 : p2;
|
2022-04-02 17:14:10 -04:00
|
|
|
if (p) {
|
2012-07-21 05:37:14 -04:00
|
|
|
result = cur_offset + (p - buf);
|
2023-05-27 18:19:52 +01:00
|
|
|
// We found \r or \n. Keep reading until we get past \r and \n characters.
|
2012-07-21 05:37:14 -04:00
|
|
|
this->seek(result + 1, SEEK_SET);
|
|
|
|
char ch;
|
2022-04-02 17:14:10 -04:00
|
|
|
while (!done) {
|
|
|
|
if (this->read(&ch, 1) == 0) {
|
2012-07-21 05:37:14 -04:00
|
|
|
done = true;
|
2022-04-02 17:14:10 -04:00
|
|
|
} else if (!((ch == '\r') || (ch == '\n'))) {
|
2020-10-27 10:51:41 -04:00
|
|
|
this->unreadCh(ch);
|
2012-07-21 05:37:14 -04:00
|
|
|
done = true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
|
|
|
std::string const&
|
|
|
|
FileInputSource::getName() const
|
|
|
|
{
|
2022-08-25 12:42:14 +01:00
|
|
|
return this->filename;
|
2012-07-21 05:37:14 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
qpdf_offset_t
|
|
|
|
FileInputSource::tell()
|
|
|
|
{
|
2022-08-25 12:42:14 +01:00
|
|
|
return QUtil::tell(this->file);
|
2012-07-21 05:37:14 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
void
|
|
|
|
FileInputSource::seek(qpdf_offset_t offset, int whence)
|
|
|
|
{
|
2022-08-25 14:05:36 +01:00
|
|
|
if (QUtil::seek(this->file, offset, whence) == -1) {
|
|
|
|
QUtil::throw_system_error(
|
2023-05-21 13:35:09 -04:00
|
|
|
std::string("seek to ") + this->filename + ", offset " + std::to_string(offset) + " (" +
|
|
|
|
std::to_string(whence) + ")");
|
2022-08-25 14:05:36 +01:00
|
|
|
}
|
2012-07-21 05:37:14 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
void
|
|
|
|
FileInputSource::rewind()
|
|
|
|
{
|
2022-08-25 12:42:14 +01:00
|
|
|
::rewind(this->file);
|
2012-07-21 05:37:14 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
size_t
|
|
|
|
FileInputSource::read(char* buffer, size_t length)
|
|
|
|
{
|
2022-08-25 15:08:03 +01:00
|
|
|
this->last_offset = QUtil::tell(this->file);
|
2022-08-25 12:42:14 +01:00
|
|
|
size_t len = fread(buffer, 1, length, this->file);
|
2022-04-02 17:14:10 -04:00
|
|
|
if (len == 0) {
|
2022-08-25 12:42:14 +01:00
|
|
|
if (ferror(this->file)) {
|
2022-04-02 17:14:10 -04:00
|
|
|
throw QPDFExc(
|
|
|
|
qpdf_e_system,
|
2022-08-25 12:42:14 +01:00
|
|
|
this->filename,
|
2022-04-02 17:14:10 -04:00
|
|
|
"",
|
|
|
|
this->last_offset,
|
2022-09-21 17:49:21 +01:00
|
|
|
(std::string("read ") + std::to_string(length) + " bytes"));
|
2022-04-02 17:14:10 -04:00
|
|
|
} else if (length > 0) {
|
2018-01-28 18:28:45 -05:00
|
|
|
this->seek(0, SEEK_END);
|
|
|
|
this->last_offset = this->tell();
|
|
|
|
}
|
2012-07-21 05:37:14 -04:00
|
|
|
}
|
|
|
|
return len;
|
|
|
|
}
|
|
|
|
|
|
|
|
void
|
|
|
|
FileInputSource::unreadCh(char ch)
|
|
|
|
{
|
2022-08-25 14:05:36 +01:00
|
|
|
if (ungetc(static_cast<unsigned char>(ch), this->file) == -1) {
|
|
|
|
QUtil::throw_system_error(this->filename + ": unread character");
|
|
|
|
}
|
2012-07-21 05:37:14 -04:00
|
|
|
}
|