Don't interpret word tokens in content streams (fixes #82)

2024-12-22 02:49:00 +00:00 · 2017-07-26 05:35:34 -04:00 · 2017-07-26 05:35:34 -04:00 · 12db09898e
commit 12db09898e
parent 701b518d5c
2 changed files with 8 additions and 5 deletions
--- a/3
+++ b/3
@ -1,5 +1,8 @@
 2017-07-26  Jay Berkenbilt  <ejb@ql.org>

+	* Don't attempt to interpret syntactic keywords (like R and
+	endobj) found while parsing content streams.
+
 	* Detect infinite loops while resolving objects. This could happen
 	if something inside an object that had to be resolved during
 	parsing, such as a stream length, recursively referenced the
--- a/libqpdf/QPDFObjectHandle.cc
+++ b/libqpdf/QPDFObjectHandle.cc
@ -964,7 +964,11 @@ QPDFObjectHandle::parseInternal(PointerHolder<InputSource> input,
 	  case QPDFTokenizer::tt_word:
 	    {
 		std::string const& value = token.getValue();
-		if ((value == "R") && (in_array || in_dictionary) &&
+                if (content_stream)
+                {
+                    object = QPDFObjectHandle::newOperator(value);
+                }
+		else if ((value == "R") && (in_array || in_dictionary) &&
 		    (olist.size() >= 2) &&
                    (! olist.at(olist.size() - 1).isIndirect()) &&
 		    (olist.at(olist.size() - 1).isInteger()) &&
@ -996,10 +1000,6 @@ QPDFObjectHandle::parseInternal(PointerHolder<InputSource> input,
 		    input->seek(input->getLastOffset(), SEEK_SET);
                    empty = true;
 		}
-		else if (content_stream)
-                {
-                    object = QPDFObjectHandle::newOperator(token.getValue());
-                }
 		else
 		{
 		    throw QPDFExc(qpdf_e_damaged_pdf, input->getName(),