Skip to content

Commit

Permalink
Merge pull request #187 from galkahana/parsing-corrections
Browse files Browse the repository at this point in the history
xref parsing corrections
  • Loading branch information
galkahana authored Dec 11, 2022
2 parents 24a9817 + a5a4862 commit f9e0631
Show file tree
Hide file tree
Showing 2 changed files with 25 additions and 30 deletions.
51 changes: 23 additions & 28 deletions PDFWriter/PDFParser.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -539,10 +539,6 @@ EStatusCode PDFParser::DetermineXrefSize()
else
{
mXrefSize = (ObjectIDType)aSize->GetValue();
if(mXrefSize > MAX_XREF_SIZE) {
TRACE_LOG("PDFParser::DetermineXrefSize, invalid value for xref size");
return PDFHummus::eFailure;
}
return PDFHummus::eSuccess;
}
}
Expand All @@ -558,10 +554,17 @@ typedef BoxingBaseWithRW<unsigned long> ULong;
typedef BoxingBaseWithRW<LongFilePositionType> LongFilePositionTypeBox;


void PDFParser::ExtendXrefToSize(XrefEntryInputVector& inXrefTable, ObjectIDType inXrefSize) {
if(inXrefTable.size() < inXrefSize) {
inXrefTable.insert(inXrefTable.end(), inXrefSize-inXrefTable.size(), scEmptyEntry);
EStatusCode PDFParser::ExtendXrefToSize(XrefEntryInputVector& inXrefTable, ObjectIDType inXrefSize) {
if (inXrefTable.size() >= inXrefSize)
return eSuccess;

if(inXrefSize > MAX_XREF_SIZE) {
TRACE_LOG("PDFParser::ExtendXrefToSize, invalid value for section length");
return eFailure;
}

inXrefTable.insert(inXrefTable.end(), inXrefSize-inXrefTable.size(), scEmptyEntry);
return eSuccess;
}

static const std::string scXref = "xref";
Expand Down Expand Up @@ -635,11 +638,6 @@ EStatusCode PDFParser::ParseXrefFromXrefTable(XrefEntryInputVector& inXrefTable,
if(ObjectIDTypeBox(token.second) == 0)
continue; // probably will never happen
firstNonSectionObject = currentObject + ObjectIDTypeBox(token.second);
if(firstNonSectionObject > MAX_XREF_SIZE) {
TRACE_LOG("PDFParser::ParseXref, invalid value for section length");
status = PDFHummus::eFailure;
break;
}

// if the segment declared objects above the xref size, consult policy on what to do
if(firstNonSectionObject > inXrefSize && mAllowExtendingSegments)
Expand All @@ -658,7 +656,9 @@ EStatusCode PDFParser::ParseXrefFromXrefTable(XrefEntryInputVector& inXrefTable,
if(currentObject < inXrefSize)
{
// make sure we have enough room
ExtendXrefToSize(inXrefTable, currentObject+1);
status = ExtendXrefToSize(inXrefTable, currentObject+1);
if (status != eSuccess)
break;

inXrefTable[currentObject].mObjectPosition = LongFilePositionTypeBox(std::string((const char*)entry, 10));
inXrefTable[currentObject].mRivision = ULong(std::string((const char*)(entry + 11), 5));
Expand Down Expand Up @@ -1093,7 +1093,7 @@ EStatusCode PDFParser::ParsePreviousXrefs(PDFDictionary* inTrailer)
break;
}

MergeXrefWithMainXref(aTable,readTableSize);
status = MergeXrefWithMainXref(aTable,readTableSize);
}
while(false);
return status;
Expand Down Expand Up @@ -1216,19 +1216,23 @@ EStatusCode PDFParser::ParsePreviousFileDirectory(LongFilePositionType inXrefPos
return status;
}

void PDFParser::MergeXrefWithMainXref(XrefEntryInputVector& inTableToMerge, ObjectIDType inMergedTableSize)
EStatusCode PDFParser::MergeXrefWithMainXref(XrefEntryInputVector& inTableToMerge, ObjectIDType inMergedTableSize)
{
if(inMergedTableSize > mXrefSize)
mXrefSize = inMergedTableSize;

// make sure we have enough room
ExtendXrefToSize(mXrefTable, inTableToMerge.size());
EStatusCode status = ExtendXrefToSize(mXrefTable, inTableToMerge.size());
if(status != eSuccess)
return status;

for(ObjectIDType i = 0; i < inTableToMerge.size(); ++i) // iterate by input table size which is what we actually want to read from (and not the logical size)
{
if(inTableToMerge[i].mType != eXrefEntryUndefined)
mXrefTable[i] = inTableToMerge[i];
}

return eSuccess;
}


Expand Down Expand Up @@ -1507,11 +1511,6 @@ EStatusCode PDFParser::ParseXrefFromXrefStream(XrefEntryInputVector& inXrefTable

// if reading objects past expected range interesting consult policy
ObjectIDType readXrefSize = (ObjectIDType)xrefSize->GetValue();
if(readXrefSize > MAX_XREF_SIZE) {
TRACE_LOG("PDFParser::ParseXrefFromXrefStream, invalid value for section length");
status = PDFHummus::eFailure;
break;
}

if(readXrefSize > inXrefSize)
{
Expand Down Expand Up @@ -1555,11 +1554,6 @@ EStatusCode PDFParser::ParseXrefFromXrefStream(XrefEntryInputVector& inXrefTable
}
ObjectIDType objectsCount = (ObjectIDType)segmentValue->GetValue();
ObjectIDType readXrefSize = startObject + objectsCount;
if(readXrefSize > MAX_XREF_SIZE) {
TRACE_LOG("PDFParser::ParseXrefFromXrefStream, invalid value for section length");
status = PDFHummus::eFailure;
break;
}

// if reading objects past expected range interesting consult policy
if(readXrefSize > inXrefSize)
Expand Down Expand Up @@ -1610,8 +1604,9 @@ EStatusCode PDFParser::ReadXrefStreamSegment(XrefEntryInputVector& inXrefTable,
long long entryType;

// make sure we have enough room
ExtendXrefToSize(inXrefTable, objectToRead+1);

status = ExtendXrefToSize(inXrefTable, objectToRead+1);
if(status != PDFHummus::eSuccess)
break;
status = ReadXrefSegmentValue(inReadFrom,inEntryWidths[0],entryType);
if(status != PDFHummus::eSuccess)
break;
Expand Down
4 changes: 2 additions & 2 deletions PDFWriter/PDFParser.h
Original file line number Diff line number Diff line change
Expand Up @@ -216,7 +216,7 @@ class PDFParser
PDFHummus::EStatusCode ParsePagesIDs(PDFDictionary* inPageNode,ObjectIDType inNodeObjectID);
PDFHummus::EStatusCode ParsePagesIDs(PDFDictionary* inPageNode,ObjectIDType inNodeObjectID,unsigned long& ioCurrentPageIndex);
PDFHummus::EStatusCode ParsePreviousXrefs(PDFDictionary* inTrailer);
void MergeXrefWithMainXref(XrefEntryInputVector& inTableToMerge,ObjectIDType inMergedTableSize);
PDFHummus::EStatusCode MergeXrefWithMainXref(XrefEntryInputVector& inTableToMerge,ObjectIDType inMergedTableSize);
PDFHummus::EStatusCode ParseFileDirectory();
PDFHummus::EStatusCode BuildXrefTableAndTrailerFromXrefStream(long long inXrefStreamObjectID);
// an overload for cases where the xref stream object is already parsed
Expand Down Expand Up @@ -263,5 +263,5 @@ class PDFParser
void GoBackTillLineStart();
bool IsPDFWhiteSpace(IOBasicTypes::Byte inCharacter);

void ExtendXrefToSize(XrefEntryInputVector& inXrefTable, ObjectIDType inXrefSize);
PDFHummus::EStatusCode ExtendXrefToSize(XrefEntryInputVector& inXrefTable, ObjectIDType inXrefSize);
};

0 comments on commit f9e0631

Please sign in to comment.