| Index: core/src/fpdfapi/fpdf_parser/cpdf_hint_tables.cpp
|
| diff --git a/core/src/fpdfapi/fpdf_parser/cpdf_hint_tables.cpp b/core/src/fpdfapi/fpdf_parser/cpdf_hint_tables.cpp
|
| new file mode 100644
|
| index 0000000000000000000000000000000000000000..09148ba76a617c581bde4c7c0b1aa5cad2e558a7
|
| --- /dev/null
|
| +++ b/core/src/fpdfapi/fpdf_parser/cpdf_hint_tables.cpp
|
| @@ -0,0 +1,467 @@
|
| +// Copyright 2016 PDFium Authors. All rights reserved.
|
| +// Use of this source code is governed by a BSD-style license that can be
|
| +// found in the LICENSE file.
|
| +
|
| +// Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com
|
| +
|
| +#include "core/src/fpdfapi/fpdf_parser/cpdf_hint_tables.h"
|
| +
|
| +#include "core/include/fxcrt/fx_safe_types.h"
|
| +#include "core/include/fpdfapi/fpdf_objects.h"
|
| +#include "core/src/fpdfapi/fpdf_parser/cpdf_data_avail.h"
|
| +
|
| +namespace {
|
| +
|
| +bool CanReadFromBitStream(const CFX_BitStream* hStream,
|
| + const FX_SAFE_DWORD& num_bits) {
|
| + return num_bits.IsValid() &&
|
| + hStream->BitsRemaining() >= num_bits.ValueOrDie();
|
| +}
|
| +
|
| +} // namespace
|
| +
|
| +CPDF_HintTables::~CPDF_HintTables() {
|
| + m_dwDeltaNObjsArray.RemoveAll();
|
| + m_dwNSharedObjsArray.RemoveAll();
|
| + m_dwSharedObjNumArray.RemoveAll();
|
| + m_dwIdentifierArray.RemoveAll();
|
| +}
|
| +
|
| +FX_DWORD CPDF_HintTables::GetItemLength(
|
| + int index,
|
| + const std::vector<FX_FILESIZE>& szArray) {
|
| + if (index < 0 || szArray.size() < 2 ||
|
| + static_cast<size_t>(index) > szArray.size() - 2 ||
|
| + szArray[index] > szArray[index + 1]) {
|
| + return 0;
|
| + }
|
| + return szArray[index + 1] - szArray[index];
|
| +}
|
| +
|
| +FX_BOOL CPDF_HintTables::ReadPageHintTable(CFX_BitStream* hStream) {
|
| + if (!hStream || hStream->IsEOF())
|
| + return FALSE;
|
| +
|
| + int nStreamOffset = ReadPrimaryHintStreamOffset();
|
| + int nStreamLen = ReadPrimaryHintStreamLength();
|
| + if (nStreamOffset < 0 || nStreamLen < 1)
|
| + return FALSE;
|
| +
|
| + const FX_DWORD kHeaderSize = 288;
|
| + if (hStream->BitsRemaining() < kHeaderSize)
|
| + return FALSE;
|
| +
|
| + // Item 1: The least number of objects in a page.
|
| + FX_DWORD dwObjLeastNum = hStream->GetBits(32);
|
| +
|
| + // Item 2: The location of the first page's page object.
|
| + FX_DWORD dwFirstObjLoc = hStream->GetBits(32);
|
| + if (dwFirstObjLoc > nStreamOffset) {
|
| + FX_SAFE_DWORD safeLoc = pdfium::base::checked_cast<FX_DWORD>(nStreamLen);
|
| + safeLoc += dwFirstObjLoc;
|
| + if (!safeLoc.IsValid())
|
| + return FALSE;
|
| + m_szFirstPageObjOffset =
|
| + pdfium::base::checked_cast<FX_FILESIZE>(safeLoc.ValueOrDie());
|
| + } else {
|
| + m_szFirstPageObjOffset =
|
| + pdfium::base::checked_cast<FX_FILESIZE>(dwFirstObjLoc);
|
| + }
|
| +
|
| + // Item 3: The number of bits needed to represent the difference
|
| + // between the greatest and least number of objects in a page.
|
| + FX_DWORD dwDeltaObjectsBits = hStream->GetBits(16);
|
| +
|
| + // Item 4: The least length of a page in bytes.
|
| + FX_DWORD dwPageLeastLen = hStream->GetBits(32);
|
| +
|
| + // Item 5: The number of bits needed to represent the difference
|
| + // between the greatest and least length of a page, in bytes.
|
| + FX_DWORD dwDeltaPageLenBits = hStream->GetBits(16);
|
| +
|
| + // Skip Item 6, 7, 8, 9 total 96 bits.
|
| + hStream->SkipBits(96);
|
| +
|
| + // Item 10: The number of bits needed to represent the greatest
|
| + // number of shared object references.
|
| + FX_DWORD dwSharedObjBits = hStream->GetBits(16);
|
| +
|
| + // Item 11: The number of bits needed to represent the numerically
|
| + // greatest shared object identifier used by the pages.
|
| + FX_DWORD dwSharedIdBits = hStream->GetBits(16);
|
| +
|
| + // Item 12: The number of bits needed to represent the numerator of
|
| + // the fractional position for each shared object reference. For each
|
| + // shared object referenced from a page, there is an indication of
|
| + // where in the page's content stream the object is first referenced.
|
| + FX_DWORD dwSharedNumeratorBits = hStream->GetBits(16);
|
| +
|
| + // Item 13: Skip Item 13 which has 16 bits.
|
| + hStream->SkipBits(16);
|
| +
|
| + CPDF_Object* pPageNum = m_pLinearizedDict->GetElementValue("N");
|
| + int nPages = pPageNum ? pPageNum->GetInteger() : 0;
|
| + if (nPages < 1)
|
| + return FALSE;
|
| +
|
| + FX_SAFE_DWORD required_bits = dwDeltaObjectsBits;
|
| + required_bits *= pdfium::base::checked_cast<FX_DWORD>(nPages);
|
| + if (!CanReadFromBitStream(hStream, required_bits))
|
| + return FALSE;
|
| +
|
| + for (int i = 0; i < nPages; ++i) {
|
| + FX_SAFE_DWORD safeDeltaObj = hStream->GetBits(dwDeltaObjectsBits);
|
| + safeDeltaObj += dwObjLeastNum;
|
| + if (!safeDeltaObj.IsValid())
|
| + return FALSE;
|
| + m_dwDeltaNObjsArray.Add(safeDeltaObj.ValueOrDie());
|
| + }
|
| + hStream->ByteAlign();
|
| +
|
| + required_bits = dwDeltaPageLenBits;
|
| + required_bits *= pdfium::base::checked_cast<FX_DWORD>(nPages);
|
| + if (!CanReadFromBitStream(hStream, required_bits))
|
| + return FALSE;
|
| +
|
| + CFX_DWordArray dwPageLenArray;
|
| + for (int i = 0; i < nPages; ++i) {
|
| + FX_SAFE_DWORD safePageLen = hStream->GetBits(dwDeltaPageLenBits);
|
| + safePageLen += dwPageLeastLen;
|
| + if (!safePageLen.IsValid())
|
| + return FALSE;
|
| + dwPageLenArray.Add(safePageLen.ValueOrDie());
|
| + }
|
| +
|
| + CPDF_Object* pOffsetE = m_pLinearizedDict->GetElementValue("E");
|
| + int nOffsetE = pOffsetE ? pOffsetE->GetInteger() : -1;
|
| + if (nOffsetE < 0)
|
| + return FALSE;
|
| +
|
| + CPDF_Object* pFirstPageNum = m_pLinearizedDict->GetElementValue("P");
|
| + int nFirstPageNum = pFirstPageNum ? pFirstPageNum->GetInteger() : 0;
|
| + for (int i = 0; i < nPages; ++i) {
|
| + if (i == nFirstPageNum) {
|
| + m_szPageOffsetArray.push_back(m_szFirstPageObjOffset);
|
| + } else if (i == nFirstPageNum + 1) {
|
| + if (i == 1) {
|
| + m_szPageOffsetArray.push_back(nOffsetE);
|
| + } else {
|
| + m_szPageOffsetArray.push_back(m_szPageOffsetArray[i - 2] +
|
| + dwPageLenArray[i - 2]);
|
| + }
|
| + } else {
|
| + if (i == 0) {
|
| + m_szPageOffsetArray.push_back(nOffsetE);
|
| + } else {
|
| + m_szPageOffsetArray.push_back(m_szPageOffsetArray[i - 1] +
|
| + dwPageLenArray[i - 1]);
|
| + }
|
| + }
|
| + }
|
| +
|
| + if (nPages > 0) {
|
| + m_szPageOffsetArray.push_back(m_szPageOffsetArray[nPages - 1] +
|
| + dwPageLenArray[nPages - 1]);
|
| + }
|
| + hStream->ByteAlign();
|
| +
|
| + // Number of shared objects.
|
| + required_bits = dwSharedObjBits;
|
| + required_bits *= pdfium::base::checked_cast<FX_DWORD>(nPages);
|
| + if (!CanReadFromBitStream(hStream, required_bits))
|
| + return FALSE;
|
| +
|
| + for (int i = 0; i < nPages; i++)
|
| + m_dwNSharedObjsArray.Add(hStream->GetBits(dwSharedObjBits));
|
| + hStream->ByteAlign();
|
| +
|
| + // Array of identifiers, size = nshared_objects.
|
| + for (int i = 0; i < nPages; i++) {
|
| + required_bits = dwSharedIdBits;
|
| + required_bits *= m_dwNSharedObjsArray[i];
|
| + if (!CanReadFromBitStream(hStream, required_bits))
|
| + return FALSE;
|
| +
|
| + for (int j = 0; j < m_dwNSharedObjsArray[i]; j++)
|
| + m_dwIdentifierArray.Add(hStream->GetBits(dwSharedIdBits));
|
| + }
|
| + hStream->ByteAlign();
|
| +
|
| + for (int i = 0; i < nPages; i++) {
|
| + FX_SAFE_DWORD safeSize = m_dwNSharedObjsArray[i];
|
| + safeSize *= dwSharedNumeratorBits;
|
| + if (!CanReadFromBitStream(hStream, safeSize))
|
| + return FALSE;
|
| +
|
| + hStream->SkipBits(safeSize.ValueOrDie());
|
| + }
|
| + hStream->ByteAlign();
|
| +
|
| + FX_SAFE_DWORD safeTotalPageLen = pdfium::base::checked_cast<FX_DWORD>(nPages);
|
| + safeTotalPageLen *= dwDeltaPageLenBits;
|
| + if (!CanReadFromBitStream(hStream, safeTotalPageLen))
|
| + return FALSE;
|
| +
|
| + hStream->SkipBits(safeTotalPageLen.ValueOrDie());
|
| + hStream->ByteAlign();
|
| + return TRUE;
|
| +}
|
| +
|
| +FX_BOOL CPDF_HintTables::ReadSharedObjHintTable(CFX_BitStream* hStream,
|
| + FX_DWORD offset) {
|
| + if (!hStream || hStream->IsEOF())
|
| + return FALSE;
|
| +
|
| + int nStreamOffset = ReadPrimaryHintStreamOffset();
|
| + int nStreamLen = ReadPrimaryHintStreamLength();
|
| + if (nStreamOffset < 0 || nStreamLen < 1)
|
| + return FALSE;
|
| +
|
| + FX_SAFE_DWORD bit_offset = offset;
|
| + bit_offset *= 8;
|
| + if (!bit_offset.IsValid() || hStream->GetPos() > bit_offset.ValueOrDie())
|
| + return FALSE;
|
| + hStream->SkipBits(bit_offset.ValueOrDie() - hStream->GetPos());
|
| +
|
| + const FX_DWORD kHeaderSize = 192;
|
| + if (hStream->BitsRemaining() < kHeaderSize)
|
| + return FALSE;
|
| +
|
| + // Item 1: The object number of the first object in the shared objects
|
| + // section.
|
| + FX_DWORD dwFirstSharedObjNum = hStream->GetBits(32);
|
| +
|
| + // Item 2: The location of the first object in the shared objects section.
|
| + FX_DWORD dwFirstSharedObjLoc = hStream->GetBits(32);
|
| + if (dwFirstSharedObjLoc > nStreamOffset)
|
| + dwFirstSharedObjLoc += nStreamLen;
|
| +
|
| + // Item 3: The number of shared object entries for the first page.
|
| + m_nFirstPageSharedObjs = hStream->GetBits(32);
|
| +
|
| + // Item 4: The number of shared object entries for the shared objects
|
| + // section, including the number of shared object entries for the first page.
|
| + FX_DWORD dwSharedObjTotal = hStream->GetBits(32);
|
| +
|
| + // Item 5: The number of bits needed to represent the greatest number of
|
| + // objects in a shared object group. Skipped.
|
| + hStream->SkipBits(16);
|
| +
|
| + // Item 6: The least length of a shared object group in bytes.
|
| + FX_DWORD dwGroupLeastLen = hStream->GetBits(32);
|
| +
|
| + // Item 7: The number of bits needed to represent the difference between the
|
| + // greatest and least length of a shared object group, in bytes.
|
| + FX_DWORD dwDeltaGroupLen = hStream->GetBits(16);
|
| + CPDF_Object* pFirstPageObj = m_pLinearizedDict->GetElementValue("O");
|
| + int nFirstPageObjNum = pFirstPageObj ? pFirstPageObj->GetInteger() : -1;
|
| + if (nFirstPageObjNum < 0)
|
| + return FALSE;
|
| +
|
| + FX_DWORD dwPrevObjLen = 0;
|
| + FX_DWORD dwCurObjLen = 0;
|
| + FX_SAFE_DWORD required_bits = dwSharedObjTotal;
|
| + required_bits *= dwDeltaGroupLen;
|
| + if (!CanReadFromBitStream(hStream, required_bits))
|
| + return FALSE;
|
| +
|
| + for (int i = 0; i < dwSharedObjTotal; ++i) {
|
| + dwPrevObjLen = dwCurObjLen;
|
| + FX_SAFE_DWORD safeObjLen = hStream->GetBits(dwDeltaGroupLen);
|
| + safeObjLen += dwGroupLeastLen;
|
| + if (!safeObjLen.IsValid())
|
| + return FALSE;
|
| +
|
| + dwCurObjLen = safeObjLen.ValueOrDie();
|
| + if (i < m_nFirstPageSharedObjs) {
|
| + m_dwSharedObjNumArray.Add(nFirstPageObjNum + i);
|
| + if (i == 0)
|
| + m_szSharedObjOffsetArray.push_back(m_szFirstPageObjOffset);
|
| + } else {
|
| + FX_SAFE_DWORD safeObjNum = dwFirstSharedObjNum;
|
| + safeObjNum += i - m_nFirstPageSharedObjs;
|
| + if (!safeObjNum.IsValid())
|
| + return FALSE;
|
| +
|
| + m_dwSharedObjNumArray.Add(safeObjNum.ValueOrDie());
|
| + if (i == m_nFirstPageSharedObjs) {
|
| + m_szSharedObjOffsetArray.push_back(
|
| + pdfium::base::checked_cast<int32_t>(dwFirstSharedObjLoc));
|
| + }
|
| + }
|
| +
|
| + if (i != 0 && i != m_nFirstPageSharedObjs) {
|
| + FX_SAFE_INT32 safeLoc = pdfium::base::checked_cast<int32_t>(dwPrevObjLen);
|
| + safeLoc += m_szSharedObjOffsetArray[i - 1];
|
| + if (!safeLoc.IsValid())
|
| + return FALSE;
|
| +
|
| + m_szSharedObjOffsetArray.push_back(safeLoc.ValueOrDie());
|
| + }
|
| + }
|
| +
|
| + if (dwSharedObjTotal > 0) {
|
| + FX_SAFE_INT32 safeLoc = pdfium::base::checked_cast<int32_t>(dwCurObjLen);
|
| + safeLoc += m_szSharedObjOffsetArray[dwSharedObjTotal - 1];
|
| + if (!safeLoc.IsValid())
|
| + return FALSE;
|
| +
|
| + m_szSharedObjOffsetArray.push_back(safeLoc.ValueOrDie());
|
| + }
|
| +
|
| + hStream->ByteAlign();
|
| + if (hStream->BitsRemaining() < dwSharedObjTotal)
|
| + return FALSE;
|
| +
|
| + hStream->SkipBits(dwSharedObjTotal);
|
| + hStream->ByteAlign();
|
| + return TRUE;
|
| +}
|
| +
|
| +FX_BOOL CPDF_HintTables::GetPagePos(int index,
|
| + FX_FILESIZE& szPageStartPos,
|
| + FX_FILESIZE& szPageLength,
|
| + FX_DWORD& dwObjNum) {
|
| + if (!m_pLinearizedDict)
|
| + return FALSE;
|
| +
|
| + szPageStartPos = m_szPageOffsetArray[index];
|
| + szPageLength = GetItemLength(index, m_szPageOffsetArray);
|
| +
|
| + CPDF_Object* pFirstPageNum = m_pLinearizedDict->GetElementValue("P");
|
| + int nFirstPageNum = pFirstPageNum ? pFirstPageNum->GetInteger() : 0;
|
| +
|
| + CPDF_Object* pFirstPageObjNum = m_pLinearizedDict->GetElementValue("O");
|
| + if (!pFirstPageObjNum)
|
| + return FALSE;
|
| +
|
| + int nFirstPageObjNum = pFirstPageObjNum->GetInteger();
|
| + if (index == nFirstPageNum) {
|
| + dwObjNum = nFirstPageObjNum;
|
| + return TRUE;
|
| + }
|
| +
|
| + // The object number of remaining pages starts from 1.
|
| + dwObjNum = 1;
|
| + for (int i = 0; i < index; ++i) {
|
| + if (i == nFirstPageNum)
|
| + continue;
|
| + dwObjNum += m_dwDeltaNObjsArray[i];
|
| + }
|
| + return TRUE;
|
| +}
|
| +
|
| +IPDF_DataAvail::DocAvailStatus CPDF_HintTables::CheckPage(
|
| + int index,
|
| + IPDF_DataAvail::DownloadHints* pHints) {
|
| + if (!m_pLinearizedDict || !pHints)
|
| + return IPDF_DataAvail::DataError;
|
| +
|
| + CPDF_Object* pFirstAvailPage = m_pLinearizedDict->GetElementValue("P");
|
| + int nFirstAvailPage = pFirstAvailPage ? pFirstAvailPage->GetInteger() : 0;
|
| + if (index == nFirstAvailPage)
|
| + return IPDF_DataAvail::DataAvailable;
|
| +
|
| + FX_DWORD dwLength = GetItemLength(index, m_szPageOffsetArray);
|
| + // If two pages have the same offset, it should be treated as an error.
|
| + if (!dwLength)
|
| + return IPDF_DataAvail::DataError;
|
| +
|
| + if (!m_pDataAvail->IsDataAvail(m_szPageOffsetArray[index], dwLength, pHints))
|
| + return IPDF_DataAvail::DataNotAvailable;
|
| +
|
| + // Download data of shared objects in the page.
|
| + FX_DWORD offset = 0;
|
| + for (int i = 0; i < index; ++i)
|
| + offset += m_dwNSharedObjsArray[i];
|
| +
|
| + CPDF_Object* pFirstPageObj = m_pLinearizedDict->GetElementValue("O");
|
| + int nFirstPageObjNum = pFirstPageObj ? pFirstPageObj->GetInteger() : -1;
|
| + if (nFirstPageObjNum < 0)
|
| + return IPDF_DataAvail::DataError;
|
| +
|
| + FX_DWORD dwIndex = 0;
|
| + FX_DWORD dwObjNum = 0;
|
| + for (int j = 0; j < m_dwNSharedObjsArray[index]; ++j) {
|
| + dwIndex = m_dwIdentifierArray[offset + j];
|
| + if (dwIndex >= m_dwSharedObjNumArray.GetSize())
|
| + return IPDF_DataAvail::DataNotAvailable;
|
| +
|
| + dwObjNum = m_dwSharedObjNumArray[dwIndex];
|
| + if (dwObjNum >= nFirstPageObjNum &&
|
| + dwObjNum < nFirstPageObjNum + m_nFirstPageSharedObjs) {
|
| + continue;
|
| + }
|
| +
|
| + dwLength = GetItemLength(dwIndex, m_szSharedObjOffsetArray);
|
| + // If two objects have the same offset, it should be treated as an error.
|
| + if (!dwLength)
|
| + return IPDF_DataAvail::DataError;
|
| +
|
| + if (!m_pDataAvail->IsDataAvail(m_szSharedObjOffsetArray[dwIndex], dwLength,
|
| + pHints)) {
|
| + return IPDF_DataAvail::DataNotAvailable;
|
| + }
|
| + }
|
| + return IPDF_DataAvail::DataAvailable;
|
| +}
|
| +
|
| +FX_BOOL CPDF_HintTables::LoadHintStream(CPDF_Stream* pHintStream) {
|
| + if (!pHintStream || !m_pLinearizedDict)
|
| + return FALSE;
|
| +
|
| + CPDF_Dictionary* pDict = pHintStream->GetDict();
|
| + CPDF_Object* pOffset = pDict ? pDict->GetElement("S") : nullptr;
|
| + if (!pOffset || !pOffset->IsNumber())
|
| + return FALSE;
|
| +
|
| + int shared_hint_table_offset = pOffset->GetInteger();
|
| + CPDF_StreamAcc acc;
|
| + acc.LoadAllData(pHintStream);
|
| +
|
| + FX_DWORD size = acc.GetSize();
|
| + // The header section of page offset hint table is 36 bytes.
|
| + // The header section of shared object hint table is 24 bytes.
|
| + // Hint table has at least 60 bytes.
|
| + const FX_DWORD MIN_STREAM_LEN = 60;
|
| + if (size < MIN_STREAM_LEN || shared_hint_table_offset <= 0 ||
|
| + size < shared_hint_table_offset) {
|
| + return FALSE;
|
| + }
|
| +
|
| + CFX_BitStream bs;
|
| + bs.Init(acc.GetData(), size);
|
| + return ReadPageHintTable(&bs) &&
|
| + ReadSharedObjHintTable(&bs, pdfium::base::checked_cast<FX_DWORD>(
|
| + shared_hint_table_offset));
|
| +}
|
| +
|
| +int CPDF_HintTables::ReadPrimaryHintStreamOffset() const {
|
| + if (!m_pLinearizedDict)
|
| + return -1;
|
| +
|
| + CPDF_Array* pRange = m_pLinearizedDict->GetArrayBy("H");
|
| + if (!pRange)
|
| + return -1;
|
| +
|
| + CPDF_Object* pStreamOffset = pRange->GetElementValue(0);
|
| + if (!pStreamOffset)
|
| + return -1;
|
| +
|
| + return pStreamOffset->GetInteger();
|
| +}
|
| +
|
| +int CPDF_HintTables::ReadPrimaryHintStreamLength() const {
|
| + if (!m_pLinearizedDict)
|
| + return -1;
|
| +
|
| + CPDF_Array* pRange = m_pLinearizedDict->GetArrayBy("H");
|
| + if (!pRange)
|
| + return -1;
|
| +
|
| + CPDF_Object* pStreamLen = pRange->GetElementValue(1);
|
| + if (!pStreamLen)
|
| + return -1;
|
| +
|
| + return pStreamLen->GetInteger();
|
| +}
|
|
|