| OLD | NEW |
| 1 // Copyright 2014 PDFium Authors. All rights reserved. | 1 // Copyright 2014 PDFium Authors. All rights reserved. |
| 2 // Use of this source code is governed by a BSD-style license that can be | 2 // Use of this source code is governed by a BSD-style license that can be |
| 3 // found in the LICENSE file. | 3 // found in the LICENSE file. |
| 4 | 4 |
| 5 // Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com | 5 // Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com |
| 6 | 6 |
| 7 #include "core/include/fpdfapi/fpdf_parser.h" | 7 #include "core/include/fpdfapi/fpdf_parser.h" |
| 8 | 8 |
| 9 #include <algorithm> | 9 #include <algorithm> |
| 10 #include <memory> | 10 #include <memory> |
| (...skipping 590 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 601 const FX_FILESIZE saved_pos = pos; | 601 const FX_FILESIZE saved_pos = pos; |
| 602 bool bOverFlow = false; | 602 bool bOverFlow = false; |
| 603 FX_DWORD size = std::min((FX_DWORD)(m_Syntax.m_FileLen - pos), kBufferSize); | 603 FX_DWORD size = std::min((FX_DWORD)(m_Syntax.m_FileLen - pos), kBufferSize); |
| 604 if (!m_Syntax.m_pFileAccess->ReadBlock(buffer.data(), pos, size)) | 604 if (!m_Syntax.m_pFileAccess->ReadBlock(buffer.data(), pos, size)) |
| 605 break; | 605 break; |
| 606 | 606 |
| 607 for (FX_DWORD i = 0; i < size; i++) { | 607 for (FX_DWORD i = 0; i < size; i++) { |
| 608 uint8_t byte = buffer[i]; | 608 uint8_t byte = buffer[i]; |
| 609 switch (state) { | 609 switch (state) { |
| 610 case ParserState::kDefault: | 610 case ParserState::kDefault: |
| 611 if (PDFCharIsWhitespace(byte)) | 611 if (PDFCharIsWhitespace(byte)) { |
| 612 state = ParserState::kWhitespace; | 612 state = ParserState::kWhitespace; |
| 613 | 613 } else if (std::isdigit(byte)) { |
| 614 if (std::isdigit(byte)) { | |
| 615 --i; | 614 --i; |
| 616 state = ParserState::kWhitespace; | 615 state = ParserState::kWhitespace; |
| 617 } | 616 } else if (byte == '%') { |
| 618 | |
| 619 if (byte == '%') { | |
| 620 inside_index = 0; | 617 inside_index = 0; |
| 621 state = ParserState::kComment; | 618 state = ParserState::kComment; |
| 622 } | 619 } else if (byte == '(') { |
| 623 | |
| 624 if (byte == '(') { | |
| 625 state = ParserState::kString; | 620 state = ParserState::kString; |
| 626 depth = 1; | 621 depth = 1; |
| 627 } | 622 } else if (byte == '<') { |
| 628 | |
| 629 if (byte == '<') { | |
| 630 inside_index = 1; | 623 inside_index = 1; |
| 631 state = ParserState::kHexString; | 624 state = ParserState::kHexString; |
| 632 } | 625 } else if (byte == '\\') { |
| 633 | |
| 634 if (byte == '\\') | |
| 635 state = ParserState::kEscapedString; | 626 state = ParserState::kEscapedString; |
| 636 | 627 } else if (byte == 't') { |
| 637 if (byte == 't') { | |
| 638 state = ParserState::kTrailer; | 628 state = ParserState::kTrailer; |
| 639 inside_index = 1; | 629 inside_index = 1; |
| 640 } | 630 } |
| 641 break; | 631 break; |
| 642 | 632 |
| 643 case ParserState::kWhitespace: | 633 case ParserState::kWhitespace: |
| 644 if (PDFCharIsWhitespace(byte)) { | 634 if (std::isdigit(byte)) { |
| 645 break; | |
| 646 } else if (std::isdigit(byte)) { | |
| 647 start_pos = pos + i; | 635 start_pos = pos + i; |
| 648 state = ParserState::kObjNum; | 636 state = ParserState::kObjNum; |
| 649 objnum = FXSYS_toDecimalDigit(byte); | 637 objnum = FXSYS_toDecimalDigit(byte); |
| 650 | |
| 651 } else if (byte == 't') { | 638 } else if (byte == 't') { |
| 652 state = ParserState::kTrailer; | 639 state = ParserState::kTrailer; |
| 653 inside_index = 1; | 640 inside_index = 1; |
| 654 | |
| 655 } else if (byte == 'x') { | 641 } else if (byte == 'x') { |
| 656 state = ParserState::kXref; | 642 state = ParserState::kXref; |
| 657 inside_index = 1; | 643 inside_index = 1; |
| 658 | 644 } else if (!PDFCharIsWhitespace(byte)) { |
| 659 } else { | |
| 660 --i; | 645 --i; |
| 661 state = ParserState::kDefault; | 646 state = ParserState::kDefault; |
| 662 } | 647 } |
| 663 break; | 648 break; |
| 664 | 649 |
| 665 case ParserState::kObjNum: | 650 case ParserState::kObjNum: |
| 666 if (std::isdigit(byte)) { | 651 if (std::isdigit(byte)) { |
| 667 objnum = objnum * 10 + FXSYS_toDecimalDigit(byte); | 652 objnum = objnum * 10 + FXSYS_toDecimalDigit(byte); |
| 668 break; | |
| 669 } else if (PDFCharIsWhitespace(byte)) { | 653 } else if (PDFCharIsWhitespace(byte)) { |
| 670 state = ParserState::kPostObjNum; | 654 state = ParserState::kPostObjNum; |
| 671 } else { | 655 } else { |
| 672 --i; | 656 --i; |
| 673 state = ParserState::kEndObj; | 657 state = ParserState::kEndObj; |
| 674 inside_index = 0; | 658 inside_index = 0; |
| 675 } | 659 } |
| 676 break; | 660 break; |
| 677 | 661 |
| 678 case ParserState::kPostObjNum: | 662 case ParserState::kPostObjNum: |
| 679 if (std::isdigit(byte)) { | 663 if (std::isdigit(byte)) { |
| 680 start_pos1 = pos + i; | 664 start_pos1 = pos + i; |
| 681 state = ParserState::kGenNum; | 665 state = ParserState::kGenNum; |
| 682 gennum = FXSYS_toDecimalDigit(byte); | 666 gennum = FXSYS_toDecimalDigit(byte); |
| 683 } else if (PDFCharIsWhitespace(byte)) { | |
| 684 break; | |
| 685 } else if (byte == 't') { | 667 } else if (byte == 't') { |
| 686 state = ParserState::kTrailer; | 668 state = ParserState::kTrailer; |
| 687 inside_index = 1; | 669 inside_index = 1; |
| 688 } else { | 670 } else if (!PDFCharIsWhitespace(byte)) { |
| 689 --i; | 671 --i; |
| 690 state = ParserState::kDefault; | 672 state = ParserState::kDefault; |
| 691 } | 673 } |
| 692 break; | 674 break; |
| 693 | 675 |
| 694 case ParserState::kGenNum: | 676 case ParserState::kGenNum: |
| 695 if (std::isdigit(byte)) { | 677 if (std::isdigit(byte)) { |
| 696 gennum = gennum * 10 + FXSYS_toDecimalDigit(byte); | 678 gennum = gennum * 10 + FXSYS_toDecimalDigit(byte); |
| 697 break; | |
| 698 } else if (PDFCharIsWhitespace(byte)) { | 679 } else if (PDFCharIsWhitespace(byte)) { |
| 699 state = ParserState::kPostGenNum; | 680 state = ParserState::kPostGenNum; |
| 700 } else { | 681 } else { |
| 701 --i; | 682 --i; |
| 702 state = ParserState::kDefault; | 683 state = ParserState::kDefault; |
| 703 } | 684 } |
| 704 break; | 685 break; |
| 705 | 686 |
| 706 case ParserState::kPostGenNum: | 687 case ParserState::kPostGenNum: |
| 707 if (byte == 'o') { | 688 if (byte == 'o') { |
| 708 state = ParserState::kBeginObj; | 689 state = ParserState::kBeginObj; |
| 709 inside_index = 1; | 690 inside_index = 1; |
| 710 } else if (PDFCharIsWhitespace(byte)) { | |
| 711 break; | |
| 712 } else if (std::isdigit(byte)) { | 691 } else if (std::isdigit(byte)) { |
| 713 objnum = gennum; | 692 objnum = gennum; |
| 714 gennum = FXSYS_toDecimalDigit(byte); | 693 gennum = FXSYS_toDecimalDigit(byte); |
| 715 start_pos = start_pos1; | 694 start_pos = start_pos1; |
| 716 start_pos1 = pos + i; | 695 start_pos1 = pos + i; |
| 717 state = ParserState::kGenNum; | 696 state = ParserState::kGenNum; |
| 718 } else if (byte == 't') { | 697 } else if (byte == 't') { |
| 719 state = ParserState::kTrailer; | 698 state = ParserState::kTrailer; |
| 720 inside_index = 1; | 699 inside_index = 1; |
| 721 } else { | 700 } else if (!PDFCharIsWhitespace(byte)) { |
| 722 --i; | 701 --i; |
| 723 state = ParserState::kDefault; | 702 state = ParserState::kDefault; |
| 724 } | 703 } |
| 725 break; | 704 break; |
| 726 | 705 |
| 727 case ParserState::kBeginObj: | 706 case ParserState::kBeginObj: |
| 728 switch (inside_index) { | 707 switch (inside_index) { |
| 729 case 1: | 708 case 1: |
| 730 if (byte != 'b') { | 709 if (byte != 'b') { |
| 731 --i; | 710 --i; |
| (...skipping 2277 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 3009 FX_BOOL* pExistInFile) { | 2988 FX_BOOL* pExistInFile) { |
| 3010 CPDF_Object* pRet = nullptr; | 2989 CPDF_Object* pRet = nullptr; |
| 3011 FX_DWORD size = 0; | 2990 FX_DWORD size = 0; |
| 3012 FX_FILESIZE offset = 0; | 2991 FX_FILESIZE offset = 0; |
| 3013 CPDF_Parser* pParser = nullptr; | 2992 CPDF_Parser* pParser = nullptr; |
| 3014 if (pExistInFile) | 2993 if (pExistInFile) |
| 3015 *pExistInFile = TRUE; | 2994 *pExistInFile = TRUE; |
| 3016 | 2995 |
| 3017 if (m_pDocument) { | 2996 if (m_pDocument) { |
| 3018 size = GetObjectSize(objnum, offset); | 2997 size = GetObjectSize(objnum, offset); |
| 3019 pParser = (CPDF_Parser*)(m_pDocument->GetParser()); | 2998 pParser = m_pDocument->GetParser(); |
| 3020 } else { | 2999 } else { |
| 3021 size = (FX_DWORD)m_parser.GetObjectSize(objnum); | 3000 size = (FX_DWORD)m_parser.GetObjectSize(objnum); |
| 3022 offset = m_parser.GetObjectOffset(objnum); | 3001 offset = m_parser.GetObjectOffset(objnum); |
| 3023 pParser = &m_parser; | 3002 pParser = &m_parser; |
| 3024 } | 3003 } |
| 3025 if (!IsDataAvail(offset, size, pHints)) { | 3004 if (!IsDataAvail(offset, size, pHints)) { |
| 3026 return nullptr; | 3005 return nullptr; |
| 3027 } | 3006 } |
| 3028 if (pParser) { | 3007 if (pParser) { |
| 3029 pRet = pParser->ParseIndirectObject(nullptr, objnum); | 3008 pRet = pParser->ParseIndirectObject(nullptr, objnum); |
| (...skipping 79 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 3109 FX_BOOL CPDF_DataAvail::PreparePageItem() { | 3088 FX_BOOL CPDF_DataAvail::PreparePageItem() { |
| 3110 CPDF_Dictionary* pRoot = m_pDocument->GetRoot(); | 3089 CPDF_Dictionary* pRoot = m_pDocument->GetRoot(); |
| 3111 CPDF_Reference* pRef = | 3090 CPDF_Reference* pRef = |
| 3112 ToReference(pRoot ? pRoot->GetElement("Pages") : nullptr); | 3091 ToReference(pRoot ? pRoot->GetElement("Pages") : nullptr); |
| 3113 if (!pRef) { | 3092 if (!pRef) { |
| 3114 m_docStatus = PDF_DATAAVAIL_ERROR; | 3093 m_docStatus = PDF_DATAAVAIL_ERROR; |
| 3115 return FALSE; | 3094 return FALSE; |
| 3116 } | 3095 } |
| 3117 | 3096 |
| 3118 m_PagesObjNum = pRef->GetRefObjNum(); | 3097 m_PagesObjNum = pRef->GetRefObjNum(); |
| 3119 m_pCurrentParser = (CPDF_Parser*)m_pDocument->GetParser(); | 3098 m_pCurrentParser = m_pDocument->GetParser(); |
| 3120 m_docStatus = PDF_DATAAVAIL_PAGETREE; | 3099 m_docStatus = PDF_DATAAVAIL_PAGETREE; |
| 3121 return TRUE; | 3100 return TRUE; |
| 3122 } | 3101 } |
| 3123 bool CPDF_DataAvail::IsFirstCheck(int iPage) { | 3102 bool CPDF_DataAvail::IsFirstCheck(int iPage) { |
| 3124 return m_pageMapCheckState.insert(iPage).second; | 3103 return m_pageMapCheckState.insert(iPage).second; |
| 3125 } | 3104 } |
| 3126 void CPDF_DataAvail::ResetFirstCheck(int iPage) { | 3105 void CPDF_DataAvail::ResetFirstCheck(int iPage) { |
| 3127 m_pageMapCheckState.erase(iPage); | 3106 m_pageMapCheckState.erase(iPage); |
| 3128 } | 3107 } |
| 3129 FX_BOOL CPDF_DataAvail::CheckPage(IFX_DownloadHints* pHints) { | 3108 FX_BOOL CPDF_DataAvail::CheckPage(IFX_DownloadHints* pHints) { |
| (...skipping 1050 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 4180 } | 4159 } |
| 4181 } else { | 4160 } else { |
| 4182 if (!m_bCurPageDictLoadOK && !CheckPage(iPage, pHints)) { | 4161 if (!m_bCurPageDictLoadOK && !CheckPage(iPage, pHints)) { |
| 4183 return DataNotAvailable; | 4162 return DataNotAvailable; |
| 4184 } | 4163 } |
| 4185 } | 4164 } |
| 4186 } else { | 4165 } else { |
| 4187 if (!LoadAllFile(pHints)) { | 4166 if (!LoadAllFile(pHints)) { |
| 4188 return DataNotAvailable; | 4167 return DataNotAvailable; |
| 4189 } | 4168 } |
| 4190 ((CPDF_Parser*)m_pDocument->GetParser())->RebuildCrossRef(); | 4169 m_pDocument->GetParser()->RebuildCrossRef(); |
| 4191 ResetFirstCheck(iPage); | 4170 ResetFirstCheck(iPage); |
| 4192 return DataAvailable; | 4171 return DataAvailable; |
| 4193 } | 4172 } |
| 4194 } else { | 4173 } else { |
| 4195 if (!m_bTotalLoadPageTree) { | 4174 if (!m_bTotalLoadPageTree) { |
| 4196 if (!m_bCurPageDictLoadOK && !CheckPage(iPage, pHints)) { | 4175 if (!m_bCurPageDictLoadOK && !CheckPage(iPage, pHints)) { |
| 4197 return DataNotAvailable; | 4176 return DataNotAvailable; |
| 4198 } | 4177 } |
| 4199 } | 4178 } |
| 4200 } | 4179 } |
| (...skipping 539 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 4740 if (!m_pLinearizedDict) | 4719 if (!m_pLinearizedDict) |
| 4741 return -1; | 4720 return -1; |
| 4742 CPDF_Array* pRange = m_pLinearizedDict->GetArrayBy("H"); | 4721 CPDF_Array* pRange = m_pLinearizedDict->GetArrayBy("H"); |
| 4743 if (!pRange) | 4722 if (!pRange) |
| 4744 return -1; | 4723 return -1; |
| 4745 CPDF_Object* pStreamLen = pRange->GetElementValue(1); | 4724 CPDF_Object* pStreamLen = pRange->GetElementValue(1); |
| 4746 if (!pStreamLen) | 4725 if (!pStreamLen) |
| 4747 return -1; | 4726 return -1; |
| 4748 return pStreamLen->GetInteger(); | 4727 return pStreamLen->GetInteger(); |
| 4749 } | 4728 } |
| OLD | NEW |