OLD | NEW |
1 // Copyright 2014 PDFium Authors. All rights reserved. | 1 // Copyright 2014 PDFium Authors. All rights reserved. |
2 // Use of this source code is governed by a BSD-style license that can be | 2 // Use of this source code is governed by a BSD-style license that can be |
3 // found in the LICENSE file. | 3 // found in the LICENSE file. |
4 | 4 |
5 // Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com | 5 // Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com |
6 | 6 |
7 #include "core/include/fpdfapi/fpdf_parser.h" | 7 #include "core/include/fpdfapi/fpdf_parser.h" |
8 | 8 |
9 #include <algorithm> | 9 #include <algorithm> |
10 #include <memory> | 10 #include <memory> |
(...skipping 590 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
601 const FX_FILESIZE saved_pos = pos; | 601 const FX_FILESIZE saved_pos = pos; |
602 bool bOverFlow = false; | 602 bool bOverFlow = false; |
603 FX_DWORD size = std::min((FX_DWORD)(m_Syntax.m_FileLen - pos), kBufferSize); | 603 FX_DWORD size = std::min((FX_DWORD)(m_Syntax.m_FileLen - pos), kBufferSize); |
604 if (!m_Syntax.m_pFileAccess->ReadBlock(buffer.data(), pos, size)) | 604 if (!m_Syntax.m_pFileAccess->ReadBlock(buffer.data(), pos, size)) |
605 break; | 605 break; |
606 | 606 |
607 for (FX_DWORD i = 0; i < size; i++) { | 607 for (FX_DWORD i = 0; i < size; i++) { |
608 uint8_t byte = buffer[i]; | 608 uint8_t byte = buffer[i]; |
609 switch (state) { | 609 switch (state) { |
610 case ParserState::kDefault: | 610 case ParserState::kDefault: |
611 if (PDFCharIsWhitespace(byte)) | 611 if (PDFCharIsWhitespace(byte)) { |
612 state = ParserState::kWhitespace; | 612 state = ParserState::kWhitespace; |
613 | 613 } else if (std::isdigit(byte)) { |
614 if (std::isdigit(byte)) { | |
615 --i; | 614 --i; |
616 state = ParserState::kWhitespace; | 615 state = ParserState::kWhitespace; |
617 } | 616 } else if (byte == '%') { |
618 | |
619 if (byte == '%') { | |
620 inside_index = 0; | 617 inside_index = 0; |
621 state = ParserState::kComment; | 618 state = ParserState::kComment; |
622 } | 619 } else if (byte == '(') { |
623 | |
624 if (byte == '(') { | |
625 state = ParserState::kString; | 620 state = ParserState::kString; |
626 depth = 1; | 621 depth = 1; |
627 } | 622 } else if (byte == '<') { |
628 | |
629 if (byte == '<') { | |
630 inside_index = 1; | 623 inside_index = 1; |
631 state = ParserState::kHexString; | 624 state = ParserState::kHexString; |
632 } | 625 } else if (byte == '\\') { |
633 | |
634 if (byte == '\\') | |
635 state = ParserState::kEscapedString; | 626 state = ParserState::kEscapedString; |
636 | 627 } else if (byte == 't') { |
637 if (byte == 't') { | |
638 state = ParserState::kTrailer; | 628 state = ParserState::kTrailer; |
639 inside_index = 1; | 629 inside_index = 1; |
640 } | 630 } |
641 break; | 631 break; |
642 | 632 |
643 case ParserState::kWhitespace: | 633 case ParserState::kWhitespace: |
644 if (PDFCharIsWhitespace(byte)) { | 634 if (std::isdigit(byte)) { |
645 break; | |
646 } else if (std::isdigit(byte)) { | |
647 start_pos = pos + i; | 635 start_pos = pos + i; |
648 state = ParserState::kObjNum; | 636 state = ParserState::kObjNum; |
649 objnum = FXSYS_toDecimalDigit(byte); | 637 objnum = FXSYS_toDecimalDigit(byte); |
650 | |
651 } else if (byte == 't') { | 638 } else if (byte == 't') { |
652 state = ParserState::kTrailer; | 639 state = ParserState::kTrailer; |
653 inside_index = 1; | 640 inside_index = 1; |
654 | |
655 } else if (byte == 'x') { | 641 } else if (byte == 'x') { |
656 state = ParserState::kXref; | 642 state = ParserState::kXref; |
657 inside_index = 1; | 643 inside_index = 1; |
658 | 644 } else if (!PDFCharIsWhitespace(byte)) { |
659 } else { | |
660 --i; | 645 --i; |
661 state = ParserState::kDefault; | 646 state = ParserState::kDefault; |
662 } | 647 } |
663 break; | 648 break; |
664 | 649 |
665 case ParserState::kObjNum: | 650 case ParserState::kObjNum: |
666 if (std::isdigit(byte)) { | 651 if (std::isdigit(byte)) { |
667 objnum = objnum * 10 + FXSYS_toDecimalDigit(byte); | 652 objnum = objnum * 10 + FXSYS_toDecimalDigit(byte); |
668 break; | |
669 } else if (PDFCharIsWhitespace(byte)) { | 653 } else if (PDFCharIsWhitespace(byte)) { |
670 state = ParserState::kPostObjNum; | 654 state = ParserState::kPostObjNum; |
671 } else { | 655 } else { |
672 --i; | 656 --i; |
673 state = ParserState::kEndObj; | 657 state = ParserState::kEndObj; |
674 inside_index = 0; | 658 inside_index = 0; |
675 } | 659 } |
676 break; | 660 break; |
677 | 661 |
678 case ParserState::kPostObjNum: | 662 case ParserState::kPostObjNum: |
679 if (std::isdigit(byte)) { | 663 if (std::isdigit(byte)) { |
680 start_pos1 = pos + i; | 664 start_pos1 = pos + i; |
681 state = ParserState::kGenNum; | 665 state = ParserState::kGenNum; |
682 gennum = FXSYS_toDecimalDigit(byte); | 666 gennum = FXSYS_toDecimalDigit(byte); |
683 } else if (PDFCharIsWhitespace(byte)) { | |
684 break; | |
685 } else if (byte == 't') { | 667 } else if (byte == 't') { |
686 state = ParserState::kTrailer; | 668 state = ParserState::kTrailer; |
687 inside_index = 1; | 669 inside_index = 1; |
688 } else { | 670 } else if (!PDFCharIsWhitespace(byte)) { |
689 --i; | 671 --i; |
690 state = ParserState::kDefault; | 672 state = ParserState::kDefault; |
691 } | 673 } |
692 break; | 674 break; |
693 | 675 |
694 case ParserState::kGenNum: | 676 case ParserState::kGenNum: |
695 if (std::isdigit(byte)) { | 677 if (std::isdigit(byte)) { |
696 gennum = gennum * 10 + FXSYS_toDecimalDigit(byte); | 678 gennum = gennum * 10 + FXSYS_toDecimalDigit(byte); |
697 break; | |
698 } else if (PDFCharIsWhitespace(byte)) { | 679 } else if (PDFCharIsWhitespace(byte)) { |
699 state = ParserState::kPostGenNum; | 680 state = ParserState::kPostGenNum; |
700 } else { | 681 } else { |
701 --i; | 682 --i; |
702 state = ParserState::kDefault; | 683 state = ParserState::kDefault; |
703 } | 684 } |
704 break; | 685 break; |
705 | 686 |
706 case ParserState::kPostGenNum: | 687 case ParserState::kPostGenNum: |
707 if (byte == 'o') { | 688 if (byte == 'o') { |
708 state = ParserState::kBeginObj; | 689 state = ParserState::kBeginObj; |
709 inside_index = 1; | 690 inside_index = 1; |
710 } else if (PDFCharIsWhitespace(byte)) { | |
711 break; | |
712 } else if (std::isdigit(byte)) { | 691 } else if (std::isdigit(byte)) { |
713 objnum = gennum; | 692 objnum = gennum; |
714 gennum = FXSYS_toDecimalDigit(byte); | 693 gennum = FXSYS_toDecimalDigit(byte); |
715 start_pos = start_pos1; | 694 start_pos = start_pos1; |
716 start_pos1 = pos + i; | 695 start_pos1 = pos + i; |
717 state = ParserState::kGenNum; | 696 state = ParserState::kGenNum; |
718 } else if (byte == 't') { | 697 } else if (byte == 't') { |
719 state = ParserState::kTrailer; | 698 state = ParserState::kTrailer; |
720 inside_index = 1; | 699 inside_index = 1; |
721 } else { | 700 } else if (!PDFCharIsWhitespace(byte)) { |
722 --i; | 701 --i; |
723 state = ParserState::kDefault; | 702 state = ParserState::kDefault; |
724 } | 703 } |
725 break; | 704 break; |
726 | 705 |
727 case ParserState::kBeginObj: | 706 case ParserState::kBeginObj: |
728 switch (inside_index) { | 707 switch (inside_index) { |
729 case 1: | 708 case 1: |
730 if (byte != 'b') { | 709 if (byte != 'b') { |
731 --i; | 710 --i; |
(...skipping 2277 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
3009 FX_BOOL* pExistInFile) { | 2988 FX_BOOL* pExistInFile) { |
3010 CPDF_Object* pRet = nullptr; | 2989 CPDF_Object* pRet = nullptr; |
3011 FX_DWORD size = 0; | 2990 FX_DWORD size = 0; |
3012 FX_FILESIZE offset = 0; | 2991 FX_FILESIZE offset = 0; |
3013 CPDF_Parser* pParser = nullptr; | 2992 CPDF_Parser* pParser = nullptr; |
3014 if (pExistInFile) | 2993 if (pExistInFile) |
3015 *pExistInFile = TRUE; | 2994 *pExistInFile = TRUE; |
3016 | 2995 |
3017 if (m_pDocument) { | 2996 if (m_pDocument) { |
3018 size = GetObjectSize(objnum, offset); | 2997 size = GetObjectSize(objnum, offset); |
3019 pParser = (CPDF_Parser*)(m_pDocument->GetParser()); | 2998 pParser = m_pDocument->GetParser(); |
3020 } else { | 2999 } else { |
3021 size = (FX_DWORD)m_parser.GetObjectSize(objnum); | 3000 size = (FX_DWORD)m_parser.GetObjectSize(objnum); |
3022 offset = m_parser.GetObjectOffset(objnum); | 3001 offset = m_parser.GetObjectOffset(objnum); |
3023 pParser = &m_parser; | 3002 pParser = &m_parser; |
3024 } | 3003 } |
3025 if (!IsDataAvail(offset, size, pHints)) { | 3004 if (!IsDataAvail(offset, size, pHints)) { |
3026 return nullptr; | 3005 return nullptr; |
3027 } | 3006 } |
3028 if (pParser) { | 3007 if (pParser) { |
3029 pRet = pParser->ParseIndirectObject(nullptr, objnum); | 3008 pRet = pParser->ParseIndirectObject(nullptr, objnum); |
(...skipping 79 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
3109 FX_BOOL CPDF_DataAvail::PreparePageItem() { | 3088 FX_BOOL CPDF_DataAvail::PreparePageItem() { |
3110 CPDF_Dictionary* pRoot = m_pDocument->GetRoot(); | 3089 CPDF_Dictionary* pRoot = m_pDocument->GetRoot(); |
3111 CPDF_Reference* pRef = | 3090 CPDF_Reference* pRef = |
3112 ToReference(pRoot ? pRoot->GetElement("Pages") : nullptr); | 3091 ToReference(pRoot ? pRoot->GetElement("Pages") : nullptr); |
3113 if (!pRef) { | 3092 if (!pRef) { |
3114 m_docStatus = PDF_DATAAVAIL_ERROR; | 3093 m_docStatus = PDF_DATAAVAIL_ERROR; |
3115 return FALSE; | 3094 return FALSE; |
3116 } | 3095 } |
3117 | 3096 |
3118 m_PagesObjNum = pRef->GetRefObjNum(); | 3097 m_PagesObjNum = pRef->GetRefObjNum(); |
3119 m_pCurrentParser = (CPDF_Parser*)m_pDocument->GetParser(); | 3098 m_pCurrentParser = m_pDocument->GetParser(); |
3120 m_docStatus = PDF_DATAAVAIL_PAGETREE; | 3099 m_docStatus = PDF_DATAAVAIL_PAGETREE; |
3121 return TRUE; | 3100 return TRUE; |
3122 } | 3101 } |
3123 bool CPDF_DataAvail::IsFirstCheck(int iPage) { | 3102 bool CPDF_DataAvail::IsFirstCheck(int iPage) { |
3124 return m_pageMapCheckState.insert(iPage).second; | 3103 return m_pageMapCheckState.insert(iPage).second; |
3125 } | 3104 } |
3126 void CPDF_DataAvail::ResetFirstCheck(int iPage) { | 3105 void CPDF_DataAvail::ResetFirstCheck(int iPage) { |
3127 m_pageMapCheckState.erase(iPage); | 3106 m_pageMapCheckState.erase(iPage); |
3128 } | 3107 } |
3129 FX_BOOL CPDF_DataAvail::CheckPage(IFX_DownloadHints* pHints) { | 3108 FX_BOOL CPDF_DataAvail::CheckPage(IFX_DownloadHints* pHints) { |
(...skipping 1050 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
4180 } | 4159 } |
4181 } else { | 4160 } else { |
4182 if (!m_bCurPageDictLoadOK && !CheckPage(iPage, pHints)) { | 4161 if (!m_bCurPageDictLoadOK && !CheckPage(iPage, pHints)) { |
4183 return DataNotAvailable; | 4162 return DataNotAvailable; |
4184 } | 4163 } |
4185 } | 4164 } |
4186 } else { | 4165 } else { |
4187 if (!LoadAllFile(pHints)) { | 4166 if (!LoadAllFile(pHints)) { |
4188 return DataNotAvailable; | 4167 return DataNotAvailable; |
4189 } | 4168 } |
4190 ((CPDF_Parser*)m_pDocument->GetParser())->RebuildCrossRef(); | 4169 m_pDocument->GetParser()->RebuildCrossRef(); |
4191 ResetFirstCheck(iPage); | 4170 ResetFirstCheck(iPage); |
4192 return DataAvailable; | 4171 return DataAvailable; |
4193 } | 4172 } |
4194 } else { | 4173 } else { |
4195 if (!m_bTotalLoadPageTree) { | 4174 if (!m_bTotalLoadPageTree) { |
4196 if (!m_bCurPageDictLoadOK && !CheckPage(iPage, pHints)) { | 4175 if (!m_bCurPageDictLoadOK && !CheckPage(iPage, pHints)) { |
4197 return DataNotAvailable; | 4176 return DataNotAvailable; |
4198 } | 4177 } |
4199 } | 4178 } |
4200 } | 4179 } |
(...skipping 539 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
4740 if (!m_pLinearizedDict) | 4719 if (!m_pLinearizedDict) |
4741 return -1; | 4720 return -1; |
4742 CPDF_Array* pRange = m_pLinearizedDict->GetArrayBy("H"); | 4721 CPDF_Array* pRange = m_pLinearizedDict->GetArrayBy("H"); |
4743 if (!pRange) | 4722 if (!pRange) |
4744 return -1; | 4723 return -1; |
4745 CPDF_Object* pStreamLen = pRange->GetElementValue(1); | 4724 CPDF_Object* pStreamLen = pRange->GetElementValue(1); |
4746 if (!pStreamLen) | 4725 if (!pStreamLen) |
4747 return -1; | 4726 return -1; |
4748 return pStreamLen->GetInteger(); | 4727 return pStreamLen->GetInteger(); |
4749 } | 4728 } |
OLD | NEW |