OLD | NEW |
| (Empty) |
1 /* | |
2 Copyright (C) 1999 Lars Knoll (knoll@mpi-hd.mpg.de) | |
3 Copyright (C) 2006 Alexey Proskuryakov (ap@nypop.com) | |
4 Copyright (C) 2006, 2008 Apple Inc. All rights reserved. | |
5 | |
6 This library is free software; you can redistribute it and/or | |
7 modify it under the terms of the GNU Library General Public | |
8 License as published by the Free Software Foundation; either | |
9 version 2 of the License, or (at your option) any later version. | |
10 | |
11 This library is distributed in the hope that it will be useful, | |
12 but WITHOUT ANY WARRANTY; without even the implied warranty of | |
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
14 Library General Public License for more details. | |
15 | |
16 You should have received a copy of the GNU Library General Public License | |
17 along with this library; see the file COPYING.LIB. If not, write to | |
18 the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, | |
19 Boston, MA 02110-1301, USA. | |
20 | |
21 */ | |
22 | |
23 #ifndef TextResourceDecoder_h | |
24 #define TextResourceDecoder_h | |
25 | |
26 #include "wtf/RefCounted.h" | |
27 #include "wtf/text/TextEncoding.h" | |
28 | |
29 namespace WebCore { | |
30 | |
31 class DocumentEncodingData; | |
32 class HTMLMetaCharsetParser; | |
33 | |
34 class TextResourceDecoder { | |
35 public: | |
36 enum EncodingSource { | |
37 DefaultEncoding, | |
38 AutoDetectedEncoding, | |
39 EncodingFromContentSniffing, | |
40 EncodingFromXMLHeader, | |
41 EncodingFromMetaTag, | |
42 EncodingFromCSSCharset, | |
43 EncodingFromHTTPHeader, | |
44 UserChosenEncoding, | |
45 EncodingFromParentFrame | |
46 }; | |
47 | |
48 static PassOwnPtr<TextResourceDecoder> create(const String& mimeType, const
WTF::TextEncoding& defaultEncoding = WTF::TextEncoding(), bool usesEncodingDetec
tor = false) | |
49 { | |
50 return adoptPtr(new TextResourceDecoder(mimeType, defaultEncoding, usesE
ncodingDetector)); | |
51 } | |
52 ~TextResourceDecoder(); | |
53 | |
54 void setEncoding(const WTF::TextEncoding&, EncodingSource); | |
55 const WTF::TextEncoding& encoding() const { return m_encoding; } | |
56 bool encodingWasDetectedHeuristically() const | |
57 { | |
58 return m_source == AutoDetectedEncoding | |
59 || m_source == EncodingFromContentSniffing; | |
60 } | |
61 | |
62 String decode(const char* data, size_t length); | |
63 String flush(); | |
64 | |
65 void setHintEncoding(const WTF::TextEncoding& encoding) | |
66 { | |
67 m_hintEncoding = encoding.name(); | |
68 } | |
69 | |
70 void useLenientXMLDecoding() { m_useLenientXMLDecoding = true; } | |
71 bool sawError() const { return m_sawError; } | |
72 | |
73 private: | |
74 TextResourceDecoder(const String& mimeType, const WTF::TextEncoding& default
Encoding, bool usesEncodingDetector); | |
75 | |
76 enum ContentType { PlainTextContent, HTMLContent, XMLContent, CSSContent };
// PlainText only checks for BOM. | |
77 static ContentType determineContentType(const String& mimeType); | |
78 static const WTF::TextEncoding& defaultEncoding(ContentType, const WTF::Text
Encoding& defaultEncoding); | |
79 | |
80 size_t checkForBOM(const char*, size_t); | |
81 bool checkForCSSCharset(const char*, size_t, bool& movedDataToBuffer); | |
82 bool checkForXMLCharset(const char*, size_t, bool& movedDataToBuffer); | |
83 void checkForMetaCharset(const char*, size_t); | |
84 void detectJapaneseEncoding(const char*, size_t); | |
85 bool shouldAutoDetect() const; | |
86 | |
87 ContentType m_contentType; | |
88 WTF::TextEncoding m_encoding; | |
89 OwnPtr<TextCodec> m_codec; | |
90 EncodingSource m_source; | |
91 const char* m_hintEncoding; | |
92 Vector<char> m_buffer; | |
93 bool m_checkedForBOM; | |
94 bool m_checkedForCSSCharset; | |
95 bool m_checkedForXMLCharset; | |
96 bool m_checkedForMetaCharset; | |
97 bool m_useLenientXMLDecoding; // Don't stop on XML decoding errors. | |
98 bool m_sawError; | |
99 bool m_usesEncodingDetector; | |
100 | |
101 OwnPtr<HTMLMetaCharsetParser> m_charsetParser; | |
102 }; | |
103 | |
104 } | |
105 | |
106 #endif | |
OLD | NEW |