Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(460)

Side by Side Diff: url/url_canon_internal.h

Issue 13998025: url: Build it as a static library. (Closed) Base URL: svn://svn.chromium.org/chrome/trunk/src
Patch Set: Created 7 years, 8 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch | Annotate | Revision Log
« no previous file with comments | « url/url_canon_icu.cc ('k') | url/url_canon_internal.cc » ('j') | no next file with comments »
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
OLDNEW
1 // Copyright 2011, Google Inc. 1 // Copyright 2011, Google Inc.
2 // All rights reserved. 2 // All rights reserved.
3 // 3 //
4 // Redistribution and use in source and binary forms, with or without 4 // Redistribution and use in source and binary forms, with or without
5 // modification, are permitted provided that the following conditions are 5 // modification, are permitted provided that the following conditions are
6 // met: 6 // met:
7 // 7 //
8 // * Redistributions of source code must retain the above copyright 8 // * Redistributions of source code must retain the above copyright
9 // notice, this list of conditions and the following disclaimer. 9 // notice, this list of conditions and the following disclaimer.
10 // * Redistributions in binary form must reproduce the above 10 // * Redistributions in binary form must reproduce the above
11 // copyright notice, this list of conditions and the following disclaimer 11 // copyright notice, this list of conditions and the following disclaimer
12 // in the documentation and/or other materials provided with the 12 // in the documentation and/or other materials provided with the
13 // distribution. 13 // distribution.
14 // * Neither the name of Google Inc. nor the names of its 14 // * Neither the name of Google Inc. nor the names of its
15 // contributors may be used to endorse or promote products derived from 15 // contributors may be used to endorse or promote products derived from
16 // this software without specific prior written permission. 16 // this software without specific prior written permission.
17 // 17 //
18 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 18 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
19 // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 19 // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
20 // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 20 // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
21 // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 21 // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
22 // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 22 // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
23 // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 23 // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
24 // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 24 // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
25 // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 25 // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
26 // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 26 // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
27 // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 27 // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
28 // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 28 // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29 29
30 #ifndef URL_URL_CANON_INTERNAL_H_
31 #define URL_URL_CANON_INTERNAL_H_
32
30 // This file is intended to be included in another C++ file where the character 33 // This file is intended to be included in another C++ file where the character
31 // types are defined. This allows us to write mostly generic code, but not have 34 // types are defined. This allows us to write mostly generic code, but not have
32 // templace bloat because everything is inlined when anybody calls any of our 35 // templace bloat because everything is inlined when anybody calls any of our
33 // functions. 36 // functions.
34 37
35 #ifndef GOOGLEURL_SRC_URL_CANON_INTERNAL_H__
36 #define GOOGLEURL_SRC_URL_CANON_INTERNAL_H__
37
38 #include <stdlib.h> 38 #include <stdlib.h>
39 39
40 #include "base/logging.h" 40 #include "base/logging.h"
41 #include "googleurl/src/url_canon.h" 41 #include "url/url_canon.h"
42 42
43 namespace url_canon { 43 namespace url_canon {
44 44
45 // Character type handling ----------------------------------------------------- 45 // Character type handling -----------------------------------------------------
46 46
47 // Bits that identify different character types. These types identify different 47 // Bits that identify different character types. These types identify different
48 // bits that are set for each 8-bit character in the kSharedCharTypeTable. 48 // bits that are set for each 8-bit character in the kSharedCharTypeTable.
49 enum SharedCharTypes { 49 enum SharedCharTypes {
50 // Characters that do not require escaping in queries. Characters that do 50 // Characters that do not require escaping in queries. Characters that do
51 // not have this flag will be escaped; see url_canon_query.cc 51 // not have this flag will be escaped; see url_canon_query.cc
(...skipping 49 matching lines...) Expand 10 before | Expand all | Expand 10 after
101 // match the given |type| in SharedCharTypes. 101 // match the given |type| in SharedCharTypes.
102 void AppendStringOfType(const char* source, int length, 102 void AppendStringOfType(const char* source, int length,
103 SharedCharTypes type, 103 SharedCharTypes type,
104 CanonOutput* output); 104 CanonOutput* output);
105 void AppendStringOfType(const char16* source, int length, 105 void AppendStringOfType(const char16* source, int length,
106 SharedCharTypes type, 106 SharedCharTypes type,
107 CanonOutput* output); 107 CanonOutput* output);
108 108
109 // Maps the hex numerical values 0x0 to 0xf to the corresponding ASCII digit 109 // Maps the hex numerical values 0x0 to 0xf to the corresponding ASCII digit
110 // that will be used to represent it. 110 // that will be used to represent it.
111 GURL_API extern const char kHexCharLookup[0x10]; 111 extern const char kHexCharLookup[0x10];
112 112
113 // This lookup table allows fast conversion between ASCII hex letters and their 113 // This lookup table allows fast conversion between ASCII hex letters and their
114 // corresponding numerical value. The 8-bit range is divided up into 8 114 // corresponding numerical value. The 8-bit range is divided up into 8
115 // regions of 0x20 characters each. Each of the three character types (numbers, 115 // regions of 0x20 characters each. Each of the three character types (numbers,
116 // uppercase, lowercase) falls into different regions of this range. The table 116 // uppercase, lowercase) falls into different regions of this range. The table
117 // contains the amount to subtract from characters in that range to get at 117 // contains the amount to subtract from characters in that range to get at
118 // the corresponding numerical value. 118 // the corresponding numerical value.
119 // 119 //
120 // See HexDigitToValue for the lookup. 120 // See HexDigitToValue for the lookup.
121 extern const char kCharToHexLookup[8]; 121 extern const char kCharToHexLookup[8];
(...skipping 46 matching lines...) Expand 10 before | Expand all | Expand 10 after
168 // Reads one character in UTF-8 starting at |*begin| in |str| and places 168 // Reads one character in UTF-8 starting at |*begin| in |str| and places
169 // the decoded value into |*code_point|. If the character is valid, we will 169 // the decoded value into |*code_point|. If the character is valid, we will
170 // return true. If invalid, we'll return false and put the 170 // return true. If invalid, we'll return false and put the
171 // kUnicodeReplacementCharacter into |*code_point|. 171 // kUnicodeReplacementCharacter into |*code_point|.
172 // 172 //
173 // |*begin| will be updated to point to the last character consumed so it 173 // |*begin| will be updated to point to the last character consumed so it
174 // can be incremented in a loop and will be ready for the next character. 174 // can be incremented in a loop and will be ready for the next character.
175 // (for a single-byte ASCII character, it will not be changed). 175 // (for a single-byte ASCII character, it will not be changed).
176 // 176 //
177 // Implementation is in url_canon_icu.cc. 177 // Implementation is in url_canon_icu.cc.
178 GURL_API bool ReadUTFChar(const char* str, int* begin, int length, 178 bool ReadUTFChar(const char* str, int* begin, int length,
179 unsigned* code_point_out); 179 unsigned* code_point_out);
180 180
181 // Generic To-UTF-8 converter. This will call the given append method for each 181 // Generic To-UTF-8 converter. This will call the given append method for each
182 // character that should be appended, with the given output method. Wrappers 182 // character that should be appended, with the given output method. Wrappers
183 // are provided below for escaped and non-escaped versions of this. 183 // are provided below for escaped and non-escaped versions of this.
184 // 184 //
185 // The char_value must have already been checked that it's a valid Unicode 185 // The char_value must have already been checked that it's a valid Unicode
186 // character. 186 // character.
187 template<class Output, void Appender(unsigned char, Output*)> 187 template<class Output, void Appender(unsigned char, Output*)>
188 inline void DoAppendUTF8(unsigned char_value, Output* output) { 188 inline void DoAppendUTF8(unsigned char_value, Output* output) {
189 if (char_value <= 0x7f) { 189 if (char_value <= 0x7f) {
(...skipping 55 matching lines...) Expand 10 before | Expand all | Expand 10 after
245 // Reads one character in UTF-16 starting at |*begin| in |str| and places 245 // Reads one character in UTF-16 starting at |*begin| in |str| and places
246 // the decoded value into |*code_point|. If the character is valid, we will 246 // the decoded value into |*code_point|. If the character is valid, we will
247 // return true. If invalid, we'll return false and put the 247 // return true. If invalid, we'll return false and put the
248 // kUnicodeReplacementCharacter into |*code_point|. 248 // kUnicodeReplacementCharacter into |*code_point|.
249 // 249 //
250 // |*begin| will be updated to point to the last character consumed so it 250 // |*begin| will be updated to point to the last character consumed so it
251 // can be incremented in a loop and will be ready for the next character. 251 // can be incremented in a loop and will be ready for the next character.
252 // (for a single-16-bit-word character, it will not be changed). 252 // (for a single-16-bit-word character, it will not be changed).
253 // 253 //
254 // Implementation is in url_canon_icu.cc. 254 // Implementation is in url_canon_icu.cc.
255 GURL_API bool ReadUTFChar(const char16* str, int* begin, int length, 255 bool ReadUTFChar(const char16* str, int* begin, int length,
256 unsigned* code_point); 256 unsigned* code_point);
257 257
258 // Equivalent to U16_APPEND_UNSAFE in ICU but uses our output method. 258 // Equivalent to U16_APPEND_UNSAFE in ICU but uses our output method.
259 inline void AppendUTF16Value(unsigned code_point, 259 inline void AppendUTF16Value(unsigned code_point,
260 CanonOutputT<char16>* output) { 260 CanonOutputT<char16>* output) {
261 if (code_point > 0xffff) { 261 if (code_point > 0xffff) {
262 output->push_back(static_cast<char16>((code_point >> 10) + 0xd7c0)); 262 output->push_back(static_cast<char16>((code_point >> 10) + 0xd7c0));
263 output->push_back(static_cast<char16>((code_point & 0x3ff) | 0xdc00)); 263 output->push_back(static_cast<char16>((code_point & 0x3ff) | 0xdc00));
264 } else { 264 } else {
265 output->push_back(static_cast<char16>(code_point)); 265 output->push_back(static_cast<char16>(code_point));
266 } 266 }
(...skipping 97 matching lines...) Expand 10 before | Expand all | Expand 10 after
364 // Misc canonicalization helpers ---------------------------------------------- 364 // Misc canonicalization helpers ----------------------------------------------
365 365
366 // Converts between UTF-8 and UTF-16, returning true on successful conversion. 366 // Converts between UTF-8 and UTF-16, returning true on successful conversion.
367 // The output will be appended to the given canonicalizer output (so make sure 367 // The output will be appended to the given canonicalizer output (so make sure
368 // it's empty if you want to replace). 368 // it's empty if you want to replace).
369 // 369 //
370 // On invalid input, this will still write as much output as possible, 370 // On invalid input, this will still write as much output as possible,
371 // replacing the invalid characters with the "invalid character". It will 371 // replacing the invalid characters with the "invalid character". It will
372 // return false in the failure case, and the caller should not continue as 372 // return false in the failure case, and the caller should not continue as
373 // normal. 373 // normal.
374 GURL_API bool ConvertUTF16ToUTF8(const char16* input, int input_len, 374 bool ConvertUTF16ToUTF8(const char16* input, int input_len,
375 CanonOutput* output); 375 CanonOutput* output);
376 GURL_API bool ConvertUTF8ToUTF16(const char* input, int input_len, 376 bool ConvertUTF8ToUTF16(const char* input, int input_len,
377 CanonOutputT<char16>* output); 377 CanonOutputT<char16>* output);
378 378
379 // Converts from UTF-16 to 8-bit using the character set converter. If the 379 // Converts from UTF-16 to 8-bit using the character set converter. If the
380 // converter is NULL, this will use UTF-8. 380 // converter is NULL, this will use UTF-8.
381 void ConvertUTF16ToQueryEncoding(const char16* input, 381 void ConvertUTF16ToQueryEncoding(const char16* input,
382 const url_parse::Component& query, 382 const url_parse::Component& query,
383 CharsetConverter* converter, 383 CharsetConverter* converter,
384 CanonOutput* output); 384 CanonOutput* output);
385 385
386 // Applies the replacements to the given component source. The component source 386 // Applies the replacements to the given component source. The component source
387 // should be pre-initialized to the "old" base. That is, all pointers will 387 // should be pre-initialized to the "old" base. That is, all pointers will
(...skipping 38 matching lines...) Expand 10 before | Expand all | Expand 10 after
426 int path_begin_in_output, 426 int path_begin_in_output,
427 CanonOutput* output); 427 CanonOutput* output);
428 bool CanonicalizePartialPath(const char16* spec, 428 bool CanonicalizePartialPath(const char16* spec,
429 const url_parse::Component& path, 429 const url_parse::Component& path,
430 int path_begin_in_output, 430 int path_begin_in_output,
431 CanonOutput* output); 431 CanonOutput* output);
432 432
433 #ifndef WIN32 433 #ifndef WIN32
434 434
435 // Implementations of Windows' int-to-string conversions 435 // Implementations of Windows' int-to-string conversions
436 GURL_API int _itoa_s(int value, char* buffer, size_t size_in_chars, int radix); 436 int _itoa_s(int value, char* buffer, size_t size_in_chars, int radix);
437 GURL_API int _itow_s(int value, char16* buffer, size_t size_in_chars, 437 int _itow_s(int value, char16* buffer, size_t size_in_chars,
438 int radix); 438 int radix);
439 439
440 // Secure template overloads for these functions 440 // Secure template overloads for these functions
441 template<size_t N> 441 template<size_t N>
442 inline int _itoa_s(int value, char (&buffer)[N], int radix) { 442 inline int _itoa_s(int value, char (&buffer)[N], int radix) {
443 return _itoa_s(value, buffer, N, radix); 443 return _itoa_s(value, buffer, N, radix);
444 } 444 }
445 445
446 template<size_t N> 446 template<size_t N>
447 inline int _itow_s(int value, char16 (&buffer)[N], int radix) { 447 inline int _itow_s(int value, char16 (&buffer)[N], int radix) {
448 return _itow_s(value, buffer, N, radix); 448 return _itow_s(value, buffer, N, radix);
449 } 449 }
450 450
451 // _strtoui64 and strtoull behave the same 451 // _strtoui64 and strtoull behave the same
452 inline unsigned long long _strtoui64(const char* nptr, 452 inline unsigned long long _strtoui64(const char* nptr,
453 char** endptr, int base) { 453 char** endptr, int base) {
454 return strtoull(nptr, endptr, base); 454 return strtoull(nptr, endptr, base);
455 } 455 }
456 456
457 #endif // WIN32 457 #endif // WIN32
458 458
459 } // namespace url_canon 459 } // namespace url_canon
460 460
461 #endif // GOOGLEURL_SRC_URL_CANON_INTERNAL_H__ 461 #endif // URL_URL_CANON_INTERNAL_H_
OLDNEW
« no previous file with comments | « url/url_canon_icu.cc ('k') | url/url_canon_internal.cc » ('j') | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698