OLD | NEW |
1 // Copyright 2013 The Chromium Authors. All rights reserved. | 1 // Copyright 2013 The Chromium Authors. All rights reserved. |
2 // Use of this source code is governed by a BSD-style license that can be | 2 // Use of this source code is governed by a BSD-style license that can be |
3 // found in the LICENSE file. | 3 // found in the LICENSE file. |
4 | 4 |
5 #ifndef URL_URL_CANON_H_ | 5 #ifndef URL_URL_CANON_H_ |
6 #define URL_URL_CANON_H_ | 6 #define URL_URL_CANON_H_ |
7 | 7 |
8 #include <stdlib.h> | 8 #include <stdlib.h> |
9 #include <string.h> | 9 #include <string.h> |
10 | 10 |
(...skipping 361 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
372 // definition of CanonHostInfo above for details. | 372 // definition of CanonHostInfo above for details. |
373 URL_EXPORT void CanonicalizeHostVerbose(const char* spec, | 373 URL_EXPORT void CanonicalizeHostVerbose(const char* spec, |
374 const Component& host, | 374 const Component& host, |
375 CanonOutput* output, | 375 CanonOutput* output, |
376 CanonHostInfo* host_info); | 376 CanonHostInfo* host_info); |
377 URL_EXPORT void CanonicalizeHostVerbose(const base::char16* spec, | 377 URL_EXPORT void CanonicalizeHostVerbose(const base::char16* spec, |
378 const Component& host, | 378 const Component& host, |
379 CanonOutput* output, | 379 CanonOutput* output, |
380 CanonHostInfo* host_info); | 380 CanonHostInfo* host_info); |
381 | 381 |
| 382 // Canonicalizes a string according to the host canonicalization rules. Unlike |
| 383 // CanonicalizeHost, this will not check for IP addresses which can change the |
| 384 // meaning (and canonicalization) of the components. This means it is possible |
| 385 // to call this for sub-components of a host name without corruption. |
| 386 // |
| 387 // As an example, "01.02.03.04.com" is a canonical hostname. If you called |
| 388 // CanonicalizeHost on the substring "01.02.03.04" it will get "fixed" to |
| 389 // "1.2.3.4" which will produce an invalid host name when reassembled. This |
| 390 // can happen more than one might think because all numbers by themselves are |
| 391 // considered IP addresses; so "5" canonicalizes to "0.0.0.5". |
| 392 // |
| 393 // Be careful: Because Punycode works on each dot-separated substring as a |
| 394 // unit, you should only pass this function substrings that represent complete |
| 395 // dot-separated subcomponents of the original host. Even if you have ASCII |
| 396 // input, percent-escaped characters will have different meanings if split in |
| 397 // the middle. |
| 398 // |
| 399 // Returns true if the host was valid. This function will treat a 0-length |
| 400 // host as valid (because it's designed to be used for substrings) while the |
| 401 // full version above will mark empty hosts as broken. |
| 402 URL_EXPORT bool CanonicalizeHostSubstring(const char* spec, |
| 403 const Component& host, |
| 404 CanonOutput* output); |
| 405 URL_EXPORT bool CanonicalizeHostSubstring(const base::char16* spec, |
| 406 const Component& host, |
| 407 CanonOutput* output); |
| 408 |
382 // IP addresses. | 409 // IP addresses. |
383 // | 410 // |
384 // Tries to interpret the given host name as an IPv4 or IPv6 address. If it is | 411 // Tries to interpret the given host name as an IPv4 or IPv6 address. If it is |
385 // an IP address, it will canonicalize it as such, appending it to |output|. | 412 // an IP address, it will canonicalize it as such, appending it to |output|. |
386 // Additional status information is returned via the |*host_info| parameter. | 413 // Additional status information is returned via the |*host_info| parameter. |
387 // See the definition of CanonHostInfo above for details. | 414 // See the definition of CanonHostInfo above for details. |
388 // | 415 // |
389 // This is called AUTOMATICALLY from the host canonicalizer, which ensures that | 416 // This is called AUTOMATICALLY from the host canonicalizer, which ensures that |
390 // the input is unescaped and name-prepped, etc. It should not normally be | 417 // the input is unescaped and name-prepped, etc. It should not normally be |
391 // necessary or wise to call this directly. | 418 // necessary or wise to call this directly. |
(...skipping 491 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
883 bool base_is_file, | 910 bool base_is_file, |
884 const base::char16* relative_url, | 911 const base::char16* relative_url, |
885 const Component& relative_component, | 912 const Component& relative_component, |
886 CharsetConverter* query_converter, | 913 CharsetConverter* query_converter, |
887 CanonOutput* output, | 914 CanonOutput* output, |
888 Parsed* out_parsed); | 915 Parsed* out_parsed); |
889 | 916 |
890 } // namespace url | 917 } // namespace url |
891 | 918 |
892 #endif // URL_URL_CANON_H_ | 919 #endif // URL_URL_CANON_H_ |
OLD | NEW |