| Index: src/third_party/jscre/ucpinternal.h
 | 
| ===================================================================
 | 
| --- src/third_party/jscre/ucpinternal.h	(revision 1305)
 | 
| +++ src/third_party/jscre/ucpinternal.h	(working copy)
 | 
| @@ -1,126 +0,0 @@
 | 
| -/* This is JavaScriptCore's variant of the PCRE library. While this library
 | 
| -started out as a copy of PCRE, many of the features of PCRE have been
 | 
| -removed. This library now supports only the regular expression features
 | 
| -required by the JavaScript language specification, and has only the functions
 | 
| -needed by JavaScriptCore and the rest of WebKit.
 | 
| -
 | 
| -                 Originally written by Philip Hazel
 | 
| -           Copyright (c) 1997-2006 University of Cambridge
 | 
| -    Copyright (C) 2002, 2004, 2006, 2007 Apple Inc. All rights reserved.
 | 
| -
 | 
| ------------------------------------------------------------------------------
 | 
| -Redistribution and use in source and binary forms, with or without
 | 
| -modification, are permitted provided that the following conditions are met:
 | 
| -
 | 
| -    * Redistributions of source code must retain the above copyright notice,
 | 
| -      this list of conditions and the following disclaimer.
 | 
| -
 | 
| -    * Redistributions in binary form must reproduce the above copyright
 | 
| -      notice, this list of conditions and the following disclaimer in the
 | 
| -      documentation and/or other materials provided with the distribution.
 | 
| -
 | 
| -    * Neither the name of the University of Cambridge nor the names of its
 | 
| -      contributors may be used to endorse or promote products derived from
 | 
| -      this software without specific prior written permission.
 | 
| -
 | 
| -THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 | 
| -AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 | 
| -IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 | 
| -ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
 | 
| -LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 | 
| -CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 | 
| -SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 | 
| -INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 | 
| -CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 | 
| -ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 | 
| -POSSIBILITY OF SUCH DAMAGE.
 | 
| ------------------------------------------------------------------------------
 | 
| -*/
 | 
| -
 | 
| -/*************************************************
 | 
| -*           Unicode Property Table handler       *
 | 
| -*************************************************/
 | 
| -
 | 
| -/* Internal header file defining the layout of the bits in each pair of 32-bit
 | 
| -words that form a data item in the table. */
 | 
| -
 | 
| -typedef struct cnode {
 | 
| -  unsigned f0;
 | 
| -  unsigned f1;
 | 
| -} cnode;
 | 
| -
 | 
| -/* Things for the f0 field */
 | 
| -
 | 
| -#define f0_scriptmask   0xff000000  /* Mask for script field */
 | 
| -#define f0_scriptshift          24  /* Shift for script value */
 | 
| -#define f0_rangeflag    0x00f00000  /* Flag for a range item */
 | 
| -#define f0_charmask     0x001fffff  /* Mask for code point value */
 | 
| -
 | 
| -/* Things for the f1 field */
 | 
| -
 | 
| -#define f1_typemask     0xfc000000  /* Mask for char type field */
 | 
| -#define f1_typeshift            26  /* Shift for the type field */
 | 
| -#define f1_rangemask    0x0000ffff  /* Mask for a range offset */
 | 
| -#define f1_casemask     0x0000ffff  /* Mask for a case offset */
 | 
| -#define f1_caseneg      0xffff8000  /* Bits for negation */
 | 
| -
 | 
| -/* The data consists of a vector of structures of type cnode. The two unsigned
 | 
| -32-bit integers are used as follows:
 | 
| -
 | 
| -(f0) (1) The most significant byte holds the script number. The numbers are
 | 
| -         defined by the enum in ucp.h.
 | 
| -
 | 
| -     (2) The 0x00800000 bit is set if this entry defines a range of characters.
 | 
| -         It is not set if this entry defines a single character
 | 
| -
 | 
| -     (3) The 0x00600000 bits are spare.
 | 
| -
 | 
| -     (4) The 0x001fffff bits contain the code point. No Unicode code point will
 | 
| -         ever be greater than 0x0010ffff, so this should be OK for ever.
 | 
| -
 | 
| -(f1) (1) The 0xfc000000 bits contain the character type number. The numbers are
 | 
| -         defined by an enum in ucp.h.
 | 
| -
 | 
| -     (2) The 0x03ff0000 bits are spare.
 | 
| -
 | 
| -     (3) The 0x0000ffff bits contain EITHER the unsigned offset to the top of
 | 
| -         range if this entry defines a range, OR the *signed* offset to the
 | 
| -         character's "other case" partner if this entry defines a single
 | 
| -         character. There is no partner if the value is zero.
 | 
| -
 | 
| --------------------------------------------------------------------------------
 | 
| -| script (8) |.|.|.| codepoint (21) || type (6) |.|.| spare (8) | offset (16) |
 | 
| --------------------------------------------------------------------------------
 | 
| -              | | |                              | |
 | 
| -              | | |-> spare                      | |-> spare
 | 
| -              | |                                |
 | 
| -              | |-> spare                        |-> spare
 | 
| -              |
 | 
| -              |-> range flag
 | 
| -
 | 
| -The upper/lower casing information is set only for characters that come in
 | 
| -pairs. The non-one-to-one mappings in the Unicode data are ignored.
 | 
| -
 | 
| -When searching the data, proceed as follows:
 | 
| -
 | 
| -(1) Set up for a binary chop search.
 | 
| -
 | 
| -(2) If the top is not greater than the bottom, the character is not in the
 | 
| -    table. Its type must therefore be "Cn" ("Undefined").
 | 
| -
 | 
| -(3) Find the middle vector element.
 | 
| -
 | 
| -(4) Extract the code point and compare. If equal, we are done.
 | 
| -
 | 
| -(5) If the test character is smaller, set the top to the current point, and
 | 
| -    goto (2).
 | 
| -
 | 
| -(6) If the current entry defines a range, compute the last character by adding
 | 
| -    the offset, and see if the test character is within the range. If it is,
 | 
| -    we are done.
 | 
| -
 | 
| -(7) Otherwise, set the bottom to one element past the current point and goto
 | 
| -    (2).
 | 
| -*/
 | 
| -
 | 
| -/* End of ucpinternal.h */
 | 
| 
 |