src/strtod.cc - Issue 3760013: Strtod fast-case that uses DiyFps and cached powers of ten.

Side by Side Diff: src/strtod.cc

Issue 3760013: Strtod fast-case that uses DiyFps and cached powers of ten. (Closed)

Patch Set: Addressed comments. Created 10 years, 2 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

OLD	NEW
1 // Copyright 2010 the V8 project authors. All rights reserved.	1 // Copyright 2010 the V8 project authors. All rights reserved.

2 // Redistribution and use in source and binary forms, with or without	2 // Redistribution and use in source and binary forms, with or without

3 // modification, are permitted provided that the following conditions are	3 // modification, are permitted provided that the following conditions are

4 // met:	4 // met:

5 //	5 //

6 // * Redistributions of source code must retain the above copyright	6 // * Redistributions of source code must retain the above copyright

7 // notice, this list of conditions and the following disclaimer.	7 // notice, this list of conditions and the following disclaimer.

8 // * Redistributions in binary form must reproduce the above	8 // * Redistributions in binary form must reproduce the above

9 // copyright notice, this list of conditions and the following	9 // copyright notice, this list of conditions and the following

10 // disclaimer in the documentation and/or other materials provided	10 // disclaimer in the documentation and/or other materials provided

(...skipping 13 matching lines...) Expand all Loading...
24 // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT	24 // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

25 // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE	25 // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE

26 // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.	26 // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

27	27

28 #include <stdarg.h>	28 #include <stdarg.h>

29 #include <limits.h>	29 #include <limits.h>

30	30

31 #include "v8.h"	31 #include "v8.h"

32	32

33 #include "strtod.h"	33 #include "strtod.h"

34 // #include "cached-powers.h"	34 #include "cached-powers.h"

	35 #include "double.h"

35	36

36 namespace v8 {	37 namespace v8 {

37 namespace internal {	38 namespace internal {

38	39

39 // 2^53 = 9007199254740992.	40 // 2^53 = 9007199254740992.

40 // Any integer with at most 15 decimal digits will hence fit into a double	41 // Any integer with at most 15 decimal digits will hence fit into a double

41 // (which has a 53bit significand) without loss of precision.	42 // (which has a 53bit significand) without loss of precision.

42 static const int kMaxExactDoubleIntegerDecimalDigits = 15;	43 static const int kMaxExactDoubleIntegerDecimalDigits = 15;

43 // 2^64 = 18446744073709551616	44 // 2^64 = 18446744073709551616 > 10^19

44 // Any integer with at most 19 digits will hence fit into a 64bit datatype.

45 static const int kMaxUint64DecimalDigits = 19;	45 static const int kMaxUint64DecimalDigits = 19;

	46

46 // Max double: 1.7976931348623157 x 10^308	47 // Max double: 1.7976931348623157 x 10^308

47 // Min non-zero double: 4.9406564584124654 x 10^-324	48 // Min non-zero double: 4.9406564584124654 x 10^-324

48 // Any x >= 10^309 is interpreted as +infinity.	49 // Any x >= 10^309 is interpreted as +infinity.

49 // Any x <= 10^-324 is interpreted as 0.	50 // Any x <= 10^-324 is interpreted as 0.

50 // Note that 2.5e-324 (despite being smaller than the min double) will be read	51 // Note that 2.5e-324 (despite being smaller than the min double) will be read

51 // as non-zero (equal to the min non-zero double).	52 // as non-zero (equal to the min non-zero double).

52 static const int kMaxDecimalPower = 309;	53 static const int kMaxDecimalPower = 309;

53 static const int kMinDecimalPower = -324;	54 static const int kMinDecimalPower = -324;

54	55

	56 // 2^64 = 18446744073709551616

	57 static const uint64_t kMaxUint64 = V8_2PART_UINT64_C(0xFFFFFFFF, FFFFFFFF);

	58

	59

55 static const double exact_powers_of_ten[] = {	60 static const double exact_powers_of_ten[] = {

56 1.0, // 10^0	61 1.0, // 10^0

57 10.0,	62 10.0,

58 100.0,	63 100.0,

59 1000.0,	64 1000.0,

60 10000.0,	65 10000.0,

61 100000.0,	66 100000.0,

62 1000000.0,	67 1000000.0,

63 10000000.0,	68 10000000.0,

64 100000000.0,	69 100000000.0,

(...skipping 65 matching lines...) Expand 10 before \| Expand all \| Expand 10 after Loading...
130 static Vector<const char> TrimTrailingZeros(Vector<const char> buffer) {	135 static Vector<const char> TrimTrailingZeros(Vector<const char> buffer) {

131 for (int i = buffer.length() - 1; i >= 0; --i) {	136 for (int i = buffer.length() - 1; i >= 0; --i) {

132 if (buffer[i] != '0') {	137 if (buffer[i] != '0') {

133 return Vector<const char>(buffer.start(), i + 1);	138 return Vector<const char>(buffer.start(), i + 1);

134 }	139 }

135 }	140 }

136 return Vector<const char>(buffer.start(), 0);	141 return Vector<const char>(buffer.start(), 0);

137 }	142 }

138	143

139	144

140 uint64_t ReadUint64(Vector<const char> buffer) {	145 // Reads digits from the buffer and converts them to a uint64.

141 ASSERT(buffer.length() <= kMaxUint64DecimalDigits);	146 // Reads in as many digits as fit into a uint64.

	147 // When the string starts with "1844674407370955161" no further digit is read.

	148 // Since 2^64 = 18446744073709551616 it would still be possible read another

	149 // digit if it was less or equal than 6, but this would complicate the code.

	150 static uint64_t ReadUint64(Vector<const char> buffer,

	151 int* number_of_read_digits) {

142 uint64_t result = 0;	152 uint64_t result = 0;

143 for (int i = 0; i < buffer.length(); ++i) {	153 int i = 0;

144 int digit = buffer[i] - '0';	154 while (i < buffer.length() && result <= (kMaxUint64 / 10 - 1)) {

	155 int digit = buffer[i++] - '0';

145 ASSERT(0 <= digit && digit <= 9);	156 ASSERT(0 <= digit && digit <= 9);

146 result = 10 * result + digit;	157 result = 10 * result + digit;

147 }	158 }

	159 *number_of_read_digits = i;

148 return result;	160 return result;

149 }	161 }

150	162

151	163

	164 // Reads a DiyFp from the buffer.

	165 // The returned DiyFp is not necessarily normalized.

	166 // If remaining_decimals is zero then the returned DiyFp is accurate.

	167 // Otherwise it has been rounded and has error of at most 1/2 ulp.

	168 static void ReadDiyFp(Vector<const char> buffer,

	169 DiyFp* result,

	170 int* remaining_decimals) {

	171 int read_digits;

	172 uint64_t significand = ReadUint64(buffer, &read_digits);

	173 if (buffer.length() == read_digits) {

	174 *result = DiyFp(significand, 0);

	175 *remaining_decimals = 0;

	176 } else {

	177 // Round the significand.

	178 if (buffer[read_digits] >= '5') {

	179 significand++;

	180 }

	181 // Compute the binary exponent.

	182 int exponent = 0;

	183 *result = DiyFp(significand, exponent);

	184 *remaining_decimals = buffer.length() - read_digits;

	185 }

	186 }

	187

	188

152 static bool DoubleStrtod(Vector<const char> trimmed,	189 static bool DoubleStrtod(Vector<const char> trimmed,

153 int exponent,	190 int exponent,

154 double* result) {	191 double* result) {

155 #if (defined(V8_TARGET_ARCH_IA32) \|\| defined(USE_SIMULATOR)) && !defined(WIN32)	192 #if (defined(V8_TARGET_ARCH_IA32) \|\| defined(USE_SIMULATOR)) && !defined(WIN32)

156 // On x86 the floating-point stack can be 64 or 80 bits wide. If it is	193 // On x86 the floating-point stack can be 64 or 80 bits wide. If it is

157 // 80 bits wide (as is the case on Linux) then double-rounding occurs and the	194 // 80 bits wide (as is the case on Linux) then double-rounding occurs and the

158 // result is not accurate.	195 // result is not accurate.

159 // We know that Windows32 uses 64 bits and is therefore accurate.	196 // We know that Windows32 uses 64 bits and is therefore accurate.

160 // Note that the ARM simulator is compiled for 32bits. It therefore exhibits	197 // Note that the ARM simulator is compiled for 32bits. It therefore exhibits

161 // the same problem.	198 // the same problem.

162 return false;	199 return false;

163 #endif	200 #endif

164 if (trimmed.length() <= kMaxExactDoubleIntegerDecimalDigits) {	201 if (trimmed.length() <= kMaxExactDoubleIntegerDecimalDigits) {

	202 int read_digits;

165 // The trimmed input fits into a double.	203 // The trimmed input fits into a double.

166 // If the 10^exponent (resp. 10^-exponent) fits into a double too then we	204 // If the 10^exponent (resp. 10^-exponent) fits into a double too then we

167 // can compute the result-double simply by multiplying (resp. dividing) the	205 // can compute the result-double simply by multiplying (resp. dividing) the

168 // two numbers.	206 // two numbers.

169 // This is possible because IEEE guarantees that floating-point operations	207 // This is possible because IEEE guarantees that floating-point operations

170 // return the best possible approximation.	208 // return the best possible approximation.

171 if (exponent < 0 && -exponent < kExactPowersOfTenSize) {	209 if (exponent < 0 && -exponent < kExactPowersOfTenSize) {

172 // 10^-exponent fits into a double.	210 // 10^-exponent fits into a double.

173 *result = static_cast<double>(ReadUint64(trimmed));	211 *result = static_cast<double>(ReadUint64(trimmed, &read_digits));

	212 ASSERT(read_digits == trimmed.length());

174 *result /= exact_powers_of_ten[-exponent];	213 *result /= exact_powers_of_ten[-exponent];

175 return true;	214 return true;

176 }	215 }

177 if (0 <= exponent && exponent < kExactPowersOfTenSize) {	216 if (0 <= exponent && exponent < kExactPowersOfTenSize) {

178 // 10^exponent fits into a double.	217 // 10^exponent fits into a double.

179 *result = static_cast<double>(ReadUint64(trimmed));	218 *result = static_cast<double>(ReadUint64(trimmed, &read_digits));

	219 ASSERT(read_digits == trimmed.length());

180 result = exact_powers_of_ten[exponent];	220 result = exact_powers_of_ten[exponent];

181 return true;	221 return true;

182 }	222 }

183 int remaining_digits =	223 int remaining_digits =

184 kMaxExactDoubleIntegerDecimalDigits - trimmed.length();	224 kMaxExactDoubleIntegerDecimalDigits - trimmed.length();

185 if ((0 <= exponent) &&	225 if ((0 <= exponent) &&

186 (exponent - remaining_digits < kExactPowersOfTenSize)) {	226 (exponent - remaining_digits < kExactPowersOfTenSize)) {

187 // The trimmed string was short and we can multiply it with	227 // The trimmed string was short and we can multiply it with

188 // 10^remaining_digits. As a result the remaining exponent now fits	228 // 10^remaining_digits. As a result the remaining exponent now fits

189 // into a double too.	229 // into a double too.

190 *result = static_cast<double>(ReadUint64(trimmed));	230 *result = static_cast<double>(ReadUint64(trimmed, &read_digits));

	231 ASSERT(read_digits == trimmed.length());

191 result = exact_powers_of_ten[remaining_digits];	232 result = exact_powers_of_ten[remaining_digits];

192 result = exact_powers_of_ten[exponent - remaining_digits];	233 result = exact_powers_of_ten[exponent - remaining_digits];

193 return true;	234 return true;

194 }	235 }

195 }	236 }

196 return false;	237 return false;

197 }	238 }

198	239

199	240

	241 // Returns 10^exponent as an exact DiyFp.

	242 // The given exponent must be in the range [1; kDecimalExponentDistance[.

	243 static DiyFp AdjustmentPowerOfTen(int exponent) {

	244 ASSERT(0 < exponent);

	245 ASSERT(exponent < PowersOfTenCache::kDecimalExponentDistance);

	246 // Simply hardcode the remaining powers for the given decimal exponent

	247 // distance.

	248 ASSERT(PowersOfTenCache::kDecimalExponentDistance == 8);

	249 switch (exponent) {

	250 case 1: return DiyFp(V8_2PART_UINT64_C(0xa0000000, 00000000), -60);

	251 case 2: return DiyFp(V8_2PART_UINT64_C(0xc8000000, 00000000), -57);

	252 case 3: return DiyFp(V8_2PART_UINT64_C(0xfa000000, 00000000), -54);

	253 case 4: return DiyFp(V8_2PART_UINT64_C(0x9c400000, 00000000), -50);

	254 case 5: return DiyFp(V8_2PART_UINT64_C(0xc3500000, 00000000), -47);

	255 case 6: return DiyFp(V8_2PART_UINT64_C(0xf4240000, 00000000), -44);

	256 case 7: return DiyFp(V8_2PART_UINT64_C(0x98968000, 00000000), -40);

	257 default:

	258 UNREACHABLE();

	259 return DiyFp(0, 0);

	260 }

	261 }

	262

	263

	264 // If the function returns true then the result is the correct double.

	265 // Otherwise it is either the correct double or the double that is just below

	266 // the correct double.

	267 static bool DiyFpStrtod(Vector<const char> buffer,

	268 int exponent,

	269 double* result) {

	270 DiyFp input;

	271 int remaining_decimals;

	272 ReadDiyFp(buffer, &input, &remaining_decimals);

	273 // Since we may have dropped some digits the input is not accurate.

	274 // If remaining_decimals is different than 0 than the error is at most

	275 // .5 ulp (unit in the last place).

	276 // We don't want to deal with fractions and therefore keep a common

	277 // denominator.

	278 const int kDenominatorLog = 3;

	279 const int kDenominator = 1 << kDenominatorLog;

	280 // Move the remaining decimals into the exponent.

	281 exponent += remaining_decimals;

	282 int error = (remaining_decimals == 0 ? 0 : kDenominator / 2);

	283

	284 int old_e = input.e();

	285 input.Normalize();

	286 error <<= old_e - input.e();

	287

	288 ASSERT(exponent <= PowersOfTenCache::kMaxDecimalExponent);

	289 if (exponent < PowersOfTenCache::kMinDecimalExponent) {

	290 *result = 0.0;

	291 return true;

	292 }

	293 DiyFp cached_power;

	294 int cached_decimal_exponent;

	295 PowersOfTenCache::GetCachedPowerForDecimalExponent(exponent,

	296 &cached_power,

	297 &cached_decimal_exponent);

	298

	299 if (cached_decimal_exponent != exponent) {

	300 int adjustment_exponent = exponent - cached_decimal_exponent;

	301 DiyFp adjustment_power = AdjustmentPowerOfTen(adjustment_exponent);

	302 input.Multiply(adjustment_power);

	303 if (kMaxUint64DecimalDigits - buffer.length() >= adjustment_exponent) {

	304 // The product of input with the adjustment power fits into a 64 bit

	305 // integer.

	306 ASSERT(DiyFp::kSignificandSize == 64);

	307 } else {

	308 // The adjustment power is exact. There is hence only an error of 0.5.

	309 error += kDenominator / 2;

	310 }

	311 }

	312

	313 input.Multiply(cached_power);

	314 // The error introduced by a multiplication of a*b equals

	315 // error_a + error_b + error_a*error_b/2^64 + 0.5

	316 // Substituting a with 'input' and b with 'cached_power' we have

	317 // error_b = 0.5 (all cached powers have an error of less than 0.5 ulp),

	318 // error_ab = 0 or 1 / kDenominator > error_a*error_b/ 2^64

	319 int error_b = kDenominator / 2;

	320 int error_ab = (error == 0 ? 0 : 1); // We round up to 1.

	321 int fixed_error = kDenominator / 2;

	322 error += error_b + error_ab + fixed_error;

	323

	324 old_e = input.e();

	325 input.Normalize();

	326 error <<= old_e - input.e();

	327

	328 // See if the double's significand changes if we add/subtract the error.

	329 int order_of_magnitude = DiyFp::kSignificandSize + input.e();

	330 int effective_significand_size =

	331 Double::SignificandSizeForOrderOfMagnitude(order_of_magnitude);

	332 int precision_digits_count =

	333 DiyFp::kSignificandSize - effective_significand_size;

	334 if (precision_digits_count + kDenominatorLog >= DiyFp::kSignificandSize) {

	335 // This can only happen for very small denormals. In this case the

	336 // half-way multiplied by the denominator exceeds the range of an uint64.

	337 // Simply shift everything to the right.

	338 int shift_amount = (precision_digits_count + kDenominatorLog) -

	339 DiyFp::kSignificandSize + 1;

	340 input.set_f(input.f() >> shift_amount);

	341 input.set_e(input.e() + shift_amount);

	342 // We add 1 for the lost precision of error, and kDenominator for

	343 // the lost precision of input.f().

	344 error = (error >> shift_amount) + 1 + kDenominator;

	345 precision_digits_count -= shift_amount;

	346 }

	347 // We use uint64_ts now. This only works if the DiyFp uses uint64_ts too.

	348 ASSERT(DiyFp::kSignificandSize == 64);

	349 ASSERT(precision_digits_count < 64);

	350 uint64_t one64 = 1;

	351 uint64_t precision_bits_mask = (one64 << precision_digits_count) - 1;

	352 uint64_t precision_bits = input.f() & precision_bits_mask;

	353 uint64_t half_way = one64 << (precision_digits_count - 1);

	354 precision_bits *= kDenominator;

	355 half_way *= kDenominator;

	356 // If the last_bits are too close to the half-way case than we are too

	357 // inaccurate and round down. In this case we return false so that we can

	358 // fall back to a more precise algorithm.

	359 uint64_t significand = input.f();

	360 if (precision_bits >= half_way + error) {

	361 significand = (significand >> precision_digits_count) + 1;

	362 exponent = input.e() + precision_digits_count;

	363 } else {

	364 significand = (significand >> precision_digits_count);

	365 exponent = input.e() + precision_digits_count;

	366 }

	367 Double d = Double(significand, exponent);

	368 *result = d.value();

	369 if (half_way - error < precision_bits && precision_bits < half_way + error) {

	370 // Too imprecise. The caller will have to fall back to a slower version.

	371 // However the returned number is guaranteed to be either the correct

	372 // double, or the next-lower double.

	373 return false;

	374 } else {

	375 return true;

	376 }

	377 }

	378

	379

200 double Strtod(Vector<const char> buffer, int exponent) {	380 double Strtod(Vector<const char> buffer, int exponent) {

201 Vector<const char> left_trimmed = TrimLeadingZeros(buffer);	381 Vector<const char> left_trimmed = TrimLeadingZeros(buffer);

202 Vector<const char> trimmed = TrimTrailingZeros(left_trimmed);	382 Vector<const char> trimmed = TrimTrailingZeros(left_trimmed);

203 exponent += left_trimmed.length() - trimmed.length();	383 exponent += left_trimmed.length() - trimmed.length();

204 if (trimmed.length() == 0) return 0.0;	384 if (trimmed.length() == 0) return 0.0;

205 if (exponent + trimmed.length() - 1 >= kMaxDecimalPower) return V8_INFINITY;	385 if (exponent + trimmed.length() - 1 >= kMaxDecimalPower) return V8_INFINITY;

206 if (exponent + trimmed.length() <= kMinDecimalPower) return 0.0;	386 if (exponent + trimmed.length() <= kMinDecimalPower) return 0.0;

	387

207 double result;	388 double result;

208 if (DoubleStrtod(trimmed, exponent, &result)) {	389 if (DoubleStrtod(trimmed, exponent, &result) \|\|

	390 DiyFpStrtod(trimmed, exponent, &result)) {

209 return result;	391 return result;

210 }	392 }

211 return old_strtod(trimmed, exponent);	393 return old_strtod(trimmed, exponent);

212 }	394 }

213	395

214 } } // namespace v8::internal	396 } } // namespace v8::internal

OLD	NEW

« no previous file with comments | « src/fast-dtoa.cc ('k') | test/cctest/test-strtod.cc » ('j') | no next file with comments »