src/arm/codegen-arm.cc - Issue 2876011: Do integer mod via sum-of-digits technique. This benefits the date

Unified Diff: src/arm/codegen-arm.cc

Issue 2876011: Do integer mod via sum-of-digits technique. This benefits the date (Closed) Base URL: http://v8.googlecode.com/svn/branches/bleeding_edge/

Patch Set: Created 10 years, 6 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: src/arm/codegen-arm.cc

===================================================================

--- src/arm/codegen-arm.cc (revision 4950)

+++ src/arm/codegen-arm.cc (working copy)

@@ -6258,6 +6258,86 @@

#define __ ACCESS_MASM(masm)

+// This uses versions of the sum-of-digits-to-see-if-a-number-is-divisible-by-3

+// trick. See http://en.wikipedia.org/wiki/Divisibility_rule

+// Takes the sum of the digits base (mask + 1) repeatedly until we have a

+// number from 0 to mask. On exit the 'eq' condition flags are set if the

+// answer is exactly the mask.

+void DigitSum(MacroAssembler* masm,

Søren Thygesen Gjesse 2010/06/28 07:19:36 static (times 5)? And why are these functions not

+ Register lhs,

+ int mask,

+ int shift) {

+ ASSERT(mask > 0);

+ ASSERT(mask <= 0xff); // This ensures we don't need ip to use it.

+ Label loop, entry;

+ __ jmp(&entry);

+ __ bind(&loop);

+ __ and_(ip, lhs, Operand(mask));

+ __ add(lhs, ip, Operand(lhs, LSR, shift));

+ __ bind(&entry);

+ __ cmp(lhs, Operand(mask));

+ __ b(gt, &loop);

+void DigitSum(MacroAssembler* masm,

+ Register lhs,

+ Register scratch,

+ int mask,

+ int shift1,

+ int shift2) {

+ ASSERT(mask > 0);

+ ASSERT(mask <= 0xff); // This ensures we don't need ip to use it.

+ Label loop, entry;

+ __ jmp(&entry);

+ __ bind(&loop);

+ __ bic(scratch, lhs, Operand(mask));

+ __ and_(ip, lhs, Operand(mask));

+ __ add(lhs, ip, Operand(lhs, LSR, shift1));

+ __ add(lhs, lhs, Operand(scratch, LSR, shift2));

+ __ bind(&entry);

+ __ cmp(lhs, Operand(mask));

+ __ b(gt, &loop);

+// Splits the number into two halves (bottom half has shift bits). The top

+// half is subtracted from the bottom half. If the result is negative then

+// rhs is added.

+void ModGetInRangeBySubtraction(MacroAssembler* masm,

+ Register lhs,

+ int shift,

+ int rhs) {

+ int mask = (1 << shift) - 1;

+ __ and_(ip, lhs, Operand(mask));

+ __ sub(lhs, ip, Operand(lhs, LSR, shift), SetCC);

+ __ add(lhs, lhs, Operand(rhs), LeaveCC, mi);

+void ModReduce(MacroAssembler* masm,

+ Register lhs,

+ int max,

+ int denominator) {

+ int limit = denominator;

+ while (limit * 2 <= max) limit *= 2;

+ while (limit >= denominator) {

+ __ cmp(lhs, Operand(limit));

+ __ sub(lhs, lhs, Operand(limit), LeaveCC, ge);

+ limit >>= 1;

+ }

+void ModAnswer(MacroAssembler* masm,

+ Register result,

+ Register shift_distance,

+ Register mask_bits,

+ Register sum_of_digits) {

+ __ add(result, mask_bits, Operand(sum_of_digits, LSL, shift_distance));

+ __ Ret();

Handle<String> Reference::GetName() {

ASSERT(type_ == NAMED);

Property* property = expression_->AsProperty();

@@ -6621,7 +6701,7 @@

__ bind(&not_special);

// Count leading zeros. Uses mantissa for a scratch register on pre-ARM5.

// Gets the wrong answer for 0, but we already checked for that case above.

- __ CountLeadingZeros(source_, mantissa, zeros_);

+ __ CountLeadingZeros(zeros_, source_, mantissa);

// Compute exponent and or it into the exponent register.

// We use mantissa as a scratch register here. Use a fudge factor to

// divide the constant 31 + HeapNumber::kExponentBias, 0x41d, into two parts

@@ -7350,7 +7430,7 @@

// If we have floating point hardware, inline ADD, SUB, MUL, and DIV,

// using registers d7 and d6 for the double values.

- if (use_fp_registers) {

+ if (CpuFeatures::IsSupported(VFP3)) {

CpuFeatures::Scope scope(VFP3);

__ mov(r7, Operand(rhs, ASR, kSmiTagSize));

__ vmov(s15, r7);

@@ -7358,8 +7438,12 @@

__ mov(r7, Operand(lhs, ASR, kSmiTagSize));

__ vmov(s13, r7);

__ vcvt_f64_s32(d6, s13);

+ if (!use_fp_registers) {

+ __ vmov(r2, r3, d7);

+ __ vmov(r0, r1, d6);

+ }

} else {

- // Write Smi from rhs to r3 and r2 in double format. r3 is scratch.

+ // Write Smi from rhs to r3 and r2 in double format. r9 is scratch.

__ mov(r7, Operand(rhs));

ConvertToDoubleStub stub1(r3, r2, r7, r9);

__ push(lr);

@@ -7434,12 +7518,15 @@

__ AllocateHeapNumber(r5, r4, r7, heap_number_map, &slow);

}

- if (use_fp_registers) {

+ if (CpuFeatures::IsSupported(VFP3)) {

CpuFeatures::Scope scope(VFP3);

// Convert smi in r0 to double in d7.

__ mov(r7, Operand(r0, ASR, kSmiTagSize));

__ vmov(s15, r7);

__ vcvt_f64_s32(d7, s15);

+ if (!use_fp_registers) {

+ __ vmov(r2, r3, d7);

+ }

} else {

// Write Smi from r0 to r3 and r2 in double format.

__ mov(r7, Operand(r0));

@@ -7490,12 +7577,15 @@

__ AllocateHeapNumber(r5, r4, r7, heap_number_map, &slow);

}

- if (use_fp_registers) {

+ if (CpuFeatures::IsSupported(VFP3)) {

CpuFeatures::Scope scope(VFP3);

// Convert smi in r1 to double in d6.

__ mov(r7, Operand(r1, ASR, kSmiTagSize));

__ vmov(s13, r7);

__ vcvt_f64_s32(d6, s13);

+ if (!use_fp_registers) {

+ __ vmov(r0, r1, d6);

+ }

} else {

// Write Smi from r1 to r1 and r0 in double format.

__ mov(r7, Operand(r1));

@@ -7942,6 +8032,98 @@

}

+// See comment for class.

+void IntegerModStub::Generate(MacroAssembler* masm) {

+ __ mov(lhs_, Operand(lhs_, LSR, shift_distance_));

+ __ bic(odd_number_, odd_number_, Operand(1));

+ __ mov(odd_number_, Operand(odd_number_, LSL, 1));

+ // We now have (odd_number_ - 1) * 2 in the register.

+ // Build a switch out of branches instead of data because it avoids

+ // having to teach the assembler about intra-code-object pointers

+ // that are not in relative branch instructions.

+ Label mod3, mod5, mod7, mod9, mod11, mod13, mod15, mod17, mod19;

+ Label mod21, mod23, mod25;

+ { Assembler::BlockConstPoolScope block_const_pool(masm);

+ __ add(pc, pc, Operand(odd_number_));

+ // When you read pc it is always 8 ahead, but when you write it you always

+ // write the actual value. So we put in two nops to take up the slack.

+ __ nop();

+ __ b(&mod3);

+ __ b(&mod5);

+ __ b(&mod7);

+ __ b(&mod9);

+ __ b(&mod11);

+ __ b(&mod13);

+ __ b(&mod15);

+ __ b(&mod17);

+ __ b(&mod19);

+ __ b(&mod21);

+ __ b(&mod23);

+ __ b(&mod25);

+ }

+ __ bind(&mod3);

+ DigitSum(masm, lhs_, 3, 2);

+ __ sub(lhs_, lhs_, Operand(3), LeaveCC, eq);