OLD | NEW |
1 //===- subzero/src/IceTargetLoweringX8632.cpp - x86-32 lowering -----------===// | 1 //===- subzero/src/IceTargetLoweringX8632.cpp - x86-32 lowering -----------===// |
2 // | 2 // |
3 // The Subzero Code Generator | 3 // The Subzero Code Generator |
4 // | 4 // |
5 // This file is distributed under the University of Illinois Open Source | 5 // This file is distributed under the University of Illinois Open Source |
6 // License. See LICENSE.TXT for details. | 6 // License. See LICENSE.TXT for details. |
7 // | 7 // |
8 //===----------------------------------------------------------------------===// | 8 //===----------------------------------------------------------------------===// |
9 // | 9 // |
10 // This file implements the TargetLoweringX8632 class, which | 10 // This file implements the TargetLoweringX8632 class, which |
(...skipping 67 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
78 #undef X | 78 #undef X |
79 }; | 79 }; |
80 const size_t TableIcmp64Size = llvm::array_lengthof(TableIcmp64); | 80 const size_t TableIcmp64Size = llvm::array_lengthof(TableIcmp64); |
81 | 81 |
82 InstX8632Br::BrCond getIcmp32Mapping(InstIcmp::ICond Cond) { | 82 InstX8632Br::BrCond getIcmp32Mapping(InstIcmp::ICond Cond) { |
83 size_t Index = static_cast<size_t>(Cond); | 83 size_t Index = static_cast<size_t>(Cond); |
84 assert(Index < TableIcmp32Size); | 84 assert(Index < TableIcmp32Size); |
85 return TableIcmp32[Index].Mapping; | 85 return TableIcmp32[Index].Mapping; |
86 } | 86 } |
87 | 87 |
| 88 // Output a valid assembly identifier for the specified type. This is |
| 89 // needed for representing vector types because the default Ostream |
| 90 // operator<< implementation does not output a valid assembly identifier |
| 91 // when the argument is a vector type. |
| 92 void emitAsmLabelForType(Ostream &OS, Type Ty) { |
| 93 if (isVectorType(Ty)) { |
| 94 OS << "v" << typeNumElements(Ty); |
| 95 } |
| 96 OS << typeElementType(Ty); |
| 97 } |
| 98 |
88 // In some cases, there are x-macros tables for both high-level and | 99 // In some cases, there are x-macros tables for both high-level and |
89 // low-level instructions/operands that use the same enum key value. | 100 // low-level instructions/operands that use the same enum key value. |
90 // The tables are kept separate to maintain a proper separation | 101 // The tables are kept separate to maintain a proper separation |
91 // between abstraction layers. There is a risk that the tables | 102 // between abstraction layers. There is a risk that the tables |
92 // could get out of sync if enum values are reordered or if entries | 103 // could get out of sync if enum values are reordered or if entries |
93 // are added or deleted. This dummy function uses static_assert to | 104 // are added or deleted. This dummy function uses static_assert to |
94 // ensure everything is kept in sync. | 105 // ensure everything is kept in sync. |
95 void xMacroIntegrityCheck() { | 106 void xMacroIntegrityCheck() { |
96 // Validate the enum values in FCMPX8632_TABLE. | 107 // Validate the enum values in FCMPX8632_TABLE. |
97 { | 108 { |
(...skipping 55 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
153 { | 164 { |
154 // Define a temporary set of enum values based on low-level | 165 // Define a temporary set of enum values based on low-level |
155 // table entries. | 166 // table entries. |
156 enum _tmp_enum { | 167 enum _tmp_enum { |
157 #define X(tag, cvt, sdss, width) _tmp_##tag, | 168 #define X(tag, cvt, sdss, width) _tmp_##tag, |
158 ICETYPEX8632_TABLE | 169 ICETYPEX8632_TABLE |
159 #undef X | 170 #undef X |
160 _num | 171 _num |
161 }; | 172 }; |
162 // Define a set of constants based on high-level table entries. | 173 // Define a set of constants based on high-level table entries. |
163 #define X(tag, size, align, str) static const int _table1_##tag = tag; | 174 #define X(tag, size, align, elts, elty, str) \ |
| 175 static const int _table1_##tag = tag; |
164 ICETYPE_TABLE; | 176 ICETYPE_TABLE; |
165 #undef X | 177 #undef X |
166 // Define a set of constants based on low-level table entries, | 178 // Define a set of constants based on low-level table entries, |
167 // and ensure the table entry keys are consistent. | 179 // and ensure the table entry keys are consistent. |
168 #define X(tag, cvt, sdss, width) \ | 180 #define X(tag, cvt, sdss, width) \ |
169 static const int _table2_##tag = _tmp_##tag; \ | 181 static const int _table2_##tag = _tmp_##tag; \ |
170 STATIC_ASSERT(_table1_##tag == _table2_##tag); | 182 STATIC_ASSERT(_table1_##tag == _table2_##tag); |
171 ICETYPEX8632_TABLE; | 183 ICETYPEX8632_TABLE; |
172 #undef X | 184 #undef X |
173 // Repeat the static asserts with respect to the high-level | 185 // Repeat the static asserts with respect to the high-level |
174 // table entries in case the high-level table has extra entries. | 186 // table entries in case the high-level table has extra entries. |
175 #define X(tag, size, align, str) STATIC_ASSERT(_table1_##tag == _table2_##tag); | 187 #define X(tag, size, align, elts, elty, str) \ |
| 188 STATIC_ASSERT(_table1_##tag == _table2_##tag); |
176 ICETYPE_TABLE; | 189 ICETYPE_TABLE; |
177 #undef X | 190 #undef X |
178 } | 191 } |
179 } | 192 } |
180 | 193 |
181 } // end of anonymous namespace | 194 } // end of anonymous namespace |
182 | 195 |
183 TargetX8632::TargetX8632(Cfg *Func) | 196 TargetX8632::TargetX8632(Cfg *Func) |
184 : TargetLowering(Func), IsEbpBasedFrame(false), FrameSizeLocals(0), | 197 : TargetLowering(Func), IsEbpBasedFrame(false), FrameSizeLocals(0), |
185 LocalsSizeBytes(0), NextLabelNumber(0), ComputedLiveRanges(false), | 198 LocalsSizeBytes(0), NextLabelNumber(0), ComputedLiveRanges(false), |
(...skipping 488 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
674 typedef ConstantDouble IceType; | 687 typedef ConstantDouble IceType; |
675 static const Type Ty = IceType_f64; | 688 static const Type Ty = IceType_f64; |
676 static const char *TypeName; | 689 static const char *TypeName; |
677 static const char *AsmTag; | 690 static const char *AsmTag; |
678 static const char *PrintfString; | 691 static const char *PrintfString; |
679 }; | 692 }; |
680 const char *PoolTypeConverter<double>::TypeName = "double"; | 693 const char *PoolTypeConverter<double>::TypeName = "double"; |
681 const char *PoolTypeConverter<double>::AsmTag = ".quad"; | 694 const char *PoolTypeConverter<double>::AsmTag = ".quad"; |
682 const char *PoolTypeConverter<double>::PrintfString = "0x%llx"; | 695 const char *PoolTypeConverter<double>::PrintfString = "0x%llx"; |
683 | 696 |
684 template <typename T> void TargetX8632::emitConstantPool() const { | 697 template <typename T> void TargetX8632::emitScalarConstantPool() const { |
685 Ostream &Str = Ctx->getStrEmit(); | 698 Ostream &Str = Ctx->getStrEmit(); |
686 Type Ty = T::Ty; | 699 Type Ty = T::Ty; |
687 SizeT Align = typeAlignInBytes(Ty); | 700 SizeT Align = typeAlignInBytes(Ty); |
688 ConstantList Pool = Ctx->getConstantPool(Ty); | 701 ConstantList Pool = Ctx->getConstantPool(Ty); |
689 | 702 |
690 Str << "\t.section\t.rodata.cst" << Align << ",\"aM\",@progbits," << Align | 703 Str << "\t.section\t.rodata.cst" << Align << ",\"aM\",@progbits," << Align |
691 << "\n"; | 704 << "\n"; |
692 Str << "\t.align\t" << Align << "\n"; | 705 Str << "\t.align\t" << Align << "\n"; |
693 for (ConstantList::const_iterator I = Pool.begin(), E = Pool.end(); I != E; | 706 for (ConstantList::const_iterator I = Pool.begin(), E = Pool.end(); I != E; |
694 ++I) { | 707 ++I) { |
695 typename T::IceType *Const = llvm::cast<typename T::IceType>(*I); | 708 typename T::IceType *Const = llvm::cast<typename T::IceType>(*I); |
696 typename T::PrimitiveFpType Value = Const->getValue(); | 709 typename T::PrimitiveFpType Value = Const->getValue(); |
697 // Use memcpy() to copy bits from Value into RawValue in a way | 710 // Use memcpy() to copy bits from Value into RawValue in a way |
698 // that avoids breaking strict-aliasing rules. | 711 // that avoids breaking strict-aliasing rules. |
699 typename T::PrimitiveIntType RawValue; | 712 typename T::PrimitiveIntType RawValue; |
700 memcpy(&RawValue, &Value, sizeof(Value)); | 713 memcpy(&RawValue, &Value, sizeof(Value)); |
701 char buf[30]; | 714 char buf[30]; |
702 int CharsPrinted = | 715 int CharsPrinted = |
703 snprintf(buf, llvm::array_lengthof(buf), T::PrintfString, RawValue); | 716 snprintf(buf, llvm::array_lengthof(buf), T::PrintfString, RawValue); |
704 assert(CharsPrinted >= 0 && | 717 assert(CharsPrinted >= 0 && |
705 (size_t)CharsPrinted < llvm::array_lengthof(buf)); | 718 (size_t)CharsPrinted < llvm::array_lengthof(buf)); |
706 (void)CharsPrinted; // avoid warnings if asserts are disabled | 719 (void)CharsPrinted; // avoid warnings if asserts are disabled |
707 Str << "L$" << Ty << "$" << Const->getPoolEntryID() << ":\n"; | 720 Str << "L$" << Ty << "$" << Const->getPoolEntryID() << ":\n"; |
708 Str << "\t" << T::AsmTag << "\t" << buf << "\t# " << T::TypeName << " " | 721 Str << "\t" << T::AsmTag << "\t" << buf << "\t# " << T::TypeName << " " |
709 << Value << "\n"; | 722 << Value << "\n"; |
710 } | 723 } |
711 } | 724 } |
712 | 725 |
| 726 void TargetX8632::emitVectorConstantPool() const { |
| 727 Ostream &Str = Ctx->getStrEmit(); |
| 728 |
| 729 // Although the PNaCl ABI doesn't require it, all vector constants are |
| 730 // aligned to 16 bytes to allow for aligned loads. |
| 731 const unsigned Align = VECT128_BYTES; |
| 732 |
| 733 Str << "\t.section\t.rodata.cst" << Align << ",\"aM\",@progbits," << Align |
| 734 << "\n"; |
| 735 Str << "\t.align\t" << Align << "\n"; |
| 736 |
| 737 // Emit each (128 bit) vector. |
| 738 // Non-I1 vectors are all in the same constant pool. |
| 739 ConstantList Vectors = Ctx->getConstantPool(IceType_v8i16); |
| 740 for (ConstantList::const_iterator I = Vectors.begin(), E = Vectors.end(); |
| 741 I != E; ++I) { |
| 742 ConstantVector *Vector = llvm::cast<ConstantVector>(*I); |
| 743 Vect128 Value = Vector->getValue(); |
| 744 assert(Value.size() == VECT128_BYTES); |
| 745 const char *Data = Value.data(); |
| 746 Str << "L$"; |
| 747 emitAsmLabelForType(Str, Vector->getType()); |
| 748 Str << "$" << Vector->getPoolEntryID() << ":\n"; |
| 749 for (unsigned Element = 0; Element < 4; ++Element) { |
| 750 uint32_t RawValue; |
| 751 memcpy(&RawValue, &Data[4 * Element], 4); |
| 752 char buf[30]; |
| 753 int CharsPrinted = |
| 754 snprintf(buf, llvm::array_lengthof(buf), "0x%x", RawValue); |
| 755 assert(CharsPrinted >= 0 && |
| 756 (size_t)CharsPrinted < llvm::array_lengthof(buf)); |
| 757 Str << "\t" |
| 758 << ".long" |
| 759 << "\t" << buf << "\t" |
| 760 << "\n"; |
| 761 } |
| 762 } |
| 763 |
| 764 // Emit each I1 vector expanded to a 128 bit constant. |
| 765 // All I1 vectors are in the same constant pool. |
| 766 ConstantList BitVectors = Ctx->getConstantPool(IceType_v4i1); |
| 767 for (ConstantList::const_iterator I = BitVectors.begin(), |
| 768 E = BitVectors.end(); |
| 769 I != E; ++I) { |
| 770 ConstantBitVector *BitVector = llvm::cast<ConstantBitVector>(*I); |
| 771 BitVect Value = BitVector->getValue(); |
| 772 Str << "L$"; |
| 773 emitAsmLabelForType(Str, BitVector->getType()); |
| 774 Str << "$" << BitVector->getPoolEntryID() << ":\n"; |
| 775 const char *AsmString = NULL; |
| 776 switch (BitVector->getType()) { |
| 777 default: |
| 778 llvm_unreachable("Unknown type"); |
| 779 case IceType_v4i1: |
| 780 AsmString = ".long"; |
| 781 break; |
| 782 case IceType_v8i1: |
| 783 AsmString = ".short"; |
| 784 break; |
| 785 case IceType_v16i1: |
| 786 AsmString = ".byte"; |
| 787 break; |
| 788 } |
| 789 unsigned NumElements = Value.size(); |
| 790 for (unsigned Element = 0; Element < NumElements; ++Element) { |
| 791 Str << "\t" << AsmString << "\t" |
| 792 << "0x"; |
| 793 Str << (Value[Element] ? "1" : "0"); |
| 794 Str << "\t" |
| 795 << "\n"; |
| 796 } |
| 797 } |
| 798 } |
| 799 |
713 void TargetX8632::emitConstants() const { | 800 void TargetX8632::emitConstants() const { |
714 emitConstantPool<PoolTypeConverter<float> >(); | 801 emitScalarConstantPool<PoolTypeConverter<float> >(); |
715 emitConstantPool<PoolTypeConverter<double> >(); | 802 emitScalarConstantPool<PoolTypeConverter<double> >(); |
| 803 emitVectorConstantPool(); |
716 | 804 |
717 // No need to emit constants from the int pool since (for x86) they | 805 // No need to emit constants from the int pool since (for x86) they |
718 // are embedded as immediates in the instructions. | 806 // are embedded as immediates in the instructions. |
719 } | 807 } |
720 | 808 |
721 void TargetX8632::split64(Variable *Var) { | 809 void TargetX8632::split64(Variable *Var) { |
722 switch (Var->getType()) { | 810 switch (Var->getType()) { |
723 default: | 811 default: |
724 return; | 812 return; |
725 case IceType_i64: | 813 case IceType_i64: |
(...skipping 564 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
1290 } | 1378 } |
1291 StackOffset += typeWidthInBytesOnStack(Arg->getType()); | 1379 StackOffset += typeWidthInBytesOnStack(Arg->getType()); |
1292 } | 1380 } |
1293 // Generate the call instruction. Assign its result to a temporary | 1381 // Generate the call instruction. Assign its result to a temporary |
1294 // with high register allocation weight. | 1382 // with high register allocation weight. |
1295 Variable *Dest = Instr->getDest(); | 1383 Variable *Dest = Instr->getDest(); |
1296 Variable *eax = NULL; // doubles as RegLo as necessary | 1384 Variable *eax = NULL; // doubles as RegLo as necessary |
1297 Variable *edx = NULL; | 1385 Variable *edx = NULL; |
1298 if (Dest) { | 1386 if (Dest) { |
1299 switch (Dest->getType()) { | 1387 switch (Dest->getType()) { |
| 1388 case IceType_v4i1: |
| 1389 case IceType_v8i1: |
| 1390 case IceType_v16i1: |
| 1391 case IceType_v16i8: |
| 1392 case IceType_v8i16: |
| 1393 case IceType_v4i32: |
| 1394 case IceType_v4f32: |
1300 case IceType_NUM: | 1395 case IceType_NUM: |
1301 llvm_unreachable("Invalid Call dest type"); | 1396 llvm_unreachable("Invalid Call dest type"); |
1302 break; | 1397 break; |
1303 case IceType_void: | 1398 case IceType_void: |
1304 break; | 1399 break; |
1305 case IceType_i1: | 1400 case IceType_i1: |
1306 case IceType_i8: | 1401 case IceType_i8: |
1307 case IceType_i16: | 1402 case IceType_i16: |
1308 case IceType_i32: | 1403 case IceType_i32: |
1309 eax = makeReg(Dest->getType(), Reg_eax); | 1404 eax = makeReg(Dest->getType(), Reg_eax); |
(...skipping 954 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
2264 if (Inst->hasRetValue()) { | 2359 if (Inst->hasRetValue()) { |
2265 Operand *Src0 = legalize(Inst->getRetValue()); | 2360 Operand *Src0 = legalize(Inst->getRetValue()); |
2266 if (Src0->getType() == IceType_i64) { | 2361 if (Src0->getType() == IceType_i64) { |
2267 Variable *eax = legalizeToVar(loOperand(Src0), false, Reg_eax); | 2362 Variable *eax = legalizeToVar(loOperand(Src0), false, Reg_eax); |
2268 Variable *edx = legalizeToVar(hiOperand(Src0), false, Reg_edx); | 2363 Variable *edx = legalizeToVar(hiOperand(Src0), false, Reg_edx); |
2269 Reg = eax; | 2364 Reg = eax; |
2270 Context.insert(InstFakeUse::create(Func, edx)); | 2365 Context.insert(InstFakeUse::create(Func, edx)); |
2271 } else if (Src0->getType() == IceType_f32 || | 2366 } else if (Src0->getType() == IceType_f32 || |
2272 Src0->getType() == IceType_f64) { | 2367 Src0->getType() == IceType_f64) { |
2273 _fld(Src0); | 2368 _fld(Src0); |
| 2369 } else if (isVectorType(Src0->getType())) { |
| 2370 Reg = legalizeToVar(Src0, false, Reg_xmm0); |
2274 } else { | 2371 } else { |
2275 _mov(Reg, Src0, Reg_eax); | 2372 _mov(Reg, Src0, Reg_eax); |
2276 } | 2373 } |
2277 } | 2374 } |
2278 _ret(Reg); | 2375 _ret(Reg); |
2279 // Add a fake use of esp to make sure esp stays alive for the entire | 2376 // Add a fake use of esp to make sure esp stays alive for the entire |
2280 // function. Otherwise post-call esp adjustments get dead-code | 2377 // function. Otherwise post-call esp adjustments get dead-code |
2281 // eliminated. TODO: Are there more places where the fake use | 2378 // eliminated. TODO: Are there more places where the fake use |
2282 // should be inserted? E.g. "void f(int n){while(1) g(n);}" may not | 2379 // should be inserted? E.g. "void f(int n){while(1) g(n);}" may not |
2283 // have a ret instruction. | 2380 // have a ret instruction. |
(...skipping 101 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
2385 _br(Inst->getLabelDefault()); | 2482 _br(Inst->getLabelDefault()); |
2386 } | 2483 } |
2387 | 2484 |
2388 void TargetX8632::lowerUnreachable(const InstUnreachable * /*Inst*/) { | 2485 void TargetX8632::lowerUnreachable(const InstUnreachable * /*Inst*/) { |
2389 const SizeT MaxSrcs = 0; | 2486 const SizeT MaxSrcs = 0; |
2390 Variable *Dest = NULL; | 2487 Variable *Dest = NULL; |
2391 InstCall *Call = makeHelperCall("ice_unreachable", Dest, MaxSrcs); | 2488 InstCall *Call = makeHelperCall("ice_unreachable", Dest, MaxSrcs); |
2392 lowerCall(Call); | 2489 lowerCall(Call); |
2393 } | 2490 } |
2394 | 2491 |
| 2492 // Helper for legalize() to emit the right code to lower an operand to a |
| 2493 // register of the appropriate type. |
| 2494 Variable *TargetX8632::copyToReg(Operand *Src, int32_t RegNum) { |
| 2495 Type Ty = Src->getType(); |
| 2496 Variable *Reg = makeReg(Ty, RegNum); |
| 2497 if (isVectorType(Src->getType())) { |
| 2498 _movp(Reg, Src); |
| 2499 } else { |
| 2500 _mov(Reg, Src); |
| 2501 } |
| 2502 return Reg; |
| 2503 } |
| 2504 |
2395 Operand *TargetX8632::legalize(Operand *From, LegalMask Allowed, | 2505 Operand *TargetX8632::legalize(Operand *From, LegalMask Allowed, |
2396 bool AllowOverlap, int32_t RegNum) { | 2506 bool AllowOverlap, int32_t RegNum) { |
2397 // Assert that a physical register is allowed. To date, all calls | 2507 // Assert that a physical register is allowed. To date, all calls |
2398 // to legalize() allow a physical register. If a physical register | 2508 // to legalize() allow a physical register. If a physical register |
2399 // needs to be explicitly disallowed, then new code will need to be | 2509 // needs to be explicitly disallowed, then new code will need to be |
2400 // written to force a spill. | 2510 // written to force a spill. |
2401 assert(Allowed & Legal_Reg); | 2511 assert(Allowed & Legal_Reg); |
2402 // If we're asking for a specific physical register, make sure we're | 2512 // If we're asking for a specific physical register, make sure we're |
2403 // not allowing any other operand kinds. (This could be future | 2513 // not allowing any other operand kinds. (This could be future |
2404 // work, e.g. allow the shl shift amount to be either an immediate | 2514 // work, e.g. allow the shl shift amount to be either an immediate |
(...skipping 12 matching lines...) Expand all Loading... |
2417 if (Index) { | 2527 if (Index) { |
2418 RegIndex = legalizeToVar(Index, true); | 2528 RegIndex = legalizeToVar(Index, true); |
2419 } | 2529 } |
2420 if (Base != RegBase || Index != RegIndex) { | 2530 if (Base != RegBase || Index != RegIndex) { |
2421 From = OperandX8632Mem::create( | 2531 From = OperandX8632Mem::create( |
2422 Func, Mem->getType(), RegBase, Mem->getOffset(), RegIndex, | 2532 Func, Mem->getType(), RegBase, Mem->getOffset(), RegIndex, |
2423 Mem->getShift(), Mem->getSegmentRegister()); | 2533 Mem->getShift(), Mem->getSegmentRegister()); |
2424 } | 2534 } |
2425 | 2535 |
2426 if (!(Allowed & Legal_Mem)) { | 2536 if (!(Allowed & Legal_Mem)) { |
2427 Variable *Reg = makeReg(From->getType(), RegNum); | 2537 From = copyToReg(From, RegNum); |
2428 _mov(Reg, From, RegNum); | |
2429 From = Reg; | |
2430 } | 2538 } |
2431 return From; | 2539 return From; |
2432 } | 2540 } |
2433 if (llvm::isa<Constant>(From)) { | 2541 if (llvm::isa<Constant>(From)) { |
2434 if (llvm::isa<ConstantUndef>(From)) { | 2542 if (llvm::isa<ConstantUndef>(From)) { |
2435 // Lower undefs to zero. Another option is to lower undefs to an | 2543 // Lower undefs to zero. Another option is to lower undefs to an |
2436 // uninitialized register; however, using an uninitialized register | 2544 // uninitialized register; however, using an uninitialized register |
2437 // results in less predictable code. | 2545 // results in less predictable code. |
2438 // | 2546 // |
2439 // If in the future the implementation is changed to lower undef | 2547 // If in the future the implementation is changed to lower undef |
2440 // values to uninitialized registers, a FakeDef will be needed: | 2548 // values to uninitialized registers, a FakeDef will be needed: |
2441 // Context.insert(InstFakeDef::create(Func, Reg)); | 2549 // Context.insert(InstFakeDef::create(Func, Reg)); |
2442 // This is in order to ensure that the live range of Reg is not | 2550 // This is in order to ensure that the live range of Reg is not |
2443 // overestimated. If the constant being lowered is a 64 bit value, | 2551 // overestimated. If the constant being lowered is a 64 bit value, |
2444 // then the result should be split and the lo and hi components will | 2552 // then the result should be split and the lo and hi components will |
2445 // need to go in uninitialized registers. | 2553 // need to go in uninitialized registers. |
2446 From = Ctx->getConstantZero(From->getType()); | 2554 From = Ctx->getConstantZero(From->getType()); |
2447 } | 2555 } |
2448 bool NeedsReg = | 2556 bool NeedsReg = |
2449 !(Allowed & Legal_Imm) || | 2557 !(Allowed & Legal_Imm) || |
2450 // ConstantFloat and ConstantDouble are actually memory operands. | 2558 // ConstantFloat, ConstantDouble, and vector constants are |
| 2559 // actually memory operands. |
2451 (!(Allowed & Legal_Mem) && | 2560 (!(Allowed & Legal_Mem) && |
2452 (From->getType() == IceType_f32 || From->getType() == IceType_f64)); | 2561 (From->getType() == IceType_f32 || From->getType() == IceType_f64 || |
| 2562 isVectorType(From->getType()))); |
2453 if (NeedsReg) { | 2563 if (NeedsReg) { |
2454 Variable *Reg = makeReg(From->getType(), RegNum); | 2564 From = copyToReg(From, RegNum); |
2455 _mov(Reg, From); | |
2456 From = Reg; | |
2457 } | 2565 } |
2458 return From; | 2566 return From; |
2459 } | 2567 } |
2460 if (Variable *Var = llvm::dyn_cast<Variable>(From)) { | 2568 if (Variable *Var = llvm::dyn_cast<Variable>(From)) { |
2461 // We need a new physical register for the operand if: | 2569 // We need a new physical register for the operand if: |
2462 // Mem is not allowed and Var->getRegNum() is unknown, or | 2570 // Mem is not allowed and Var->getRegNum() is unknown, or |
2463 // RegNum is required and Var->getRegNum() doesn't match. | 2571 // RegNum is required and Var->getRegNum() doesn't match. |
2464 if ((!(Allowed & Legal_Mem) && !Var->hasReg()) || | 2572 if ((!(Allowed & Legal_Mem) && !Var->hasReg()) || |
2465 (RegNum != Variable::NoRegister && RegNum != Var->getRegNum())) { | 2573 (RegNum != Variable::NoRegister && RegNum != Var->getRegNum())) { |
2466 Variable *Reg = makeReg(From->getType(), RegNum); | 2574 Variable *Reg = copyToReg(From, RegNum); |
2467 if (RegNum == Variable::NoRegister) { | 2575 if (RegNum == Variable::NoRegister) { |
2468 Reg->setPreferredRegister(Var, AllowOverlap); | 2576 Reg->setPreferredRegister(Var, AllowOverlap); |
2469 } | 2577 } |
2470 _mov(Reg, From); | |
2471 From = Reg; | 2578 From = Reg; |
2472 } | 2579 } |
2473 return From; | 2580 return From; |
2474 } | 2581 } |
2475 llvm_unreachable("Unhandled operand kind in legalize()"); | 2582 llvm_unreachable("Unhandled operand kind in legalize()"); |
2476 return From; | 2583 return From; |
2477 } | 2584 } |
2478 | 2585 |
2479 // Provide a trivial wrapper to legalize() for this common usage. | 2586 // Provide a trivial wrapper to legalize() for this common usage. |
2480 Variable *TargetX8632::legalizeToVar(Operand *From, bool AllowOverlap, | 2587 Variable *TargetX8632::legalizeToVar(Operand *From, bool AllowOverlap, |
(...skipping 81 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
2562 } | 2669 } |
2563 assert(AvailableTypedRegisters.any()); | 2670 assert(AvailableTypedRegisters.any()); |
2564 int32_t RegNum = AvailableTypedRegisters.find_first(); | 2671 int32_t RegNum = AvailableTypedRegisters.find_first(); |
2565 Var->setRegNum(RegNum); | 2672 Var->setRegNum(RegNum); |
2566 AvailableRegisters[RegNum] = false; | 2673 AvailableRegisters[RegNum] = false; |
2567 } | 2674 } |
2568 } | 2675 } |
2569 } | 2676 } |
2570 } | 2677 } |
2571 | 2678 |
| 2679 template <> void ConstantInteger::emit(GlobalContext *Ctx) const { |
| 2680 Ostream &Str = Ctx->getStrEmit(); |
| 2681 Str << getValue(); |
| 2682 } |
| 2683 |
2572 template <> void ConstantFloat::emit(GlobalContext *Ctx) const { | 2684 template <> void ConstantFloat::emit(GlobalContext *Ctx) const { |
2573 Ostream &Str = Ctx->getStrEmit(); | 2685 Ostream &Str = Ctx->getStrEmit(); |
2574 // It would be better to prefix with ".L$" instead of "L$", but | 2686 // It would be better to prefix with ".L$" instead of "L$", but |
2575 // llvm-mc doesn't parse "dword ptr [.L$foo]". | 2687 // llvm-mc doesn't parse "dword ptr [.L$foo]". |
2576 Str << "dword ptr [L$" << IceType_f32 << "$" << getPoolEntryID() << "]"; | 2688 Str << "dword ptr [L$" << IceType_f32 << "$" << getPoolEntryID() << "]"; |
2577 } | 2689 } |
2578 | 2690 |
2579 template <> void ConstantDouble::emit(GlobalContext *Ctx) const { | 2691 template <> void ConstantDouble::emit(GlobalContext *Ctx) const { |
2580 Ostream &Str = Ctx->getStrEmit(); | 2692 Ostream &Str = Ctx->getStrEmit(); |
2581 Str << "qword ptr [L$" << IceType_f64 << "$" << getPoolEntryID() << "]"; | 2693 Str << "qword ptr [L$" << IceType_f64 << "$" << getPoolEntryID() << "]"; |
2582 } | 2694 } |
2583 | 2695 |
| 2696 template <> void ConstantVector::emit(GlobalContext *Ctx) const { |
| 2697 Ostream &Str = Ctx->getStrEmit(); |
| 2698 Str << "xmmword ptr [L$"; |
| 2699 emitAsmLabelForType(Str, getType()); |
| 2700 Str << "$" << getPoolEntryID() << "]"; |
| 2701 } |
| 2702 |
| 2703 template <> void ConstantBitVector::emit(GlobalContext *Ctx) const { |
| 2704 Ostream &Str = Ctx->getStrEmit(); |
| 2705 Str << "xmmword ptr [L$"; |
| 2706 emitAsmLabelForType(Str, getType()); |
| 2707 Str << "$" << getPoolEntryID() << "]"; |
| 2708 } |
| 2709 |
2584 } // end of namespace Ice | 2710 } // end of namespace Ice |
OLD | NEW |