| OLD | NEW | 
|---|
| 1 //===- subzero/src/IceTargetLoweringX8632.cpp - x86-32 lowering -----------===// | 1 //===- subzero/src/IceTargetLoweringX8632.cpp - x86-32 lowering -----------===// | 
| 2 // | 2 // | 
| 3 //                        The Subzero Code Generator | 3 //                        The Subzero Code Generator | 
| 4 // | 4 // | 
| 5 // This file is distributed under the University of Illinois Open Source | 5 // This file is distributed under the University of Illinois Open Source | 
| 6 // License. See LICENSE.TXT for details. | 6 // License. See LICENSE.TXT for details. | 
| 7 // | 7 // | 
| 8 //===----------------------------------------------------------------------===// | 8 //===----------------------------------------------------------------------===// | 
| 9 // | 9 // | 
| 10 // This file implements the TargetLoweringX8632 class, which | 10 // This file implements the TargetLoweringX8632 class, which | 
| (...skipping 67 matching lines...) Expand 10 before | Expand all | Expand 10 after  Loading... | 
| 78 #undef X | 78 #undef X | 
| 79   }; | 79   }; | 
| 80 const size_t TableIcmp64Size = llvm::array_lengthof(TableIcmp64); | 80 const size_t TableIcmp64Size = llvm::array_lengthof(TableIcmp64); | 
| 81 | 81 | 
| 82 InstX8632Br::BrCond getIcmp32Mapping(InstIcmp::ICond Cond) { | 82 InstX8632Br::BrCond getIcmp32Mapping(InstIcmp::ICond Cond) { | 
| 83   size_t Index = static_cast<size_t>(Cond); | 83   size_t Index = static_cast<size_t>(Cond); | 
| 84   assert(Index < TableIcmp32Size); | 84   assert(Index < TableIcmp32Size); | 
| 85   return TableIcmp32[Index].Mapping; | 85   return TableIcmp32[Index].Mapping; | 
| 86 } | 86 } | 
| 87 | 87 | 
|  | 88 // Output a valid assembly identifier for the specified type. This is | 
|  | 89 // needed for representing vector types because the default Ostream | 
|  | 90 // operator<< implementation does not output a valid assembly identifier | 
|  | 91 // when the argument is a vector type. | 
|  | 92 void emitAsmLabelForType(Ostream &OS, Type Ty) { | 
|  | 93   if (isVectorType(Ty)) { | 
|  | 94     OS << "v" << typeNumElements(Ty); | 
|  | 95   } | 
|  | 96   OS << typeElementType(Ty); | 
|  | 97 } | 
|  | 98 | 
| 88 // In some cases, there are x-macros tables for both high-level and | 99 // In some cases, there are x-macros tables for both high-level and | 
| 89 // low-level instructions/operands that use the same enum key value. | 100 // low-level instructions/operands that use the same enum key value. | 
| 90 // The tables are kept separate to maintain a proper separation | 101 // The tables are kept separate to maintain a proper separation | 
| 91 // between abstraction layers.  There is a risk that the tables | 102 // between abstraction layers.  There is a risk that the tables | 
| 92 // could get out of sync if enum values are reordered or if entries | 103 // could get out of sync if enum values are reordered or if entries | 
| 93 // are added or deleted.  This dummy function uses static_assert to | 104 // are added or deleted.  This dummy function uses static_assert to | 
| 94 // ensure everything is kept in sync. | 105 // ensure everything is kept in sync. | 
| 95 void xMacroIntegrityCheck() { | 106 void xMacroIntegrityCheck() { | 
| 96   // Validate the enum values in FCMPX8632_TABLE. | 107   // Validate the enum values in FCMPX8632_TABLE. | 
| 97   { | 108   { | 
| (...skipping 55 matching lines...) Expand 10 before | Expand all | Expand 10 after  Loading... | 
| 153   { | 164   { | 
| 154     // Define a temporary set of enum values based on low-level | 165     // Define a temporary set of enum values based on low-level | 
| 155     // table entries. | 166     // table entries. | 
| 156     enum _tmp_enum { | 167     enum _tmp_enum { | 
| 157 #define X(tag, cvt, sdss, width) _tmp_##tag, | 168 #define X(tag, cvt, sdss, width) _tmp_##tag, | 
| 158       ICETYPEX8632_TABLE | 169       ICETYPEX8632_TABLE | 
| 159 #undef X | 170 #undef X | 
| 160           _num | 171           _num | 
| 161     }; | 172     }; | 
| 162 // Define a set of constants based on high-level table entries. | 173 // Define a set of constants based on high-level table entries. | 
| 163 #define X(tag, size, align, str) static const int _table1_##tag = tag; | 174 #define X(tag, size, align, elts, elty, str)                                   \ | 
|  | 175   static const int _table1_##tag = tag; | 
| 164     ICETYPE_TABLE; | 176     ICETYPE_TABLE; | 
| 165 #undef X | 177 #undef X | 
| 166 // Define a set of constants based on low-level table entries, | 178 // Define a set of constants based on low-level table entries, | 
| 167 // and ensure the table entry keys are consistent. | 179 // and ensure the table entry keys are consistent. | 
| 168 #define X(tag, cvt, sdss, width)                                               \ | 180 #define X(tag, cvt, sdss, width)                                               \ | 
| 169   static const int _table2_##tag = _tmp_##tag;                                 \ | 181   static const int _table2_##tag = _tmp_##tag;                                 \ | 
| 170   STATIC_ASSERT(_table1_##tag == _table2_##tag); | 182   STATIC_ASSERT(_table1_##tag == _table2_##tag); | 
| 171     ICETYPEX8632_TABLE; | 183     ICETYPEX8632_TABLE; | 
| 172 #undef X | 184 #undef X | 
| 173 // Repeat the static asserts with respect to the high-level | 185 // Repeat the static asserts with respect to the high-level | 
| 174 // table entries in case the high-level table has extra entries. | 186 // table entries in case the high-level table has extra entries. | 
| 175 #define X(tag, size, align, str) STATIC_ASSERT(_table1_##tag == _table2_##tag); | 187 #define X(tag, size, align, elts, elty, str)                                   \ | 
|  | 188   STATIC_ASSERT(_table1_##tag == _table2_##tag); | 
| 176     ICETYPE_TABLE; | 189     ICETYPE_TABLE; | 
| 177 #undef X | 190 #undef X | 
| 178   } | 191   } | 
| 179 } | 192 } | 
| 180 | 193 | 
| 181 } // end of anonymous namespace | 194 } // end of anonymous namespace | 
| 182 | 195 | 
| 183 TargetX8632::TargetX8632(Cfg *Func) | 196 TargetX8632::TargetX8632(Cfg *Func) | 
| 184     : TargetLowering(Func), IsEbpBasedFrame(false), FrameSizeLocals(0), | 197     : TargetLowering(Func), IsEbpBasedFrame(false), FrameSizeLocals(0), | 
| 185       LocalsSizeBytes(0), NextLabelNumber(0), ComputedLiveRanges(false), | 198       LocalsSizeBytes(0), NextLabelNumber(0), ComputedLiveRanges(false), | 
| (...skipping 488 matching lines...) Expand 10 before | Expand all | Expand 10 after  Loading... | 
| 674   typedef ConstantDouble IceType; | 687   typedef ConstantDouble IceType; | 
| 675   static const Type Ty = IceType_f64; | 688   static const Type Ty = IceType_f64; | 
| 676   static const char *TypeName; | 689   static const char *TypeName; | 
| 677   static const char *AsmTag; | 690   static const char *AsmTag; | 
| 678   static const char *PrintfString; | 691   static const char *PrintfString; | 
| 679 }; | 692 }; | 
| 680 const char *PoolTypeConverter<double>::TypeName = "double"; | 693 const char *PoolTypeConverter<double>::TypeName = "double"; | 
| 681 const char *PoolTypeConverter<double>::AsmTag = ".quad"; | 694 const char *PoolTypeConverter<double>::AsmTag = ".quad"; | 
| 682 const char *PoolTypeConverter<double>::PrintfString = "0x%llx"; | 695 const char *PoolTypeConverter<double>::PrintfString = "0x%llx"; | 
| 683 | 696 | 
| 684 template <typename T> void TargetX8632::emitConstantPool() const { | 697 template <typename T> void TargetX8632::emitScalarConstantPool() const { | 
| 685   Ostream &Str = Ctx->getStrEmit(); | 698   Ostream &Str = Ctx->getStrEmit(); | 
| 686   Type Ty = T::Ty; | 699   Type Ty = T::Ty; | 
| 687   SizeT Align = typeAlignInBytes(Ty); | 700   SizeT Align = typeAlignInBytes(Ty); | 
| 688   ConstantList Pool = Ctx->getConstantPool(Ty); | 701   ConstantList Pool = Ctx->getConstantPool(Ty); | 
| 689 | 702 | 
| 690   Str << "\t.section\t.rodata.cst" << Align << ",\"aM\",@progbits," << Align | 703   Str << "\t.section\t.rodata.cst" << Align << ",\"aM\",@progbits," << Align | 
| 691       << "\n"; | 704       << "\n"; | 
| 692   Str << "\t.align\t" << Align << "\n"; | 705   Str << "\t.align\t" << Align << "\n"; | 
| 693   for (ConstantList::const_iterator I = Pool.begin(), E = Pool.end(); I != E; | 706   for (ConstantList::const_iterator I = Pool.begin(), E = Pool.end(); I != E; | 
| 694        ++I) { | 707        ++I) { | 
| 695     typename T::IceType *Const = llvm::cast<typename T::IceType>(*I); | 708     typename T::IceType *Const = llvm::cast<typename T::IceType>(*I); | 
| 696     typename T::PrimitiveFpType Value = Const->getValue(); | 709     typename T::PrimitiveFpType Value = Const->getValue(); | 
| 697     // Use memcpy() to copy bits from Value into RawValue in a way | 710     // Use memcpy() to copy bits from Value into RawValue in a way | 
| 698     // that avoids breaking strict-aliasing rules. | 711     // that avoids breaking strict-aliasing rules. | 
| 699     typename T::PrimitiveIntType RawValue; | 712     typename T::PrimitiveIntType RawValue; | 
| 700     memcpy(&RawValue, &Value, sizeof(Value)); | 713     memcpy(&RawValue, &Value, sizeof(Value)); | 
| 701     char buf[30]; | 714     char buf[30]; | 
| 702     int CharsPrinted = | 715     int CharsPrinted = | 
| 703         snprintf(buf, llvm::array_lengthof(buf), T::PrintfString, RawValue); | 716         snprintf(buf, llvm::array_lengthof(buf), T::PrintfString, RawValue); | 
| 704     assert(CharsPrinted >= 0 && | 717     assert(CharsPrinted >= 0 && | 
| 705            (size_t)CharsPrinted < llvm::array_lengthof(buf)); | 718            (size_t)CharsPrinted < llvm::array_lengthof(buf)); | 
| 706     (void)CharsPrinted; // avoid warnings if asserts are disabled | 719     (void)CharsPrinted; // avoid warnings if asserts are disabled | 
| 707     Str << "L$" << Ty << "$" << Const->getPoolEntryID() << ":\n"; | 720     Str << "L$" << Ty << "$" << Const->getPoolEntryID() << ":\n"; | 
| 708     Str << "\t" << T::AsmTag << "\t" << buf << "\t# " << T::TypeName << " " | 721     Str << "\t" << T::AsmTag << "\t" << buf << "\t# " << T::TypeName << " " | 
| 709         << Value << "\n"; | 722         << Value << "\n"; | 
| 710   } | 723   } | 
| 711 } | 724 } | 
| 712 | 725 | 
|  | 726 void TargetX8632::emitVectorConstantPool() const { | 
|  | 727   Ostream &Str = Ctx->getStrEmit(); | 
|  | 728 | 
|  | 729   // Although the PNaCl ABI doesn't require it, all vector constants are | 
|  | 730   // aligned to 16 bytes to allow for aligned loads. | 
|  | 731   const unsigned Align = VECT128_BYTES; | 
|  | 732 | 
|  | 733   Str << "\t.section\t.rodata.cst" << Align << ",\"aM\",@progbits," << Align | 
|  | 734       << "\n"; | 
|  | 735   Str << "\t.align\t" << Align << "\n"; | 
|  | 736 | 
|  | 737   // Emit each (128 bit) vector. | 
|  | 738   // Non-I1 vectors are all in the same constant pool. | 
|  | 739   ConstantList Vectors = Ctx->getConstantPool(IceType_v8i16); | 
|  | 740   for (ConstantList::const_iterator I = Vectors.begin(), E = Vectors.end(); | 
|  | 741        I != E; ++I) { | 
|  | 742     ConstantVector *Vector = llvm::cast<ConstantVector>(*I); | 
|  | 743     Vect128 Value = Vector->getValue(); | 
|  | 744     assert(Value.size() == VECT128_BYTES); | 
|  | 745     const char *Data = Value.data(); | 
|  | 746     Str << "L$"; | 
|  | 747     emitAsmLabelForType(Str, Vector->getType()); | 
|  | 748     Str << "$" << Vector->getPoolEntryID() << ":\n"; | 
|  | 749     for (unsigned Element = 0; Element < 4; ++Element) { | 
|  | 750       uint32_t RawValue; | 
|  | 751       memcpy(&RawValue, &Data[4 * Element], 4); | 
|  | 752       char buf[30]; | 
|  | 753       int CharsPrinted = | 
|  | 754           snprintf(buf, llvm::array_lengthof(buf), "0x%x", RawValue); | 
|  | 755       assert(CharsPrinted >= 0 && | 
|  | 756              (size_t)CharsPrinted < llvm::array_lengthof(buf)); | 
|  | 757       Str << "\t" | 
|  | 758           << ".long" | 
|  | 759           << "\t" << buf << "\t" | 
|  | 760           << "\n"; | 
|  | 761     } | 
|  | 762   } | 
|  | 763 | 
|  | 764   // Emit each I1 vector expanded to a 128 bit constant. | 
|  | 765   // All I1 vectors are in the same constant pool. | 
|  | 766   ConstantList BitVectors = Ctx->getConstantPool(IceType_v4i1); | 
|  | 767   for (ConstantList::const_iterator I = BitVectors.begin(), | 
|  | 768                                     E = BitVectors.end(); | 
|  | 769        I != E; ++I) { | 
|  | 770     ConstantBitVector *BitVector = llvm::cast<ConstantBitVector>(*I); | 
|  | 771     BitVect Value = BitVector->getValue(); | 
|  | 772     Str << "L$"; | 
|  | 773     emitAsmLabelForType(Str, BitVector->getType()); | 
|  | 774     Str << "$" << BitVector->getPoolEntryID() << ":\n"; | 
|  | 775     const char *AsmString = NULL; | 
|  | 776     switch (BitVector->getType()) { | 
|  | 777     default: | 
|  | 778       llvm_unreachable("Unknown type"); | 
|  | 779     case IceType_v4i1: | 
|  | 780       AsmString = ".long"; | 
|  | 781       break; | 
|  | 782     case IceType_v8i1: | 
|  | 783       AsmString = ".short"; | 
|  | 784       break; | 
|  | 785     case IceType_v16i1: | 
|  | 786       AsmString = ".byte"; | 
|  | 787       break; | 
|  | 788     } | 
|  | 789     unsigned NumElements = Value.size(); | 
|  | 790     for (unsigned Element = 0; Element < NumElements; ++Element) { | 
|  | 791       Str << "\t" << AsmString << "\t" | 
|  | 792           << "0x"; | 
|  | 793       Str << (Value[Element] ? "1" : "0"); | 
|  | 794       Str << "\t" | 
|  | 795           << "\n"; | 
|  | 796     } | 
|  | 797   } | 
|  | 798 } | 
|  | 799 | 
| 713 void TargetX8632::emitConstants() const { | 800 void TargetX8632::emitConstants() const { | 
| 714   emitConstantPool<PoolTypeConverter<float> >(); | 801   emitScalarConstantPool<PoolTypeConverter<float> >(); | 
| 715   emitConstantPool<PoolTypeConverter<double> >(); | 802   emitScalarConstantPool<PoolTypeConverter<double> >(); | 
|  | 803   emitVectorConstantPool(); | 
| 716 | 804 | 
| 717   // No need to emit constants from the int pool since (for x86) they | 805   // No need to emit constants from the int pool since (for x86) they | 
| 718   // are embedded as immediates in the instructions. | 806   // are embedded as immediates in the instructions. | 
| 719 } | 807 } | 
| 720 | 808 | 
| 721 void TargetX8632::split64(Variable *Var) { | 809 void TargetX8632::split64(Variable *Var) { | 
| 722   switch (Var->getType()) { | 810   switch (Var->getType()) { | 
| 723   default: | 811   default: | 
| 724     return; | 812     return; | 
| 725   case IceType_i64: | 813   case IceType_i64: | 
| (...skipping 564 matching lines...) Expand 10 before | Expand all | Expand 10 after  Loading... | 
| 1290     } | 1378     } | 
| 1291     StackOffset += typeWidthInBytesOnStack(Arg->getType()); | 1379     StackOffset += typeWidthInBytesOnStack(Arg->getType()); | 
| 1292   } | 1380   } | 
| 1293   // Generate the call instruction.  Assign its result to a temporary | 1381   // Generate the call instruction.  Assign its result to a temporary | 
| 1294   // with high register allocation weight. | 1382   // with high register allocation weight. | 
| 1295   Variable *Dest = Instr->getDest(); | 1383   Variable *Dest = Instr->getDest(); | 
| 1296   Variable *eax = NULL; // doubles as RegLo as necessary | 1384   Variable *eax = NULL; // doubles as RegLo as necessary | 
| 1297   Variable *edx = NULL; | 1385   Variable *edx = NULL; | 
| 1298   if (Dest) { | 1386   if (Dest) { | 
| 1299     switch (Dest->getType()) { | 1387     switch (Dest->getType()) { | 
|  | 1388     case IceType_v4i1: | 
|  | 1389     case IceType_v8i1: | 
|  | 1390     case IceType_v16i1: | 
|  | 1391     case IceType_v16i8: | 
|  | 1392     case IceType_v8i16: | 
|  | 1393     case IceType_v4i32: | 
|  | 1394     case IceType_v4f32: | 
| 1300     case IceType_NUM: | 1395     case IceType_NUM: | 
| 1301       llvm_unreachable("Invalid Call dest type"); | 1396       llvm_unreachable("Invalid Call dest type"); | 
| 1302       break; | 1397       break; | 
| 1303     case IceType_void: | 1398     case IceType_void: | 
| 1304       break; | 1399       break; | 
| 1305     case IceType_i1: | 1400     case IceType_i1: | 
| 1306     case IceType_i8: | 1401     case IceType_i8: | 
| 1307     case IceType_i16: | 1402     case IceType_i16: | 
| 1308     case IceType_i32: | 1403     case IceType_i32: | 
| 1309       eax = makeReg(Dest->getType(), Reg_eax); | 1404       eax = makeReg(Dest->getType(), Reg_eax); | 
| (...skipping 954 matching lines...) Expand 10 before | Expand all | Expand 10 after  Loading... | 
| 2264   if (Inst->hasRetValue()) { | 2359   if (Inst->hasRetValue()) { | 
| 2265     Operand *Src0 = legalize(Inst->getRetValue()); | 2360     Operand *Src0 = legalize(Inst->getRetValue()); | 
| 2266     if (Src0->getType() == IceType_i64) { | 2361     if (Src0->getType() == IceType_i64) { | 
| 2267       Variable *eax = legalizeToVar(loOperand(Src0), false, Reg_eax); | 2362       Variable *eax = legalizeToVar(loOperand(Src0), false, Reg_eax); | 
| 2268       Variable *edx = legalizeToVar(hiOperand(Src0), false, Reg_edx); | 2363       Variable *edx = legalizeToVar(hiOperand(Src0), false, Reg_edx); | 
| 2269       Reg = eax; | 2364       Reg = eax; | 
| 2270       Context.insert(InstFakeUse::create(Func, edx)); | 2365       Context.insert(InstFakeUse::create(Func, edx)); | 
| 2271     } else if (Src0->getType() == IceType_f32 || | 2366     } else if (Src0->getType() == IceType_f32 || | 
| 2272                Src0->getType() == IceType_f64) { | 2367                Src0->getType() == IceType_f64) { | 
| 2273       _fld(Src0); | 2368       _fld(Src0); | 
|  | 2369     } else if (isVectorType(Src0->getType())) { | 
|  | 2370       Reg = legalizeToVar(Src0, false, Reg_xmm0); | 
| 2274     } else { | 2371     } else { | 
| 2275       _mov(Reg, Src0, Reg_eax); | 2372       _mov(Reg, Src0, Reg_eax); | 
| 2276     } | 2373     } | 
| 2277   } | 2374   } | 
| 2278   _ret(Reg); | 2375   _ret(Reg); | 
| 2279   // Add a fake use of esp to make sure esp stays alive for the entire | 2376   // Add a fake use of esp to make sure esp stays alive for the entire | 
| 2280   // function.  Otherwise post-call esp adjustments get dead-code | 2377   // function.  Otherwise post-call esp adjustments get dead-code | 
| 2281   // eliminated.  TODO: Are there more places where the fake use | 2378   // eliminated.  TODO: Are there more places where the fake use | 
| 2282   // should be inserted?  E.g. "void f(int n){while(1) g(n);}" may not | 2379   // should be inserted?  E.g. "void f(int n){while(1) g(n);}" may not | 
| 2283   // have a ret instruction. | 2380   // have a ret instruction. | 
| (...skipping 101 matching lines...) Expand 10 before | Expand all | Expand 10 after  Loading... | 
| 2385   _br(Inst->getLabelDefault()); | 2482   _br(Inst->getLabelDefault()); | 
| 2386 } | 2483 } | 
| 2387 | 2484 | 
| 2388 void TargetX8632::lowerUnreachable(const InstUnreachable * /*Inst*/) { | 2485 void TargetX8632::lowerUnreachable(const InstUnreachable * /*Inst*/) { | 
| 2389   const SizeT MaxSrcs = 0; | 2486   const SizeT MaxSrcs = 0; | 
| 2390   Variable *Dest = NULL; | 2487   Variable *Dest = NULL; | 
| 2391   InstCall *Call = makeHelperCall("ice_unreachable", Dest, MaxSrcs); | 2488   InstCall *Call = makeHelperCall("ice_unreachable", Dest, MaxSrcs); | 
| 2392   lowerCall(Call); | 2489   lowerCall(Call); | 
| 2393 } | 2490 } | 
| 2394 | 2491 | 
|  | 2492 // Helper for legalize() to emit the right code to lower an operand to a | 
|  | 2493 // register of the appropriate type. | 
|  | 2494 Variable *TargetX8632::copyToReg(Operand *Src, int32_t RegNum) { | 
|  | 2495   Type Ty = Src->getType(); | 
|  | 2496   Variable *Reg = makeReg(Ty, RegNum); | 
|  | 2497   if (isVectorType(Src->getType())) { | 
|  | 2498     _movp(Reg, Src); | 
|  | 2499   } else { | 
|  | 2500     _mov(Reg, Src); | 
|  | 2501   } | 
|  | 2502   return Reg; | 
|  | 2503 } | 
|  | 2504 | 
| 2395 Operand *TargetX8632::legalize(Operand *From, LegalMask Allowed, | 2505 Operand *TargetX8632::legalize(Operand *From, LegalMask Allowed, | 
| 2396                                bool AllowOverlap, int32_t RegNum) { | 2506                                bool AllowOverlap, int32_t RegNum) { | 
| 2397   // Assert that a physical register is allowed.  To date, all calls | 2507   // Assert that a physical register is allowed.  To date, all calls | 
| 2398   // to legalize() allow a physical register.  If a physical register | 2508   // to legalize() allow a physical register.  If a physical register | 
| 2399   // needs to be explicitly disallowed, then new code will need to be | 2509   // needs to be explicitly disallowed, then new code will need to be | 
| 2400   // written to force a spill. | 2510   // written to force a spill. | 
| 2401   assert(Allowed & Legal_Reg); | 2511   assert(Allowed & Legal_Reg); | 
| 2402   // If we're asking for a specific physical register, make sure we're | 2512   // If we're asking for a specific physical register, make sure we're | 
| 2403   // not allowing any other operand kinds.  (This could be future | 2513   // not allowing any other operand kinds.  (This could be future | 
| 2404   // work, e.g. allow the shl shift amount to be either an immediate | 2514   // work, e.g. allow the shl shift amount to be either an immediate | 
| (...skipping 12 matching lines...) Expand all  Loading... | 
| 2417     if (Index) { | 2527     if (Index) { | 
| 2418       RegIndex = legalizeToVar(Index, true); | 2528       RegIndex = legalizeToVar(Index, true); | 
| 2419     } | 2529     } | 
| 2420     if (Base != RegBase || Index != RegIndex) { | 2530     if (Base != RegBase || Index != RegIndex) { | 
| 2421       From = OperandX8632Mem::create( | 2531       From = OperandX8632Mem::create( | 
| 2422           Func, Mem->getType(), RegBase, Mem->getOffset(), RegIndex, | 2532           Func, Mem->getType(), RegBase, Mem->getOffset(), RegIndex, | 
| 2423           Mem->getShift(), Mem->getSegmentRegister()); | 2533           Mem->getShift(), Mem->getSegmentRegister()); | 
| 2424     } | 2534     } | 
| 2425 | 2535 | 
| 2426     if (!(Allowed & Legal_Mem)) { | 2536     if (!(Allowed & Legal_Mem)) { | 
| 2427       Variable *Reg = makeReg(From->getType(), RegNum); | 2537       From = copyToReg(From, RegNum); | 
| 2428       _mov(Reg, From, RegNum); |  | 
| 2429       From = Reg; |  | 
| 2430     } | 2538     } | 
| 2431     return From; | 2539     return From; | 
| 2432   } | 2540   } | 
| 2433   if (llvm::isa<Constant>(From)) { | 2541   if (llvm::isa<Constant>(From)) { | 
| 2434     if (llvm::isa<ConstantUndef>(From)) { | 2542     if (llvm::isa<ConstantUndef>(From)) { | 
| 2435       // Lower undefs to zero.  Another option is to lower undefs to an | 2543       // Lower undefs to zero.  Another option is to lower undefs to an | 
| 2436       // uninitialized register; however, using an uninitialized register | 2544       // uninitialized register; however, using an uninitialized register | 
| 2437       // results in less predictable code. | 2545       // results in less predictable code. | 
| 2438       // | 2546       // | 
| 2439       // If in the future the implementation is changed to lower undef | 2547       // If in the future the implementation is changed to lower undef | 
| 2440       // values to uninitialized registers, a FakeDef will be needed: | 2548       // values to uninitialized registers, a FakeDef will be needed: | 
| 2441       //     Context.insert(InstFakeDef::create(Func, Reg)); | 2549       //     Context.insert(InstFakeDef::create(Func, Reg)); | 
| 2442       // This is in order to ensure that the live range of Reg is not | 2550       // This is in order to ensure that the live range of Reg is not | 
| 2443       // overestimated.  If the constant being lowered is a 64 bit value, | 2551       // overestimated.  If the constant being lowered is a 64 bit value, | 
| 2444       // then the result should be split and the lo and hi components will | 2552       // then the result should be split and the lo and hi components will | 
| 2445       // need to go in uninitialized registers. | 2553       // need to go in uninitialized registers. | 
| 2446       From = Ctx->getConstantZero(From->getType()); | 2554       From = Ctx->getConstantZero(From->getType()); | 
| 2447     } | 2555     } | 
| 2448     bool NeedsReg = | 2556     bool NeedsReg = | 
| 2449         !(Allowed & Legal_Imm) || | 2557         !(Allowed & Legal_Imm) || | 
| 2450         // ConstantFloat and ConstantDouble are actually memory operands. | 2558         // ConstantFloat, ConstantDouble, and vector constants are | 
|  | 2559         // actually memory operands. | 
| 2451         (!(Allowed & Legal_Mem) && | 2560         (!(Allowed & Legal_Mem) && | 
| 2452          (From->getType() == IceType_f32 || From->getType() == IceType_f64)); | 2561          (From->getType() == IceType_f32 || From->getType() == IceType_f64 || | 
|  | 2562           isVectorType(From->getType()))); | 
| 2453     if (NeedsReg) { | 2563     if (NeedsReg) { | 
| 2454       Variable *Reg = makeReg(From->getType(), RegNum); | 2564       From = copyToReg(From, RegNum); | 
| 2455       _mov(Reg, From); |  | 
| 2456       From = Reg; |  | 
| 2457     } | 2565     } | 
| 2458     return From; | 2566     return From; | 
| 2459   } | 2567   } | 
| 2460   if (Variable *Var = llvm::dyn_cast<Variable>(From)) { | 2568   if (Variable *Var = llvm::dyn_cast<Variable>(From)) { | 
| 2461     // We need a new physical register for the operand if: | 2569     // We need a new physical register for the operand if: | 
| 2462     //   Mem is not allowed and Var->getRegNum() is unknown, or | 2570     //   Mem is not allowed and Var->getRegNum() is unknown, or | 
| 2463     //   RegNum is required and Var->getRegNum() doesn't match. | 2571     //   RegNum is required and Var->getRegNum() doesn't match. | 
| 2464     if ((!(Allowed & Legal_Mem) && !Var->hasReg()) || | 2572     if ((!(Allowed & Legal_Mem) && !Var->hasReg()) || | 
| 2465         (RegNum != Variable::NoRegister && RegNum != Var->getRegNum())) { | 2573         (RegNum != Variable::NoRegister && RegNum != Var->getRegNum())) { | 
| 2466       Variable *Reg = makeReg(From->getType(), RegNum); | 2574       Variable *Reg = copyToReg(From, RegNum); | 
| 2467       if (RegNum == Variable::NoRegister) { | 2575       if (RegNum == Variable::NoRegister) { | 
| 2468         Reg->setPreferredRegister(Var, AllowOverlap); | 2576         Reg->setPreferredRegister(Var, AllowOverlap); | 
| 2469       } | 2577       } | 
| 2470       _mov(Reg, From); |  | 
| 2471       From = Reg; | 2578       From = Reg; | 
| 2472     } | 2579     } | 
| 2473     return From; | 2580     return From; | 
| 2474   } | 2581   } | 
| 2475   llvm_unreachable("Unhandled operand kind in legalize()"); | 2582   llvm_unreachable("Unhandled operand kind in legalize()"); | 
| 2476   return From; | 2583   return From; | 
| 2477 } | 2584 } | 
| 2478 | 2585 | 
| 2479 // Provide a trivial wrapper to legalize() for this common usage. | 2586 // Provide a trivial wrapper to legalize() for this common usage. | 
| 2480 Variable *TargetX8632::legalizeToVar(Operand *From, bool AllowOverlap, | 2587 Variable *TargetX8632::legalizeToVar(Operand *From, bool AllowOverlap, | 
| (...skipping 81 matching lines...) Expand 10 before | Expand all | Expand 10 after  Loading... | 
| 2562         } | 2669         } | 
| 2563         assert(AvailableTypedRegisters.any()); | 2670         assert(AvailableTypedRegisters.any()); | 
| 2564         int32_t RegNum = AvailableTypedRegisters.find_first(); | 2671         int32_t RegNum = AvailableTypedRegisters.find_first(); | 
| 2565         Var->setRegNum(RegNum); | 2672         Var->setRegNum(RegNum); | 
| 2566         AvailableRegisters[RegNum] = false; | 2673         AvailableRegisters[RegNum] = false; | 
| 2567       } | 2674       } | 
| 2568     } | 2675     } | 
| 2569   } | 2676   } | 
| 2570 } | 2677 } | 
| 2571 | 2678 | 
|  | 2679 template <> void ConstantInteger::emit(GlobalContext *Ctx) const { | 
|  | 2680   Ostream &Str = Ctx->getStrEmit(); | 
|  | 2681   Str << getValue(); | 
|  | 2682 } | 
|  | 2683 | 
| 2572 template <> void ConstantFloat::emit(GlobalContext *Ctx) const { | 2684 template <> void ConstantFloat::emit(GlobalContext *Ctx) const { | 
| 2573   Ostream &Str = Ctx->getStrEmit(); | 2685   Ostream &Str = Ctx->getStrEmit(); | 
| 2574   // It would be better to prefix with ".L$" instead of "L$", but | 2686   // It would be better to prefix with ".L$" instead of "L$", but | 
| 2575   // llvm-mc doesn't parse "dword ptr [.L$foo]". | 2687   // llvm-mc doesn't parse "dword ptr [.L$foo]". | 
| 2576   Str << "dword ptr [L$" << IceType_f32 << "$" << getPoolEntryID() << "]"; | 2688   Str << "dword ptr [L$" << IceType_f32 << "$" << getPoolEntryID() << "]"; | 
| 2577 } | 2689 } | 
| 2578 | 2690 | 
| 2579 template <> void ConstantDouble::emit(GlobalContext *Ctx) const { | 2691 template <> void ConstantDouble::emit(GlobalContext *Ctx) const { | 
| 2580   Ostream &Str = Ctx->getStrEmit(); | 2692   Ostream &Str = Ctx->getStrEmit(); | 
| 2581   Str << "qword ptr [L$" << IceType_f64 << "$" << getPoolEntryID() << "]"; | 2693   Str << "qword ptr [L$" << IceType_f64 << "$" << getPoolEntryID() << "]"; | 
| 2582 } | 2694 } | 
| 2583 | 2695 | 
|  | 2696 template <> void ConstantVector::emit(GlobalContext *Ctx) const { | 
|  | 2697   Ostream &Str = Ctx->getStrEmit(); | 
|  | 2698   Str << "xmmword ptr [L$"; | 
|  | 2699   emitAsmLabelForType(Str, getType()); | 
|  | 2700   Str << "$" << getPoolEntryID() << "]"; | 
|  | 2701 } | 
|  | 2702 | 
|  | 2703 template <> void ConstantBitVector::emit(GlobalContext *Ctx) const { | 
|  | 2704   Ostream &Str = Ctx->getStrEmit(); | 
|  | 2705   Str << "xmmword ptr [L$"; | 
|  | 2706   emitAsmLabelForType(Str, getType()); | 
|  | 2707   Str << "$" << getPoolEntryID() << "]"; | 
|  | 2708 } | 
|  | 2709 | 
| 2584 } // end of namespace Ice | 2710 } // end of namespace Ice | 
| OLD | NEW | 
|---|