OLD | NEW |
---|---|
1 //===- subzero/src/IceTargetLoweringARM32.cpp - ARM32 lowering ------------===// | 1 //===- subzero/src/IceTargetLoweringARM32.cpp - ARM32 lowering ------------===// |
2 // | 2 // |
3 // The Subzero Code Generator | 3 // The Subzero Code Generator |
4 // | 4 // |
5 // This file is distributed under the University of Illinois Open Source | 5 // This file is distributed under the University of Illinois Open Source |
6 // License. See LICENSE.TXT for details. | 6 // License. See LICENSE.TXT for details. |
7 // | 7 // |
8 //===----------------------------------------------------------------------===// | 8 //===----------------------------------------------------------------------===// |
9 /// | 9 /// |
10 /// \file | 10 /// \file |
(...skipping 280 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
291 | 291 |
292 void TargetARM32::staticInit(GlobalContext *Ctx) { | 292 void TargetARM32::staticInit(GlobalContext *Ctx) { |
293 | 293 |
294 // Limit this size (or do all bitsets need to be the same width)??? | 294 // Limit this size (or do all bitsets need to be the same width)??? |
295 llvm::SmallBitVector IntegerRegisters(RegARM32::Reg_NUM); | 295 llvm::SmallBitVector IntegerRegisters(RegARM32::Reg_NUM); |
296 llvm::SmallBitVector I64PairRegisters(RegARM32::Reg_NUM); | 296 llvm::SmallBitVector I64PairRegisters(RegARM32::Reg_NUM); |
297 llvm::SmallBitVector Float32Registers(RegARM32::Reg_NUM); | 297 llvm::SmallBitVector Float32Registers(RegARM32::Reg_NUM); |
298 llvm::SmallBitVector Float64Registers(RegARM32::Reg_NUM); | 298 llvm::SmallBitVector Float64Registers(RegARM32::Reg_NUM); |
299 llvm::SmallBitVector VectorRegisters(RegARM32::Reg_NUM); | 299 llvm::SmallBitVector VectorRegisters(RegARM32::Reg_NUM); |
300 llvm::SmallBitVector InvalidRegisters(RegARM32::Reg_NUM); | 300 llvm::SmallBitVector InvalidRegisters(RegARM32::Reg_NUM); |
301 llvm::SmallBitVector QtoSRegisters(RegARM32::Reg_NUM); | |
Jim Stichnoth
2016/02/03 15:28:37
I would list this before InvalidRegisters.
Eric Holk
2016/02/03 21:02:22
Done.
| |
301 for (int i = 0; i < RegARM32::Reg_NUM; ++i) { | 302 for (int i = 0; i < RegARM32::Reg_NUM; ++i) { |
302 const auto &Entry = RegARM32::RegTable[i]; | 303 const auto &Entry = RegARM32::RegTable[i]; |
303 IntegerRegisters[i] = Entry.IsInt; | 304 IntegerRegisters[i] = Entry.IsInt; |
304 I64PairRegisters[i] = Entry.IsI64Pair; | 305 I64PairRegisters[i] = Entry.IsI64Pair; |
305 Float32Registers[i] = Entry.IsFP32; | 306 Float32Registers[i] = Entry.IsFP32; |
306 Float64Registers[i] = Entry.IsFP64; | 307 Float64Registers[i] = Entry.IsFP64; |
307 VectorRegisters[i] = Entry.IsVec128; | 308 VectorRegisters[i] = Entry.IsVec128; |
308 RegisterAliases[i].resize(RegARM32::Reg_NUM); | 309 RegisterAliases[i].resize(RegARM32::Reg_NUM); |
310 QtoSRegisters[i] = Entry.IsVec128 && i < RegARM32::Reg_q8; | |
309 for (int j = 0; j < Entry.NumAliases; ++j) { | 311 for (int j = 0; j < Entry.NumAliases; ++j) { |
310 assert(i == j || !RegisterAliases[i][Entry.Aliases[j]]); | 312 assert(i == j || !RegisterAliases[i][Entry.Aliases[j]]); |
311 RegisterAliases[i].set(Entry.Aliases[j]); | 313 RegisterAliases[i].set(Entry.Aliases[j]); |
312 } | 314 } |
313 assert(RegisterAliases[i][i]); | 315 assert(RegisterAliases[i][i]); |
314 if (Entry.CCArg <= 0) { | 316 if (Entry.CCArg <= 0) { |
315 continue; | 317 continue; |
316 } | 318 } |
317 if (Entry.IsGPR) { | 319 if (Entry.IsGPR) { |
318 GPRArgInitializer[Entry.CCArg - 1] = i; | 320 GPRArgInitializer[Entry.CCArg - 1] = i; |
(...skipping 15 matching lines...) Expand all Loading... | |
334 TypeToRegisterSet[IceType_i64] = I64PairRegisters; | 336 TypeToRegisterSet[IceType_i64] = I64PairRegisters; |
335 TypeToRegisterSet[IceType_f32] = Float32Registers; | 337 TypeToRegisterSet[IceType_f32] = Float32Registers; |
336 TypeToRegisterSet[IceType_f64] = Float64Registers; | 338 TypeToRegisterSet[IceType_f64] = Float64Registers; |
337 TypeToRegisterSet[IceType_v4i1] = VectorRegisters; | 339 TypeToRegisterSet[IceType_v4i1] = VectorRegisters; |
338 TypeToRegisterSet[IceType_v8i1] = VectorRegisters; | 340 TypeToRegisterSet[IceType_v8i1] = VectorRegisters; |
339 TypeToRegisterSet[IceType_v16i1] = VectorRegisters; | 341 TypeToRegisterSet[IceType_v16i1] = VectorRegisters; |
340 TypeToRegisterSet[IceType_v16i8] = VectorRegisters; | 342 TypeToRegisterSet[IceType_v16i8] = VectorRegisters; |
341 TypeToRegisterSet[IceType_v8i16] = VectorRegisters; | 343 TypeToRegisterSet[IceType_v8i16] = VectorRegisters; |
342 TypeToRegisterSet[IceType_v4i32] = VectorRegisters; | 344 TypeToRegisterSet[IceType_v4i32] = VectorRegisters; |
343 TypeToRegisterSet[IceType_v4f32] = VectorRegisters; | 345 TypeToRegisterSet[IceType_v4f32] = VectorRegisters; |
346 TypeToRegisterSet[RegARM32::RCARM32_QtoS] = QtoSRegisters; | |
344 | 347 |
345 for (size_t i = 0; i < llvm::array_lengthof(TypeToRegisterSet); ++i) | 348 for (size_t i = 0; i < llvm::array_lengthof(TypeToRegisterSet); ++i) |
346 TypeToRegisterSetUnfiltered[i] = TypeToRegisterSet[i]; | 349 TypeToRegisterSetUnfiltered[i] = TypeToRegisterSet[i]; |
347 | 350 |
348 filterTypeToRegisterSet( | 351 filterTypeToRegisterSet( |
349 Ctx, RegARM32::Reg_NUM, TypeToRegisterSet, | 352 Ctx, RegARM32::Reg_NUM, TypeToRegisterSet, |
350 llvm::array_lengthof(TypeToRegisterSet), [](int32_t RegNum) -> IceString { | 353 llvm::array_lengthof(TypeToRegisterSet), [](int32_t RegNum) -> IceString { |
351 // This function simply removes ", " from the register name. | 354 // This function simply removes ", " from the register name. |
352 IceString Name = RegARM32::getRegName(RegNum); | 355 IceString Name = RegARM32::getRegName(RegNum); |
353 constexpr const char RegSeparator[] = ", "; | 356 constexpr const char RegSeparator[] = ", "; |
(...skipping 3469 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
3823 case IceType_v4i32: { | 3826 case IceType_v4i32: { |
3824 UnimplementedLoweringError(this, Inst); | 3827 UnimplementedLoweringError(this, Inst); |
3825 break; | 3828 break; |
3826 } | 3829 } |
3827 } | 3830 } |
3828 break; | 3831 break; |
3829 } | 3832 } |
3830 } | 3833 } |
3831 } | 3834 } |
3832 | 3835 |
3833 void TargetARM32::lowerExtractElement(const InstExtractElement *Inst) { | 3836 void TargetARM32::lowerExtractElement(const InstExtractElement *Instr) { |
3834 UnimplementedLoweringError(this, Inst); | 3837 Variable *Dest = Instr->getDest(); |
3838 auto DestTy = Dest->getType(); | |
3839 | |
3840 if (Dest->isRematerializable()) { | |
3841 Context.insert<InstFakeDef>(Dest); | |
Jim Stichnoth
2016/02/03 15:28:37
Maybe I haven't thought this through well enough,
John
2016/02/03 16:06:51
Yup, this is wrong. you have to handle these (whic
| |
3842 return; | |
3843 } | |
3844 | |
3845 Variable *Src0 = legalizeToReg(Instr->getSrc(0)); | |
Jim Stichnoth
2016/02/03 15:28:38
Optional: It would be nice if InstExtractElement h
| |
3846 Operand *Src1 = Instr->getSrc(1); | |
3847 | |
3848 if (const auto *Imm = llvm::dyn_cast<ConstantInteger32>(Src1)) { | |
3849 auto Index = Imm->getValue(); | |
3850 Variable *T = makeReg(DestTy); | |
3851 | |
3852 if (isFloatingType(DestTy)) { | |
3853 // We need to make sure the source is in a suitable register. | |
3854 Src0->setRegClass(RegARM32::RCARM32_QtoS); | |
Jim Stichnoth
2016/02/03 15:28:38
It's possible (though unlikely) that legalizeToReg
Eric Holk
2016/02/03 21:02:22
Done.
| |
3855 } | |
3856 | |
3857 _extract(T, Src0, Index); | |
3858 _mov(Dest, T); | |
3859 return; | |
3860 } else { | |
3861 assert(false && "extract requires a constant index"); | |
Jim Stichnoth
2016/02/03 15:28:38
s/extract/extractelement
would make a more instant
Eric Holk
2016/02/03 21:02:21
Done.
| |
3862 } | |
3835 } | 3863 } |
3836 | 3864 |
3837 namespace { | 3865 namespace { |
3838 // Validates FCMPARM32_TABLE's declaration w.r.t. InstFcmp::FCondition ordering | 3866 // Validates FCMPARM32_TABLE's declaration w.r.t. InstFcmp::FCondition ordering |
3839 // (and naming). | 3867 // (and naming). |
3840 enum { | 3868 enum { |
3841 #define X(val, CC0, CC1) _fcmp_ll_##val, | 3869 #define X(val, CC0, CC1) _fcmp_ll_##val, |
3842 FCMPARM32_TABLE | 3870 FCMPARM32_TABLE |
3843 #undef X | 3871 #undef X |
3844 _fcmp_ll_NUM | 3872 _fcmp_ll_NUM |
(...skipping 373 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
4218 _mov(T, _0); | 4246 _mov(T, _0); |
4219 CondWhenTrue Cond = lowerIcmpCond(Inst); | 4247 CondWhenTrue Cond = lowerIcmpCond(Inst); |
4220 _mov_redefined(T, _1, Cond.WhenTrue0); | 4248 _mov_redefined(T, _1, Cond.WhenTrue0); |
4221 _mov(Dest, T); | 4249 _mov(Dest, T); |
4222 | 4250 |
4223 assert(Cond.WhenTrue1 == CondARM32::kNone); | 4251 assert(Cond.WhenTrue1 == CondARM32::kNone); |
4224 | 4252 |
4225 return; | 4253 return; |
4226 } | 4254 } |
4227 | 4255 |
4228 void TargetARM32::lowerInsertElement(const InstInsertElement *Inst) { | 4256 void TargetARM32::lowerInsertElement(const InstInsertElement *Instr) { |
4229 UnimplementedLoweringError(this, Inst); | 4257 Variable *Dest = Instr->getDest(); |
4258 auto DestTy = Dest->getType(); | |
4259 | |
4260 if (Dest->isRematerializable()) { | |
4261 Context.insert<InstFakeDef>(Dest); | |
4262 return; | |
4263 } | |
4264 | |
4265 Variable *Src0 = legalizeToReg(Instr->getSrc(0)); | |
4266 Variable *Src1 = legalizeToReg(Instr->getSrc(1)); | |
4267 Operand *Src2 = Instr->getSrc(2); | |
4268 | |
4269 if (const auto *Imm = llvm::dyn_cast<ConstantInteger32>(Src2)) { | |
4270 auto Index = Imm->getValue(); | |
4271 Variable *T = makeReg(DestTy); | |
4272 | |
4273 if (isFloatingType(DestTy)) { | |
4274 T->setRegClass(RegARM32::RCARM32_QtoS); | |
4275 } | |
4276 | |
4277 _mov(T, Src0); | |
4278 _insert(T, Src1, Index); | |
4279 _set_dest_redefined(); | |
4280 _mov(Dest, T); | |
4281 return; | |
4282 } | |
4283 assert(false && "insert requires a constant index"); | |
4230 } | 4284 } |
4231 | 4285 |
4232 namespace { | 4286 namespace { |
4233 inline uint64_t getConstantMemoryOrder(Operand *Opnd) { | 4287 inline uint64_t getConstantMemoryOrder(Operand *Opnd) { |
4234 if (auto *Integer = llvm::dyn_cast<ConstantInteger32>(Opnd)) | 4288 if (auto *Integer = llvm::dyn_cast<ConstantInteger32>(Opnd)) |
4235 return Integer->getValue(); | 4289 return Integer->getValue(); |
4236 return Intrinsics::MemoryOrderInvalid; | 4290 return Intrinsics::MemoryOrderInvalid; |
4237 } | 4291 } |
4238 } // end of anonymous namespace | 4292 } // end of anonymous namespace |
4239 | 4293 |
(...skipping 2276 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
6516 Str << ".eabi_attribute 14, 3 @ Tag_ABI_PCS_R9_use: Not used\n"; | 6570 Str << ".eabi_attribute 14, 3 @ Tag_ABI_PCS_R9_use: Not used\n"; |
6517 } | 6571 } |
6518 | 6572 |
6519 llvm::SmallBitVector TargetARM32::TypeToRegisterSet[RegARM32::RCARM32_NUM]; | 6573 llvm::SmallBitVector TargetARM32::TypeToRegisterSet[RegARM32::RCARM32_NUM]; |
6520 llvm::SmallBitVector | 6574 llvm::SmallBitVector |
6521 TargetARM32::TypeToRegisterSetUnfiltered[RegARM32::RCARM32_NUM]; | 6575 TargetARM32::TypeToRegisterSetUnfiltered[RegARM32::RCARM32_NUM]; |
6522 llvm::SmallBitVector TargetARM32::RegisterAliases[RegARM32::Reg_NUM]; | 6576 llvm::SmallBitVector TargetARM32::RegisterAliases[RegARM32::Reg_NUM]; |
6523 | 6577 |
6524 } // end of namespace ARM32 | 6578 } // end of namespace ARM32 |
6525 } // end of namespace Ice | 6579 } // end of namespace Ice |
OLD | NEW |