Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(9)

Side by Side Diff: src/IceTargetLoweringARM32.cpp

Issue 1655313002: Subzero: ARM32: lowering of vector insert and extract. (Closed) Base URL: https://chromium.googlesource.com/native_client/pnacl-subzero.git@master
Patch Set: Created 4 years, 10 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch
OLDNEW
1 //===- subzero/src/IceTargetLoweringARM32.cpp - ARM32 lowering ------------===// 1 //===- subzero/src/IceTargetLoweringARM32.cpp - ARM32 lowering ------------===//
2 // 2 //
3 // The Subzero Code Generator 3 // The Subzero Code Generator
4 // 4 //
5 // This file is distributed under the University of Illinois Open Source 5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details. 6 // License. See LICENSE.TXT for details.
7 // 7 //
8 //===----------------------------------------------------------------------===// 8 //===----------------------------------------------------------------------===//
9 /// 9 ///
10 /// \file 10 /// \file
(...skipping 280 matching lines...) Expand 10 before | Expand all | Expand 10 after
291 291
292 void TargetARM32::staticInit(GlobalContext *Ctx) { 292 void TargetARM32::staticInit(GlobalContext *Ctx) {
293 293
294 // Limit this size (or do all bitsets need to be the same width)??? 294 // Limit this size (or do all bitsets need to be the same width)???
295 llvm::SmallBitVector IntegerRegisters(RegARM32::Reg_NUM); 295 llvm::SmallBitVector IntegerRegisters(RegARM32::Reg_NUM);
296 llvm::SmallBitVector I64PairRegisters(RegARM32::Reg_NUM); 296 llvm::SmallBitVector I64PairRegisters(RegARM32::Reg_NUM);
297 llvm::SmallBitVector Float32Registers(RegARM32::Reg_NUM); 297 llvm::SmallBitVector Float32Registers(RegARM32::Reg_NUM);
298 llvm::SmallBitVector Float64Registers(RegARM32::Reg_NUM); 298 llvm::SmallBitVector Float64Registers(RegARM32::Reg_NUM);
299 llvm::SmallBitVector VectorRegisters(RegARM32::Reg_NUM); 299 llvm::SmallBitVector VectorRegisters(RegARM32::Reg_NUM);
300 llvm::SmallBitVector InvalidRegisters(RegARM32::Reg_NUM); 300 llvm::SmallBitVector InvalidRegisters(RegARM32::Reg_NUM);
301 llvm::SmallBitVector QtoSRegisters(RegARM32::Reg_NUM);
Jim Stichnoth 2016/02/03 15:28:37 I would list this before InvalidRegisters.
Eric Holk 2016/02/03 21:02:22 Done.
301 for (int i = 0; i < RegARM32::Reg_NUM; ++i) { 302 for (int i = 0; i < RegARM32::Reg_NUM; ++i) {
302 const auto &Entry = RegARM32::RegTable[i]; 303 const auto &Entry = RegARM32::RegTable[i];
303 IntegerRegisters[i] = Entry.IsInt; 304 IntegerRegisters[i] = Entry.IsInt;
304 I64PairRegisters[i] = Entry.IsI64Pair; 305 I64PairRegisters[i] = Entry.IsI64Pair;
305 Float32Registers[i] = Entry.IsFP32; 306 Float32Registers[i] = Entry.IsFP32;
306 Float64Registers[i] = Entry.IsFP64; 307 Float64Registers[i] = Entry.IsFP64;
307 VectorRegisters[i] = Entry.IsVec128; 308 VectorRegisters[i] = Entry.IsVec128;
308 RegisterAliases[i].resize(RegARM32::Reg_NUM); 309 RegisterAliases[i].resize(RegARM32::Reg_NUM);
310 QtoSRegisters[i] = Entry.IsVec128 && i < RegARM32::Reg_q8;
309 for (int j = 0; j < Entry.NumAliases; ++j) { 311 for (int j = 0; j < Entry.NumAliases; ++j) {
310 assert(i == j || !RegisterAliases[i][Entry.Aliases[j]]); 312 assert(i == j || !RegisterAliases[i][Entry.Aliases[j]]);
311 RegisterAliases[i].set(Entry.Aliases[j]); 313 RegisterAliases[i].set(Entry.Aliases[j]);
312 } 314 }
313 assert(RegisterAliases[i][i]); 315 assert(RegisterAliases[i][i]);
314 if (Entry.CCArg <= 0) { 316 if (Entry.CCArg <= 0) {
315 continue; 317 continue;
316 } 318 }
317 if (Entry.IsGPR) { 319 if (Entry.IsGPR) {
318 GPRArgInitializer[Entry.CCArg - 1] = i; 320 GPRArgInitializer[Entry.CCArg - 1] = i;
(...skipping 15 matching lines...) Expand all
334 TypeToRegisterSet[IceType_i64] = I64PairRegisters; 336 TypeToRegisterSet[IceType_i64] = I64PairRegisters;
335 TypeToRegisterSet[IceType_f32] = Float32Registers; 337 TypeToRegisterSet[IceType_f32] = Float32Registers;
336 TypeToRegisterSet[IceType_f64] = Float64Registers; 338 TypeToRegisterSet[IceType_f64] = Float64Registers;
337 TypeToRegisterSet[IceType_v4i1] = VectorRegisters; 339 TypeToRegisterSet[IceType_v4i1] = VectorRegisters;
338 TypeToRegisterSet[IceType_v8i1] = VectorRegisters; 340 TypeToRegisterSet[IceType_v8i1] = VectorRegisters;
339 TypeToRegisterSet[IceType_v16i1] = VectorRegisters; 341 TypeToRegisterSet[IceType_v16i1] = VectorRegisters;
340 TypeToRegisterSet[IceType_v16i8] = VectorRegisters; 342 TypeToRegisterSet[IceType_v16i8] = VectorRegisters;
341 TypeToRegisterSet[IceType_v8i16] = VectorRegisters; 343 TypeToRegisterSet[IceType_v8i16] = VectorRegisters;
342 TypeToRegisterSet[IceType_v4i32] = VectorRegisters; 344 TypeToRegisterSet[IceType_v4i32] = VectorRegisters;
343 TypeToRegisterSet[IceType_v4f32] = VectorRegisters; 345 TypeToRegisterSet[IceType_v4f32] = VectorRegisters;
346 TypeToRegisterSet[RegARM32::RCARM32_QtoS] = QtoSRegisters;
344 347
345 for (size_t i = 0; i < llvm::array_lengthof(TypeToRegisterSet); ++i) 348 for (size_t i = 0; i < llvm::array_lengthof(TypeToRegisterSet); ++i)
346 TypeToRegisterSetUnfiltered[i] = TypeToRegisterSet[i]; 349 TypeToRegisterSetUnfiltered[i] = TypeToRegisterSet[i];
347 350
348 filterTypeToRegisterSet( 351 filterTypeToRegisterSet(
349 Ctx, RegARM32::Reg_NUM, TypeToRegisterSet, 352 Ctx, RegARM32::Reg_NUM, TypeToRegisterSet,
350 llvm::array_lengthof(TypeToRegisterSet), [](int32_t RegNum) -> IceString { 353 llvm::array_lengthof(TypeToRegisterSet), [](int32_t RegNum) -> IceString {
351 // This function simply removes ", " from the register name. 354 // This function simply removes ", " from the register name.
352 IceString Name = RegARM32::getRegName(RegNum); 355 IceString Name = RegARM32::getRegName(RegNum);
353 constexpr const char RegSeparator[] = ", "; 356 constexpr const char RegSeparator[] = ", ";
(...skipping 3469 matching lines...) Expand 10 before | Expand all | Expand 10 after
3823 case IceType_v4i32: { 3826 case IceType_v4i32: {
3824 UnimplementedLoweringError(this, Inst); 3827 UnimplementedLoweringError(this, Inst);
3825 break; 3828 break;
3826 } 3829 }
3827 } 3830 }
3828 break; 3831 break;
3829 } 3832 }
3830 } 3833 }
3831 } 3834 }
3832 3835
3833 void TargetARM32::lowerExtractElement(const InstExtractElement *Inst) { 3836 void TargetARM32::lowerExtractElement(const InstExtractElement *Instr) {
3834 UnimplementedLoweringError(this, Inst); 3837 Variable *Dest = Instr->getDest();
3838 auto DestTy = Dest->getType();
3839
3840 if (Dest->isRematerializable()) {
3841 Context.insert<InstFakeDef>(Dest);
Jim Stichnoth 2016/02/03 15:28:37 Maybe I haven't thought this through well enough,
John 2016/02/03 16:06:51 Yup, this is wrong. you have to handle these (whic
3842 return;
3843 }
3844
3845 Variable *Src0 = legalizeToReg(Instr->getSrc(0));
Jim Stichnoth 2016/02/03 15:28:38 Optional: It would be nice if InstExtractElement h
3846 Operand *Src1 = Instr->getSrc(1);
3847
3848 if (const auto *Imm = llvm::dyn_cast<ConstantInteger32>(Src1)) {
3849 auto Index = Imm->getValue();
3850 Variable *T = makeReg(DestTy);
3851
3852 if (isFloatingType(DestTy)) {
3853 // We need to make sure the source is in a suitable register.
3854 Src0->setRegClass(RegARM32::RCARM32_QtoS);
Jim Stichnoth 2016/02/03 15:28:38 It's possible (though unlikely) that legalizeToReg
Eric Holk 2016/02/03 21:02:22 Done.
3855 }
3856
3857 _extract(T, Src0, Index);
3858 _mov(Dest, T);
3859 return;
3860 } else {
3861 assert(false && "extract requires a constant index");
Jim Stichnoth 2016/02/03 15:28:38 s/extract/extractelement would make a more instant
Eric Holk 2016/02/03 21:02:21 Done.
3862 }
3835 } 3863 }
3836 3864
3837 namespace { 3865 namespace {
3838 // Validates FCMPARM32_TABLE's declaration w.r.t. InstFcmp::FCondition ordering 3866 // Validates FCMPARM32_TABLE's declaration w.r.t. InstFcmp::FCondition ordering
3839 // (and naming). 3867 // (and naming).
3840 enum { 3868 enum {
3841 #define X(val, CC0, CC1) _fcmp_ll_##val, 3869 #define X(val, CC0, CC1) _fcmp_ll_##val,
3842 FCMPARM32_TABLE 3870 FCMPARM32_TABLE
3843 #undef X 3871 #undef X
3844 _fcmp_ll_NUM 3872 _fcmp_ll_NUM
(...skipping 373 matching lines...) Expand 10 before | Expand all | Expand 10 after
4218 _mov(T, _0); 4246 _mov(T, _0);
4219 CondWhenTrue Cond = lowerIcmpCond(Inst); 4247 CondWhenTrue Cond = lowerIcmpCond(Inst);
4220 _mov_redefined(T, _1, Cond.WhenTrue0); 4248 _mov_redefined(T, _1, Cond.WhenTrue0);
4221 _mov(Dest, T); 4249 _mov(Dest, T);
4222 4250
4223 assert(Cond.WhenTrue1 == CondARM32::kNone); 4251 assert(Cond.WhenTrue1 == CondARM32::kNone);
4224 4252
4225 return; 4253 return;
4226 } 4254 }
4227 4255
4228 void TargetARM32::lowerInsertElement(const InstInsertElement *Inst) { 4256 void TargetARM32::lowerInsertElement(const InstInsertElement *Instr) {
4229 UnimplementedLoweringError(this, Inst); 4257 Variable *Dest = Instr->getDest();
4258 auto DestTy = Dest->getType();
4259
4260 if (Dest->isRematerializable()) {
4261 Context.insert<InstFakeDef>(Dest);
4262 return;
4263 }
4264
4265 Variable *Src0 = legalizeToReg(Instr->getSrc(0));
4266 Variable *Src1 = legalizeToReg(Instr->getSrc(1));
4267 Operand *Src2 = Instr->getSrc(2);
4268
4269 if (const auto *Imm = llvm::dyn_cast<ConstantInteger32>(Src2)) {
4270 auto Index = Imm->getValue();
4271 Variable *T = makeReg(DestTy);
4272
4273 if (isFloatingType(DestTy)) {
4274 T->setRegClass(RegARM32::RCARM32_QtoS);
4275 }
4276
4277 _mov(T, Src0);
4278 _insert(T, Src1, Index);
4279 _set_dest_redefined();
4280 _mov(Dest, T);
4281 return;
4282 }
4283 assert(false && "insert requires a constant index");
4230 } 4284 }
4231 4285
4232 namespace { 4286 namespace {
4233 inline uint64_t getConstantMemoryOrder(Operand *Opnd) { 4287 inline uint64_t getConstantMemoryOrder(Operand *Opnd) {
4234 if (auto *Integer = llvm::dyn_cast<ConstantInteger32>(Opnd)) 4288 if (auto *Integer = llvm::dyn_cast<ConstantInteger32>(Opnd))
4235 return Integer->getValue(); 4289 return Integer->getValue();
4236 return Intrinsics::MemoryOrderInvalid; 4290 return Intrinsics::MemoryOrderInvalid;
4237 } 4291 }
4238 } // end of anonymous namespace 4292 } // end of anonymous namespace
4239 4293
(...skipping 2276 matching lines...) Expand 10 before | Expand all | Expand 10 after
6516 Str << ".eabi_attribute 14, 3 @ Tag_ABI_PCS_R9_use: Not used\n"; 6570 Str << ".eabi_attribute 14, 3 @ Tag_ABI_PCS_R9_use: Not used\n";
6517 } 6571 }
6518 6572
6519 llvm::SmallBitVector TargetARM32::TypeToRegisterSet[RegARM32::RCARM32_NUM]; 6573 llvm::SmallBitVector TargetARM32::TypeToRegisterSet[RegARM32::RCARM32_NUM];
6520 llvm::SmallBitVector 6574 llvm::SmallBitVector
6521 TargetARM32::TypeToRegisterSetUnfiltered[RegARM32::RCARM32_NUM]; 6575 TargetARM32::TypeToRegisterSetUnfiltered[RegARM32::RCARM32_NUM];
6522 llvm::SmallBitVector TargetARM32::RegisterAliases[RegARM32::Reg_NUM]; 6576 llvm::SmallBitVector TargetARM32::RegisterAliases[RegARM32::Reg_NUM];
6523 6577
6524 } // end of namespace ARM32 6578 } // end of namespace ARM32
6525 } // end of namespace Ice 6579 } // end of namespace Ice
OLDNEW

Powered by Google App Engine
This is Rietveld 408576698