Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(117)

Side by Side Diff: src/IceInstARM32.cpp

Issue 1679023008: Add insert/extract element to the integrated ARM assembler. (Closed) Base URL: https://chromium.googlesource.com/native_client/pnacl-subzero.git@master
Patch Set: Fix nits. Created 4 years, 10 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch
« no previous file with comments | « src/IceInstARM32.h ('k') | tests_lit/assembler/arm32/insert-extract.ll » ('j') | no next file with comments »
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
OLDNEW
1 //===- subzero/src/IceInstARM32.cpp - ARM32 instruction implementation ----===// 1 //===- subzero/src/IceInstARM32.cpp - ARM32 instruction implementation ----===//
2 // 2 //
3 // The Subzero Code Generator 3 // The Subzero Code Generator
4 // 4 //
5 // This file is distributed under the University of Illinois Open Source 5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details. 6 // License. See LICENSE.TXT for details.
7 // 7 //
8 //===----------------------------------------------------------------------===// 8 //===----------------------------------------------------------------------===//
9 /// 9 ///
10 /// \file 10 /// \file
(...skipping 1049 matching lines...) Expand 10 before | Expand all | Expand 10 after
1060 } 1060 }
1061 1061
1062 if (Src64 == nullptr) { 1062 if (Src64 == nullptr) {
1063 addSource(Src); 1063 addSource(Src);
1064 } else { 1064 } else {
1065 addSource(Src64->getLo()); 1065 addSource(Src64->getLo());
1066 addSource(Src64->getHi()); 1066 addSource(Src64->getHi());
1067 } 1067 }
1068 } 1068 }
1069 1069
1070 namespace {
1071
1070 // These next two functions find the D register that maps to the half of the Q 1072 // These next two functions find the D register that maps to the half of the Q
1071 // register that this instruction is accessing. 1073 // register that this instruction is accessing.
1072 Register getDRegister(const Variable *Src, uint32_t Index) { 1074 Register getDRegister(const Variable *Src, uint32_t Index) {
1073 assert(Src->hasReg()); 1075 assert(Src->hasReg());
1074 const auto SrcReg = Src->getRegNum(); 1076 const auto SrcReg = Src->getRegNum();
1075 1077
1076 const RegARM32::RegTableType &SrcEntry = RegARM32::RegTable[SrcReg]; 1078 const RegARM32::RegTableType &SrcEntry = RegARM32::RegTable[SrcReg];
1077 assert(SrcEntry.IsVec128); 1079 assert(SrcEntry.IsVec128);
1078 1080
1079 const uint32_t NumElements = typeNumElements(Src->getType()); 1081 const uint32_t NumElements = typeNumElements(Src->getType());
(...skipping 37 matching lines...) Expand 10 before | Expand all | Expand 10 after
1117 assert(SrcReg < RegARM32::Reg_q8); 1119 assert(SrcReg < RegARM32::Reg_q8);
1118 1120
1119 // This part assumes the register alias list goes q0, d0, d1, s0, s1, s2, s3. 1121 // This part assumes the register alias list goes q0, d0, d1, s0, s1, s2, s3.
1120 assert(Index < 4); 1122 assert(Index < 4);
1121 1123
1122 // TODO(jpp): find a way to do this that doesn't rely on ordering of the alias 1124 // TODO(jpp): find a way to do this that doesn't rely on ordering of the alias
1123 // list. 1125 // list.
1124 return static_cast<Register>(RegARM32::RegTable[SrcReg].Aliases[Index + 3]); 1126 return static_cast<Register>(RegARM32::RegTable[SrcReg].Aliases[Index + 3]);
1125 } 1127 }
1126 1128
1129 } // end of anonymous namespace
1130
1127 void InstARM32Extract::emit(const Cfg *Func) const { 1131 void InstARM32Extract::emit(const Cfg *Func) const {
1128 Ostream &Str = Func->getContext()->getStrEmit(); 1132 Ostream &Str = Func->getContext()->getStrEmit();
1129 const Type DestTy = getDest()->getType(); 1133 const Type DestTy = getDest()->getType();
1130 1134
1131 const auto *Src = llvm::cast<Variable>(getSrc(0)); 1135 const auto *Src = llvm::cast<Variable>(getSrc(0));
1132 1136
1133 if (isIntegerType(DestTy)) { 1137 if (isIntegerType(DestTy)) {
1134 Str << "\t" 1138 Str << "\t"
1135 << "vmov" << getPredicate(); 1139 << "vmov" << getPredicate();
1136 const uint32_t BitSize = typeWidthInBytes(DestTy) * CHAR_BIT; 1140 const uint32_t BitSize = typeWidthInBytes(DestTy) * CHAR_BIT;
(...skipping 18 matching lines...) Expand all
1155 Str << "\t" 1159 Str << "\t"
1156 << "vmov" << getPredicate() << ".f32" 1160 << "vmov" << getPredicate() << ".f32"
1157 << "\t"; 1161 << "\t";
1158 getDest()->emit(Func); 1162 getDest()->emit(Func);
1159 Str << ", " << RegARM32::RegTable[SrcReg].Name; 1163 Str << ", " << RegARM32::RegTable[SrcReg].Name;
1160 } else { 1164 } else {
1161 assert(false && "Invalid extract type"); 1165 assert(false && "Invalid extract type");
1162 } 1166 }
1163 } 1167 }
1164 1168
1169 void InstARM32Extract::emitIAS(const Cfg *Func) const {
1170 const Operand *Dest = getDest();
1171 const Type DestTy = Dest->getType();
1172 const Operand *Src = getSrc(0);
1173 assert(isVectorType(Src->getType()));
1174 assert(DestTy == typeElementType(Src->getType()));
1175 auto *Asm = Func->getAssembler<ARM32::AssemblerARM32>();
1176 if (isIntegerType(DestTy)) {
1177 Asm->vmovrqi(Dest, Src, Index, getPredicate());
1178 assert(!Asm->needsTextFixup());
1179 return;
1180 }
1181 assert(isFloatingType(DestTy));
1182 Asm->vmovsqi(Dest, Src, Index, getPredicate());
1183 assert(!Asm->needsTextFixup());
1184 }
1185
1165 void InstARM32Insert::emit(const Cfg *Func) const { 1186 void InstARM32Insert::emit(const Cfg *Func) const {
1166 Ostream &Str = Func->getContext()->getStrEmit(); 1187 Ostream &Str = Func->getContext()->getStrEmit();
1167 const Variable *Dest = getDest(); 1188 const Variable *Dest = getDest();
1168 const Type DestTy = getDest()->getType(); 1189 const Type DestTy = getDest()->getType();
1169 1190
1170 const auto *Src = llvm::cast<Variable>(getSrc(0)); 1191 const auto *Src = llvm::cast<Variable>(getSrc(0));
1171 1192
1172 if (isIntegerType(DestTy)) { 1193 if (isIntegerType(DestTy)) {
1173 Str << "\t" 1194 Str << "\t"
1174 << "vmov" << getPredicate(); 1195 << "vmov" << getPredicate();
(...skipping 11 matching lines...) Expand all
1186 << "vmov" << getPredicate() << ".f32" 1207 << "vmov" << getPredicate() << ".f32"
1187 << "\t"; 1208 << "\t";
1188 const Register DestReg = getSRegister(Dest, Index); 1209 const Register DestReg = getSRegister(Dest, Index);
1189 Str << RegARM32::RegTable[DestReg].Name << ", "; 1210 Str << RegARM32::RegTable[DestReg].Name << ", ";
1190 Src->emit(Func); 1211 Src->emit(Func);
1191 } else { 1212 } else {
1192 assert(false && "Invalid insert type"); 1213 assert(false && "Invalid insert type");
1193 } 1214 }
1194 } 1215 }
1195 1216
1217 void InstARM32Insert::emitIAS(const Cfg *Func) const {
1218 const Variable *Dest = getDest();
1219 const Operand *Src = getSrc(0);
1220 const Type SrcTy = Src->getType();
1221 assert(isVectorType(Dest->getType()));
1222 assert(typeElementType(Dest->getType()) == SrcTy);
1223 auto *Asm = Func->getAssembler<ARM32::AssemblerARM32>();
1224 if (isIntegerType(SrcTy)) {
1225 const Operand *Src = getSrc(0);
1226 Asm->vmovqir(Dest, Index, Src, getPredicate());
1227 assert(!Asm->needsTextFixup());
1228 return;
1229 }
1230 assert(isFloatingType(SrcTy));
1231 Asm->vmovqis(Dest, Index, Src, getPredicate());
1232 assert(!Asm->needsTextFixup());
1233 }
1234
1196 template <InstARM32::InstKindARM32 K> 1235 template <InstARM32::InstKindARM32 K>
1197 void InstARM32CmpLike<K>::emitIAS(const Cfg *Func) const { 1236 void InstARM32CmpLike<K>::emitIAS(const Cfg *Func) const {
1198 emitUsingTextFixup(Func); 1237 emitUsingTextFixup(Func);
1199 } 1238 }
1200 1239
1201 template <> void InstARM32Cmn::emitIAS(const Cfg *Func) const { 1240 template <> void InstARM32Cmn::emitIAS(const Cfg *Func) const {
1202 assert(getSrcSize() == 2); 1241 assert(getSrcSize() == 2);
1203 auto *Asm = Func->getAssembler<ARM32::AssemblerARM32>(); 1242 auto *Asm = Func->getAssembler<ARM32::AssemblerARM32>();
1204 Asm->cmn(getSrc(0), getSrc(1), getPredicate()); 1243 Asm->cmn(getSrc(0), getSrc(1), getPredicate());
1205 if (Asm->needsTextFixup()) 1244 if (Asm->needsTextFixup())
(...skipping 1514 matching lines...) Expand 10 before | Expand all | Expand 10 after
2720 2759
2721 template class InstARM32FourAddrGPR<InstARM32::Mla>; 2760 template class InstARM32FourAddrGPR<InstARM32::Mla>;
2722 template class InstARM32FourAddrGPR<InstARM32::Mls>; 2761 template class InstARM32FourAddrGPR<InstARM32::Mls>;
2723 2762
2724 template class InstARM32CmpLike<InstARM32::Cmn>; 2763 template class InstARM32CmpLike<InstARM32::Cmn>;
2725 template class InstARM32CmpLike<InstARM32::Cmp>; 2764 template class InstARM32CmpLike<InstARM32::Cmp>;
2726 template class InstARM32CmpLike<InstARM32::Tst>; 2765 template class InstARM32CmpLike<InstARM32::Tst>;
2727 2766
2728 } // end of namespace ARM32 2767 } // end of namespace ARM32
2729 } // end of namespace Ice 2768 } // end of namespace Ice
OLDNEW
« no previous file with comments | « src/IceInstARM32.h ('k') | tests_lit/assembler/arm32/insert-extract.ll » ('j') | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698