Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(463)

Side by Side Diff: src/arm64/simulator-arm64.h

Issue 2812573003: Reland "ARM64: Add NEON support" (Closed)
Patch Set: Add trace directory to gitignore Created 3 years, 8 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch
« no previous file with comments | « src/arm64/macro-assembler-arm64-inl.h ('k') | src/arm64/simulator-arm64.cc » ('j') | no next file with comments »
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
OLDNEW
1 // Copyright 2013 the V8 project authors. All rights reserved. 1 // Copyright 2013 the V8 project authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be 2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file. 3 // found in the LICENSE file.
4 4
5 #ifndef V8_ARM64_SIMULATOR_ARM64_H_ 5 #ifndef V8_ARM64_SIMULATOR_ARM64_H_
6 #define V8_ARM64_SIMULATOR_ARM64_H_ 6 #define V8_ARM64_SIMULATOR_ARM64_H_
7 7
8 #include <stdarg.h> 8 #include <stdarg.h>
9 #include <vector> 9 #include <vector>
10 10
(...skipping 52 matching lines...) Expand 10 before | Expand all | Expand 10 after
63 return try_catch_address; 63 return try_catch_address;
64 } 64 }
65 65
66 static void UnregisterCTryCatch(v8::internal::Isolate* isolate) { 66 static void UnregisterCTryCatch(v8::internal::Isolate* isolate) {
67 USE(isolate); 67 USE(isolate);
68 } 68 }
69 }; 69 };
70 70
71 #else // !defined(USE_SIMULATOR) 71 #else // !defined(USE_SIMULATOR)
72 72
73 // Assemble the specified IEEE-754 components into the target type and apply
74 // appropriate rounding.
75 // sign: 0 = positive, 1 = negative
76 // exponent: Unbiased IEEE-754 exponent.
77 // mantissa: The mantissa of the input. The top bit (which is not encoded for
78 // normal IEEE-754 values) must not be omitted. This bit has the
79 // value 'pow(2, exponent)'.
80 //
81 // The input value is assumed to be a normalized value. That is, the input may
82 // not be infinity or NaN. If the source value is subnormal, it must be
83 // normalized before calling this function such that the highest set bit in the
84 // mantissa has the value 'pow(2, exponent)'.
85 //
86 // Callers should use FPRoundToFloat or FPRoundToDouble directly, rather than
87 // calling a templated FPRound.
88 template <class T, int ebits, int mbits>
89 T FPRound(int64_t sign, int64_t exponent, uint64_t mantissa,
90 FPRounding round_mode) {
91 static_assert((sizeof(T) * 8) >= (1 + ebits + mbits),
92 "destination type T not large enough");
93 static_assert(sizeof(T) <= sizeof(uint64_t),
94 "maximum size of destination type T is 64 bits");
95 static_assert(std::is_unsigned<T>::value,
96 "destination type T must be unsigned");
97
98 DCHECK((sign == 0) || (sign == 1));
99
100 // Only FPTieEven and FPRoundOdd rounding modes are implemented.
101 DCHECK((round_mode == FPTieEven) || (round_mode == FPRoundOdd));
102
103 // Rounding can promote subnormals to normals, and normals to infinities. For
104 // example, a double with exponent 127 (FLT_MAX_EXP) would appear to be
105 // encodable as a float, but rounding based on the low-order mantissa bits
106 // could make it overflow. With ties-to-even rounding, this value would become
107 // an infinity.
108
109 // ---- Rounding Method ----
110 //
111 // The exponent is irrelevant in the rounding operation, so we treat the
112 // lowest-order bit that will fit into the result ('onebit') as having
113 // the value '1'. Similarly, the highest-order bit that won't fit into
114 // the result ('halfbit') has the value '0.5'. The 'point' sits between
115 // 'onebit' and 'halfbit':
116 //
117 // These bits fit into the result.
118 // |---------------------|
119 // mantissa = 0bxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxx
120 // ||
121 // / |
122 // / halfbit
123 // onebit
124 //
125 // For subnormal outputs, the range of representable bits is smaller and
126 // the position of onebit and halfbit depends on the exponent of the
127 // input, but the method is otherwise similar.
128 //
129 // onebit(frac)
130 // |
131 // | halfbit(frac) halfbit(adjusted)
132 // | / /
133 // | | |
134 // 0b00.0 (exact) -> 0b00.0 (exact) -> 0b00
135 // 0b00.0... -> 0b00.0... -> 0b00
136 // 0b00.1 (exact) -> 0b00.0111..111 -> 0b00
137 // 0b00.1... -> 0b00.1... -> 0b01
138 // 0b01.0 (exact) -> 0b01.0 (exact) -> 0b01
139 // 0b01.0... -> 0b01.0... -> 0b01
140 // 0b01.1 (exact) -> 0b01.1 (exact) -> 0b10
141 // 0b01.1... -> 0b01.1... -> 0b10
142 // 0b10.0 (exact) -> 0b10.0 (exact) -> 0b10
143 // 0b10.0... -> 0b10.0... -> 0b10
144 // 0b10.1 (exact) -> 0b10.0111..111 -> 0b10
145 // 0b10.1... -> 0b10.1... -> 0b11
146 // 0b11.0 (exact) -> 0b11.0 (exact) -> 0b11
147 // ... / | / |
148 // / | / |
149 // / |
150 // adjusted = frac - (halfbit(mantissa) & ~onebit(frac)); / |
151 //
152 // mantissa = (mantissa >> shift) + halfbit(adjusted);
153
154 const int mantissa_offset = 0;
155 const int exponent_offset = mantissa_offset + mbits;
156 const int sign_offset = exponent_offset + ebits;
157 DCHECK_EQ(sign_offset, static_cast<int>(sizeof(T) * 8 - 1));
158
159 // Bail out early for zero inputs.
160 if (mantissa == 0) {
161 return static_cast<T>(sign << sign_offset);
162 }
163
164 // If all bits in the exponent are set, the value is infinite or NaN.
165 // This is true for all binary IEEE-754 formats.
166 const int infinite_exponent = (1 << ebits) - 1;
167 const int max_normal_exponent = infinite_exponent - 1;
168
169 // Apply the exponent bias to encode it for the result. Doing this early makes
170 // it easy to detect values that will be infinite or subnormal.
171 exponent += max_normal_exponent >> 1;
172
173 if (exponent > max_normal_exponent) {
174 // Overflow: the input is too large for the result type to represent.
175 if (round_mode == FPTieEven) {
176 // FPTieEven rounding mode handles overflows using infinities.
177 exponent = infinite_exponent;
178 mantissa = 0;
179 } else {
180 DCHECK_EQ(round_mode, FPRoundOdd);
181 // FPRoundOdd rounding mode handles overflows using the largest magnitude
182 // normal number.
183 exponent = max_normal_exponent;
184 mantissa = (UINT64_C(1) << exponent_offset) - 1;
185 }
186 return static_cast<T>((sign << sign_offset) |
187 (exponent << exponent_offset) |
188 (mantissa << mantissa_offset));
189 }
190
191 // Calculate the shift required to move the top mantissa bit to the proper
192 // place in the destination type.
193 const int highest_significant_bit = 63 - CountLeadingZeros(mantissa, 64);
194 int shift = highest_significant_bit - mbits;
195
196 if (exponent <= 0) {
197 // The output will be subnormal (before rounding).
198 // For subnormal outputs, the shift must be adjusted by the exponent. The +1
199 // is necessary because the exponent of a subnormal value (encoded as 0) is
200 // the same as the exponent of the smallest normal value (encoded as 1).
201 shift += -exponent + 1;
202
203 // Handle inputs that would produce a zero output.
204 //
205 // Shifts higher than highest_significant_bit+1 will always produce a zero
206 // result. A shift of exactly highest_significant_bit+1 might produce a
207 // non-zero result after rounding.
208 if (shift > (highest_significant_bit + 1)) {
209 if (round_mode == FPTieEven) {
210 // The result will always be +/-0.0.
211 return static_cast<T>(sign << sign_offset);
212 } else {
213 DCHECK_EQ(round_mode, FPRoundOdd);
214 DCHECK_NE(mantissa, 0U);
215 // For FPRoundOdd, if the mantissa is too small to represent and
216 // non-zero return the next "odd" value.
217 return static_cast<T>((sign << sign_offset) | 1);
218 }
219 }
220
221 // Properly encode the exponent for a subnormal output.
222 exponent = 0;
223 } else {
224 // Clear the topmost mantissa bit, since this is not encoded in IEEE-754
225 // normal values.
226 mantissa &= ~(UINT64_C(1) << highest_significant_bit);
227 }
228
229 if (shift > 0) {
230 if (round_mode == FPTieEven) {
231 // We have to shift the mantissa to the right. Some precision is lost, so
232 // we need to apply rounding.
233 uint64_t onebit_mantissa = (mantissa >> (shift)) & 1;
234 uint64_t halfbit_mantissa = (mantissa >> (shift - 1)) & 1;
235 uint64_t adjustment = (halfbit_mantissa & ~onebit_mantissa);
236 uint64_t adjusted = mantissa - adjustment;
237 T halfbit_adjusted = (adjusted >> (shift - 1)) & 1;
238
239 T result =
240 static_cast<T>((sign << sign_offset) | (exponent << exponent_offset) |
241 ((mantissa >> shift) << mantissa_offset));
242
243 // A very large mantissa can overflow during rounding. If this happens,
244 // the exponent should be incremented and the mantissa set to 1.0
245 // (encoded as 0). Applying halfbit_adjusted after assembling the float
246 // has the nice side-effect that this case is handled for free.
247 //
248 // This also handles cases where a very large finite value overflows to
249 // infinity, or where a very large subnormal value overflows to become
250 // normal.
251 return result + halfbit_adjusted;
252 } else {
253 DCHECK_EQ(round_mode, FPRoundOdd);
254 // If any bits at position halfbit or below are set, onebit (ie. the
255 // bottom bit of the resulting mantissa) must be set.
256 uint64_t fractional_bits = mantissa & ((UINT64_C(1) << shift) - 1);
257 if (fractional_bits != 0) {
258 mantissa |= UINT64_C(1) << shift;
259 }
260
261 return static_cast<T>((sign << sign_offset) |
262 (exponent << exponent_offset) |
263 ((mantissa >> shift) << mantissa_offset));
264 }
265 } else {
266 // We have to shift the mantissa to the left (or not at all). The input
267 // mantissa is exactly representable in the output mantissa, so apply no
268 // rounding correction.
269 return static_cast<T>((sign << sign_offset) |
270 (exponent << exponent_offset) |
271 ((mantissa << -shift) << mantissa_offset));
272 }
273 }
274
275 // Representation of memory, with typed getters and setters for access.
276 class SimMemory {
277 public:
278 template <typename T>
279 static T AddressUntag(T address) {
280 // Cast the address using a C-style cast. A reinterpret_cast would be
281 // appropriate, but it can't cast one integral type to another.
282 uint64_t bits = (uint64_t)address;
283 return (T)(bits & ~kAddressTagMask);
284 }
285
286 template <typename T, typename A>
287 static T Read(A address) {
288 T value;
289 address = AddressUntag(address);
290 DCHECK((sizeof(value) == 1) || (sizeof(value) == 2) ||
291 (sizeof(value) == 4) || (sizeof(value) == 8) ||
292 (sizeof(value) == 16));
293 memcpy(&value, reinterpret_cast<const char*>(address), sizeof(value));
294 return value;
295 }
296
297 template <typename T, typename A>
298 static void Write(A address, T value) {
299 address = AddressUntag(address);
300 DCHECK((sizeof(value) == 1) || (sizeof(value) == 2) ||
301 (sizeof(value) == 4) || (sizeof(value) == 8) ||
302 (sizeof(value) == 16));
303 memcpy(reinterpret_cast<char*>(address), &value, sizeof(value));
304 }
305 };
73 306
74 // The proper way to initialize a simulated system register (such as NZCV) is as 307 // The proper way to initialize a simulated system register (such as NZCV) is as
75 // follows: 308 // follows:
76 // SimSystemRegister nzcv = SimSystemRegister::DefaultValueFor(NZCV); 309 // SimSystemRegister nzcv = SimSystemRegister::DefaultValueFor(NZCV);
77 class SimSystemRegister { 310 class SimSystemRegister {
78 public: 311 public:
79 // The default constructor represents a register which has no writable bits. 312 // The default constructor represents a register which has no writable bits.
80 // It is not possible to set its value to anything other than 0. 313 // It is not possible to set its value to anything other than 0.
81 SimSystemRegister() : value_(0), write_ignore_mask_(0xffffffff) { } 314 SimSystemRegister() : value_(0), write_ignore_mask_(0xffffffff) { }
82 315
(...skipping 35 matching lines...) Expand 10 before | Expand all | Expand 10 after
118 // describes the bits which are not modifiable. 351 // describes the bits which are not modifiable.
119 SimSystemRegister(uint32_t value, uint32_t write_ignore_mask) 352 SimSystemRegister(uint32_t value, uint32_t write_ignore_mask)
120 : value_(value), write_ignore_mask_(write_ignore_mask) { } 353 : value_(value), write_ignore_mask_(write_ignore_mask) { }
121 354
122 uint32_t value_; 355 uint32_t value_;
123 uint32_t write_ignore_mask_; 356 uint32_t write_ignore_mask_;
124 }; 357 };
125 358
126 359
127 // Represent a register (r0-r31, v0-v31). 360 // Represent a register (r0-r31, v0-v31).
361 template <int kSizeInBytes>
128 class SimRegisterBase { 362 class SimRegisterBase {
129 public: 363 public:
130 template<typename T> 364 template<typename T>
131 void Set(T new_value) { 365 void Set(T new_value) {
132 value_ = 0; 366 static_assert(sizeof(new_value) <= kSizeInBytes,
367 "Size of new_value must be <= size of template type.");
368 if (sizeof(new_value) < kSizeInBytes) {
369 // All AArch64 registers are zero-extending.
370 memset(value_ + sizeof(new_value), 0, kSizeInBytes - sizeof(new_value));
371 }
133 memcpy(&value_, &new_value, sizeof(T)); 372 memcpy(&value_, &new_value, sizeof(T));
134 } 373 NotifyRegisterWrite();
135 374 }
136 template<typename T> 375
137 T Get() const { 376 // Insert a typed value into a register, leaving the rest of the register
377 // unchanged. The lane parameter indicates where in the register the value
378 // should be inserted, in the range [ 0, sizeof(value_) / sizeof(T) ), where
379 // 0 represents the least significant bits.
380 template <typename T>
381 void Insert(int lane, T new_value) {
382 DCHECK_GE(lane, 0);
383 DCHECK_LE(sizeof(new_value) + (lane * sizeof(new_value)),
384 static_cast<unsigned>(kSizeInBytes));
385 memcpy(&value_[lane * sizeof(new_value)], &new_value, sizeof(new_value));
386 NotifyRegisterWrite();
387 }
388
389 template <typename T>
390 T Get(int lane = 0) const {
138 T result; 391 T result;
139 memcpy(&result, &value_, sizeof(T)); 392 DCHECK_GE(lane, 0);
393 DCHECK_LE(sizeof(result) + (lane * sizeof(result)),
394 static_cast<unsigned>(kSizeInBytes));
395 memcpy(&result, &value_[lane * sizeof(result)], sizeof(result));
140 return result; 396 return result;
141 } 397 }
142 398
399 // TODO(all): Make this return a map of updated bytes, so that we can
400 // highlight updated lanes for load-and-insert. (That never happens for scalar
401 // code, but NEON has some instructions that can update individual lanes.)
402 bool WrittenSinceLastLog() const { return written_since_last_log_; }
403
404 void NotifyRegisterLogged() { written_since_last_log_ = false; }
405
143 protected: 406 protected:
144 int64_t value_; 407 uint8_t value_[kSizeInBytes];
408
409 // Helpers to aid with register tracing.
410 bool written_since_last_log_;
411
412 void NotifyRegisterWrite() { written_since_last_log_ = true; }
145 }; 413 };
146 414
147 415 typedef SimRegisterBase<kXRegSize> SimRegister; // r0-r31
148 typedef SimRegisterBase SimRegister; // r0-r31 416 typedef SimRegisterBase<kQRegSize> SimVRegister; // v0-v31
149 typedef SimRegisterBase SimFPRegister; // v0-v31 417
150 418 // Representation of a vector register, with typed getters and setters for lanes
419 // and additional information to represent lane state.
420 class LogicVRegister {
421 public:
422 inline LogicVRegister(SimVRegister& other) // NOLINT
423 : register_(other) {
424 for (unsigned i = 0; i < arraysize(saturated_); i++) {
425 saturated_[i] = kNotSaturated;
426 }
427 for (unsigned i = 0; i < arraysize(round_); i++) {
428 round_[i] = false;
429 }
430 }
431
432 int64_t Int(VectorFormat vform, int index) const {
433 int64_t element;
434 switch (LaneSizeInBitsFromFormat(vform)) {
435 case 8:
436 element = register_.Get<int8_t>(index);
437 break;
438 case 16:
439 element = register_.Get<int16_t>(index);
440 break;
441 case 32:
442 element = register_.Get<int32_t>(index);
443 break;
444 case 64:
445 element = register_.Get<int64_t>(index);
446 break;
447 default:
448 UNREACHABLE();
449 return 0;
450 }
451 return element;
452 }
453
454 uint64_t Uint(VectorFormat vform, int index) const {
455 uint64_t element;
456 switch (LaneSizeInBitsFromFormat(vform)) {
457 case 8:
458 element = register_.Get<uint8_t>(index);
459 break;
460 case 16:
461 element = register_.Get<uint16_t>(index);
462 break;
463 case 32:
464 element = register_.Get<uint32_t>(index);
465 break;
466 case 64:
467 element = register_.Get<uint64_t>(index);
468 break;
469 default:
470 UNREACHABLE();
471 return 0;
472 }
473 return element;
474 }
475
476 uint64_t UintLeftJustified(VectorFormat vform, int index) const {
477 return Uint(vform, index) << (64 - LaneSizeInBitsFromFormat(vform));
478 }
479
480 int64_t IntLeftJustified(VectorFormat vform, int index) const {
481 uint64_t value = UintLeftJustified(vform, index);
482 int64_t result;
483 memcpy(&result, &value, sizeof(result));
484 return result;
485 }
486
487 void SetInt(VectorFormat vform, int index, int64_t value) const {
488 switch (LaneSizeInBitsFromFormat(vform)) {
489 case 8:
490 register_.Insert(index, static_cast<int8_t>(value));
491 break;
492 case 16:
493 register_.Insert(index, static_cast<int16_t>(value));
494 break;
495 case 32:
496 register_.Insert(index, static_cast<int32_t>(value));
497 break;
498 case 64:
499 register_.Insert(index, static_cast<int64_t>(value));
500 break;
501 default:
502 UNREACHABLE();
503 return;
504 }
505 }
506
507 void SetIntArray(VectorFormat vform, const int64_t* src) const {
508 ClearForWrite(vform);
509 for (int i = 0; i < LaneCountFromFormat(vform); i++) {
510 SetInt(vform, i, src[i]);
511 }
512 }
513
514 void SetUint(VectorFormat vform, int index, uint64_t value) const {
515 switch (LaneSizeInBitsFromFormat(vform)) {
516 case 8:
517 register_.Insert(index, static_cast<uint8_t>(value));
518 break;
519 case 16:
520 register_.Insert(index, static_cast<uint16_t>(value));
521 break;
522 case 32:
523 register_.Insert(index, static_cast<uint32_t>(value));
524 break;
525 case 64:
526 register_.Insert(index, static_cast<uint64_t>(value));
527 break;
528 default:
529 UNREACHABLE();
530 return;
531 }
532 }
533
534 void SetUintArray(VectorFormat vform, const uint64_t* src) const {
535 ClearForWrite(vform);
536 for (int i = 0; i < LaneCountFromFormat(vform); i++) {
537 SetUint(vform, i, src[i]);
538 }
539 }
540
541 void ReadUintFromMem(VectorFormat vform, int index, uint64_t addr) const;
542
543 void WriteUintToMem(VectorFormat vform, int index, uint64_t addr) const;
544
545 template <typename T>
546 T Float(int index) const {
547 return register_.Get<T>(index);
548 }
549
550 template <typename T>
551 void SetFloat(int index, T value) const {
552 register_.Insert(index, value);
553 }
554
555 // When setting a result in a register of size less than Q, the top bits of
556 // the Q register must be cleared.
557 void ClearForWrite(VectorFormat vform) const {
558 unsigned size = RegisterSizeInBytesFromFormat(vform);
559 for (unsigned i = size; i < kQRegSize; i++) {
560 SetUint(kFormat16B, i, 0);
561 }
562 }
563
564 // Saturation state for each lane of a vector.
565 enum Saturation {
566 kNotSaturated = 0,
567 kSignedSatPositive = 1 << 0,
568 kSignedSatNegative = 1 << 1,
569 kSignedSatMask = kSignedSatPositive | kSignedSatNegative,
570 kSignedSatUndefined = kSignedSatMask,
571 kUnsignedSatPositive = 1 << 2,
572 kUnsignedSatNegative = 1 << 3,
573 kUnsignedSatMask = kUnsignedSatPositive | kUnsignedSatNegative,
574 kUnsignedSatUndefined = kUnsignedSatMask
575 };
576
577 // Getters for saturation state.
578 Saturation GetSignedSaturation(int index) {
579 return static_cast<Saturation>(saturated_[index] & kSignedSatMask);
580 }
581
582 Saturation GetUnsignedSaturation(int index) {
583 return static_cast<Saturation>(saturated_[index] & kUnsignedSatMask);
584 }
585
586 // Setters for saturation state.
587 void ClearSat(int index) { saturated_[index] = kNotSaturated; }
588
589 void SetSignedSat(int index, bool positive) {
590 SetSatFlag(index, positive ? kSignedSatPositive : kSignedSatNegative);
591 }
592
593 void SetUnsignedSat(int index, bool positive) {
594 SetSatFlag(index, positive ? kUnsignedSatPositive : kUnsignedSatNegative);
595 }
596
597 void SetSatFlag(int index, Saturation sat) {
598 saturated_[index] = static_cast<Saturation>(saturated_[index] | sat);
599 DCHECK_NE(sat & kUnsignedSatMask, kUnsignedSatUndefined);
600 DCHECK_NE(sat & kSignedSatMask, kSignedSatUndefined);
601 }
602
603 // Saturate lanes of a vector based on saturation state.
604 LogicVRegister& SignedSaturate(VectorFormat vform) {
605 for (int i = 0; i < LaneCountFromFormat(vform); i++) {
606 Saturation sat = GetSignedSaturation(i);
607 if (sat == kSignedSatPositive) {
608 SetInt(vform, i, MaxIntFromFormat(vform));
609 } else if (sat == kSignedSatNegative) {
610 SetInt(vform, i, MinIntFromFormat(vform));
611 }
612 }
613 return *this;
614 }
615
616 LogicVRegister& UnsignedSaturate(VectorFormat vform) {
617 for (int i = 0; i < LaneCountFromFormat(vform); i++) {
618 Saturation sat = GetUnsignedSaturation(i);
619 if (sat == kUnsignedSatPositive) {
620 SetUint(vform, i, MaxUintFromFormat(vform));
621 } else if (sat == kUnsignedSatNegative) {
622 SetUint(vform, i, 0);
623 }
624 }
625 return *this;
626 }
627
628 // Getter for rounding state.
629 bool GetRounding(int index) { return round_[index]; }
630
631 // Setter for rounding state.
632 void SetRounding(int index, bool round) { round_[index] = round; }
633
634 // Round lanes of a vector based on rounding state.
635 LogicVRegister& Round(VectorFormat vform) {
636 for (int i = 0; i < LaneCountFromFormat(vform); i++) {
637 SetUint(vform, i, Uint(vform, i) + (GetRounding(i) ? 1 : 0));
638 }
639 return *this;
640 }
641
642 // Unsigned halve lanes of a vector, and use the saturation state to set the
643 // top bit.
644 LogicVRegister& Uhalve(VectorFormat vform) {
645 for (int i = 0; i < LaneCountFromFormat(vform); i++) {
646 uint64_t val = Uint(vform, i);
647 SetRounding(i, (val & 1) == 1);
648 val >>= 1;
649 if (GetUnsignedSaturation(i) != kNotSaturated) {
650 // If the operation causes unsigned saturation, the bit shifted into the
651 // most significant bit must be set.
652 val |= (MaxUintFromFormat(vform) >> 1) + 1;
653 }
654 SetInt(vform, i, val);
655 }
656 return *this;
657 }
658
659 // Signed halve lanes of a vector, and use the carry state to set the top bit.
660 LogicVRegister& Halve(VectorFormat vform) {
661 for (int i = 0; i < LaneCountFromFormat(vform); i++) {
662 int64_t val = Int(vform, i);
663 SetRounding(i, (val & 1) == 1);
664 val >>= 1;
665 if (GetSignedSaturation(i) != kNotSaturated) {
666 // If the operation causes signed saturation, the sign bit must be
667 // inverted.
668 val ^= (MaxUintFromFormat(vform) >> 1) + 1;
669 }
670 SetInt(vform, i, val);
671 }
672 return *this;
673 }
674
675 private:
676 SimVRegister& register_;
677
678 // Allocate one saturation state entry per lane; largest register is type Q,
679 // and lanes can be a minimum of one byte wide.
680 Saturation saturated_[kQRegSize];
681
682 // Allocate one rounding state entry per lane.
683 bool round_[kQRegSize];
684 };
151 685
152 class Simulator : public DecoderVisitor { 686 class Simulator : public DecoderVisitor {
153 public: 687 public:
154 static void FlushICache(base::CustomMatcherHashMap* i_cache, void* start, 688 static void FlushICache(base::CustomMatcherHashMap* i_cache, void* start,
155 size_t size) { 689 size_t size) {
156 USE(i_cache); 690 USE(i_cache);
157 USE(start); 691 USE(start);
158 USE(size); 692 USE(size);
159 } 693 }
160 694
(...skipping 147 matching lines...) Expand 10 before | Expand all | Expand 10 after
308 842
309 virtual void Decode(Instruction* instr) { 843 virtual void Decode(Instruction* instr) {
310 decoder_->Decode(instr); 844 decoder_->Decode(instr);
311 } 845 }
312 846
313 void ExecuteInstruction() { 847 void ExecuteInstruction() {
314 DCHECK(IsAligned(reinterpret_cast<uintptr_t>(pc_), kInstructionSize)); 848 DCHECK(IsAligned(reinterpret_cast<uintptr_t>(pc_), kInstructionSize));
315 CheckBreakNext(); 849 CheckBreakNext();
316 Decode(pc_); 850 Decode(pc_);
317 increment_pc(); 851 increment_pc();
852 LogAllWrittenRegisters();
318 CheckBreakpoints(); 853 CheckBreakpoints();
319 } 854 }
320 855
321 // Declare all Visitor functions. 856 // Declare all Visitor functions.
322 #define DECLARE(A) void Visit##A(Instruction* instr); 857 #define DECLARE(A) void Visit##A(Instruction* instr);
323 VISITOR_LIST(DECLARE) 858 VISITOR_LIST(DECLARE)
324 #undef DECLARE 859 #undef DECLARE
325 860
326 bool IsZeroRegister(unsigned code, Reg31Mode r31mode) const { 861 bool IsZeroRegister(unsigned code, Reg31Mode r31mode) const {
327 return ((code == 31) && (r31mode == Reg31IsZeroRegister)); 862 return ((code == 31) && (r31mode == Reg31IsZeroRegister));
328 } 863 }
329 864
330 // Register accessors. 865 // Register accessors.
331 // Return 'size' bits of the value of an integer register, as the specified 866 // Return 'size' bits of the value of an integer register, as the specified
332 // type. The value is zero-extended to fill the result. 867 // type. The value is zero-extended to fill the result.
333 // 868 //
334 template<typename T> 869 template<typename T>
335 T reg(unsigned code, Reg31Mode r31mode = Reg31IsZeroRegister) const { 870 T reg(unsigned code, Reg31Mode r31mode = Reg31IsZeroRegister) const {
336 DCHECK(code < kNumberOfRegisters); 871 DCHECK_LT(code, static_cast<unsigned>(kNumberOfRegisters));
337 if (IsZeroRegister(code, r31mode)) { 872 if (IsZeroRegister(code, r31mode)) {
338 return 0; 873 return 0;
339 } 874 }
340 return registers_[code].Get<T>(); 875 return registers_[code].Get<T>();
341 } 876 }
342 877
343 // Common specialized accessors for the reg() template. 878 // Common specialized accessors for the reg() template.
344 int32_t wreg(unsigned code, Reg31Mode r31mode = Reg31IsZeroRegister) const { 879 int32_t wreg(unsigned code, Reg31Mode r31mode = Reg31IsZeroRegister) const {
345 return reg<int32_t>(code, r31mode); 880 return reg<int32_t>(code, r31mode);
346 } 881 }
347 882
348 int64_t xreg(unsigned code, Reg31Mode r31mode = Reg31IsZeroRegister) const { 883 int64_t xreg(unsigned code, Reg31Mode r31mode = Reg31IsZeroRegister) const {
349 return reg<int64_t>(code, r31mode); 884 return reg<int64_t>(code, r31mode);
350 } 885 }
351 886
887 enum RegLogMode { LogRegWrites, NoRegLog };
888
352 // Write 'value' into an integer register. The value is zero-extended. This 889 // Write 'value' into an integer register. The value is zero-extended. This
353 // behaviour matches AArch64 register writes. 890 // behaviour matches AArch64 register writes.
354 template<typename T> 891 template<typename T>
355 void set_reg(unsigned code, T value, 892 void set_reg(unsigned code, T value,
356 Reg31Mode r31mode = Reg31IsZeroRegister) { 893 Reg31Mode r31mode = Reg31IsZeroRegister) {
357 set_reg_no_log(code, value, r31mode); 894 set_reg_no_log(code, value, r31mode);
358 LogRegister(code, r31mode); 895 LogRegister(code, r31mode);
359 } 896 }
360 897
361 // Common specialized accessors for the set_reg() template. 898 // Common specialized accessors for the set_reg() template.
362 void set_wreg(unsigned code, int32_t value, 899 void set_wreg(unsigned code, int32_t value,
363 Reg31Mode r31mode = Reg31IsZeroRegister) { 900 Reg31Mode r31mode = Reg31IsZeroRegister) {
364 set_reg(code, value, r31mode); 901 set_reg(code, value, r31mode);
365 } 902 }
366 903
367 void set_xreg(unsigned code, int64_t value, 904 void set_xreg(unsigned code, int64_t value,
368 Reg31Mode r31mode = Reg31IsZeroRegister) { 905 Reg31Mode r31mode = Reg31IsZeroRegister) {
369 set_reg(code, value, r31mode); 906 set_reg(code, value, r31mode);
370 } 907 }
371 908
372 // As above, but don't automatically log the register update. 909 // As above, but don't automatically log the register update.
373 template <typename T> 910 template <typename T>
374 void set_reg_no_log(unsigned code, T value, 911 void set_reg_no_log(unsigned code, T value,
375 Reg31Mode r31mode = Reg31IsZeroRegister) { 912 Reg31Mode r31mode = Reg31IsZeroRegister) {
376 DCHECK(code < kNumberOfRegisters); 913 DCHECK_LT(code, static_cast<unsigned>(kNumberOfRegisters));
377 if (!IsZeroRegister(code, r31mode)) { 914 if (!IsZeroRegister(code, r31mode)) {
378 registers_[code].Set(value); 915 registers_[code].Set(value);
379 } 916 }
380 } 917 }
381 918
382 void set_wreg_no_log(unsigned code, int32_t value, 919 void set_wreg_no_log(unsigned code, int32_t value,
383 Reg31Mode r31mode = Reg31IsZeroRegister) { 920 Reg31Mode r31mode = Reg31IsZeroRegister) {
384 set_reg_no_log(code, value, r31mode); 921 set_reg_no_log(code, value, r31mode);
385 } 922 }
386 923
387 void set_xreg_no_log(unsigned code, int64_t value, 924 void set_xreg_no_log(unsigned code, int64_t value,
388 Reg31Mode r31mode = Reg31IsZeroRegister) { 925 Reg31Mode r31mode = Reg31IsZeroRegister) {
389 set_reg_no_log(code, value, r31mode); 926 set_reg_no_log(code, value, r31mode);
390 } 927 }
391 928
392 // Commonly-used special cases. 929 // Commonly-used special cases.
393 template<typename T> 930 template<typename T>
394 void set_lr(T value) { 931 void set_lr(T value) {
395 DCHECK(sizeof(T) == kPointerSize); 932 DCHECK_EQ(sizeof(T), static_cast<unsigned>(kPointerSize));
396 set_reg(kLinkRegCode, value); 933 set_reg(kLinkRegCode, value);
397 } 934 }
398 935
399 template<typename T> 936 template<typename T>
400 void set_sp(T value) { 937 void set_sp(T value) {
401 DCHECK(sizeof(T) == kPointerSize); 938 DCHECK_EQ(sizeof(T), static_cast<unsigned>(kPointerSize));
402 set_reg(31, value, Reg31IsStackPointer); 939 set_reg(31, value, Reg31IsStackPointer);
403 } 940 }
404 941
942 // Vector register accessors.
943 // These are equivalent to the integer register accessors, but for vector
944 // registers.
945
946 // A structure for representing a 128-bit Q register.
947 struct qreg_t {
948 uint8_t val[kQRegSize];
949 };
950
951 // Basic accessor: read the register as the specified type.
952 template <typename T>
953 T vreg(unsigned code) const {
954 static_assert((sizeof(T) == kBRegSize) || (sizeof(T) == kHRegSize) ||
955 (sizeof(T) == kSRegSize) || (sizeof(T) == kDRegSize) ||
956 (sizeof(T) == kQRegSize),
957 "Template type must match size of register.");
958 DCHECK_LT(code, static_cast<unsigned>(kNumberOfVRegisters));
959
960 return vregisters_[code].Get<T>();
961 }
962
963 inline SimVRegister& vreg(unsigned code) { return vregisters_[code]; }
964
405 int64_t sp() { return xreg(31, Reg31IsStackPointer); } 965 int64_t sp() { return xreg(31, Reg31IsStackPointer); }
406 int64_t jssp() { return xreg(kJSSPCode, Reg31IsStackPointer); } 966 int64_t jssp() { return xreg(kJSSPCode, Reg31IsStackPointer); }
407 int64_t fp() { 967 int64_t fp() {
408 return xreg(kFramePointerRegCode, Reg31IsStackPointer); 968 return xreg(kFramePointerRegCode, Reg31IsStackPointer);
409 } 969 }
410 Instruction* lr() { return reg<Instruction*>(kLinkRegCode); } 970 Instruction* lr() { return reg<Instruction*>(kLinkRegCode); }
411 971
412 Address get_sp() const { return reg<Address>(31, Reg31IsStackPointer); } 972 Address get_sp() const { return reg<Address>(31, Reg31IsStackPointer); }
413 973
414 template<typename T> 974 // Common specialized accessors for the vreg() template.
415 T fpreg(unsigned code) const { 975 uint8_t breg(unsigned code) const { return vreg<uint8_t>(code); }
416 DCHECK(code < kNumberOfRegisters);
417 return fpregisters_[code].Get<T>();
418 }
419 976
420 // Common specialized accessors for the fpreg() template. 977 float hreg(unsigned code) const { return vreg<uint16_t>(code); }
421 float sreg(unsigned code) const {
422 return fpreg<float>(code);
423 }
424 978
425 uint32_t sreg_bits(unsigned code) const { 979 float sreg(unsigned code) const { return vreg<float>(code); }
426 return fpreg<uint32_t>(code);
427 }
428 980
429 double dreg(unsigned code) const { 981 uint32_t sreg_bits(unsigned code) const { return vreg<uint32_t>(code); }
430 return fpreg<double>(code);
431 }
432 982
433 uint64_t dreg_bits(unsigned code) const { 983 double dreg(unsigned code) const { return vreg<double>(code); }
434 return fpreg<uint64_t>(code);
435 }
436 984
437 double fpreg(unsigned size, unsigned code) const { 985 uint64_t dreg_bits(unsigned code) const { return vreg<uint64_t>(code); }
986
987 qreg_t qreg(unsigned code) const { return vreg<qreg_t>(code); }
988
989 // As above, with parameterized size and return type. The value is
990 // either zero-extended or truncated to fit, as required.
991 template <typename T>
992 T vreg(unsigned size, unsigned code) const {
993 uint64_t raw = 0;
994 T result;
995
438 switch (size) { 996 switch (size) {
439 case kSRegSizeInBits: return sreg(code); 997 case kSRegSize:
440 case kDRegSizeInBits: return dreg(code); 998 raw = vreg<uint32_t>(code);
999 break;
1000 case kDRegSize:
1001 raw = vreg<uint64_t>(code);
1002 break;
441 default: 1003 default:
442 UNREACHABLE(); 1004 UNREACHABLE();
443 return 0.0; 1005 break;
444 } 1006 }
1007
1008 static_assert(sizeof(result) <= sizeof(raw),
1009 "Template type must be <= 64 bits.");
1010 // Copy the result and truncate to fit. This assumes a little-endian host.
1011 memcpy(&result, &raw, sizeof(result));
1012 return result;
445 } 1013 }
446 1014
447 // Write 'value' into a floating-point register. The value is zero-extended. 1015 // Write 'value' into a floating-point register. The value is zero-extended.
448 // This behaviour matches AArch64 register writes. 1016 // This behaviour matches AArch64 register writes.
449 template<typename T> 1017 template <typename T>
450 void set_fpreg(unsigned code, T value) { 1018 void set_vreg(unsigned code, T value, RegLogMode log_mode = LogRegWrites) {
451 set_fpreg_no_log(code, value); 1019 static_assert(
1020 (sizeof(value) == kBRegSize) || (sizeof(value) == kHRegSize) ||
1021 (sizeof(value) == kSRegSize) || (sizeof(value) == kDRegSize) ||
1022 (sizeof(value) == kQRegSize),
1023 "Template type must match size of register.");
1024 DCHECK_LT(code, static_cast<unsigned>(kNumberOfVRegisters));
1025 vregisters_[code].Set(value);
452 1026
453 if (sizeof(value) <= kSRegSize) { 1027 if (log_mode == LogRegWrites) {
454 LogFPRegister(code, kPrintSRegValue); 1028 LogVRegister(code, GetPrintRegisterFormat(value));
455 } else {
456 LogFPRegister(code, kPrintDRegValue);
457 } 1029 }
458 } 1030 }
459 1031
460 // Common specialized accessors for the set_fpreg() template. 1032 // Common specialized accessors for the set_vreg() template.
461 void set_sreg(unsigned code, float value) { 1033 void set_breg(unsigned code, int8_t value,
462 set_fpreg(code, value); 1034 RegLogMode log_mode = LogRegWrites) {
1035 set_vreg(code, value, log_mode);
463 } 1036 }
464 1037
465 void set_sreg_bits(unsigned code, uint32_t value) { 1038 void set_hreg(unsigned code, int16_t value,
466 set_fpreg(code, value); 1039 RegLogMode log_mode = LogRegWrites) {
1040 set_vreg(code, value, log_mode);
467 } 1041 }
468 1042
469 void set_dreg(unsigned code, double value) { 1043 void set_sreg(unsigned code, float value,
470 set_fpreg(code, value); 1044 RegLogMode log_mode = LogRegWrites) {
1045 set_vreg(code, value, log_mode);
471 } 1046 }
472 1047
473 void set_dreg_bits(unsigned code, uint64_t value) { 1048 void set_sreg_bits(unsigned code, uint32_t value,
474 set_fpreg(code, value); 1049 RegLogMode log_mode = LogRegWrites) {
1050 set_vreg(code, value, log_mode);
1051 }
1052
1053 void set_dreg(unsigned code, double value,
1054 RegLogMode log_mode = LogRegWrites) {
1055 set_vreg(code, value, log_mode);
1056 }
1057
1058 void set_dreg_bits(unsigned code, uint64_t value,
1059 RegLogMode log_mode = LogRegWrites) {
1060 set_vreg(code, value, log_mode);
1061 }
1062
1063 void set_qreg(unsigned code, qreg_t value,
1064 RegLogMode log_mode = LogRegWrites) {
1065 set_vreg(code, value, log_mode);
475 } 1066 }
476 1067
477 // As above, but don't automatically log the register update. 1068 // As above, but don't automatically log the register update.
478 template <typename T> 1069 template <typename T>
479 void set_fpreg_no_log(unsigned code, T value) { 1070 void set_vreg_no_log(unsigned code, T value) {
480 DCHECK((sizeof(value) == kDRegSize) || (sizeof(value) == kSRegSize)); 1071 STATIC_ASSERT((sizeof(value) == kBRegSize) ||
481 DCHECK(code < kNumberOfFPRegisters); 1072 (sizeof(value) == kHRegSize) ||
482 fpregisters_[code].Set(value); 1073 (sizeof(value) == kSRegSize) ||
1074 (sizeof(value) == kDRegSize) || (sizeof(value) == kQRegSize));
1075 DCHECK_LT(code, static_cast<unsigned>(kNumberOfVRegisters));
1076 vregisters_[code].Set(value);
1077 }
1078
1079 void set_breg_no_log(unsigned code, uint8_t value) {
1080 set_vreg_no_log(code, value);
1081 }
1082
1083 void set_hreg_no_log(unsigned code, uint16_t value) {
1084 set_vreg_no_log(code, value);
483 } 1085 }
484 1086
485 void set_sreg_no_log(unsigned code, float value) { 1087 void set_sreg_no_log(unsigned code, float value) {
486 set_fpreg_no_log(code, value); 1088 set_vreg_no_log(code, value);
487 } 1089 }
488 1090
489 void set_dreg_no_log(unsigned code, double value) { 1091 void set_dreg_no_log(unsigned code, double value) {
490 set_fpreg_no_log(code, value); 1092 set_vreg_no_log(code, value);
1093 }
1094
1095 void set_qreg_no_log(unsigned code, qreg_t value) {
1096 set_vreg_no_log(code, value);
491 } 1097 }
492 1098
493 SimSystemRegister& nzcv() { return nzcv_; } 1099 SimSystemRegister& nzcv() { return nzcv_; }
494 SimSystemRegister& fpcr() { return fpcr_; } 1100 SimSystemRegister& fpcr() { return fpcr_; }
1101 FPRounding RMode() { return static_cast<FPRounding>(fpcr_.RMode()); }
1102 bool DN() { return fpcr_.DN() != 0; }
495 1103
496 // Debug helpers 1104 // Debug helpers
497 1105
498 // Simulator breakpoints. 1106 // Simulator breakpoints.
499 struct Breakpoint { 1107 struct Breakpoint {
500 Instruction* location; 1108 Instruction* location;
501 bool enabled; 1109 bool enabled;
502 }; 1110 };
503 std::vector<Breakpoint> breakpoints_; 1111 std::vector<Breakpoint> breakpoints_;
504 void SetBreakpoint(Instruction* breakpoint); 1112 void SetBreakpoint(Instruction* breakpoint);
505 void ListBreakpoints(); 1113 void ListBreakpoints();
506 void CheckBreakpoints(); 1114 void CheckBreakpoints();
507 1115
508 // Helpers for the 'next' command. 1116 // Helpers for the 'next' command.
509 // When this is set, the Simulator will insert a breakpoint after the next BL 1117 // When this is set, the Simulator will insert a breakpoint after the next BL
510 // instruction it meets. 1118 // instruction it meets.
511 bool break_on_next_; 1119 bool break_on_next_;
512 // Check if the Simulator should insert a break after the current instruction 1120 // Check if the Simulator should insert a break after the current instruction
513 // for the 'next' command. 1121 // for the 'next' command.
514 void CheckBreakNext(); 1122 void CheckBreakNext();
515 1123
516 // Disassemble instruction at the given address. 1124 // Disassemble instruction at the given address.
517 void PrintInstructionsAt(Instruction* pc, uint64_t count); 1125 void PrintInstructionsAt(Instruction* pc, uint64_t count);
518 1126
519 // Print all registers of the specified types. 1127 // Print all registers of the specified types.
520 void PrintRegisters(); 1128 void PrintRegisters();
521 void PrintFPRegisters(); 1129 void PrintVRegisters();
522 void PrintSystemRegisters(); 1130 void PrintSystemRegisters();
523 1131
524 // Like Print* (above), but respect log_parameters(). 1132 // As above, but only print the registers that have been updated.
525 void LogSystemRegisters() { 1133 void PrintWrittenRegisters();
526 if (log_parameters() & LOG_SYS_REGS) PrintSystemRegisters(); 1134 void PrintWrittenVRegisters();
1135
1136 // As above, but respect LOG_REG and LOG_VREG.
1137 void LogWrittenRegisters() {
1138 if (log_parameters() & LOG_REGS) PrintWrittenRegisters();
527 } 1139 }
528 void LogRegisters() { 1140 void LogWrittenVRegisters() {
529 if (log_parameters() & LOG_REGS) PrintRegisters(); 1141 if (log_parameters() & LOG_VREGS) PrintWrittenVRegisters();
530 } 1142 }
531 void LogFPRegisters() { 1143 void LogAllWrittenRegisters() {
532 if (log_parameters() & LOG_FP_REGS) PrintFPRegisters(); 1144 LogWrittenRegisters();
1145 LogWrittenVRegisters();
533 } 1146 }
534 1147
535 // Specify relevant register sizes, for PrintFPRegister. 1148 // Specify relevant register formats for Print(V)Register and related helpers.
536 // 1149 enum PrintRegisterFormat {
537 // These values are bit masks; they can be combined in case multiple views of 1150 // The lane size.
538 // a machine register are interesting. 1151 kPrintRegLaneSizeB = 0 << 0,
539 enum PrintFPRegisterSizes { 1152 kPrintRegLaneSizeH = 1 << 0,
540 kPrintDRegValue = 1 << kDRegSize, 1153 kPrintRegLaneSizeS = 2 << 0,
541 kPrintSRegValue = 1 << kSRegSize, 1154 kPrintRegLaneSizeW = kPrintRegLaneSizeS,
542 kPrintAllFPRegValues = kPrintDRegValue | kPrintSRegValue 1155 kPrintRegLaneSizeD = 3 << 0,
1156 kPrintRegLaneSizeX = kPrintRegLaneSizeD,
1157 kPrintRegLaneSizeQ = 4 << 0,
1158
1159 kPrintRegLaneSizeOffset = 0,
1160 kPrintRegLaneSizeMask = 7 << 0,
1161
1162 // The lane count.
1163 kPrintRegAsScalar = 0,
1164 kPrintRegAsDVector = 1 << 3,
1165 kPrintRegAsQVector = 2 << 3,
1166
1167 kPrintRegAsVectorMask = 3 << 3,
1168
1169 // Indicate floating-point format lanes. (This flag is only supported for S-
1170 // and D-sized lanes.)
1171 kPrintRegAsFP = 1 << 5,
1172
1173 // Supported combinations.
1174
1175 kPrintXReg = kPrintRegLaneSizeX | kPrintRegAsScalar,
1176 kPrintWReg = kPrintRegLaneSizeW | kPrintRegAsScalar,
1177 kPrintSReg = kPrintRegLaneSizeS | kPrintRegAsScalar | kPrintRegAsFP,
1178 kPrintDReg = kPrintRegLaneSizeD | kPrintRegAsScalar | kPrintRegAsFP,
1179
1180 kPrintReg1B = kPrintRegLaneSizeB | kPrintRegAsScalar,
1181 kPrintReg8B = kPrintRegLaneSizeB | kPrintRegAsDVector,
1182 kPrintReg16B = kPrintRegLaneSizeB | kPrintRegAsQVector,
1183 kPrintReg1H = kPrintRegLaneSizeH | kPrintRegAsScalar,
1184 kPrintReg4H = kPrintRegLaneSizeH | kPrintRegAsDVector,
1185 kPrintReg8H = kPrintRegLaneSizeH | kPrintRegAsQVector,
1186 kPrintReg1S = kPrintRegLaneSizeS | kPrintRegAsScalar,
1187 kPrintReg2S = kPrintRegLaneSizeS | kPrintRegAsDVector,
1188 kPrintReg4S = kPrintRegLaneSizeS | kPrintRegAsQVector,
1189 kPrintReg1SFP = kPrintRegLaneSizeS | kPrintRegAsScalar | kPrintRegAsFP,
1190 kPrintReg2SFP = kPrintRegLaneSizeS | kPrintRegAsDVector | kPrintRegAsFP,
1191 kPrintReg4SFP = kPrintRegLaneSizeS | kPrintRegAsQVector | kPrintRegAsFP,
1192 kPrintReg1D = kPrintRegLaneSizeD | kPrintRegAsScalar,
1193 kPrintReg2D = kPrintRegLaneSizeD | kPrintRegAsQVector,
1194 kPrintReg1DFP = kPrintRegLaneSizeD | kPrintRegAsScalar | kPrintRegAsFP,
1195 kPrintReg2DFP = kPrintRegLaneSizeD | kPrintRegAsQVector | kPrintRegAsFP,
1196 kPrintReg1Q = kPrintRegLaneSizeQ | kPrintRegAsScalar
543 }; 1197 };
544 1198
1199 unsigned GetPrintRegLaneSizeInBytesLog2(PrintRegisterFormat format) {
1200 return (format & kPrintRegLaneSizeMask) >> kPrintRegLaneSizeOffset;
1201 }
1202
1203 unsigned GetPrintRegLaneSizeInBytes(PrintRegisterFormat format) {
1204 return 1 << GetPrintRegLaneSizeInBytesLog2(format);
1205 }
1206
1207 unsigned GetPrintRegSizeInBytesLog2(PrintRegisterFormat format) {
1208 if (format & kPrintRegAsDVector) return kDRegSizeLog2;
1209 if (format & kPrintRegAsQVector) return kQRegSizeLog2;
1210
1211 // Scalar types.
1212 return GetPrintRegLaneSizeInBytesLog2(format);
1213 }
1214
1215 unsigned GetPrintRegSizeInBytes(PrintRegisterFormat format) {
1216 return 1 << GetPrintRegSizeInBytesLog2(format);
1217 }
1218
1219 unsigned GetPrintRegLaneCount(PrintRegisterFormat format) {
1220 unsigned reg_size_log2 = GetPrintRegSizeInBytesLog2(format);
1221 unsigned lane_size_log2 = GetPrintRegLaneSizeInBytesLog2(format);
1222 DCHECK_GE(reg_size_log2, lane_size_log2);
1223 return 1 << (reg_size_log2 - lane_size_log2);
1224 }
1225
1226 template <typename T>
1227 PrintRegisterFormat GetPrintRegisterFormat(T value) {
1228 return GetPrintRegisterFormatForSize(sizeof(value));
1229 }
1230
1231 PrintRegisterFormat GetPrintRegisterFormat(double value) {
1232 static_assert(sizeof(value) == kDRegSize,
1233 "D register must be size of double.");
1234 return GetPrintRegisterFormatForSizeFP(sizeof(value));
1235 }
1236
1237 PrintRegisterFormat GetPrintRegisterFormat(float value) {
1238 static_assert(sizeof(value) == kSRegSize,
1239 "S register must be size of float.");
1240 return GetPrintRegisterFormatForSizeFP(sizeof(value));
1241 }
1242
1243 PrintRegisterFormat GetPrintRegisterFormat(VectorFormat vform);
1244 PrintRegisterFormat GetPrintRegisterFormatFP(VectorFormat vform);
1245
1246 PrintRegisterFormat GetPrintRegisterFormatForSize(size_t reg_size,
1247 size_t lane_size);
1248
1249 PrintRegisterFormat GetPrintRegisterFormatForSize(size_t size) {
1250 return GetPrintRegisterFormatForSize(size, size);
1251 }
1252
1253 PrintRegisterFormat GetPrintRegisterFormatForSizeFP(size_t size) {
1254 switch (size) {
1255 default:
1256 UNREACHABLE();
1257 case kDRegSize:
1258 return kPrintDReg;
1259 case kSRegSize:
1260 return kPrintSReg;
1261 }
1262 }
1263
1264 PrintRegisterFormat GetPrintRegisterFormatTryFP(PrintRegisterFormat format) {
1265 if ((GetPrintRegLaneSizeInBytes(format) == kSRegSize) ||
1266 (GetPrintRegLaneSizeInBytes(format) == kDRegSize)) {
1267 return static_cast<PrintRegisterFormat>(format | kPrintRegAsFP);
1268 }
1269 return format;
1270 }
1271
545 // Print individual register values (after update). 1272 // Print individual register values (after update).
546 void PrintRegister(unsigned code, Reg31Mode r31mode = Reg31IsStackPointer); 1273 void PrintRegister(unsigned code, Reg31Mode r31mode = Reg31IsStackPointer);
547 void PrintFPRegister(unsigned code, 1274 void PrintVRegister(unsigned code, PrintRegisterFormat sizes);
548 PrintFPRegisterSizes sizes = kPrintAllFPRegValues);
549 void PrintSystemRegister(SystemRegister id); 1275 void PrintSystemRegister(SystemRegister id);
550 1276
551 // Like Print* (above), but respect log_parameters(). 1277 // Like Print* (above), but respect log_parameters().
552 void LogRegister(unsigned code, Reg31Mode r31mode = Reg31IsStackPointer) { 1278 void LogRegister(unsigned code, Reg31Mode r31mode = Reg31IsStackPointer) {
553 if (log_parameters() & LOG_REGS) PrintRegister(code, r31mode); 1279 if (log_parameters() & LOG_REGS) PrintRegister(code, r31mode);
554 } 1280 }
555 void LogFPRegister(unsigned code, 1281 void LogVRegister(unsigned code, PrintRegisterFormat format) {
556 PrintFPRegisterSizes sizes = kPrintAllFPRegValues) { 1282 if (log_parameters() & LOG_VREGS) PrintVRegister(code, format);
557 if (log_parameters() & LOG_FP_REGS) PrintFPRegister(code, sizes);
558 } 1283 }
559 void LogSystemRegister(SystemRegister id) { 1284 void LogSystemRegister(SystemRegister id) {
560 if (log_parameters() & LOG_SYS_REGS) PrintSystemRegister(id); 1285 if (log_parameters() & LOG_SYS_REGS) PrintSystemRegister(id);
561 } 1286 }
562 1287
563 // Print memory accesses. 1288 // Print memory accesses.
564 void PrintRead(uintptr_t address, size_t size, unsigned reg_code); 1289 void PrintRead(uintptr_t address, unsigned reg_code,
565 void PrintReadFP(uintptr_t address, size_t size, unsigned reg_code); 1290 PrintRegisterFormat format);
566 void PrintWrite(uintptr_t address, size_t size, unsigned reg_code); 1291 void PrintWrite(uintptr_t address, unsigned reg_code,
567 void PrintWriteFP(uintptr_t address, size_t size, unsigned reg_code); 1292 PrintRegisterFormat format);
1293 void PrintVRead(uintptr_t address, unsigned reg_code,
1294 PrintRegisterFormat format, unsigned lane);
1295 void PrintVWrite(uintptr_t address, unsigned reg_code,
1296 PrintRegisterFormat format, unsigned lane);
568 1297
569 // Like Print* (above), but respect log_parameters(). 1298 // Like Print* (above), but respect log_parameters().
570 void LogRead(uintptr_t address, size_t size, unsigned reg_code) { 1299 void LogRead(uintptr_t address, unsigned reg_code,
571 if (log_parameters() & LOG_REGS) PrintRead(address, size, reg_code); 1300 PrintRegisterFormat format) {
1301 if (log_parameters() & LOG_REGS) PrintRead(address, reg_code, format);
572 } 1302 }
573 void LogReadFP(uintptr_t address, size_t size, unsigned reg_code) { 1303 void LogWrite(uintptr_t address, unsigned reg_code,
574 if (log_parameters() & LOG_FP_REGS) PrintReadFP(address, size, reg_code); 1304 PrintRegisterFormat format) {
1305 if (log_parameters() & LOG_WRITE) PrintWrite(address, reg_code, format);
575 } 1306 }
576 void LogWrite(uintptr_t address, size_t size, unsigned reg_code) { 1307 void LogVRead(uintptr_t address, unsigned reg_code,
577 if (log_parameters() & LOG_WRITE) PrintWrite(address, size, reg_code); 1308 PrintRegisterFormat format, unsigned lane = 0) {
1309 if (log_parameters() & LOG_VREGS) {
1310 PrintVRead(address, reg_code, format, lane);
1311 }
578 } 1312 }
579 void LogWriteFP(uintptr_t address, size_t size, unsigned reg_code) { 1313 void LogVWrite(uintptr_t address, unsigned reg_code,
580 if (log_parameters() & LOG_WRITE) PrintWriteFP(address, size, reg_code); 1314 PrintRegisterFormat format, unsigned lane = 0) {
1315 if (log_parameters() & LOG_WRITE) {
1316 PrintVWrite(address, reg_code, format, lane);
1317 }
581 } 1318 }
582 1319
583 int log_parameters() { return log_parameters_; } 1320 int log_parameters() { return log_parameters_; }
584 void set_log_parameters(int new_parameters) { 1321 void set_log_parameters(int new_parameters) {
585 log_parameters_ = new_parameters; 1322 log_parameters_ = new_parameters;
586 if (!decoder_) { 1323 if (!decoder_) {
587 if (new_parameters & LOG_DISASM) { 1324 if (new_parameters & LOG_DISASM) {
588 PrintF("Run --debug-sim to dynamically turn on disassembler\n"); 1325 PrintF("Run --debug-sim to dynamically turn on disassembler\n");
589 } 1326 }
590 return; 1327 return;
591 } 1328 }
592 if (new_parameters & LOG_DISASM) { 1329 if (new_parameters & LOG_DISASM) {
593 decoder_->InsertVisitorBefore(print_disasm_, this); 1330 decoder_->InsertVisitorBefore(print_disasm_, this);
594 } else { 1331 } else {
595 decoder_->RemoveVisitor(print_disasm_); 1332 decoder_->RemoveVisitor(print_disasm_);
596 } 1333 }
597 } 1334 }
598 1335
1336 // Helper functions for register tracing.
1337 void PrintRegisterRawHelper(unsigned code, Reg31Mode r31mode,
1338 int size_in_bytes = kXRegSize);
1339 void PrintVRegisterRawHelper(unsigned code, int bytes = kQRegSize,
1340 int lsb = 0);
1341 void PrintVRegisterFPHelper(unsigned code, unsigned lane_size_in_bytes,
1342 int lane_count = 1, int rightmost_lane = 0);
1343
599 static inline const char* WRegNameForCode(unsigned code, 1344 static inline const char* WRegNameForCode(unsigned code,
600 Reg31Mode mode = Reg31IsZeroRegister); 1345 Reg31Mode mode = Reg31IsZeroRegister);
601 static inline const char* XRegNameForCode(unsigned code, 1346 static inline const char* XRegNameForCode(unsigned code,
602 Reg31Mode mode = Reg31IsZeroRegister); 1347 Reg31Mode mode = Reg31IsZeroRegister);
603 static inline const char* SRegNameForCode(unsigned code); 1348 static inline const char* SRegNameForCode(unsigned code);
604 static inline const char* DRegNameForCode(unsigned code); 1349 static inline const char* DRegNameForCode(unsigned code);
605 static inline const char* VRegNameForCode(unsigned code); 1350 static inline const char* VRegNameForCode(unsigned code);
606 static inline int CodeFromName(const char* name); 1351 static inline int CodeFromName(const char* name);
607 1352
608 protected: 1353 protected:
(...skipping 54 matching lines...) Expand 10 before | Expand all | Expand 10 after
663 void ConditionalCompareHelper(Instruction* instr, T op2); 1408 void ConditionalCompareHelper(Instruction* instr, T op2);
664 void LoadStoreHelper(Instruction* instr, 1409 void LoadStoreHelper(Instruction* instr,
665 int64_t offset, 1410 int64_t offset,
666 AddrMode addrmode); 1411 AddrMode addrmode);
667 void LoadStorePairHelper(Instruction* instr, AddrMode addrmode); 1412 void LoadStorePairHelper(Instruction* instr, AddrMode addrmode);
668 uintptr_t LoadStoreAddress(unsigned addr_reg, int64_t offset, 1413 uintptr_t LoadStoreAddress(unsigned addr_reg, int64_t offset,
669 AddrMode addrmode); 1414 AddrMode addrmode);
670 void LoadStoreWriteBack(unsigned addr_reg, 1415 void LoadStoreWriteBack(unsigned addr_reg,
671 int64_t offset, 1416 int64_t offset,
672 AddrMode addrmode); 1417 AddrMode addrmode);
1418 void NEONLoadStoreMultiStructHelper(const Instruction* instr,
1419 AddrMode addr_mode);
1420 void NEONLoadStoreSingleStructHelper(const Instruction* instr,
1421 AddrMode addr_mode);
673 void CheckMemoryAccess(uintptr_t address, uintptr_t stack); 1422 void CheckMemoryAccess(uintptr_t address, uintptr_t stack);
674 1423
675 // Memory read helpers. 1424 // Memory read helpers.
676 template <typename T, typename A> 1425 template <typename T, typename A>
677 T MemoryRead(A address) { 1426 T MemoryRead(A address) {
678 T value; 1427 T value;
679 STATIC_ASSERT((sizeof(value) == 1) || (sizeof(value) == 2) || 1428 STATIC_ASSERT((sizeof(value) == 1) || (sizeof(value) == 2) ||
680 (sizeof(value) == 4) || (sizeof(value) == 8)); 1429 (sizeof(value) == 4) || (sizeof(value) == 8) ||
1430 (sizeof(value) == 16));
681 memcpy(&value, reinterpret_cast<const void*>(address), sizeof(value)); 1431 memcpy(&value, reinterpret_cast<const void*>(address), sizeof(value));
682 return value; 1432 return value;
683 } 1433 }
684 1434
685 // Memory write helpers. 1435 // Memory write helpers.
686 template <typename T, typename A> 1436 template <typename T, typename A>
687 void MemoryWrite(A address, T value) { 1437 void MemoryWrite(A address, T value) {
688 STATIC_ASSERT((sizeof(value) == 1) || (sizeof(value) == 2) || 1438 STATIC_ASSERT((sizeof(value) == 1) || (sizeof(value) == 2) ||
689 (sizeof(value) == 4) || (sizeof(value) == 8)); 1439 (sizeof(value) == 4) || (sizeof(value) == 8) ||
1440 (sizeof(value) == 16));
690 memcpy(reinterpret_cast<void*>(address), &value, sizeof(value)); 1441 memcpy(reinterpret_cast<void*>(address), &value, sizeof(value));
691 } 1442 }
692 1443
693 template <typename T> 1444 template <typename T>
694 T ShiftOperand(T value, 1445 T ShiftOperand(T value,
695 Shift shift_type, 1446 Shift shift_type,
696 unsigned amount); 1447 unsigned amount);
697 template <typename T> 1448 template <typename T>
698 T ExtendValue(T value, 1449 T ExtendValue(T value,
699 Extend extend_type, 1450 Extend extend_type,
700 unsigned left_shift = 0); 1451 unsigned left_shift = 0);
701 template <typename T> 1452 template <typename T>
702 void Extract(Instruction* instr); 1453 void Extract(Instruction* instr);
703 template <typename T> 1454 template <typename T>
704 void DataProcessing2Source(Instruction* instr); 1455 void DataProcessing2Source(Instruction* instr);
705 template <typename T> 1456 template <typename T>
706 void BitfieldHelper(Instruction* instr); 1457 void BitfieldHelper(Instruction* instr);
707 1458 uint16_t PolynomialMult(uint8_t op1, uint8_t op2);
708 template <typename T> 1459
709 T FPDefaultNaN() const; 1460 void ld1(VectorFormat vform, LogicVRegister dst, uint64_t addr);
1461 void ld1(VectorFormat vform, LogicVRegister dst, int index, uint64_t addr);
1462 void ld1r(VectorFormat vform, LogicVRegister dst, uint64_t addr);
1463 void ld2(VectorFormat vform, LogicVRegister dst1, LogicVRegister dst2,
1464 uint64_t addr);
1465 void ld2(VectorFormat vform, LogicVRegister dst1, LogicVRegister dst2,
1466 int index, uint64_t addr);
1467 void ld2r(VectorFormat vform, LogicVRegister dst1, LogicVRegister dst2,
1468 uint64_t addr);
1469 void ld3(VectorFormat vform, LogicVRegister dst1, LogicVRegister dst2,
1470 LogicVRegister dst3, uint64_t addr);
1471 void ld3(VectorFormat vform, LogicVRegister dst1, LogicVRegister dst2,
1472 LogicVRegister dst3, int index, uint64_t addr);
1473 void ld3r(VectorFormat vform, LogicVRegister dst1, LogicVRegister dst2,
1474 LogicVRegister dst3, uint64_t addr);
1475 void ld4(VectorFormat vform, LogicVRegister dst1, LogicVRegister dst2,
1476 LogicVRegister dst3, LogicVRegister dst4, uint64_t addr);
1477 void ld4(VectorFormat vform, LogicVRegister dst1, LogicVRegister dst2,
1478 LogicVRegister dst3, LogicVRegister dst4, int index, uint64_t addr);
1479 void ld4r(VectorFormat vform, LogicVRegister dst1, LogicVRegister dst2,
1480 LogicVRegister dst3, LogicVRegister dst4, uint64_t addr);
1481 void st1(VectorFormat vform, LogicVRegister src, uint64_t addr);
1482 void st1(VectorFormat vform, LogicVRegister src, int index, uint64_t addr);
1483 void st2(VectorFormat vform, LogicVRegister src, LogicVRegister src2,
1484 uint64_t addr);
1485 void st2(VectorFormat vform, LogicVRegister src, LogicVRegister src2,
1486 int index, uint64_t addr);
1487 void st3(VectorFormat vform, LogicVRegister src, LogicVRegister src2,
1488 LogicVRegister src3, uint64_t addr);
1489 void st3(VectorFormat vform, LogicVRegister src, LogicVRegister src2,
1490 LogicVRegister src3, int index, uint64_t addr);
1491 void st4(VectorFormat vform, LogicVRegister src, LogicVRegister src2,
1492 LogicVRegister src3, LogicVRegister src4, uint64_t addr);
1493 void st4(VectorFormat vform, LogicVRegister src, LogicVRegister src2,
1494 LogicVRegister src3, LogicVRegister src4, int index, uint64_t addr);
1495 LogicVRegister cmp(VectorFormat vform, LogicVRegister dst,
1496 const LogicVRegister& src1, const LogicVRegister& src2,
1497 Condition cond);
1498 LogicVRegister cmp(VectorFormat vform, LogicVRegister dst,
1499 const LogicVRegister& src1, int imm, Condition cond);
1500 LogicVRegister cmptst(VectorFormat vform, LogicVRegister dst,
1501 const LogicVRegister& src1, const LogicVRegister& src2);
1502 LogicVRegister add(VectorFormat vform, LogicVRegister dst,
1503 const LogicVRegister& src1, const LogicVRegister& src2);
1504 LogicVRegister addp(VectorFormat vform, LogicVRegister dst,
1505 const LogicVRegister& src1, const LogicVRegister& src2);
1506 LogicVRegister mla(VectorFormat vform, LogicVRegister dst,
1507 const LogicVRegister& src1, const LogicVRegister& src2);
1508 LogicVRegister mls(VectorFormat vform, LogicVRegister dst,
1509 const LogicVRegister& src1, const LogicVRegister& src2);
1510 LogicVRegister mul(VectorFormat vform, LogicVRegister dst,
1511 const LogicVRegister& src1, const LogicVRegister& src2);
1512 LogicVRegister mul(VectorFormat vform, LogicVRegister dst,
1513 const LogicVRegister& src1, const LogicVRegister& src2,
1514 int index);
1515 LogicVRegister mla(VectorFormat vform, LogicVRegister dst,
1516 const LogicVRegister& src1, const LogicVRegister& src2,
1517 int index);
1518 LogicVRegister mls(VectorFormat vform, LogicVRegister dst,
1519 const LogicVRegister& src1, const LogicVRegister& src2,
1520 int index);
1521 LogicVRegister pmul(VectorFormat vform, LogicVRegister dst,
1522 const LogicVRegister& src1, const LogicVRegister& src2);
1523
1524 typedef LogicVRegister (Simulator::*ByElementOp)(VectorFormat vform,
1525 LogicVRegister dst,
1526 const LogicVRegister& src1,
1527 const LogicVRegister& src2,
1528 int index);
1529 LogicVRegister fmul(VectorFormat vform, LogicVRegister dst,
1530 const LogicVRegister& src1, const LogicVRegister& src2,
1531 int index);
1532 LogicVRegister fmla(VectorFormat vform, LogicVRegister dst,
1533 const LogicVRegister& src1, const LogicVRegister& src2,
1534 int index);
1535 LogicVRegister fmls(VectorFormat vform, LogicVRegister dst,
1536 const LogicVRegister& src1, const LogicVRegister& src2,
1537 int index);
1538 LogicVRegister fmulx(VectorFormat vform, LogicVRegister dst,
1539 const LogicVRegister& src1, const LogicVRegister& src2,
1540 int index);
1541 LogicVRegister smull(VectorFormat vform, LogicVRegister dst,
1542 const LogicVRegister& src1, const LogicVRegister& src2,
1543 int index);
1544 LogicVRegister smull2(VectorFormat vform, LogicVRegister dst,
1545 const LogicVRegister& src1, const LogicVRegister& src2,
1546 int index);
1547 LogicVRegister umull(VectorFormat vform, LogicVRegister dst,
1548 const LogicVRegister& src1, const LogicVRegister& src2,
1549 int index);
1550 LogicVRegister umull2(VectorFormat vform, LogicVRegister dst,
1551 const LogicVRegister& src1, const LogicVRegister& src2,
1552 int index);
1553 LogicVRegister smlal(VectorFormat vform, LogicVRegister dst,
1554 const LogicVRegister& src1, const LogicVRegister& src2,
1555 int index);
1556 LogicVRegister smlal2(VectorFormat vform, LogicVRegister dst,
1557 const LogicVRegister& src1, const LogicVRegister& src2,
1558 int index);
1559 LogicVRegister umlal(VectorFormat vform, LogicVRegister dst,
1560 const LogicVRegister& src1, const LogicVRegister& src2,
1561 int index);
1562 LogicVRegister umlal2(VectorFormat vform, LogicVRegister dst,
1563 const LogicVRegister& src1, const LogicVRegister& src2,
1564 int index);
1565 LogicVRegister smlsl(VectorFormat vform, LogicVRegister dst,
1566 const LogicVRegister& src1, const LogicVRegister& src2,
1567 int index);
1568 LogicVRegister smlsl2(VectorFormat vform, LogicVRegister dst,
1569 const LogicVRegister& src1, const LogicVRegister& src2,
1570 int index);
1571 LogicVRegister umlsl(VectorFormat vform, LogicVRegister dst,
1572 const LogicVRegister& src1, const LogicVRegister& src2,
1573 int index);
1574 LogicVRegister umlsl2(VectorFormat vform, LogicVRegister dst,
1575 const LogicVRegister& src1, const LogicVRegister& src2,
1576 int index);
1577 LogicVRegister sqdmull(VectorFormat vform, LogicVRegister dst,
1578 const LogicVRegister& src1, const LogicVRegister& src2,
1579 int index);
1580 LogicVRegister sqdmull2(VectorFormat vform, LogicVRegister dst,
1581 const LogicVRegister& src1,
1582 const LogicVRegister& src2, int index);
1583 LogicVRegister sqdmlal(VectorFormat vform, LogicVRegister dst,
1584 const LogicVRegister& src1, const LogicVRegister& src2,
1585 int index);
1586 LogicVRegister sqdmlal2(VectorFormat vform, LogicVRegister dst,
1587 const LogicVRegister& src1,
1588 const LogicVRegister& src2, int index);
1589 LogicVRegister sqdmlsl(VectorFormat vform, LogicVRegister dst,
1590 const LogicVRegister& src1, const LogicVRegister& src2,
1591 int index);
1592 LogicVRegister sqdmlsl2(VectorFormat vform, LogicVRegister dst,
1593 const LogicVRegister& src1,
1594 const LogicVRegister& src2, int index);
1595 LogicVRegister sqdmulh(VectorFormat vform, LogicVRegister dst,
1596 const LogicVRegister& src1, const LogicVRegister& src2,
1597 int index);
1598 LogicVRegister sqrdmulh(VectorFormat vform, LogicVRegister dst,
1599 const LogicVRegister& src1,
1600 const LogicVRegister& src2, int index);
1601 LogicVRegister sub(VectorFormat vform, LogicVRegister dst,
1602 const LogicVRegister& src1, const LogicVRegister& src2);
1603 LogicVRegister and_(VectorFormat vform, LogicVRegister dst,
1604 const LogicVRegister& src1, const LogicVRegister& src2);
1605 LogicVRegister orr(VectorFormat vform, LogicVRegister dst,
1606 const LogicVRegister& src1, const LogicVRegister& src2);
1607 LogicVRegister orn(VectorFormat vform, LogicVRegister dst,
1608 const LogicVRegister& src1, const LogicVRegister& src2);
1609 LogicVRegister eor(VectorFormat vform, LogicVRegister dst,
1610 const LogicVRegister& src1, const LogicVRegister& src2);
1611 LogicVRegister bic(VectorFormat vform, LogicVRegister dst,
1612 const LogicVRegister& src1, const LogicVRegister& src2);
1613 LogicVRegister bic(VectorFormat vform, LogicVRegister dst,
1614 const LogicVRegister& src, uint64_t imm);
1615 LogicVRegister bif(VectorFormat vform, LogicVRegister dst,
1616 const LogicVRegister& src1, const LogicVRegister& src2);
1617 LogicVRegister bit(VectorFormat vform, LogicVRegister dst,
1618 const LogicVRegister& src1, const LogicVRegister& src2);
1619 LogicVRegister bsl(VectorFormat vform, LogicVRegister dst,
1620 const LogicVRegister& src1, const LogicVRegister& src2);
1621 LogicVRegister cls(VectorFormat vform, LogicVRegister dst,
1622 const LogicVRegister& src);
1623 LogicVRegister clz(VectorFormat vform, LogicVRegister dst,
1624 const LogicVRegister& src);
1625 LogicVRegister cnt(VectorFormat vform, LogicVRegister dst,
1626 const LogicVRegister& src);
1627 LogicVRegister not_(VectorFormat vform, LogicVRegister dst,
1628 const LogicVRegister& src);
1629 LogicVRegister rbit(VectorFormat vform, LogicVRegister dst,
1630 const LogicVRegister& src);
1631 LogicVRegister rev(VectorFormat vform, LogicVRegister dst,
1632 const LogicVRegister& src, int revSize);
1633 LogicVRegister rev16(VectorFormat vform, LogicVRegister dst,
1634 const LogicVRegister& src);
1635 LogicVRegister rev32(VectorFormat vform, LogicVRegister dst,
1636 const LogicVRegister& src);
1637 LogicVRegister rev64(VectorFormat vform, LogicVRegister dst,
1638 const LogicVRegister& src);
1639 LogicVRegister addlp(VectorFormat vform, LogicVRegister dst,
1640 const LogicVRegister& src, bool is_signed,
1641 bool do_accumulate);
1642 LogicVRegister saddlp(VectorFormat vform, LogicVRegister dst,
1643 const LogicVRegister& src);
1644 LogicVRegister uaddlp(VectorFormat vform, LogicVRegister dst,
1645 const LogicVRegister& src);
1646 LogicVRegister sadalp(VectorFormat vform, LogicVRegister dst,
1647 const LogicVRegister& src);
1648 LogicVRegister uadalp(VectorFormat vform, LogicVRegister dst,
1649 const LogicVRegister& src);
1650 LogicVRegister ext(VectorFormat vform, LogicVRegister dst,
1651 const LogicVRegister& src1, const LogicVRegister& src2,
1652 int index);
1653 LogicVRegister ins_element(VectorFormat vform, LogicVRegister dst,
1654 int dst_index, const LogicVRegister& src,
1655 int src_index);
1656 LogicVRegister ins_immediate(VectorFormat vform, LogicVRegister dst,
1657 int dst_index, uint64_t imm);
1658 LogicVRegister dup_element(VectorFormat vform, LogicVRegister dst,
1659 const LogicVRegister& src, int src_index);
1660 LogicVRegister dup_immediate(VectorFormat vform, LogicVRegister dst,
1661 uint64_t imm);
1662 LogicVRegister movi(VectorFormat vform, LogicVRegister dst, uint64_t imm);
1663 LogicVRegister mvni(VectorFormat vform, LogicVRegister dst, uint64_t imm);
1664 LogicVRegister orr(VectorFormat vform, LogicVRegister dst,
1665 const LogicVRegister& src, uint64_t imm);
1666 LogicVRegister sshl(VectorFormat vform, LogicVRegister dst,
1667 const LogicVRegister& src1, const LogicVRegister& src2);
1668 LogicVRegister ushl(VectorFormat vform, LogicVRegister dst,
1669 const LogicVRegister& src1, const LogicVRegister& src2);
1670 LogicVRegister SMinMax(VectorFormat vform, LogicVRegister dst,
1671 const LogicVRegister& src1, const LogicVRegister& src2,
1672 bool max);
1673 LogicVRegister smax(VectorFormat vform, LogicVRegister dst,
1674 const LogicVRegister& src1, const LogicVRegister& src2);
1675 LogicVRegister smin(VectorFormat vform, LogicVRegister dst,
1676 const LogicVRegister& src1, const LogicVRegister& src2);
1677 LogicVRegister SMinMaxP(VectorFormat vform, LogicVRegister dst,
1678 const LogicVRegister& src1,
1679 const LogicVRegister& src2, bool max);
1680 LogicVRegister smaxp(VectorFormat vform, LogicVRegister dst,
1681 const LogicVRegister& src1, const LogicVRegister& src2);
1682 LogicVRegister sminp(VectorFormat vform, LogicVRegister dst,
1683 const LogicVRegister& src1, const LogicVRegister& src2);
1684 LogicVRegister addp(VectorFormat vform, LogicVRegister dst,
1685 const LogicVRegister& src);
1686 LogicVRegister addv(VectorFormat vform, LogicVRegister dst,
1687 const LogicVRegister& src);
1688 LogicVRegister uaddlv(VectorFormat vform, LogicVRegister dst,
1689 const LogicVRegister& src);
1690 LogicVRegister saddlv(VectorFormat vform, LogicVRegister dst,
1691 const LogicVRegister& src);
1692 LogicVRegister SMinMaxV(VectorFormat vform, LogicVRegister dst,
1693 const LogicVRegister& src, bool max);
1694 LogicVRegister smaxv(VectorFormat vform, LogicVRegister dst,
1695 const LogicVRegister& src);
1696 LogicVRegister sminv(VectorFormat vform, LogicVRegister dst,
1697 const LogicVRegister& src);
1698 LogicVRegister uxtl(VectorFormat vform, LogicVRegister dst,
1699 const LogicVRegister& src);
1700 LogicVRegister uxtl2(VectorFormat vform, LogicVRegister dst,
1701 const LogicVRegister& src);
1702 LogicVRegister sxtl(VectorFormat vform, LogicVRegister dst,
1703 const LogicVRegister& src);
1704 LogicVRegister sxtl2(VectorFormat vform, LogicVRegister dst,
1705 const LogicVRegister& src);
1706 LogicVRegister Table(VectorFormat vform, LogicVRegister dst,
1707 const LogicVRegister& ind, bool zero_out_of_bounds,
1708 const LogicVRegister* tab1,
1709 const LogicVRegister* tab2 = NULL,
1710 const LogicVRegister* tab3 = NULL,
1711 const LogicVRegister* tab4 = NULL);
1712 LogicVRegister tbl(VectorFormat vform, LogicVRegister dst,
1713 const LogicVRegister& tab, const LogicVRegister& ind);
1714 LogicVRegister tbl(VectorFormat vform, LogicVRegister dst,
1715 const LogicVRegister& tab, const LogicVRegister& tab2,
1716 const LogicVRegister& ind);
1717 LogicVRegister tbl(VectorFormat vform, LogicVRegister dst,
1718 const LogicVRegister& tab, const LogicVRegister& tab2,
1719 const LogicVRegister& tab3, const LogicVRegister& ind);
1720 LogicVRegister tbl(VectorFormat vform, LogicVRegister dst,
1721 const LogicVRegister& tab, const LogicVRegister& tab2,
1722 const LogicVRegister& tab3, const LogicVRegister& tab4,
1723 const LogicVRegister& ind);
1724 LogicVRegister tbx(VectorFormat vform, LogicVRegister dst,
1725 const LogicVRegister& tab, const LogicVRegister& ind);
1726 LogicVRegister tbx(VectorFormat vform, LogicVRegister dst,
1727 const LogicVRegister& tab, const LogicVRegister& tab2,
1728 const LogicVRegister& ind);
1729 LogicVRegister tbx(VectorFormat vform, LogicVRegister dst,
1730 const LogicVRegister& tab, const LogicVRegister& tab2,
1731 const LogicVRegister& tab3, const LogicVRegister& ind);
1732 LogicVRegister tbx(VectorFormat vform, LogicVRegister dst,
1733 const LogicVRegister& tab, const LogicVRegister& tab2,
1734 const LogicVRegister& tab3, const LogicVRegister& tab4,
1735 const LogicVRegister& ind);
1736 LogicVRegister uaddl(VectorFormat vform, LogicVRegister dst,
1737 const LogicVRegister& src1, const LogicVRegister& src2);
1738 LogicVRegister uaddl2(VectorFormat vform, LogicVRegister dst,
1739 const LogicVRegister& src1, const LogicVRegister& src2);
1740 LogicVRegister uaddw(VectorFormat vform, LogicVRegister dst,
1741 const LogicVRegister& src1, const LogicVRegister& src2);
1742 LogicVRegister uaddw2(VectorFormat vform, LogicVRegister dst,
1743 const LogicVRegister& src1, const LogicVRegister& src2);
1744 LogicVRegister saddl(VectorFormat vform, LogicVRegister dst,
1745 const LogicVRegister& src1, const LogicVRegister& src2);
1746 LogicVRegister saddl2(VectorFormat vform, LogicVRegister dst,
1747 const LogicVRegister& src1, const LogicVRegister& src2);
1748 LogicVRegister saddw(VectorFormat vform, LogicVRegister dst,
1749 const LogicVRegister& src1, const LogicVRegister& src2);
1750 LogicVRegister saddw2(VectorFormat vform, LogicVRegister dst,
1751 const LogicVRegister& src1, const LogicVRegister& src2);
1752 LogicVRegister usubl(VectorFormat vform, LogicVRegister dst,
1753 const LogicVRegister& src1, const LogicVRegister& src2);
1754 LogicVRegister usubl2(VectorFormat vform, LogicVRegister dst,
1755 const LogicVRegister& src1, const LogicVRegister& src2);
1756 LogicVRegister usubw(VectorFormat vform, LogicVRegister dst,
1757 const LogicVRegister& src1, const LogicVRegister& src2);
1758 LogicVRegister usubw2(VectorFormat vform, LogicVRegister dst,
1759 const LogicVRegister& src1, const LogicVRegister& src2);
1760 LogicVRegister ssubl(VectorFormat vform, LogicVRegister dst,
1761 const LogicVRegister& src1, const LogicVRegister& src2);
1762 LogicVRegister ssubl2(VectorFormat vform, LogicVRegister dst,
1763 const LogicVRegister& src1, const LogicVRegister& src2);
1764 LogicVRegister ssubw(VectorFormat vform, LogicVRegister dst,
1765 const LogicVRegister& src1, const LogicVRegister& src2);
1766 LogicVRegister ssubw2(VectorFormat vform, LogicVRegister dst,
1767 const LogicVRegister& src1, const LogicVRegister& src2);
1768 LogicVRegister UMinMax(VectorFormat vform, LogicVRegister dst,
1769 const LogicVRegister& src1, const LogicVRegister& src2,
1770 bool max);
1771 LogicVRegister umax(VectorFormat vform, LogicVRegister dst,
1772 const LogicVRegister& src1, const LogicVRegister& src2);
1773 LogicVRegister umin(VectorFormat vform, LogicVRegister dst,
1774 const LogicVRegister& src1, const LogicVRegister& src2);
1775 LogicVRegister UMinMaxP(VectorFormat vform, LogicVRegister dst,
1776 const LogicVRegister& src1,
1777 const LogicVRegister& src2, bool max);
1778 LogicVRegister umaxp(VectorFormat vform, LogicVRegister dst,
1779 const LogicVRegister& src1, const LogicVRegister& src2);
1780 LogicVRegister uminp(VectorFormat vform, LogicVRegister dst,
1781 const LogicVRegister& src1, const LogicVRegister& src2);
1782 LogicVRegister UMinMaxV(VectorFormat vform, LogicVRegister dst,
1783 const LogicVRegister& src, bool max);
1784 LogicVRegister umaxv(VectorFormat vform, LogicVRegister dst,
1785 const LogicVRegister& src);
1786 LogicVRegister uminv(VectorFormat vform, LogicVRegister dst,
1787 const LogicVRegister& src);
1788 LogicVRegister trn1(VectorFormat vform, LogicVRegister dst,
1789 const LogicVRegister& src1, const LogicVRegister& src2);
1790 LogicVRegister trn2(VectorFormat vform, LogicVRegister dst,
1791 const LogicVRegister& src1, const LogicVRegister& src2);
1792 LogicVRegister zip1(VectorFormat vform, LogicVRegister dst,
1793 const LogicVRegister& src1, const LogicVRegister& src2);
1794 LogicVRegister zip2(VectorFormat vform, LogicVRegister dst,
1795 const LogicVRegister& src1, const LogicVRegister& src2);
1796 LogicVRegister uzp1(VectorFormat vform, LogicVRegister dst,
1797 const LogicVRegister& src1, const LogicVRegister& src2);
1798 LogicVRegister uzp2(VectorFormat vform, LogicVRegister dst,
1799 const LogicVRegister& src1, const LogicVRegister& src2);
1800 LogicVRegister shl(VectorFormat vform, LogicVRegister dst,
1801 const LogicVRegister& src, int shift);
1802 LogicVRegister scvtf(VectorFormat vform, LogicVRegister dst,
1803 const LogicVRegister& src, int fbits,
1804 FPRounding rounding_mode);
1805 LogicVRegister ucvtf(VectorFormat vform, LogicVRegister dst,
1806 const LogicVRegister& src, int fbits,
1807 FPRounding rounding_mode);
1808 LogicVRegister sshll(VectorFormat vform, LogicVRegister dst,
1809 const LogicVRegister& src, int shift);
1810 LogicVRegister sshll2(VectorFormat vform, LogicVRegister dst,
1811 const LogicVRegister& src, int shift);
1812 LogicVRegister shll(VectorFormat vform, LogicVRegister dst,
1813 const LogicVRegister& src);
1814 LogicVRegister shll2(VectorFormat vform, LogicVRegister dst,
1815 const LogicVRegister& src);
1816 LogicVRegister ushll(VectorFormat vform, LogicVRegister dst,
1817 const LogicVRegister& src, int shift);
1818 LogicVRegister ushll2(VectorFormat vform, LogicVRegister dst,
1819 const LogicVRegister& src, int shift);
1820 LogicVRegister sli(VectorFormat vform, LogicVRegister dst,
1821 const LogicVRegister& src, int shift);
1822 LogicVRegister sri(VectorFormat vform, LogicVRegister dst,
1823 const LogicVRegister& src, int shift);
1824 LogicVRegister sshr(VectorFormat vform, LogicVRegister dst,
1825 const LogicVRegister& src, int shift);
1826 LogicVRegister ushr(VectorFormat vform, LogicVRegister dst,
1827 const LogicVRegister& src, int shift);
1828 LogicVRegister ssra(VectorFormat vform, LogicVRegister dst,
1829 const LogicVRegister& src, int shift);
1830 LogicVRegister usra(VectorFormat vform, LogicVRegister dst,
1831 const LogicVRegister& src, int shift);
1832 LogicVRegister srsra(VectorFormat vform, LogicVRegister dst,
1833 const LogicVRegister& src, int shift);
1834 LogicVRegister ursra(VectorFormat vform, LogicVRegister dst,
1835 const LogicVRegister& src, int shift);
1836 LogicVRegister suqadd(VectorFormat vform, LogicVRegister dst,
1837 const LogicVRegister& src);
1838 LogicVRegister usqadd(VectorFormat vform, LogicVRegister dst,
1839 const LogicVRegister& src);
1840 LogicVRegister sqshl(VectorFormat vform, LogicVRegister dst,
1841 const LogicVRegister& src, int shift);
1842 LogicVRegister uqshl(VectorFormat vform, LogicVRegister dst,
1843 const LogicVRegister& src, int shift);
1844 LogicVRegister sqshlu(VectorFormat vform, LogicVRegister dst,
1845 const LogicVRegister& src, int shift);
1846 LogicVRegister abs(VectorFormat vform, LogicVRegister dst,
1847 const LogicVRegister& src);
1848 LogicVRegister neg(VectorFormat vform, LogicVRegister dst,
1849 const LogicVRegister& src);
1850 LogicVRegister ExtractNarrow(VectorFormat vform, LogicVRegister dst,
1851 bool dstIsSigned, const LogicVRegister& src,
1852 bool srcIsSigned);
1853 LogicVRegister xtn(VectorFormat vform, LogicVRegister dst,
1854 const LogicVRegister& src);
1855 LogicVRegister sqxtn(VectorFormat vform, LogicVRegister dst,
1856 const LogicVRegister& src);
1857 LogicVRegister uqxtn(VectorFormat vform, LogicVRegister dst,
1858 const LogicVRegister& src);
1859 LogicVRegister sqxtun(VectorFormat vform, LogicVRegister dst,
1860 const LogicVRegister& src);
1861 LogicVRegister AbsDiff(VectorFormat vform, LogicVRegister dst,
1862 const LogicVRegister& src1, const LogicVRegister& src2,
1863 bool issigned);
1864 LogicVRegister saba(VectorFormat vform, LogicVRegister dst,
1865 const LogicVRegister& src1, const LogicVRegister& src2);
1866 LogicVRegister uaba(VectorFormat vform, LogicVRegister dst,
1867 const LogicVRegister& src1, const LogicVRegister& src2);
1868 LogicVRegister shrn(VectorFormat vform, LogicVRegister dst,
1869 const LogicVRegister& src, int shift);
1870 LogicVRegister shrn2(VectorFormat vform, LogicVRegister dst,
1871 const LogicVRegister& src, int shift);
1872 LogicVRegister rshrn(VectorFormat vform, LogicVRegister dst,
1873 const LogicVRegister& src, int shift);
1874 LogicVRegister rshrn2(VectorFormat vform, LogicVRegister dst,
1875 const LogicVRegister& src, int shift);
1876 LogicVRegister uqshrn(VectorFormat vform, LogicVRegister dst,
1877 const LogicVRegister& src, int shift);
1878 LogicVRegister uqshrn2(VectorFormat vform, LogicVRegister dst,
1879 const LogicVRegister& src, int shift);
1880 LogicVRegister uqrshrn(VectorFormat vform, LogicVRegister dst,
1881 const LogicVRegister& src, int shift);
1882 LogicVRegister uqrshrn2(VectorFormat vform, LogicVRegister dst,
1883 const LogicVRegister& src, int shift);
1884 LogicVRegister sqshrn(VectorFormat vform, LogicVRegister dst,
1885 const LogicVRegister& src, int shift);
1886 LogicVRegister sqshrn2(VectorFormat vform, LogicVRegister dst,
1887 const LogicVRegister& src, int shift);
1888 LogicVRegister sqrshrn(VectorFormat vform, LogicVRegister dst,
1889 const LogicVRegister& src, int shift);
1890 LogicVRegister sqrshrn2(VectorFormat vform, LogicVRegister dst,
1891 const LogicVRegister& src, int shift);
1892 LogicVRegister sqshrun(VectorFormat vform, LogicVRegister dst,
1893 const LogicVRegister& src, int shift);
1894 LogicVRegister sqshrun2(VectorFormat vform, LogicVRegister dst,
1895 const LogicVRegister& src, int shift);
1896 LogicVRegister sqrshrun(VectorFormat vform, LogicVRegister dst,
1897 const LogicVRegister& src, int shift);
1898 LogicVRegister sqrshrun2(VectorFormat vform, LogicVRegister dst,
1899 const LogicVRegister& src, int shift);
1900 LogicVRegister sqrdmulh(VectorFormat vform, LogicVRegister dst,
1901 const LogicVRegister& src1,
1902 const LogicVRegister& src2, bool round = true);
1903 LogicVRegister sqdmulh(VectorFormat vform, LogicVRegister dst,
1904 const LogicVRegister& src1,
1905 const LogicVRegister& src2);
1906 #define NEON_3VREG_LOGIC_LIST(V) \
1907 V(addhn) \
1908 V(addhn2) \
1909 V(raddhn) \
1910 V(raddhn2) \
1911 V(subhn) \
1912 V(subhn2) \
1913 V(rsubhn) \
1914 V(rsubhn2) \
1915 V(pmull) \
1916 V(pmull2) \
1917 V(sabal) \
1918 V(sabal2) \
1919 V(uabal) \
1920 V(uabal2) \
1921 V(sabdl) \
1922 V(sabdl2) \
1923 V(uabdl) \
1924 V(uabdl2) \
1925 V(smull) \
1926 V(smull2) \
1927 V(umull) \
1928 V(umull2) \
1929 V(smlal) \
1930 V(smlal2) \
1931 V(umlal) \
1932 V(umlal2) \
1933 V(smlsl) \
1934 V(smlsl2) \
1935 V(umlsl) \
1936 V(umlsl2) \
1937 V(sqdmlal) \
1938 V(sqdmlal2) \
1939 V(sqdmlsl) \
1940 V(sqdmlsl2) \
1941 V(sqdmull) \
1942 V(sqdmull2)
1943
1944 #define DEFINE_LOGIC_FUNC(FXN) \
1945 LogicVRegister FXN(VectorFormat vform, LogicVRegister dst, \
1946 const LogicVRegister& src1, const LogicVRegister& src2);
1947 NEON_3VREG_LOGIC_LIST(DEFINE_LOGIC_FUNC)
1948 #undef DEFINE_LOGIC_FUNC
1949
1950 #define NEON_FP3SAME_LIST(V) \
1951 V(fadd, FPAdd, false) \
1952 V(fsub, FPSub, true) \
1953 V(fmul, FPMul, true) \
1954 V(fmulx, FPMulx, true) \
1955 V(fdiv, FPDiv, true) \
1956 V(fmax, FPMax, false) \
1957 V(fmin, FPMin, false) \
1958 V(fmaxnm, FPMaxNM, false) \
1959 V(fminnm, FPMinNM, false)
1960
1961 #define DECLARE_NEON_FP_VECTOR_OP(FN, OP, PROCNAN) \
1962 template <typename T> \
1963 LogicVRegister FN(VectorFormat vform, LogicVRegister dst, \
1964 const LogicVRegister& src1, const LogicVRegister& src2); \
1965 LogicVRegister FN(VectorFormat vform, LogicVRegister dst, \
1966 const LogicVRegister& src1, const LogicVRegister& src2);
1967 NEON_FP3SAME_LIST(DECLARE_NEON_FP_VECTOR_OP)
1968 #undef DECLARE_NEON_FP_VECTOR_OP
1969
1970 #define NEON_FPPAIRWISE_LIST(V) \
1971 V(faddp, fadd, FPAdd) \
1972 V(fmaxp, fmax, FPMax) \
1973 V(fmaxnmp, fmaxnm, FPMaxNM) \
1974 V(fminp, fmin, FPMin) \
1975 V(fminnmp, fminnm, FPMinNM)
1976
1977 #define DECLARE_NEON_FP_PAIR_OP(FNP, FN, OP) \
1978 LogicVRegister FNP(VectorFormat vform, LogicVRegister dst, \
1979 const LogicVRegister& src1, const LogicVRegister& src2); \
1980 LogicVRegister FNP(VectorFormat vform, LogicVRegister dst, \
1981 const LogicVRegister& src);
1982 NEON_FPPAIRWISE_LIST(DECLARE_NEON_FP_PAIR_OP)
1983 #undef DECLARE_NEON_FP_PAIR_OP
1984
1985 template <typename T>
1986 LogicVRegister frecps(VectorFormat vform, LogicVRegister dst,
1987 const LogicVRegister& src1, const LogicVRegister& src2);
1988 LogicVRegister frecps(VectorFormat vform, LogicVRegister dst,
1989 const LogicVRegister& src1, const LogicVRegister& src2);
1990 template <typename T>
1991 LogicVRegister frsqrts(VectorFormat vform, LogicVRegister dst,
1992 const LogicVRegister& src1,
1993 const LogicVRegister& src2);
1994 LogicVRegister frsqrts(VectorFormat vform, LogicVRegister dst,
1995 const LogicVRegister& src1,
1996 const LogicVRegister& src2);
1997 template <typename T>
1998 LogicVRegister fmla(VectorFormat vform, LogicVRegister dst,
1999 const LogicVRegister& src1, const LogicVRegister& src2);
2000 LogicVRegister fmla(VectorFormat vform, LogicVRegister dst,
2001 const LogicVRegister& src1, const LogicVRegister& src2);
2002 template <typename T>
2003 LogicVRegister fmls(VectorFormat vform, LogicVRegister dst,
2004 const LogicVRegister& src1, const LogicVRegister& src2);
2005 LogicVRegister fmls(VectorFormat vform, LogicVRegister dst,
2006 const LogicVRegister& src1, const LogicVRegister& src2);
2007 LogicVRegister fnmul(VectorFormat vform, LogicVRegister dst,
2008 const LogicVRegister& src1, const LogicVRegister& src2);
2009
2010 template <typename T>
2011 LogicVRegister fcmp(VectorFormat vform, LogicVRegister dst,
2012 const LogicVRegister& src1, const LogicVRegister& src2,
2013 Condition cond);
2014 LogicVRegister fcmp(VectorFormat vform, LogicVRegister dst,
2015 const LogicVRegister& src1, const LogicVRegister& src2,
2016 Condition cond);
2017 LogicVRegister fabscmp(VectorFormat vform, LogicVRegister dst,
2018 const LogicVRegister& src1, const LogicVRegister& src2,
2019 Condition cond);
2020 LogicVRegister fcmp_zero(VectorFormat vform, LogicVRegister dst,
2021 const LogicVRegister& src, Condition cond);
2022
2023 template <typename T>
2024 LogicVRegister fneg(VectorFormat vform, LogicVRegister dst,
2025 const LogicVRegister& src);
2026 LogicVRegister fneg(VectorFormat vform, LogicVRegister dst,
2027 const LogicVRegister& src);
2028 template <typename T>
2029 LogicVRegister frecpx(VectorFormat vform, LogicVRegister dst,
2030 const LogicVRegister& src);
2031 LogicVRegister frecpx(VectorFormat vform, LogicVRegister dst,
2032 const LogicVRegister& src);
2033 template <typename T>
2034 LogicVRegister fabs_(VectorFormat vform, LogicVRegister dst,
2035 const LogicVRegister& src);
2036 LogicVRegister fabs_(VectorFormat vform, LogicVRegister dst,
2037 const LogicVRegister& src);
2038 LogicVRegister fabd(VectorFormat vform, LogicVRegister dst,
2039 const LogicVRegister& src1, const LogicVRegister& src2);
2040 LogicVRegister frint(VectorFormat vform, LogicVRegister dst,
2041 const LogicVRegister& src, FPRounding rounding_mode,
2042 bool inexact_exception = false);
2043 LogicVRegister fcvts(VectorFormat vform, LogicVRegister dst,
2044 const LogicVRegister& src, FPRounding rounding_mode,
2045 int fbits = 0);
2046 LogicVRegister fcvtu(VectorFormat vform, LogicVRegister dst,
2047 const LogicVRegister& src, FPRounding rounding_mode,
2048 int fbits = 0);
2049 LogicVRegister fcvtl(VectorFormat vform, LogicVRegister dst,
2050 const LogicVRegister& src);
2051 LogicVRegister fcvtl2(VectorFormat vform, LogicVRegister dst,
2052 const LogicVRegister& src);
2053 LogicVRegister fcvtn(VectorFormat vform, LogicVRegister dst,
2054 const LogicVRegister& src);
2055 LogicVRegister fcvtn2(VectorFormat vform, LogicVRegister dst,
2056 const LogicVRegister& src);
2057 LogicVRegister fcvtxn(VectorFormat vform, LogicVRegister dst,
2058 const LogicVRegister& src);
2059 LogicVRegister fcvtxn2(VectorFormat vform, LogicVRegister dst,
2060 const LogicVRegister& src);
2061 LogicVRegister fsqrt(VectorFormat vform, LogicVRegister dst,
2062 const LogicVRegister& src);
2063 LogicVRegister frsqrte(VectorFormat vform, LogicVRegister dst,
2064 const LogicVRegister& src);
2065 LogicVRegister frecpe(VectorFormat vform, LogicVRegister dst,
2066 const LogicVRegister& src, FPRounding rounding);
2067 LogicVRegister ursqrte(VectorFormat vform, LogicVRegister dst,
2068 const LogicVRegister& src);
2069 LogicVRegister urecpe(VectorFormat vform, LogicVRegister dst,
2070 const LogicVRegister& src);
2071
2072 typedef float (Simulator::*FPMinMaxOp)(float a, float b);
2073
2074 LogicVRegister FMinMaxV(VectorFormat vform, LogicVRegister dst,
2075 const LogicVRegister& src, FPMinMaxOp Op);
2076
2077 LogicVRegister fminv(VectorFormat vform, LogicVRegister dst,
2078 const LogicVRegister& src);
2079 LogicVRegister fmaxv(VectorFormat vform, LogicVRegister dst,
2080 const LogicVRegister& src);
2081 LogicVRegister fminnmv(VectorFormat vform, LogicVRegister dst,
2082 const LogicVRegister& src);
2083 LogicVRegister fmaxnmv(VectorFormat vform, LogicVRegister dst,
2084 const LogicVRegister& src);
2085
2086 template <typename T>
2087 T FPRecipSqrtEstimate(T op);
2088 template <typename T>
2089 T FPRecipEstimate(T op, FPRounding rounding);
2090 template <typename T, typename R>
2091 R FPToFixed(T op, int fbits, bool is_signed, FPRounding rounding);
710 2092
711 void FPCompare(double val0, double val1); 2093 void FPCompare(double val0, double val1);
712 double FPRoundInt(double value, FPRounding round_mode); 2094 double FPRoundInt(double value, FPRounding round_mode);
713 double FPToDouble(float value); 2095 double FPToDouble(float value);
714 float FPToFloat(double value, FPRounding round_mode); 2096 float FPToFloat(double value, FPRounding round_mode);
2097 float FPToFloat(float16 value);
2098 float16 FPToFloat16(float value, FPRounding round_mode);
2099 float16 FPToFloat16(double value, FPRounding round_mode);
2100 double recip_sqrt_estimate(double a);
2101 double recip_estimate(double a);
2102 double FPRecipSqrtEstimate(double a);
2103 double FPRecipEstimate(double a);
715 double FixedToDouble(int64_t src, int fbits, FPRounding round_mode); 2104 double FixedToDouble(int64_t src, int fbits, FPRounding round_mode);
716 double UFixedToDouble(uint64_t src, int fbits, FPRounding round_mode); 2105 double UFixedToDouble(uint64_t src, int fbits, FPRounding round_mode);
717 float FixedToFloat(int64_t src, int fbits, FPRounding round_mode); 2106 float FixedToFloat(int64_t src, int fbits, FPRounding round_mode);
718 float UFixedToFloat(uint64_t src, int fbits, FPRounding round_mode); 2107 float UFixedToFloat(uint64_t src, int fbits, FPRounding round_mode);
719 int32_t FPToInt32(double value, FPRounding rmode); 2108 int32_t FPToInt32(double value, FPRounding rmode);
720 int64_t FPToInt64(double value, FPRounding rmode); 2109 int64_t FPToInt64(double value, FPRounding rmode);
721 uint32_t FPToUInt32(double value, FPRounding rmode); 2110 uint32_t FPToUInt32(double value, FPRounding rmode);
722 uint64_t FPToUInt64(double value, FPRounding rmode); 2111 uint64_t FPToUInt64(double value, FPRounding rmode);
723 2112
724 template <typename T> 2113 template <typename T>
(...skipping 11 matching lines...) Expand all
736 template <typename T> 2125 template <typename T>
737 T FPMin(T a, T b); 2126 T FPMin(T a, T b);
738 2127
739 template <typename T> 2128 template <typename T>
740 T FPMinNM(T a, T b); 2129 T FPMinNM(T a, T b);
741 2130
742 template <typename T> 2131 template <typename T>
743 T FPMul(T op1, T op2); 2132 T FPMul(T op1, T op2);
744 2133
745 template <typename T> 2134 template <typename T>
2135 T FPMulx(T op1, T op2);
2136
2137 template <typename T>
746 T FPMulAdd(T a, T op1, T op2); 2138 T FPMulAdd(T a, T op1, T op2);
747 2139
748 template <typename T> 2140 template <typename T>
749 T FPSqrt(T op); 2141 T FPSqrt(T op);
750 2142
751 template <typename T> 2143 template <typename T>
752 T FPSub(T op1, T op2); 2144 T FPSub(T op1, T op2);
753 2145
754 // Standard NaN processing.
755 template <typename T> 2146 template <typename T>
756 T FPProcessNaN(T op); 2147 T FPRecipStepFused(T op1, T op2);
757
758 bool FPProcessNaNs(Instruction* instr);
759 2148
760 template <typename T> 2149 template <typename T>
761 T FPProcessNaNs(T op1, T op2); 2150 T FPRSqrtStepFused(T op1, T op2);
762 2151
763 template <typename T> 2152 // This doesn't do anything at the moment. We'll need it if we want support
764 T FPProcessNaNs3(T op1, T op2, T op3); 2153 // for cumulative exception bits or floating-point exceptions.
2154 void FPProcessException() {}
2155
2156 // Standard NaN processing.
2157 bool FPProcessNaNs(Instruction* instr);
765 2158
766 void CheckStackAlignment(); 2159 void CheckStackAlignment();
767 2160
768 inline void CheckPCSComplianceAndRun(); 2161 inline void CheckPCSComplianceAndRun();
769 2162
770 #ifdef DEBUG 2163 #ifdef DEBUG
771 // Corruption values should have their least significant byte cleared to 2164 // Corruption values should have their least significant byte cleared to
772 // allow the code of the register being corrupted to be inserted. 2165 // allow the code of the register being corrupted to be inserted.
773 static const uint64_t kCallerSavedRegisterCorruptionValue = 2166 static const uint64_t kCallerSavedRegisterCorruptionValue =
774 0xca11edc0de000000UL; 2167 0xca11edc0de000000UL;
775 // This value is a NaN in both 32-bit and 64-bit FP. 2168 // This value is a NaN in both 32-bit and 64-bit FP.
776 static const uint64_t kCallerSavedFPRegisterCorruptionValue = 2169 static const uint64_t kCallerSavedVRegisterCorruptionValue =
777 0x7ff000007f801000UL; 2170 0x7ff000007f801000UL;
778 // This value is a mix of 32/64-bits NaN and "verbose" immediate. 2171 // This value is a mix of 32/64-bits NaN and "verbose" immediate.
779 static const uint64_t kDefaultCPURegisterCorruptionValue = 2172 static const uint64_t kDefaultCPURegisterCorruptionValue =
780 0x7ffbad007f8bad00UL; 2173 0x7ffbad007f8bad00UL;
781 2174
782 void CorruptRegisters(CPURegList* list, 2175 void CorruptRegisters(CPURegList* list,
783 uint64_t value = kDefaultCPURegisterCorruptionValue); 2176 uint64_t value = kDefaultCPURegisterCorruptionValue);
784 void CorruptAllCallerSavedCPURegisters(); 2177 void CorruptAllCallerSavedCPURegisters();
785 #endif 2178 #endif
786 2179
787 // Pseudo Printf instruction 2180 // Pseudo Printf instruction
788 void DoPrintf(Instruction* instr); 2181 void DoPrintf(Instruction* instr);
789 2182
790 // Processor state --------------------------------------- 2183 // Processor state ---------------------------------------
791 2184
792 // Output stream. 2185 // Output stream.
793 FILE* stream_; 2186 FILE* stream_;
794 PrintDisassembler* print_disasm_; 2187 PrintDisassembler* print_disasm_;
795 void PRINTF_FORMAT(2, 3) TraceSim(const char* format, ...); 2188 void PRINTF_FORMAT(2, 3) TraceSim(const char* format, ...);
796 2189
797 // Instrumentation. 2190 // Instrumentation.
798 Instrument* instrument_; 2191 Instrument* instrument_;
799 2192
800 // General purpose registers. Register 31 is the stack pointer. 2193 // General purpose registers. Register 31 is the stack pointer.
801 SimRegister registers_[kNumberOfRegisters]; 2194 SimRegister registers_[kNumberOfRegisters];
802 2195
803 // Floating point registers 2196 // Floating point registers
804 SimFPRegister fpregisters_[kNumberOfFPRegisters]; 2197 SimVRegister vregisters_[kNumberOfVRegisters];
805 2198
806 // Processor state 2199 // Processor state
807 // bits[31, 27]: Condition flags N, Z, C, and V. 2200 // bits[31, 27]: Condition flags N, Z, C, and V.
808 // (Negative, Zero, Carry, Overflow) 2201 // (Negative, Zero, Carry, Overflow)
809 SimSystemRegister nzcv_; 2202 SimSystemRegister nzcv_;
810 2203
811 // Floating-Point Control Register 2204 // Floating-Point Control Register
812 SimSystemRegister fpcr_; 2205 SimSystemRegister fpcr_;
813 2206
814 // Only a subset of FPCR features are supported by the simulator. This helper 2207 // Only a subset of FPCR features are supported by the simulator. This helper
(...skipping 137 matching lines...) Expand 10 before | Expand all | Expand 10 after
952 Processor* head_; 2345 Processor* head_;
953 }; 2346 };
954 2347
955 LocalMonitor local_monitor_; 2348 LocalMonitor local_monitor_;
956 GlobalMonitor::Processor global_monitor_processor_; 2349 GlobalMonitor::Processor global_monitor_processor_;
957 static base::LazyInstance<GlobalMonitor>::type global_monitor_; 2350 static base::LazyInstance<GlobalMonitor>::type global_monitor_;
958 2351
959 private: 2352 private:
960 void Init(FILE* stream); 2353 void Init(FILE* stream);
961 2354
2355 template <typename T>
2356 static T FPDefaultNaN();
2357
2358 template <typename T>
2359 T FPProcessNaN(T op) {
2360 DCHECK(std::isnan(op));
2361 return fpcr().DN() ? FPDefaultNaN<T>() : ToQuietNaN(op);
2362 }
2363
2364 template <typename T>
2365 T FPProcessNaNs(T op1, T op2) {
2366 if (IsSignallingNaN(op1)) {
2367 return FPProcessNaN(op1);
2368 } else if (IsSignallingNaN(op2)) {
2369 return FPProcessNaN(op2);
2370 } else if (std::isnan(op1)) {
2371 DCHECK(IsQuietNaN(op1));
2372 return FPProcessNaN(op1);
2373 } else if (std::isnan(op2)) {
2374 DCHECK(IsQuietNaN(op2));
2375 return FPProcessNaN(op2);
2376 } else {
2377 return 0.0;
2378 }
2379 }
2380
2381 template <typename T>
2382 T FPProcessNaNs3(T op1, T op2, T op3) {
2383 if (IsSignallingNaN(op1)) {
2384 return FPProcessNaN(op1);
2385 } else if (IsSignallingNaN(op2)) {
2386 return FPProcessNaN(op2);
2387 } else if (IsSignallingNaN(op3)) {
2388 return FPProcessNaN(op3);
2389 } else if (std::isnan(op1)) {
2390 DCHECK(IsQuietNaN(op1));
2391 return FPProcessNaN(op1);
2392 } else if (std::isnan(op2)) {
2393 DCHECK(IsQuietNaN(op2));
2394 return FPProcessNaN(op2);
2395 } else if (std::isnan(op3)) {
2396 DCHECK(IsQuietNaN(op3));
2397 return FPProcessNaN(op3);
2398 } else {
2399 return 0.0;
2400 }
2401 }
2402
962 int log_parameters_; 2403 int log_parameters_;
963 Isolate* isolate_; 2404 Isolate* isolate_;
964 }; 2405 };
965 2406
2407 template <>
2408 inline double Simulator::FPDefaultNaN<double>() {
2409 return kFP64DefaultNaN;
2410 }
2411
2412 template <>
2413 inline float Simulator::FPDefaultNaN<float>() {
2414 return kFP32DefaultNaN;
2415 }
966 2416
967 // When running with the simulator transition into simulated execution at this 2417 // When running with the simulator transition into simulated execution at this
968 // point. 2418 // point.
969 #define CALL_GENERATED_CODE(isolate, entry, p0, p1, p2, p3, p4) \ 2419 #define CALL_GENERATED_CODE(isolate, entry, p0, p1, p2, p3, p4) \
970 reinterpret_cast<Object*>(Simulator::current(isolate)->CallJS( \ 2420 reinterpret_cast<Object*>(Simulator::current(isolate)->CallJS( \
971 FUNCTION_ADDR(entry), p0, p1, p2, p3, p4)) 2421 FUNCTION_ADDR(entry), p0, p1, p2, p3, p4))
972 2422
973 #define CALL_GENERATED_REGEXP_CODE(isolate, entry, p0, p1, p2, p3, p4, p5, p6, \ 2423 #define CALL_GENERATED_REGEXP_CODE(isolate, entry, p0, p1, p2, p3, p4, p5, p6, \
974 p7, p8) \ 2424 p7, p8) \
975 static_cast<int>(Simulator::current(isolate)->CallRegExp( \ 2425 static_cast<int>(Simulator::current(isolate)->CallRegExp( \
(...skipping 21 matching lines...) Expand all
997 Simulator::current(isolate)->PopAddress(); 2447 Simulator::current(isolate)->PopAddress();
998 } 2448 }
999 }; 2449 };
1000 2450
1001 #endif // !defined(USE_SIMULATOR) 2451 #endif // !defined(USE_SIMULATOR)
1002 2452
1003 } // namespace internal 2453 } // namespace internal
1004 } // namespace v8 2454 } // namespace v8
1005 2455
1006 #endif // V8_ARM64_SIMULATOR_ARM64_H_ 2456 #endif // V8_ARM64_SIMULATOR_ARM64_H_
OLDNEW
« no previous file with comments | « src/arm64/macro-assembler-arm64-inl.h ('k') | src/arm64/simulator-arm64.cc » ('j') | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698