src/arm/assembler-arm.cc - Issue 11428137: ARM: Make use of d16-d31 when available.

Side by Side Diff: src/arm/assembler-arm.cc

Issue 11428137: ARM: Make use of d16-d31 when available. (Closed) Base URL: https://v8.googlecode.com/svn/branches/bleeding_edge

Patch Set: Address Rodolph's comments Created 8 years ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View unified diff | Download patch | Annotate | Revision Log

OLD	NEW
1 // Copyright (c) 1994-2006 Sun Microsystems Inc.	1 // Copyright (c) 1994-2006 Sun Microsystems Inc.

2 // All Rights Reserved.	2 // All Rights Reserved.

3 //	3 //

4 // Redistribution and use in source and binary forms, with or without	4 // Redistribution and use in source and binary forms, with or without

5 // modification, are permitted provided that the following conditions	5 // modification, are permitted provided that the following conditions

6 // are met:	6 // are met:

7 //	7 //

8 // - Redistributions of source code must retain the above copyright notice,	8 // - Redistributions of source code must retain the above copyright notice,

9 // this list of conditions and the following disclaimer.	9 // this list of conditions and the following disclaimer.

10 //	10 //

(...skipping 1662 matching lines...) Expand 10 before \| Expand all \| Expand 10 after Loading...
1673 }	1673 }

1674	1674

1675	1675

1676 // Support for VFP.	1676 // Support for VFP.

1677	1677

1678 void Assembler::vldr(const DwVfpRegister dst,	1678 void Assembler::vldr(const DwVfpRegister dst,

1679 const Register base,	1679 const Register base,

1680 int offset,	1680 int offset,

1681 const Condition cond) {	1681 const Condition cond) {

1682 // Ddst = MEM(Rbase + offset).	1682 // Ddst = MEM(Rbase + offset).

1683 // Instruction details available in ARM DDI 0406A, A8-628.	1683 // Instruction details available in ARM DDI 0406C.b, A8-924.

1684 // cond(31-28) \| 1101(27-24)\| U001(23-20) \| Rbase(19-16) \|	1684 // cond(31-28) \| 1101(27-24)\| U(23) \| D(22) \| 01(21-20) \| Rbase(19-16) \|

1685 // Vdst(15-12) \| 1011(11-8) \| offset	1685 // Vd(15-12) \| 1011(11-8) \| offset

1686 ASSERT(CpuFeatures::IsEnabled(VFP2));	1686 ASSERT(CpuFeatures::IsEnabled(VFP2));

1687 int u = 1;	1687 int u = 1;

1688 if (offset < 0) {	1688 if (offset < 0) {

1689 offset = -offset;	1689 offset = -offset;

1690 u = 0;	1690 u = 0;

1691 }	1691 }

	1692 ASSERT(offset >= 0);

	1693 int vd, d;

	1694 dst.split_code(&vd, &d);

1692	1695

1693 ASSERT(offset >= 0);	1696 ASSERT(offset >= 0);

1694 if ((offset % 4) == 0 && (offset / 4) < 256) {	1697 if ((offset % 4) == 0 && (offset / 4) < 256) {

1695 emit(cond \| uB23 \| 0xD1B20 \| base.code()B16 \| dst.code()B12 \|	1698 emit(cond \| 0xDB24 \| uB23 \| dB22 \| B20 \| base.code()B16 \| vd*B12 \|

1696 0xB*B8 \| ((offset / 4) & 255));	1699 0xB*B8 \| ((offset / 4) & 255));

1697 } else {	1700 } else {

1698 // Larger offsets must be handled by computing the correct address	1701 // Larger offsets must be handled by computing the correct address

1699 // in the ip register.	1702 // in the ip register.

1700 ASSERT(!base.is(ip));	1703 ASSERT(!base.is(ip));

1701 if (u == 1) {	1704 if (u == 1) {

1702 add(ip, base, Operand(offset));	1705 add(ip, base, Operand(offset));

1703 } else {	1706 } else {

1704 sub(ip, base, Operand(offset));	1707 sub(ip, base, Operand(offset));

1705 }	1708 }

1706 emit(cond \| 0xD1B20 \| ip.code()B16 \| dst.code()B12 \| 0xBB8);	1709 emit(cond \| 0xDB24 \| dB22 \| B20 \| ip.code()B16 \| vdB12 \| 0xB*B8);

1707 }	1710 }

1708 }	1711 }

1709	1712

1710	1713

1711 void Assembler::vldr(const DwVfpRegister dst,	1714 void Assembler::vldr(const DwVfpRegister dst,

1712 const MemOperand& operand,	1715 const MemOperand& operand,

1713 const Condition cond) {	1716 const Condition cond) {

1714 ASSERT(!operand.rm().is_valid());	1717 ASSERT(!operand.rm().is_valid());

1715 ASSERT(operand.am_ == Offset);	1718 ASSERT(operand.am_ == Offset);

1716 vldr(dst, operand.rn(), operand.offset(), cond);	1719 vldr(dst, operand.rn(), operand.offset(), cond);

(...skipping 42 matching lines...) Expand 10 before \| Expand all \| Expand 10 after Loading...
1759 ASSERT(operand.am_ == Offset);	1762 ASSERT(operand.am_ == Offset);

1760 vldr(dst, operand.rn(), operand.offset(), cond);	1763 vldr(dst, operand.rn(), operand.offset(), cond);

1761 }	1764 }

1762	1765

1763	1766

1764 void Assembler::vstr(const DwVfpRegister src,	1767 void Assembler::vstr(const DwVfpRegister src,

1765 const Register base,	1768 const Register base,

1766 int offset,	1769 int offset,

1767 const Condition cond) {	1770 const Condition cond) {

1768 // MEM(Rbase + offset) = Dsrc.	1771 // MEM(Rbase + offset) = Dsrc.

1769 // Instruction details available in ARM DDI 0406A, A8-786.	1772 // Instruction details available in ARM DDI 0406C.b, A8-1082.

1770 // cond(31-28) \| 1101(27-24)\| U000(23-20) \| \| Rbase(19-16) \|	1773 // cond(31-28) \| 1101(27-24)\| U(23) \| D(22) \| 00(21-20) \| Rbase(19-16) \|

1771 // Vsrc(15-12) \| 1011(11-8) \| (offset/4)	1774 // Vd(15-12) \| 1011(11-8) \| (offset/4)

1772 ASSERT(CpuFeatures::IsEnabled(VFP2));	1775 ASSERT(CpuFeatures::IsEnabled(VFP2));

1773 int u = 1;	1776 int u = 1;

1774 if (offset < 0) {	1777 if (offset < 0) {

1775 offset = -offset;	1778 offset = -offset;

1776 u = 0;	1779 u = 0;

1777 }	1780 }

1778 ASSERT(offset >= 0);	1781 ASSERT(offset >= 0);

	1782 int vd, d;

	1783 src.split_code(&vd, &d);

	1784

1779 if ((offset % 4) == 0 && (offset / 4) < 256) {	1785 if ((offset % 4) == 0 && (offset / 4) < 256) {

1780 emit(cond \| uB23 \| 0xD0B20 \| base.code()B16 \| src.code()B12 \|	1786 emit(cond \| 0xDB24 \| uB23 \| dB22 \| base.code()B16 \| vdB12 \| 0xBB8 \|

1781 0xB*B8 \| ((offset / 4) & 255));	1787 ((offset / 4) & 255));

1782 } else {	1788 } else {

1783 // Larger offsets must be handled by computing the correct address	1789 // Larger offsets must be handled by computing the correct address

1784 // in the ip register.	1790 // in the ip register.

1785 ASSERT(!base.is(ip));	1791 ASSERT(!base.is(ip));

1786 if (u == 1) {	1792 if (u == 1) {

1787 add(ip, base, Operand(offset));	1793 add(ip, base, Operand(offset));

1788 } else {	1794 } else {

1789 sub(ip, base, Operand(offset));	1795 sub(ip, base, Operand(offset));

1790 }	1796 }

1791 emit(cond \| 0xD0B20 \| ip.code()B16 \| src.code()B12 \| 0xBB8);	1797 emit(cond \| 0xDB24 \| dB22 \| ip.code()B16 \| vdB12 \| 0xB*B8);

1792 }	1798 }

1793 }	1799 }

1794	1800

1795	1801

1796 void Assembler::vstr(const DwVfpRegister src,	1802 void Assembler::vstr(const DwVfpRegister src,

1797 const MemOperand& operand,	1803 const MemOperand& operand,

1798 const Condition cond) {	1804 const Condition cond) {

1799 ASSERT(!operand.rm().is_valid());	1805 ASSERT(!operand.rm().is_valid());

1800 ASSERT(operand.am_ == Offset);	1806 ASSERT(operand.am_ == Offset);

1801 vstr(src, operand.rn(), operand.offset(), cond);	1807 vstr(src, operand.rn(), operand.offset(), cond);

(...skipping 41 matching lines...) Expand 10 before \| Expand all \| Expand 10 after Loading...
1843 ASSERT(operand.am_ == Offset);	1849 ASSERT(operand.am_ == Offset);

1844 vstr(src, operand.rn(), operand.offset(), cond);	1850 vstr(src, operand.rn(), operand.offset(), cond);

1845 }	1851 }

1846	1852

1847	1853

1848 void Assembler::vldm(BlockAddrMode am,	1854 void Assembler::vldm(BlockAddrMode am,

1849 Register base,	1855 Register base,

1850 DwVfpRegister first,	1856 DwVfpRegister first,

1851 DwVfpRegister last,	1857 DwVfpRegister last,

1852 Condition cond) {	1858 Condition cond) {

1853 // Instruction details available in ARM DDI 0406A, A8-626.	1859 // Instruction details available in ARM DDI 0406C.b, A8-922.

1854 // cond(31-28) \| 110(27-25)\| PUDW1(24-20) \| Rbase(19-16) \|	1860 // cond(31-28) \| 110(27-25)\| PUDW1(24-20) \| Rbase(19-16) \|

1855 // first(15-12) \| 1010(11-8) \| (count * 2)	1861 // first(15-12) \| 1011(11-8) \| (count * 2)

1856 ASSERT(CpuFeatures::IsEnabled(VFP2));	1862 ASSERT(CpuFeatures::IsEnabled(VFP2));

1857 ASSERT_LE(first.code(), last.code());	1863 ASSERT_LE(first.code(), last.code());

1858 ASSERT(am == ia \|\| am == ia_w \|\| am == db_w);	1864 ASSERT(am == ia \|\| am == ia_w \|\| am == db_w);

1859 ASSERT(!base.is(pc));	1865 ASSERT(!base.is(pc));

1860	1866

1861 int sd, d;	1867 int sd, d;

1862 first.split_code(&sd, &d);	1868 first.split_code(&sd, &d);

1863 int count = last.code() - first.code() + 1;	1869 int count = last.code() - first.code() + 1;

1864 ASSERT(count <= 16);	1870 ASSERT(count <= 16);

1865 emit(cond \| B27 \| B26 \| am \| dB22 \| B20 \| base.code()B16 \| sd*B12 \|	1871 emit(cond \| B27 \| B26 \| am \| dB22 \| B20 \| base.code()B16 \| sd*B12 \|

1866 0xBB8 \| count2);	1872 0xBB8 \| count2);

1867 }	1873 }

1868	1874

1869	1875

1870 void Assembler::vstm(BlockAddrMode am,	1876 void Assembler::vstm(BlockAddrMode am,

1871 Register base,	1877 Register base,

1872 DwVfpRegister first,	1878 DwVfpRegister first,

1873 DwVfpRegister last,	1879 DwVfpRegister last,

1874 Condition cond) {	1880 Condition cond) {

1875 // Instruction details available in ARM DDI 0406A, A8-784.	1881 // Instruction details available in ARM DDI 0406C.b, A8-1080.

1876 // cond(31-28) \| 110(27-25)\| PUDW0(24-20) \| Rbase(19-16) \|	1882 // cond(31-28) \| 110(27-25)\| PUDW0(24-20) \| Rbase(19-16) \|

1877 // first(15-12) \| 1011(11-8) \| (count * 2)	1883 // first(15-12) \| 1011(11-8) \| (count * 2)

1878 ASSERT(CpuFeatures::IsEnabled(VFP2));	1884 ASSERT(CpuFeatures::IsEnabled(VFP2));

1879 ASSERT_LE(first.code(), last.code());	1885 ASSERT_LE(first.code(), last.code());

1880 ASSERT(am == ia \|\| am == ia_w \|\| am == db_w);	1886 ASSERT(am == ia \|\| am == ia_w \|\| am == db_w);

1881 ASSERT(!base.is(pc));	1887 ASSERT(!base.is(pc));

1882	1888

1883 int sd, d;	1889 int sd, d;

1884 first.split_code(&sd, &d);	1890 first.split_code(&sd, &d);

1885 int count = last.code() - first.code() + 1;	1891 int count = last.code() - first.code() + 1;

(...skipping 115 matching lines...) Expand 10 before \| Expand all \| Expand 10 after Loading...
2001 // The double can be encoded in the instruction.	2007 // The double can be encoded in the instruction.

2002 emit(cond \| 0xEB24 \| 0xBB20 \| dst.code()B12 \| 0xBB8 \| enc);	2008 emit(cond \| 0xEB24 \| 0xBB20 \| dst.code()B12 \| 0xBB8 \| enc);

2003 } else {	2009 } else {

2004 // Synthesise the double from ARM immediates. This could be implemented	2010 // Synthesise the double from ARM immediates. This could be implemented

2005 // using vldr from a constant pool.	2011 // using vldr from a constant pool.

2006 uint32_t lo, hi;	2012 uint32_t lo, hi;

2007 DoubleAsTwoUInt32(imm, &lo, &hi);	2013 DoubleAsTwoUInt32(imm, &lo, &hi);

2008 mov(ip, Operand(lo));	2014 mov(ip, Operand(lo));

2009	2015

2010 if (scratch.is(no_reg)) {	2016 if (scratch.is(no_reg)) {

2011 // Move the low part of the double into the lower of the corresponsing S	2017 if (dst.code() < 16) {

2012 // registers of D register dst.	2018 // Move the low part of the double into the lower of the corresponsing S

2013 vmov(dst.low(), ip, cond);	2019 // registers of D register dst.

	2020 vmov(dst.low(), ip, cond);

2014	2021

2015 // Move the high part of the double into the higher of the corresponsing S	2022 // Move the high part of the double into the higher of the corresponsing S

2016 // registers of D register dst.	2023 // registers of D register dst.

2017 mov(ip, Operand(hi));	2024 mov(ip, Operand(hi));

2018 vmov(dst.high(), ip, cond);	2025 vmov(dst.high(), ip, cond);

	2026 } else {

	2027 // There are no corresponding S registers for D register dst.

	2028

	2029 // FIXME: We need a way to do this! For now, let's use the stack.

	2030 // Push r4, r5 on the stack.
	Rodolph Perfetta 2012/12/05 00:42:10 There is an instruction which lets you move an ARM There is an instruction which lets you move an ARM register into the bottom or top word of any D register: vmov.32. For example vmov.32 d16[0], ip will move ip in the lower 32bits of d16. It can be found section A8.6.328 of the ARM ARM (move core reg to scalar) It is not implemented in V8 though and note that vmov.16 and vmov.8 are NEON only instructions. hans 2012/12/05 14:12:58 Awesome, I'll just use vmov.32 then. Thanks! Show quoted text On 2012/12/05 00:42:10, Rodolph Perfetta wrote: > There is an instruction which lets you move an ARM register into the bottom or > top word of any D register: vmov.32. For example vmov.32 d16[0], ip will move ip > in the lower 32bits of d16. It can be found section A8.6.328 of the ARM ARM > (move core reg to scalar) > > It is not implemented in V8 though and note that vmov.16 and vmov.8 are NEON > only instructions. Awesome, I'll just use vmov.32 then. Thanks!
	2031 push(r4);

	2032 push(r5);

	2033 mov(r4, Operand(lo));

	2034 mov(r5, Operand(hi));

	2035 vmov(dst, r4, r5, cond);

	2036 pop(r5);

	2037 pop(r4);

	2038 }

2019 } else {	2039 } else {

2020 // Move the low and high parts of the double to a D register in one	2040 // Move the low and high parts of the double to a D register in one

2021 // instruction.	2041 // instruction.

2022 mov(scratch, Operand(hi));	2042 mov(scratch, Operand(hi));

2023 vmov(dst, ip, scratch, cond);	2043 vmov(dst, ip, scratch, cond);

2024 }	2044 }

2025 }	2045 }

2026 }	2046 }

2027	2047

2028	2048

2029 void Assembler::vmov(const SwVfpRegister dst,	2049 void Assembler::vmov(const SwVfpRegister dst,

2030 const SwVfpRegister src,	2050 const SwVfpRegister src,

2031 const Condition cond) {	2051 const Condition cond) {

2032 // Sd = Sm	2052 // Sd = Sm

2033 // Instruction details available in ARM DDI 0406B, A8-642.	2053 // Instruction details available in ARM DDI 0406B, A8-642.

2034 ASSERT(CpuFeatures::IsEnabled(VFP2));	2054 ASSERT(CpuFeatures::IsEnabled(VFP2));

2035 int sd, d, sm, m;	2055 int sd, d, sm, m;

2036 dst.split_code(&sd, &d);	2056 dst.split_code(&sd, &d);

2037 src.split_code(&sm, &m);	2057 src.split_code(&sm, &m);

2038 emit(cond \| 0xEB24 \| dB22 \| 0xBB20 \| sdB12 \| 0xAB8 \| B6 \| mB5 \| sm);	2058 emit(cond \| 0xEB24 \| dB22 \| 0xBB20 \| sdB12 \| 0xAB8 \| B6 \| mB5 \| sm);

2039 }	2059 }

2040	2060

2041	2061

2042 void Assembler::vmov(const DwVfpRegister dst,	2062 void Assembler::vmov(const DwVfpRegister dst,

2043 const DwVfpRegister src,	2063 const DwVfpRegister src,

2044 const Condition cond) {	2064 const Condition cond) {

2045 // Dd = Dm	2065 // Dd = Dm

2046 // Instruction details available in ARM DDI 0406B, A8-642.	2066 // Instruction details available in ARM DDI 0406C.b, A8-938.

	2067 // cond(31-28) \| 11101(27-23) \| D(22) \| 11(21-20) \| 0000(19-16) \| Vd(15-12) \|

	2068 // 101(11-9) \| sz=1(8) \| 0(7) \| 1(6) \| M(5) \| 0(4) \| Vm(3-0)

2047 ASSERT(CpuFeatures::IsEnabled(VFP2));	2069 ASSERT(CpuFeatures::IsEnabled(VFP2));

2048 emit(cond \| 0xEB24 \| 0xBB20 \|	2070 int vd, d;

2049 dst.code()B12 \| 0x5B9 \| B8 \| B6 \| src.code());	2071 dst.split_code(&vd, &d);

	2072 int vm, m;

	2073 src.split_code(&vm, &m);

	2074 emit(cond \| 0x1DB23 \| dB22 \| 0x3B20 \| vdB12 \| 0x5B9 \| B8 \| B6 \| mB5 \|

	2075 vm);

2050 }	2076 }

2051	2077

2052	2078

2053 void Assembler::vmov(const DwVfpRegister dst,	2079 void Assembler::vmov(const DwVfpRegister dst,

2054 const Register src1,	2080 const Register src1,

2055 const Register src2,	2081 const Register src2,

2056 const Condition cond) {	2082 const Condition cond) {

2057 // Dm = <Rt,Rt2>.	2083 // Dm = <Rt,Rt2>.

2058 // Instruction details available in ARM DDI 0406A, A8-646.	2084 // Instruction details available in ARM DDI 0406C.b, A8-948.

2059 // cond(31-28) \| 1100(27-24)\| 010(23-21) \| op=0(20) \| Rt2(19-16) \|	2085 // cond(31-28) \| 1100(27-24)\| 010(23-21) \| op=0(20) \| Rt2(19-16) \|

2060 // Rt(15-12) \| 1011(11-8) \| 00(7-6) \| M(5) \| 1(4) \| Vm	2086 // Rt(15-12) \| 1011(11-8) \| 00(7-6) \| M(5) \| 1(4) \| Vm

2061 ASSERT(CpuFeatures::IsEnabled(VFP2));	2087 ASSERT(CpuFeatures::IsEnabled(VFP2));

2062 ASSERT(!src1.is(pc) && !src2.is(pc));	2088 ASSERT(!src1.is(pc) && !src2.is(pc));

	2089 int vm, m;

	2090 dst.split_code(&vm, &m);

2063 emit(cond \| 0xCB24 \| B22 \| src2.code()B16 \|	2091 emit(cond \| 0xCB24 \| B22 \| src2.code()B16 \|

2064 src1.code()B12 \| 0xBB8 \| B4 \| dst.code());	2092 src1.code()B12 \| 0xBB8 \| m*B5 \| B4 \| vm);

2065 }	2093 }

2066	2094

2067	2095

2068 void Assembler::vmov(const Register dst1,	2096 void Assembler::vmov(const Register dst1,

2069 const Register dst2,	2097 const Register dst2,

2070 const DwVfpRegister src,	2098 const DwVfpRegister src,

2071 const Condition cond) {	2099 const Condition cond) {

2072 // <Rt,Rt2> = Dm.	2100 // <Rt,Rt2> = Dm.

2073 // Instruction details available in ARM DDI 0406A, A8-646.	2101 // Instruction details available in ARM DDI 0406C.b, A8-948.

2074 // cond(31-28) \| 1100(27-24)\| 010(23-21) \| op=1(20) \| Rt2(19-16) \|	2102 // cond(31-28) \| 1100(27-24)\| 010(23-21) \| op=1(20) \| Rt2(19-16) \|

2075 // Rt(15-12) \| 1011(11-8) \| 00(7-6) \| M(5) \| 1(4) \| Vm	2103 // Rt(15-12) \| 1011(11-8) \| 00(7-6) \| M(5) \| 1(4) \| Vm

2076 ASSERT(CpuFeatures::IsEnabled(VFP2));	2104 ASSERT(CpuFeatures::IsEnabled(VFP2));

2077 ASSERT(!dst1.is(pc) && !dst2.is(pc));	2105 ASSERT(!dst1.is(pc) && !dst2.is(pc));

	2106 int vm, m;

	2107 src.split_code(&vm, &m);

2078 emit(cond \| 0xCB24 \| B22 \| B20 \| dst2.code()B16 \|	2108 emit(cond \| 0xCB24 \| B22 \| B20 \| dst2.code()B16 \|

2079 dst1.code()B12 \| 0xBB8 \| B4 \| src.code());	2109 dst1.code()B12 \| 0xBB8 \| m*B5 \| B4 \| vm);

2080 }	2110 }

2081	2111

2082	2112

2083 void Assembler::vmov(const SwVfpRegister dst,	2113 void Assembler::vmov(const SwVfpRegister dst,

2084 const Register src,	2114 const Register src,

2085 const Condition cond) {	2115 const Condition cond) {

2086 // Sn = Rt.	2116 // Sn = Rt.

2087 // Instruction details available in ARM DDI 0406A, A8-642.	2117 // Instruction details available in ARM DDI 0406A, A8-642.

2088 // cond(31-28) \| 1110(27-24)\| 000(23-21) \| op=0(20) \| Vn(19-16) \|	2118 // cond(31-28) \| 1110(27-24)\| 000(23-21) \| op=0(20) \| Vn(19-16) \|

2089 // Rt(15-12) \| 1010(11-8) \| N(7)=0 \| 00(6-5) \| 1(4) \| 0000(3-0)	2119 // Rt(15-12) \| 1010(11-8) \| N(7)=0 \| 00(6-5) \| 1(4) \| 0000(3-0)

(...skipping 192 matching lines...) Expand 10 before \| Expand all \| Expand 10 after Loading...
2282 VFPConversionMode mode,	2312 VFPConversionMode mode,

2283 const Condition cond) {	2313 const Condition cond) {

2284 ASSERT(CpuFeatures::IsEnabled(VFP2));	2314 ASSERT(CpuFeatures::IsEnabled(VFP2));

2285 emit(EncodeVCVT(F32, dst.code(), F64, src.code(), mode, cond));	2315 emit(EncodeVCVT(F32, dst.code(), F64, src.code(), mode, cond));

2286 }	2316 }

2287	2317

2288	2318

2289 void Assembler::vneg(const DwVfpRegister dst,	2319 void Assembler::vneg(const DwVfpRegister dst,

2290 const DwVfpRegister src,	2320 const DwVfpRegister src,

2291 const Condition cond) {	2321 const Condition cond) {

	2322 // Instruction details available in ARM DDI 0406C.b, A8-968.

	2323 // cond(31-28) \| 11101(27-23) \| D(22) \| 11(21-20) \| 0001(19-16) \| Vd(15-12) \|

	2324 // 101(11-9) \| sz=1(8) \| 0(7) \| 1(6) \| M(5) \| 0(4) \| Vm(3-0)

2292 ASSERT(CpuFeatures::IsEnabled(VFP2));	2325 ASSERT(CpuFeatures::IsEnabled(VFP2));

2293 emit(cond \| 0xEB24 \| 0xBB20 \| B16 \| dst.code()*B12 \|	2326 int vd, d;

2294 0x5*B9 \| B8 \| B6 \| src.code());	2327 dst.split_code(&vd, &d);

	2328 int vm, m;

	2329 src.split_code(&vm, &m);

	2330

	2331 emit(cond \| 0x1DB23 \| dB22 \| 0x3B20 \| B16 \| vdB12 \| 0x5*B9 \| B8 \| B6 \|

	2332 m*B5 \| vm);

2295 }	2333 }

2296	2334

2297	2335

2298 void Assembler::vabs(const DwVfpRegister dst,	2336 void Assembler::vabs(const DwVfpRegister dst,

2299 const DwVfpRegister src,	2337 const DwVfpRegister src,

2300 const Condition cond) {	2338 const Condition cond) {

	2339 // Instruction details available in ARM DDI 0406C.b, A8-524.

	2340 // cond(31-28) \| 11101(27-23) \| D(22) \| 11(21-20) \| 0000(19-16) \| Vd(15-12) \|

	2341 // 101(11-9) \| sz=1(8) \| 1(7) \| 1(6) \| M(5) \| 0(4) \| Vm(3-0).

2301 ASSERT(CpuFeatures::IsEnabled(VFP2));	2342 ASSERT(CpuFeatures::IsEnabled(VFP2));

2302 emit(cond \| 0xEB24 \| 0xBB20 \| dst.code()*B12 \|	2343 int vd, d;

2303 0x5B9 \| B8 \| 0x3B6 \| src.code());	2344 dst.split_code(&vd, &d);

	2345 int vm, m;

	2346 src.split_code(&vm, &m);

	2347 emit(cond \| 0x1DB23 \| dB22 \| 0x3B20 \| vdB12 \| 0x5*B9 \| B8 \| B7 \| B6 \|

	2348 m*B5 \| vm);

2304 }	2349 }

2305	2350

2306	2351

2307 void Assembler::vadd(const DwVfpRegister dst,	2352 void Assembler::vadd(const DwVfpRegister dst,

2308 const DwVfpRegister src1,	2353 const DwVfpRegister src1,

2309 const DwVfpRegister src2,	2354 const DwVfpRegister src2,

2310 const Condition cond) {	2355 const Condition cond) {

2311 // Dd = vadd(Dn, Dm) double precision floating point addition.	2356 // Dd = vadd(Dn, Dm) double precision floating point addition.

2312 // Dd = D:Vd; Dm=M:Vm; Dn=N:Vm.	2357 // Dd = D:Vd; Dm=M:Vm; Dn=N:Vm.

2313 // Instruction details available in ARM DDI 0406A, A8-536.	2358 // Instruction details available in ARM DDI 0406C.b, A8-830.

2314 // cond(31-28) \| 11100(27-23)\| D=?(22) \| 11(21-20) \| Vn(19-16) \|	2359 // cond(31-28) \| 11100(27-23)\| D(22) \| 11(21-20) \| Vn(19-16) \|

2315 // Vd(15-12) \| 101(11-9) \| sz(8)=1 \| N(7)=0 \| 0(6) \| M=?(5) \| 0(4) \| Vm(3-0)	2360 // Vd(15-12) \| 101(11-9) \| sz=1(8) \| N(7) \| 0(6) \| M(5) \| 0(4) \| Vm(3-0)

2316 ASSERT(CpuFeatures::IsEnabled(VFP2));	2361 ASSERT(CpuFeatures::IsEnabled(VFP2));

2317 emit(cond \| 0xEB24 \| 0x3B20 \| src1.code()*B16 \|	2362 int vd, d;

2318 dst.code()B12 \| 0x5B9 \| B8 \| src2.code());	2363 dst.split_code(&vd, &d);

	2364 int vn, n;

	2365 src1.split_code(&vn, &n);

	2366 int vm, m;

	2367 src2.split_code(&vm, &m);

	2368 emit(cond \| 0x1CB23 \| dB22 \| 0x3B20 \| vnB16 \| vdB12 \| 0x5B9 \| B8 \|

	2369 nB7 \| mB5 \| vm);

2319 }	2370 }

2320	2371

2321	2372

2322 void Assembler::vsub(const DwVfpRegister dst,	2373 void Assembler::vsub(const DwVfpRegister dst,

2323 const DwVfpRegister src1,	2374 const DwVfpRegister src1,

2324 const DwVfpRegister src2,	2375 const DwVfpRegister src2,

2325 const Condition cond) {	2376 const Condition cond) {

2326 // Dd = vsub(Dn, Dm) double precision floating point subtraction.	2377 // Dd = vsub(Dn, Dm) double precision floating point subtraction.

2327 // Dd = D:Vd; Dm=M:Vm; Dn=N:Vm.	2378 // Dd = D:Vd; Dm=M:Vm; Dn=N:Vm.

2328 // Instruction details available in ARM DDI 0406A, A8-784.	2379 // Instruction details available in ARM DDI 0406C.b, A8-1086.

2329 // cond(31-28) \| 11100(27-23)\| D=?(22) \| 11(21-20) \| Vn(19-16) \|	2380 // cond(31-28) \| 11100(27-23)\| D(22) \| 11(21-20) \| Vn(19-16) \|

2330 // Vd(15-12) \| 101(11-9) \| sz(8)=1 \| N(7)=0 \| 1(6) \| M=?(5) \| 0(4) \| Vm(3-0)	2381 // Vd(15-12) \| 101(11-9) \| sz=1(8) \| N(7) \| 1(6) \| M(5) \| 0(4) \| Vm(3-0)

2331 ASSERT(CpuFeatures::IsEnabled(VFP2));	2382 ASSERT(CpuFeatures::IsEnabled(VFP2));

2332 emit(cond \| 0xEB24 \| 0x3B20 \| src1.code()*B16 \|	2383 int vd, d;

2333 dst.code()B12 \| 0x5B9 \| B8 \| B6 \| src2.code());	2384 dst.split_code(&vd, &d);

	2385 int vn, n;

	2386 src1.split_code(&vn, &n);

	2387 int vm, m;

	2388 src2.split_code(&vm, &m);

	2389 emit(cond \| 0x1CB23 \| dB22 \| 0x3B20 \| vnB16 \| vdB12 \| 0x5B9 \| B8 \|

	2390 nB7 \| B6 \| mB5 \| vm);

2334 }	2391 }

2335	2392

2336	2393

2337 void Assembler::vmul(const DwVfpRegister dst,	2394 void Assembler::vmul(const DwVfpRegister dst,

2338 const DwVfpRegister src1,	2395 const DwVfpRegister src1,

2339 const DwVfpRegister src2,	2396 const DwVfpRegister src2,

2340 const Condition cond) {	2397 const Condition cond) {

2341 // Dd = vmul(Dn, Dm) double precision floating point multiplication.	2398 // Dd = vmul(Dn, Dm) double precision floating point multiplication.

2342 // Dd = D:Vd; Dm=M:Vm; Dn=N:Vm.	2399 // Dd = D:Vd; Dm=M:Vm; Dn=N:Vm.

2343 // Instruction details available in ARM DDI 0406A, A8-784.	2400 // Instruction details available in ARM DDI 0406C.b, A8-960.

2344 // cond(31-28) \| 11100(27-23)\| D=?(22) \| 10(21-20) \| Vn(19-16) \|	2401 // cond(31-28) \| 11100(27-23)\| D(22) \| 10(21-20) \| Vn(19-16) \|

2345 // Vd(15-12) \| 101(11-9) \| sz(8)=1 \| N(7)=0 \| 0(6) \| M=?(5) \| 0(4) \| Vm(3-0)	2402 // Vd(15-12) \| 101(11-9) \| sz=1(8) \| N(7) \| 0(6) \| M(5) \| 0(4) \| Vm(3-0)

2346 ASSERT(CpuFeatures::IsEnabled(VFP2));	2403 ASSERT(CpuFeatures::IsEnabled(VFP2));

2347 emit(cond \| 0xEB24 \| 0x2B20 \| src1.code()*B16 \|	2404 int vd, d;

2348 dst.code()B12 \| 0x5B9 \| B8 \| src2.code());	2405 dst.split_code(&vd, &d);

	2406 int vn, n;

	2407 src1.split_code(&vn, &n);

	2408 int vm, m;

	2409 src2.split_code(&vm, &m);

	2410 emit(cond \| 0x1CB23 \| dB22 \| 0x2B20 \| vnB16 \| vdB12 \| 0x5B9 \| B8 \|

	2411 nB7 \| mB5 \| vm);

2349 }	2412 }

2350	2413

2351	2414

2352 void Assembler::vmla(const DwVfpRegister dst,	2415 void Assembler::vmla(const DwVfpRegister dst,

2353 const DwVfpRegister src1,	2416 const DwVfpRegister src1,

2354 const DwVfpRegister src2,	2417 const DwVfpRegister src2,

2355 const Condition cond) {	2418 const Condition cond) {

2356 // Instruction details available in ARM DDI 0406C.b, A8-892.	2419 // Instruction details available in ARM DDI 0406C.b, A8-932.

2357 // cond(31-28) \| 11100(27-23) \| D=?(22) \| 00(21-20) \| Vn(19-16) \|	2420 // cond(31-28) \| 11100(27-23) \| D(22) \| 00(21-20) \| Vn(19-16) \|

2358 // Vd(15-12) \| 101(11-9) \| sz(8)=1 \| N=?(7) \| op(6)=0 \| M=?(5) \| 0(4) \|	2421 // Vd(15-12) \| 101(11-9) \| sz=1(8) \| N(7) \| op=0(6) \| M(5) \| 0(4) \| Vm(3-0)

2359 // Vm(3-0)	2422 int vd, d;

2360 unsigned x = (cond \| 0x1CB23 \| src1.code()B16 \|	2423 dst.split_code(&vd, &d);

2361 dst.code()B12 \| 0x5B9 \| B8 \| src2.code());	2424 int vn, n;

2362 emit(x);	2425 src1.split_code(&vn, &n);

	2426 int vm, m;

	2427 src2.split_code(&vm, &m);

	2428 emit(cond \| 0x1CB23 \| dB22 \| vnB16 \| vdB12 \| 0x5B9 \| B8 \| nB7 \| m*B5 \|

	2429 vm);

2363 }	2430 }

2364	2431

2365	2432

2366 void Assembler::vdiv(const DwVfpRegister dst,	2433 void Assembler::vdiv(const DwVfpRegister dst,

2367 const DwVfpRegister src1,	2434 const DwVfpRegister src1,

2368 const DwVfpRegister src2,	2435 const DwVfpRegister src2,

2369 const Condition cond) {	2436 const Condition cond) {

2370 // Dd = vdiv(Dn, Dm) double precision floating point division.	2437 // Dd = vdiv(Dn, Dm) double precision floating point division.

2371 // Dd = D:Vd; Dm=M:Vm; Dn=N:Vm.	2438 // Dd = D:Vd; Dm=M:Vm; Dn=N:Vm.

2372 // Instruction details available in ARM DDI 0406A, A8-584.	2439 // Instruction details available in ARM DDI 0406C.b, A8-882.

2373 // cond(31-28) \| 11101(27-23)\| D=?(22) \| 00(21-20) \| Vn(19-16) \|	2440 // cond(31-28) \| 11101(27-23)\| D(22) \| 00(21-20) \| Vn(19-16) \|

2374 // Vd(15-12) \| 101(11-9) \| sz(8)=1 \| N(7)=? \| 0(6) \| M=?(5) \| 0(4) \| Vm(3-0)	2441 // Vd(15-12) \| 101(11-9) \| sz=1(8) \| N(7) \| 0(6) \| M(5) \| 0(4) \| Vm(3-0)

2375 ASSERT(CpuFeatures::IsEnabled(VFP2));	2442 ASSERT(CpuFeatures::IsEnabled(VFP2));

2376 emit(cond \| 0xEB24 \| B23 \| src1.code()B16 \|	2443 int vd, d;

2377 dst.code()B12 \| 0x5B9 \| B8 \| src2.code());	2444 dst.split_code(&vd, &d);

	2445 int vn, n;

	2446 src1.split_code(&vn, &n);

	2447 int vm, m;

	2448 src2.split_code(&vm, &m);

	2449 emit(cond \| 0x1DB23 \| dB22 \| vnB16 \| vdB12 \| 0x5B9 \| B8 \| nB7 \| m*B5 \|

	2450 vm);

2378 }	2451 }

2379	2452

2380	2453

2381 void Assembler::vcmp(const DwVfpRegister src1,	2454 void Assembler::vcmp(const DwVfpRegister src1,

2382 const DwVfpRegister src2,	2455 const DwVfpRegister src2,

2383 const Condition cond) {	2456 const Condition cond) {

2384 // vcmp(Dd, Dm) double precision floating point comparison.	2457 // vcmp(Dd, Dm) double precision floating point comparison.

2385 // Instruction details available in ARM DDI 0406A, A8-570.	2458 // Instruction details available in ARM DDI 0406C.b, A8-864.

2386 // cond(31-28) \| 11101 (27-23)\| D=?(22) \| 11 (21-20) \| 0100 (19-16) \|	2459 // cond(31-28) \| 11101(27-23)\| D(22) \| 11(21-20) \| 0100(19-16) \|

2387 // Vd(15-12) \| 101(11-9) \| sz(8)=1 \| E(7)=0 \| 1(6) \| M(5)=? \| 0(4) \| Vm(3-0)	2460 // Vd(15-12) \| 101(11-9) \| sz=1(8) \| E=0(7) \| 1(6) \| M(5) \| 0(4) \| Vm(3-0)

2388 ASSERT(CpuFeatures::IsEnabled(VFP2));	2461 ASSERT(CpuFeatures::IsEnabled(VFP2));

2389 emit(cond \| 0xEB24 \|B23 \| 0x3B20 \| B18 \|	2462 int vd, d;

2390 src1.code()B12 \| 0x5B9 \| B8 \| B6 \| src2.code());	2463 src1.split_code(&vd, &d);

	2464 int vm, m;

	2465 src2.split_code(&vm, &m);

	2466 emit(cond \| 0x1DB23 \| dB22 \| 0x3B20 \| 0x4B16 \| vdB12 \| 0x5B9 \| B8 \| B6 \|

	2467 m*B5 \| vm);

2391 }	2468 }

2392	2469

2393	2470

2394 void Assembler::vcmp(const DwVfpRegister src1,	2471 void Assembler::vcmp(const DwVfpRegister src1,

2395 const double src2,	2472 const double src2,

2396 const Condition cond) {	2473 const Condition cond) {

2397 // vcmp(Dd, Dm) double precision floating point comparison.	2474 // vcmp(Dd, #0.0) double precision floating point comparison.

2398 // Instruction details available in ARM DDI 0406A, A8-570.	2475 // Instruction details available in ARM DDI 0406C.b, A8-864.

2399 // cond(31-28) \| 11101 (27-23)\| D=?(22) \| 11 (21-20) \| 0101 (19-16) \|	2476 // cond(31-28) \| 11101(27-23)\| D(22) \| 11(21-20) \| 0101(19-16) \|

2400 // Vd(15-12) \| 101(11-9) \| sz(8)=1 \| E(7)=0 \| 1(6) \| M(5)=? \| 0(4) \| 0000(3-0)	2477 // Vd(15-12) \| 101(11-9) \| sz=1(8) \| E=0(7) \| 1(6) \| 0(5) \| 0(4) \| 0000(3-0)

2401 ASSERT(CpuFeatures::IsEnabled(VFP2));	2478 ASSERT(CpuFeatures::IsEnabled(VFP2));

2402 ASSERT(src2 == 0.0);	2479 ASSERT(src2 == 0.0);

2403 emit(cond \| 0xEB24 \|B23 \| 0x3B20 \| B18 \| B16 \|	2480 int vd, d;

2404 src1.code()B12 \| 0x5B9 \| B8 \| B6);	2481 src1.split_code(&vd, &d);

	2482 emit(cond \| 0x1DB23 \| dB22 \| 0x3B20 \| 0x5B16 \| vdB12 \| 0x5B9 \| B8 \| B6);

2405 }	2483 }

2406	2484

2407	2485

2408 void Assembler::vmsr(Register dst, Condition cond) {	2486 void Assembler::vmsr(Register dst, Condition cond) {

2409 // Instruction details available in ARM DDI 0406A, A8-652.	2487 // Instruction details available in ARM DDI 0406A, A8-652.

2410 // cond(31-28) \| 1110 (27-24) \| 1110(23-20)\| 0001 (19-16) \|	2488 // cond(31-28) \| 1110 (27-24) \| 1110(23-20)\| 0001 (19-16) \|

2411 // Rt(15-12) \| 1010 (11-8) \| 0(7) \| 00 (6-5) \| 1(4) \| 0000(3-0)	2489 // Rt(15-12) \| 1010 (11-8) \| 0(7) \| 00 (6-5) \| 1(4) \| 0000(3-0)

2412 ASSERT(CpuFeatures::IsEnabled(VFP2));	2490 ASSERT(CpuFeatures::IsEnabled(VFP2));

2413 emit(cond \| 0xEB24 \| 0xEB20 \| B16 \|	2491 emit(cond \| 0xEB24 \| 0xEB20 \| B16 \|

2414 dst.code()B12 \| 0xAB8 \| B4);	2492 dst.code()B12 \| 0xAB8 \| B4);

2415 }	2493 }

2416	2494

2417	2495

2418 void Assembler::vmrs(Register dst, Condition cond) {	2496 void Assembler::vmrs(Register dst, Condition cond) {

2419 // Instruction details available in ARM DDI 0406A, A8-652.	2497 // Instruction details available in ARM DDI 0406A, A8-652.

2420 // cond(31-28) \| 1110 (27-24) \| 1111(23-20)\| 0001 (19-16) \|	2498 // cond(31-28) \| 1110 (27-24) \| 1111(23-20)\| 0001 (19-16) \|

2421 // Rt(15-12) \| 1010 (11-8) \| 0(7) \| 00 (6-5) \| 1(4) \| 0000(3-0)	2499 // Rt(15-12) \| 1010 (11-8) \| 0(7) \| 00 (6-5) \| 1(4) \| 0000(3-0)

2422 ASSERT(CpuFeatures::IsEnabled(VFP2));	2500 ASSERT(CpuFeatures::IsEnabled(VFP2));

2423 emit(cond \| 0xEB24 \| 0xFB20 \| B16 \|	2501 emit(cond \| 0xEB24 \| 0xFB20 \| B16 \|

2424 dst.code()B12 \| 0xAB8 \| B4);	2502 dst.code()B12 \| 0xAB8 \| B4);

2425 }	2503 }

2426	2504

2427	2505

2428 void Assembler::vsqrt(const DwVfpRegister dst,	2506 void Assembler::vsqrt(const DwVfpRegister dst,

2429 const DwVfpRegister src,	2507 const DwVfpRegister src,

2430 const Condition cond) {	2508 const Condition cond) {

2431 // cond(31-28) \| 11101 (27-23)\| D=?(22) \| 11 (21-20) \| 0001 (19-16) \|	2509 // Instruction details available in ARM DDI 0406C.b, A8-1058.

2432 // Vd(15-12) \| 101(11-9) \| sz(8)=1 \| 11 (7-6) \| M(5)=? \| 0(4) \| Vm(3-0)	2510 // cond(31-28) \| 11101(27-23)\| D(22) \| 11(21-20) \| 0001(19-16) \|

	2511 // Vd(15-12) \| 101(11-9) \| sz=1(8) \| 11(7-6) \| M(5) \| 0(4) \| Vm(3-0)

2433 ASSERT(CpuFeatures::IsEnabled(VFP2));	2512 ASSERT(CpuFeatures::IsEnabled(VFP2));

2434 emit(cond \| 0xEB24 \| B23 \| 0x3B20 \| B16 \|	2513 int vd, d;

2435 dst.code()B12 \| 0x5B9 \| B8 \| 3*B6 \| src.code());	2514 dst.split_code(&vd, &d);

	2515 int vm, m;

	2516 src.split_code(&vm, &m);

	2517 emit(cond \| 0x1DB23 \| dB22 \| 0x3B20 \| B16 \| vdB12 \| 0x5B9 \| B8 \| 0x3B6 \|

	2518 m*B5 \| vm);

2436 }	2519 }

2437	2520

2438	2521

2439 // Pseudo instructions.	2522 // Pseudo instructions.

2440 void Assembler::nop(int type) {	2523 void Assembler::nop(int type) {

2441 // ARMv6{K/T2} and v7 have an actual NOP instruction but it serializes	2524 // ARMv6{K/T2} and v7 have an actual NOP instruction but it serializes

2442 // some of the CPU's pipeline and has to issue. Older ARM chips simply used	2525 // some of the CPU's pipeline and has to issue. Older ARM chips simply used

2443 // MOV Rx, Rx as NOP and it performs better even in newer CPUs.	2526 // MOV Rx, Rx as NOP and it performs better even in newer CPUs.

2444 // We therefore use MOV Rx, Rx, even on newer CPUs, and use Rx to encode	2527 // We therefore use MOV Rx, Rx, even on newer CPUs, and use Rx to encode

2445 // a type.	2528 // a type.

(...skipping 297 matching lines...) Expand 10 before \| Expand all \| Expand 10 after Loading...
2743	2826

2744 // Since a constant pool was just emitted, move the check offset forward by	2827 // Since a constant pool was just emitted, move the check offset forward by

2745 // the standard interval.	2828 // the standard interval.

2746 next_buffer_check_ = pc_offset() + kCheckPoolInterval;	2829 next_buffer_check_ = pc_offset() + kCheckPoolInterval;

2747 }	2830 }

2748	2831

2749	2832

2750 } } // namespace v8::internal	2833 } } // namespace v8::internal

2751	2834

2752 #endif // V8_TARGET_ARCH_ARM	2835 #endif // V8_TARGET_ARCH_ARM

OLD	NEW

« no previous file with comments | « src/arm/assembler-arm.h ('k') | src/arm/assembler-arm-inl.h » ('j') | src/arm/code-stubs-arm.h » ('J')