Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(947)

Side by Side Diff: courgette/disassembler_elf_32_arm.cc

Issue 1792603006: Revert of [Courgette] Clean up Disassembler; fix ELF Memory leaks. (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master
Patch Set: Created 4 years, 9 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch
« no previous file with comments | « courgette/disassembler_elf_32_arm.h ('k') | courgette/disassembler_elf_32_x86.h » ('j') | no next file with comments »
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
OLDNEW
1 // Copyright 2013 The Chromium Authors. All rights reserved. 1 // Copyright 2013 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be 2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file. 3 // found in the LICENSE file.
4 4
5 #include "courgette/disassembler_elf_32_arm.h" 5 #include "courgette/disassembler_elf_32_arm.h"
6 6
7 #include <stddef.h>
8 #include <stdint.h>
9
10 #include <algorithm>
11 #include <string>
7 #include <vector> 12 #include <vector>
8 13
9 #include "base/logging.h" 14 #include "base/logging.h"
10 #include "base/memory/scoped_ptr.h" 15
11 #include "courgette/assembly_program.h" 16 #include "courgette/assembly_program.h"
12 #include "courgette/courgette.h" 17 #include "courgette/courgette.h"
18 #include "courgette/encoded_program.h"
13 19
14 namespace courgette { 20 namespace courgette {
15 21
16 CheckBool DisassemblerElf32ARM::Compress(ARM_RVA type, 22 CheckBool DisassemblerElf32ARM::Compress(ARM_RVA type,
17 uint32_t arm_op, 23 uint32_t arm_op,
18 RVA rva, 24 RVA rva,
19 uint16_t* c_op, 25 uint16_t* c_op,
20 uint32_t* addr) { 26 uint32_t* addr) {
21 // Notation for bit ranges in comments: 27 // This method takes an ARM or thumb opcode, extracts the relative
22 // - Listing bits from highest to lowest. 28 // target address from it (addr), and creates a corresponding
23 // - A-Z or (j1), (j2), etc.: single bit in source. 29 // Courgette opcode (c_op).
24 // - a-z: multiple, consecutive bits in source. 30 //
31 // Details on ARM the opcodes, and how the relative targets are
32 // computed were taken from the "ARM Architecture Reference Manual",
33 // section A4.1.5 and the "Thumb-2 supplement", section 4.6.12.
34 // ARM_OFF24 is for the ARM opcode. The rest are for thumb opcodes.
25 switch (type) { 35 switch (type) {
26 case ARM_OFF8: { 36 case ARM_OFF8: {
27 // Encoding T1. 37 // The offset is given by lower 8 bits of the op. It is a 9-bit
28 // The offset is given by lower 8 bits of the op. It is a 9-bit offset, 38 // offset, shifted right one bit and signed extended.
29 // shifted right 1 bit, and signed extended.
30 // arm_op = aaaaaaaa Snnnnnnn
31 // *addr := SSSSSSSS SSSSSSSS SSSSSSSS nnnnnnn0 + 100
32 // *c_op := 00010000 aaaaaaaa
33 uint32_t temp = (arm_op & 0x00FF) << 1; 39 uint32_t temp = (arm_op & 0x00FF) << 1;
34 if (temp & 0x0100) 40 if (temp & 0x0100)
35 temp |= 0xFFFFFE00; 41 temp |= 0xFFFFFE00;
36 temp += 4; // Offset from _next_ PC. 42 temp += 4; // Offset from _next_ PC.
43 fflush(stdout);
37 44
38 (*addr) = temp; 45 (*addr) = temp;
39 (*c_op) = static_cast<uint16_t>(arm_op >> 8) | 0x1000; 46 (*c_op) = static_cast<uint16_t>(arm_op >> 8) | 0x1000;
40 break; 47 break;
41 } 48 }
42 case ARM_OFF11: { 49 case ARM_OFF11: {
43 // Encoding T2. 50 // The offset is given by lower 11 bits of the op, and is a
44 // The offset is given by lower 11 bits of the op, and is a 12-bit offset, 51 // 12-bit offset, shifted right one bit and sign extended.
45 // shifted right 1 bit, and sign extended.
46 // arm_op = aaaaaSnn nnnnnnnn
47 // *addr := SSSSSSSS SSSSSSSS SSSSSnnn nnnnnnn0 + 100
48 // *c_op := 00100000 000aaaaa
49 uint32_t temp = (arm_op & 0x07FF) << 1; 52 uint32_t temp = (arm_op & 0x07FF) << 1;
50 if (temp & 0x00000800) 53 if (temp & 0x00000800)
51 temp |= 0xFFFFF000; 54 temp |= 0xFFFFF000;
52 temp += 4; // Offset from _next_ PC. 55 temp += 4; // Offset from _next_ PC.
53 56
54 (*addr) = temp; 57 (*addr) = temp;
55 (*c_op) = static_cast<uint16_t>(arm_op >> 11) | 0x2000; 58 (*c_op) = static_cast<uint16_t>(arm_op >> 11) | 0x2000;
56 break; 59 break;
57 } 60 }
58 case ARM_OFF24: { 61 case ARM_OFF24: {
59 // The offset is given by the lower 24-bits of the op, shifted 62 // The offset is given by the lower 24-bits of the op, shifted
60 // left 2 bits, and sign extended. 63 // left 2 bits, and sign extended.
61 // arm_op = aaaaaaaa Snnnnnnn nnnnnnnn nnnnnnnn
62 // *addr := SSSSSSSn nnnnnnnn nnnnnnnn nnnnnn00 + 1000
63 // *c_op := 00110000 aaaaaaaa
64 uint32_t temp = (arm_op & 0x00FFFFFF) << 2; 64 uint32_t temp = (arm_op & 0x00FFFFFF) << 2;
65 if (temp & 0x02000000) 65 if (temp & 0x02000000)
66 temp |= 0xFC000000; 66 temp |= 0xFC000000;
67 temp += 8; 67 temp += 8;
68 68
69 (*addr) = temp; 69 (*addr) = temp;
70 (*c_op) = (arm_op >> 24) | 0x3000; 70 (*c_op) = (arm_op >> 24) | 0x3000;
71 break; 71 break;
72 } 72 }
73 case ARM_OFF25: { 73 case ARM_OFF25: {
74 // Encoding T4.
75 // arm_op = aaaaaSmm mmmmmmmm BC(j1)D(j2)nnn nnnnnnnn
76 // where CD is in {01, 10, 11}
77 // i1 := ~(j1 ^ S)
78 // i2 := ~(j2 ^ S)
79 // If CD == 10:
80 // pppp := (rva % 4 == 0) ? 0100 : 0010
81 // Else:
82 // pppp := 0100
83 // *addr := SSSSSSSS (i1)(i2)mmmmmm mmmmnnnn nnnnnnn0 + pppp
84 // *c_op := 0100pppp aaaaaBCD
85 // TODO(huangs): aaaaa = 11110 and B = 1 always? Investigate and fix.
86 uint32_t temp = 0; 74 uint32_t temp = 0;
87 temp |= (arm_op & 0x000007FF) << 1; // imm11 75 temp |= (arm_op & 0x000007FF) << 1; // imm11
88 temp |= (arm_op & 0x03FF0000) >> 4; // imm10 76 temp |= (arm_op & 0x03FF0000) >> 4; // imm10
89 77
90 uint32_t S = (arm_op & (1 << 26)) >> 26; 78 uint32_t S = (arm_op & (1 << 26)) >> 26;
91 uint32_t j2 = (arm_op & (1 << 11)) >> 11; 79 uint32_t j2 = (arm_op & (1 << 11)) >> 11;
92 uint32_t j1 = (arm_op & (1 << 13)) >> 13; 80 uint32_t j1 = (arm_op & (1 << 13)) >> 13;
93 bool bit12 = ((arm_op & (1 << 12)) >> 12) != 0; // D 81 bool bit12 = ((arm_op & (1 << 12)) >> 12) != 0;
94 bool bit14 = ((arm_op & (1 << 14)) >> 14) != 0; // C 82 bool bit14 = ((arm_op & (1 << 14)) >> 14) != 0;
95 83
96 uint32_t i2 = ~(j2 ^ S) & 1; 84 uint32_t i2 = ~(j2 ^ S) & 1;
97 uint32_t i1 = ~(j1 ^ S) & 1; 85 uint32_t i1 = ~(j1 ^ S) & 1;
98 bool toARM = bit14 && !bit12; 86 bool toARM = bit14 && !bit12;
99 87
100 temp |= (S << 24) | (i1 << 23) | (i2 << 22); 88 temp |= (S << 24) | (i1 << 23) | (i2 << 22);
101 89
102 if (temp & 0x01000000) // sign extension 90 if (temp & 0x01000000) // sign extension
103 temp |= 0xFE000000; 91 temp |= 0xFE000000;
104 uint32_t prefetch; 92 uint32_t prefetch;
105 if (toARM) { 93 if (toARM) {
106 // Align PC on 4-byte boundary. 94 // Align PC on 4-byte boundary
107 uint32_t align4byte = (rva % 4) ? 2 : 4; 95 uint32_t align4byte = (rva % 4) ? 2 : 4;
108 prefetch = align4byte; 96 prefetch = align4byte;
109 } else { 97 } else {
110 prefetch = 4; 98 prefetch = 4;
111 } 99 }
112 temp += prefetch; 100 temp += prefetch;
113 (*addr) = temp; 101 (*addr) = temp;
114 102
115 uint32_t temp2 = 0x4000; 103 uint32_t temp2 = 0x4000;
116 temp2 |= (arm_op & (1 << 12)) >> 12; // .......D 104 temp2 |= (arm_op & (1 << 12)) >> 12;
117 temp2 |= (arm_op & (1 << 14)) >> 13; // ......C. 105 temp2 |= (arm_op & (1 << 14)) >> 13;
118 temp2 |= (arm_op & (1 << 15)) >> 13; // .....B.. 106 temp2 |= (arm_op & (1 << 15)) >> 13;
119 temp2 |= (arm_op & 0xF8000000) >> 24; // aaaaa... 107 temp2 |= (arm_op & 0xF8000000) >> 24;
120 temp2 |= (prefetch & 0x0000000F) << 8; 108 temp2 |= (prefetch & 0x0000000F) << 8;
121 (*c_op) = static_cast<uint16_t>(temp2); 109 (*c_op) = static_cast<uint16_t>(temp2);
122 break; 110 break;
123 } 111 }
124 case ARM_OFF21: { 112 case ARM_OFF21: {
125 // Encoding T3.
126 // arm_op = 11110Scc ccmmmmmm 10(j1)0(j2)nnn nnnnnnnn
127 // *addr := SSSSSSSS SSSS(j1)(j2)mm mmmmnnnn nnnnnnn0 + 100
128 // *c_op := 01010000 0000cccc
129 uint32_t temp = 0; 113 uint32_t temp = 0;
130 temp |= (arm_op & 0x000007FF) << 1; // imm11 114 temp |= (arm_op & 0x000007FF) << 1; // imm11
131 temp |= (arm_op & 0x003F0000) >> 4; // imm6 115 temp |= (arm_op & 0x003F0000) >> 4; // imm6
132 116
133 uint32_t S = (arm_op & (1 << 26)) >> 26; 117 uint32_t S = (arm_op & (1 << 26)) >> 26;
134 // TODO(huangs): Check with docs: Perhaps j1, j2 should swap?
135 uint32_t j2 = (arm_op & (1 << 11)) >> 11; 118 uint32_t j2 = (arm_op & (1 << 11)) >> 11;
136 uint32_t j1 = (arm_op & (1 << 13)) >> 13; 119 uint32_t j1 = (arm_op & (1 << 13)) >> 13;
137 120
138 temp |= (S << 20) | (j1 << 19) | (j2 << 18); 121 temp |= (S << 20) | (j1 << 19) | (j2 << 18);
139 122
140 if (temp & 0x00100000) // sign extension 123 if (temp & 0x00100000) // sign extension
141 temp |= 0xFFE00000; 124 temp |= 0xFFE00000;
142 temp += 4; 125 temp += 4;
143 (*addr) = temp; 126 (*addr) = temp;
144 127
145 uint32_t temp2 = 0x5000; 128 uint32_t temp2 = 0x5000;
146 temp2 |= (arm_op & 0x03C00000) >> 22; // just save the cond 129 temp2 |= (arm_op & 0x03C00000) >> 22; // just save the cond
147 (*c_op) = static_cast<uint16_t>(temp2); 130 (*c_op) = static_cast<uint16_t>(temp2);
148 break; 131 break;
149 } 132 }
150 default: 133 default:
151 return false; 134 return false;
152 } 135 }
153 return true; 136 return true;
154 } 137 }
155 138
156 CheckBool DisassemblerElf32ARM::Decompress(ARM_RVA type, 139 CheckBool DisassemblerElf32ARM::Decompress(ARM_RVA type,
157 uint16_t c_op, 140 uint16_t c_op,
158 uint32_t addr, 141 uint32_t addr,
159 uint32_t* arm_op) { 142 uint32_t* arm_op) {
143 // Reverses the process in the compress() method. Takes the
144 // Courgette op and relative address and reconstructs the original
145 // ARM or thumb op.
160 switch (type) { 146 switch (type) {
161 case ARM_OFF8: 147 case ARM_OFF8:
162 // addr = SSSSSSSS SSSSSSSS SSSSSSSS nnnnnnn0 + 100
163 // c_op = 00010000 aaaaaaaa
164 // *arm_op := aaaaaaaa Snnnnnnn
165 (*arm_op) = ((c_op & 0x0FFF) << 8) | (((addr - 4) >> 1) & 0x000000FF); 148 (*arm_op) = ((c_op & 0x0FFF) << 8) | (((addr - 4) >> 1) & 0x000000FF);
166 break; 149 break;
167 case ARM_OFF11: 150 case ARM_OFF11:
168 // addr = SSSSSSSS SSSSSSSS SSSSSnnn nnnnnnn0 + 100
169 // c_op = 00100000 000aaaaa
170 // *arm_op := aaaaaSnn nnnnnnnn
171 (*arm_op) = ((c_op & 0x0FFF) << 11) | (((addr - 4) >> 1) & 0x000007FF); 151 (*arm_op) = ((c_op & 0x0FFF) << 11) | (((addr - 4) >> 1) & 0x000007FF);
172 break; 152 break;
173 case ARM_OFF24: 153 case ARM_OFF24:
174 // addr = SSSSSSSn nnnnnnnn nnnnnnnn nnnnnn00 + 1000
175 // c_op = 00110000 aaaaaaaa
176 // *arm_op := aaaaaaaa Snnnnnnn nnnnnnnn nnnnnnnn
177 (*arm_op) = ((c_op & 0x0FFF) << 24) | (((addr - 8) >> 2) & 0x00FFFFFF); 154 (*arm_op) = ((c_op & 0x0FFF) << 24) | (((addr - 8) >> 2) & 0x00FFFFFF);
178 break; 155 break;
179 case ARM_OFF25: { 156 case ARM_OFF25: {
180 // addr = SSSSSSSS (i1)(i2)mmmmmm mmmmnnnn nnnnnnn0 + pppp
181 // c_op = 0100pppp aaaaaBCD
182 // j1 := ~i1 ^ S
183 // j2 := ~i2 ^ S
184 // *arm_op := aaaaaSmm mmmmmmmm BC(j1)D(j2)nnn nnnnnnnn
185 uint32_t temp = 0; 157 uint32_t temp = 0;
186 temp |= (c_op & (1 << 0)) << 12; 158 temp |= (c_op & (1 << 0)) << 12;
187 temp |= (c_op & (1 << 1)) << 13; 159 temp |= (c_op & (1 << 1)) << 13;
188 temp |= (c_op & (1 << 2)) << 13; 160 temp |= (c_op & (1 << 2)) << 13;
189 temp |= (c_op & (0xF8000000 >> 24)) << 24; 161 temp |= (c_op & (0xF8000000 >> 24)) << 24;
190 162
191 uint32_t prefetch = (c_op & 0x0F00) >> 8; 163 uint32_t prefetch = (c_op & 0x0F00) >> 8;
192 addr -= prefetch; 164 addr -= prefetch;
193 165
194 addr &= 0x01FFFFFF; 166 addr &= 0x01FFFFFF;
195 167
196 uint32_t S = (addr & (1 << 24)) >> 24; 168 uint32_t S = (addr & (1 << 24)) >> 24;
197 uint32_t i1 = (addr & (1 << 23)) >> 23; 169 uint32_t i1 = (addr & (1 << 23)) >> 23;
198 uint32_t i2 = (addr & (1 << 22)) >> 22; 170 uint32_t i2 = (addr & (1 << 22)) >> 22;
199 171
200 uint32_t j1 = ((~i1) ^ S) & 1; 172 uint32_t j1 = ((~i1) ^ S) & 1;
201 uint32_t j2 = ((~i2) ^ S) & 1; 173 uint32_t j2 = ((~i2) ^ S) & 1;
202 174
203 temp |= S << 26; 175 temp |= S << 26;
204 temp |= j2 << 11; 176 temp |= j2 << 11;
205 temp |= j1 << 13; 177 temp |= j1 << 13;
206 178
207 temp |= (addr & (0x000007FF << 1)) >> 1; 179 temp |= (addr & (0x000007FF << 1)) >> 1;
208 temp |= (addr & (0x03FF0000 >> 4)) << 4; 180 temp |= (addr & (0x03FF0000 >> 4)) << 4;
209 181
210 (*arm_op) = temp; 182 (*arm_op) = temp;
211 break; 183 break;
212 } 184 }
213 case ARM_OFF21: { 185 case ARM_OFF21: {
214 // addr = SSSSSSSS SSSS(j1)(j2)mm mmmmnnnn nnnnnnn0 + 100
215 // c_op = 01010000 0000cccc
216 // *arm_op := 11110Scc ccmmmmmm 10(j1)0(j2)nnn nnnnnnnn
217 uint32_t temp = 0xF0008000; 186 uint32_t temp = 0xF0008000;
218 temp |= (c_op & (0x03C00000 >> 22)) << 22; 187 temp |= (c_op & (0x03C00000 >> 22)) << 22;
219 188
220 addr -= 4; 189 addr -= 4;
221 addr &= 0x001FFFFF; 190 addr &= 0x001FFFFF;
222 191
223 uint32_t S = (addr & (1 << 20)) >> 20; 192 uint32_t S = (addr & (1 << 20)) >> 20;
224 uint32_t j1 = (addr & (1 << 19)) >> 19; 193 uint32_t j1 = (addr & (1 << 19)) >> 19;
225 uint32_t j2 = (addr & (1 << 18)) >> 18; 194 uint32_t j2 = (addr & (1 << 18)) >> 18;
226 195
(...skipping 27 matching lines...) Expand all
254 return 4; 223 return 4;
255 default: 224 default:
256 return 0xFFFF; 225 return 0xFFFF;
257 } 226 }
258 } 227 }
259 228
260 CheckBool DisassemblerElf32ARM::TypedRVAARM::ComputeRelativeTarget( 229 CheckBool DisassemblerElf32ARM::TypedRVAARM::ComputeRelativeTarget(
261 const uint8_t* op_pointer) { 230 const uint8_t* op_pointer) {
262 arm_op_ = op_pointer; 231 arm_op_ = op_pointer;
263 switch (type_) { 232 switch (type_) {
264 case ARM_OFF8: // Falls through. 233 case ARM_OFF8:
234 // Fall through
265 case ARM_OFF11: { 235 case ARM_OFF11: {
266 RVA relative_target; 236 RVA relative_target;
267 CheckBool ret = Compress(type_, 237 CheckBool ret = Compress(type_, Read16LittleEndian(op_pointer), rva(),
268 Read16LittleEndian(op_pointer), 238 &c_op_, &relative_target);
269 rva(),
270 &c_op_,
271 &relative_target);
272 set_relative_target(relative_target); 239 set_relative_target(relative_target);
273 return ret; 240 return ret;
274 } 241 }
275 case ARM_OFF24: { 242 case ARM_OFF24: {
276 RVA relative_target; 243 RVA relative_target;
277 CheckBool ret = Compress(type_, 244 CheckBool ret = Compress(type_, Read32LittleEndian(op_pointer), rva(),
278 Read32LittleEndian(op_pointer), 245 &c_op_, &relative_target);
279 rva(),
280 &c_op_,
281 &relative_target);
282 set_relative_target(relative_target); 246 set_relative_target(relative_target);
283 return ret; 247 return ret;
284 } 248 }
285 case ARM_OFF25: // Falls through. 249 case ARM_OFF25:
250 // Fall through
286 case ARM_OFF21: { 251 case ARM_OFF21: {
287 // A thumb-2 op is 32 bits stored as two 16-bit words 252 // A thumb-2 op is 32 bits stored as two 16-bit words
288 uint32_t pval = (Read16LittleEndian(op_pointer) << 16) | 253 uint32_t pval = (Read16LittleEndian(op_pointer) << 16) |
289 Read16LittleEndian(op_pointer + 2); 254 Read16LittleEndian(op_pointer + 2);
290 RVA relative_target; 255 RVA relative_target;
291 CheckBool ret = Compress(type_, pval, rva(), &c_op_, &relative_target); 256 CheckBool ret = Compress(type_, pval, rva(), &c_op_, &relative_target);
292 set_relative_target(relative_target); 257 set_relative_target(relative_target);
293 return ret; 258 return ret;
294 } 259 }
295 default: 260 default:
296 return false; 261 return false;
297 } 262 }
298 } 263 }
299 264
300 CheckBool DisassemblerElf32ARM::TypedRVAARM::EmitInstruction( 265 CheckBool DisassemblerElf32ARM::TypedRVAARM::EmitInstruction(
301 AssemblyProgram* program, 266 AssemblyProgram* program,
302 RVA target_rva) { 267 RVA target_rva) {
303 return program->EmitRel32ARM(c_op(), 268 return program->EmitRel32ARM(c_op(),
304 program->FindOrMakeRel32Label(target_rva), 269 program->FindOrMakeRel32Label(target_rva),
305 arm_op_, 270 arm_op_,
306 op_size()); 271 op_size());
307 } 272 }
308 273
309 DisassemblerElf32ARM::DisassemblerElf32ARM(const void* start, size_t length) 274 DisassemblerElf32ARM::DisassemblerElf32ARM(const void* start, size_t length)
310 : DisassemblerElf32(start, length) { 275 : DisassemblerElf32(start, length) {
311 } 276 }
312 277
313 // Convert an ELF relocation struction into an RVA. 278 // Convert an ELF relocation struction into an RVA
314 CheckBool DisassemblerElf32ARM::RelToRVA(Elf32_Rel rel, RVA* result) const { 279 CheckBool DisassemblerElf32ARM::RelToRVA(Elf32_Rel rel, RVA* result) const {
315 // The rightmost byte of r_info is the type. 280
281 // The rightmost byte of r_info is the type...
316 elf32_rel_arm_type_values type = 282 elf32_rel_arm_type_values type =
317 static_cast<elf32_rel_arm_type_values>(rel.r_info & 0xFF); 283 (elf32_rel_arm_type_values)(unsigned char)rel.r_info;
318 284
319 // The other 3 bytes of r_info are the symbol. 285 // The other 3 bytes of r_info are the symbol
320 uint32_t symbol = rel.r_info >> 8; 286 uint32_t symbol = rel.r_info >> 8;
321 287
322 switch (type) { 288 switch(type)
289 {
323 case R_ARM_RELATIVE: 290 case R_ARM_RELATIVE:
324 if (symbol != 0) 291 if (symbol != 0)
325 return false; 292 return false;
326 293
327 // This is a basic ABS32 relocation address. 294 // This is a basic ABS32 relocation address
328 *result = rel.r_offset; 295 *result = rel.r_offset;
329 return true; 296 return true;
330 297
331 default: 298 default:
332 return false; 299 return false;
333 } 300 }
334 } 301 }
335 302
336 CheckBool DisassemblerElf32ARM::ParseRelocationSection( 303 CheckBool DisassemblerElf32ARM::ParseRelocationSection(
337 const Elf32_Shdr* section_header, 304 const Elf32_Shdr *section_header,
338 AssemblyProgram* program) { 305 AssemblyProgram* program) {
339 // This method compresses a contiguous stretch of R_ARM_RELATIVE entries in 306 // This method compresses a contiguous stretch of R_ARM_RELATIVE
340 // the relocation table with a Courgette relocation table instruction. 307 // entries in the relocation table with a Courgette relocation table
341 // It skips any entries at the beginning that appear in a section that 308 // instruction. It skips any entries at the beginning that appear
342 // Courgette doesn't support, e.g. INIT. 309 // in a section that Courgette doesn't support, e.g. INIT.
343 //
344 // Specifically, the entries should be 310 // Specifically, the entries should be
345 // (1) In the same relocation table 311 // (1) In the same relocation table
346 // (2) Are consecutive 312 // (2) Are consecutive
347 // (3) Are sorted in memory address order 313 // (3) Are sorted in memory address order
348 // 314 //
349 // Happily, this is normally the case, but it's not required by spec so we 315 // Happily, this is normally the case, but it's not required by spec
350 // check, and just don't do it if we don't match up. 316 // so we check, and just don't do it if we don't match up.
351 // 317 //
352 // The expectation is that one relocation section will contain all of our 318 // The expectation is that one relocation section will contain
353 // R_ARM_RELATIVE entries in the expected order followed by assorted other 319 // all of our R_ARM_RELATIVE entries in the expected order followed
354 // entries we can't use special handling for. 320 // by assorted other entries we can't use special handling for.
355 321
356 bool match = true; 322 bool match = true;
357 323
358 // Walk all the bytes in the section, matching relocation table or not. 324 // Walk all the bytes in the section, matching relocation table or not
359 FileOffset file_offset = section_header->sh_offset; 325 size_t file_offset = section_header->sh_offset;
360 FileOffset section_end = section_header->sh_offset + section_header->sh_size; 326 size_t section_end = section_header->sh_offset + section_header->sh_size;
361 327
362 const Elf32_Rel* section_relocs_iter = reinterpret_cast<const Elf32_Rel*>( 328 Elf32_Rel *section_relocs_iter =
363 FileOffsetToPointer(section_header->sh_offset)); 329 (Elf32_Rel *)OffsetToPointer(section_header->sh_offset);
364 330
365 uint32_t section_relocs_count = 331 uint32_t section_relocs_count =
366 section_header->sh_size / section_header->sh_entsize; 332 section_header->sh_size / section_header->sh_entsize;
367 333
368 if (abs32_locations_.size() > section_relocs_count) 334 if (abs32_locations_.size() > section_relocs_count)
369 match = false; 335 match = false;
370 336
371 if (!abs32_locations_.empty()) { 337 if (!abs32_locations_.empty()) {
372 std::vector<RVA>::iterator reloc_iter = abs32_locations_.begin(); 338 std::vector<RVA>::iterator reloc_iter = abs32_locations_.begin();
373 339
374 for (uint32_t i = 0; i < section_relocs_count; ++i) { 340 for (uint32_t i = 0; i < section_relocs_count; i++) {
375 if (section_relocs_iter->r_offset == *reloc_iter) 341 if (section_relocs_iter->r_offset == *reloc_iter)
376 break; 342 break;
377 343
378 if (!ParseSimpleRegion(file_offset, 344 if (!ParseSimpleRegion(file_offset, file_offset + sizeof(Elf32_Rel),
379 file_offset + sizeof(Elf32_Rel), 345 program))
380 program)) {
381 return false; 346 return false;
382 }
383 347
384 file_offset += sizeof(Elf32_Rel); 348 file_offset += sizeof(Elf32_Rel);
385 ++section_relocs_iter; 349 ++section_relocs_iter;
386 } 350 }
387 351
388 while (match && (reloc_iter != abs32_locations_.end())) { 352 while (match && (reloc_iter != abs32_locations_.end())) {
389 if (section_relocs_iter->r_info != R_ARM_RELATIVE || 353 if (section_relocs_iter->r_info != R_ARM_RELATIVE ||
390 section_relocs_iter->r_offset != *reloc_iter) { 354 section_relocs_iter->r_offset != *reloc_iter)
391 match = false; 355 match = false;
392 }
393 356
394 ++section_relocs_iter; 357 section_relocs_iter++;
395 ++reloc_iter; 358 reloc_iter++;
396 file_offset += sizeof(Elf32_Rel); 359 file_offset += sizeof(Elf32_Rel);
397 } 360 }
398 361
399 if (match) { 362 if (match) {
400 // Skip over relocation tables 363 // Skip over relocation tables
401 if (!program->EmitElfARMRelocationInstruction()) 364 if (!program->EmitElfARMRelocationInstruction())
402 return false; 365 return false;
403 } 366 }
404 } 367 }
405 368
406 return ParseSimpleRegion(file_offset, section_end, program); 369 return ParseSimpleRegion(file_offset, section_end, program);
407 } 370 }
408 371
409 // TODO(huangs): Detect and avoid overlap with abs32 addresses.
410 CheckBool DisassemblerElf32ARM::ParseRel32RelocsFromSection( 372 CheckBool DisassemblerElf32ARM::ParseRel32RelocsFromSection(
411 const Elf32_Shdr* section_header) { 373 const Elf32_Shdr* section_header) {
412 FileOffset start_file_offset = section_header->sh_offset; 374 uint32_t start_file_offset = section_header->sh_offset;
413 FileOffset end_file_offset = start_file_offset + section_header->sh_size; 375 uint32_t end_file_offset = start_file_offset + section_header->sh_size;
414 376
415 const uint8_t* start_pointer = FileOffsetToPointer(start_file_offset); 377 const uint8_t* start_pointer = OffsetToPointer(start_file_offset);
416 const uint8_t* end_pointer = FileOffsetToPointer(end_file_offset); 378 const uint8_t* end_pointer = OffsetToPointer(end_file_offset);
417 379
418 // Quick way to convert from Pointer to RVA within a single Section is to 380 // Quick way to convert from Pointer to RVA within a single Section is to
419 // subtract |pointer_to_rva|. 381 // subtract 'pointer_to_rva'.
420 const uint8_t* const adjust_pointer_to_rva = 382 const uint8_t* const adjust_pointer_to_rva =
421 start_pointer - section_header->sh_addr; 383 start_pointer - section_header->sh_addr;
422 384
423 // Find the rel32 relocations. 385 // Find the rel32 relocations.
424 const uint8_t* p = start_pointer; 386 const uint8_t* p = start_pointer;
425 bool on_32bit = 1; // 32-bit ARM ops appear on 32-bit boundaries, so track it 387 bool on_32bit = 1; // 32-bit ARM ops appear on 32-bit boundaries, so track it
426 while (p < end_pointer) { 388 while (p < end_pointer) {
427 // Heuristic discovery of rel32 locations in instruction stream: are the 389 // Heuristic discovery of rel32 locations in instruction stream: are the
428 // next few bytes the start of an instruction containing a rel32 390 // next few bytes the start of an instruction containing a rel32
429 // addressing mode? 391 // addressing mode?
430 scoped_ptr<TypedRVAARM> rel32_rva; 392
393 TypedRVAARM* rel32_rva = NULL;
431 RVA target_rva = 0; 394 RVA target_rva = 0;
432 bool found = false; 395 bool found = false;
433 396
434 // 16-bit thumb ops 397 // 16-bit thumb ops
435 if (!found && p + 3 <= end_pointer) { 398 if (!found && (p + 3) <= end_pointer) {
436 uint16_t pval = Read16LittleEndian(p); 399 uint16_t pval = Read16LittleEndian(p);
437 if ((pval & 0xF000) == 0xD000) { 400 if ((pval & 0xF000) == 0xD000) {
438 RVA rva = static_cast<RVA>(p - adjust_pointer_to_rva); 401 RVA rva = static_cast<RVA>(p - adjust_pointer_to_rva);
439 402
440 rel32_rva.reset(new TypedRVAARM(ARM_OFF8, rva)); 403 rel32_rva = new TypedRVAARM(ARM_OFF8, rva);
441 if (!rel32_rva->ComputeRelativeTarget(p)) 404 if (!rel32_rva->ComputeRelativeTarget((uint8_t*)p)) {
442 return false; 405 return false;
443 406 }
444 target_rva = rel32_rva->rva() + rel32_rva->relative_target(); 407 target_rva = rel32_rva->rva() + rel32_rva->relative_target();
445 found = true; 408 found = true;
446 } else if ((pval & 0xF800) == 0xE000) { 409 } else if ((pval & 0xF800) == 0xE000) {
447 RVA rva = static_cast<RVA>(p - adjust_pointer_to_rva); 410 RVA rva = static_cast<RVA>(p - adjust_pointer_to_rva);
448 411
449 rel32_rva.reset(new TypedRVAARM(ARM_OFF11, rva)); 412 rel32_rva = new TypedRVAARM(ARM_OFF11, rva);
450 if (!rel32_rva->ComputeRelativeTarget(p)) 413 if (!rel32_rva->ComputeRelativeTarget((uint8_t*)p)) {
451 return false; 414 return false;
452 415 }
453 target_rva = rel32_rva->rva() + rel32_rva->relative_target(); 416 target_rva = rel32_rva->rva() + rel32_rva->relative_target();
454 found = true; 417 found = true;
455 } 418 }
456 } 419 }
457 420
458 // thumb-2 ops comprised of two 16-bit words. 421 // thumb-2 ops comprised of two 16-bit words
459 if (!found && p + 5 <= end_pointer) { 422 if (!found && (p + 5) <= end_pointer) {
460 // This is really two 16-bit words, not one 32-bit word. 423 // This is really two 16-bit words, not one 32-bit word.
461 uint32_t pval = (Read16LittleEndian(p) << 16) | Read16LittleEndian(p + 2); 424 uint32_t pval = (Read16LittleEndian(p) << 16) | Read16LittleEndian(p + 2);
462 if ((pval & 0xF8008000) == 0xF0008000) { 425 if ((pval & 0xF8008000) == 0xF0008000) {
463 // Covers thumb-2's 32-bit conditional/unconditional branches 426 // Covers thumb-2's 32-bit conditional/unconditional branches
464 if ((pval & (1 << 14)) || (pval & (1 << 12))) { 427
428 if ( (pval & (1 << 14)) || (pval & (1 << 12)) ) {
465 // A branch, with link, or with link and exchange. 429 // A branch, with link, or with link and exchange.
466 RVA rva = static_cast<RVA>(p - adjust_pointer_to_rva); 430 RVA rva = static_cast<RVA>(p - adjust_pointer_to_rva);
467 431
468 rel32_rva.reset(new TypedRVAARM(ARM_OFF25, rva)); 432 rel32_rva = new TypedRVAARM(ARM_OFF25, rva);
469 if (!rel32_rva->ComputeRelativeTarget(p)) 433 if (!rel32_rva->ComputeRelativeTarget((uint8_t*)p)) {
470 return false; 434 return false;
471 435 }
472 target_rva = rel32_rva->rva() + rel32_rva->relative_target(); 436 target_rva = rel32_rva->rva() + rel32_rva->relative_target();
473 found = true; 437 found = true;
474
475 } else { 438 } else {
476 // TODO(paulgazz) make sure cond is not 111 439 // TODO(paulgazz) make sure cond is not 111
477 // A conditional branch instruction 440 // A conditional branch instruction
478 RVA rva = static_cast<RVA>(p - adjust_pointer_to_rva); 441 RVA rva = static_cast<RVA>(p - adjust_pointer_to_rva);
479 442
480 rel32_rva.reset(new TypedRVAARM(ARM_OFF21, rva)); 443 rel32_rva = new TypedRVAARM(ARM_OFF21, rva);
481 if (!rel32_rva->ComputeRelativeTarget(p)) 444 if (!rel32_rva->ComputeRelativeTarget((uint8_t*)p)) {
482 return false; 445 return false;
483 446 }
484 target_rva = rel32_rva->rva() + rel32_rva->relative_target(); 447 target_rva = rel32_rva->rva() + rel32_rva->relative_target();
485 found = true; 448 found = true;
486 } 449 }
487 } 450 }
488 } 451 }
489 452
490 // 32-bit ARM ops. 453 // 32-bit ARM ops
491 if (!found && on_32bit && (p + 5) <= end_pointer) { 454 if (!found && on_32bit && (p + 5) <= end_pointer) {
492 uint32_t pval = Read32LittleEndian(p); 455 uint32_t pval = Read32LittleEndian(p);
493 if ((pval & 0x0E000000) == 0x0A000000) { 456 if ((pval & 0x0E000000) == 0x0A000000) {
494 // Covers both 0x0A 0x0B ARM relative branches 457 // Covers both 0x0A 0x0B ARM relative branches
495 RVA rva = static_cast<RVA>(p - adjust_pointer_to_rva); 458 RVA rva = static_cast<RVA>(p - adjust_pointer_to_rva);
496 459
497 rel32_rva.reset(new TypedRVAARM(ARM_OFF24, rva)); 460 rel32_rva = new TypedRVAARM(ARM_OFF24, rva);
498 if (!rel32_rva->ComputeRelativeTarget(p)) 461 if (!rel32_rva->ComputeRelativeTarget((uint8_t*)p)) {
499 return false; 462 return false;
500 463 }
501 target_rva = rel32_rva->rva() + rel32_rva->relative_target(); 464 target_rva = rel32_rva->rva() + rel32_rva->relative_target();
502 found = true; 465 found = true;
503 } 466 }
504 } 467 }
505 468
506 if (found && IsValidTargetRVA(target_rva)) { 469 if (found && IsValidRVA(target_rva)) {
507 uint16_t op_size = rel32_rva->op_size(); 470 rel32_locations_.push_back(rel32_rva);
508 rel32_locations_.push_back(rel32_rva.release());
509 #if COURGETTE_HISTOGRAM_TARGETS 471 #if COURGETTE_HISTOGRAM_TARGETS
510 ++rel32_target_rvas_[target_rva]; 472 ++rel32_target_rvas_[target_rva];
511 #endif 473 #endif
512 p += op_size; 474 p += rel32_rva->op_size();
513 475
514 // A tricky way to update the on_32bit flag. Here is the truth table: 476 // A tricky way to update the on_32bit flag. Here is the truth table:
515 // on_32bit | on_32bit size is 4 477 // on_32bit | on_32bit size is 4
516 // ---------+--------------------- 478 // ---------+---------------------
517 // 1 | 0 0 479 // 1 | 0 0
518 // 0 | 0 1 480 // 0 | 0 1
519 // 0 | 1 0 481 // 0 | 1 0
520 // 1 | 1 1 482 // 1 | 1 1
521 on_32bit = (~(on_32bit ^ (op_size == 4))) != 0; 483 on_32bit = (~(on_32bit ^ (rel32_rva->op_size() == 4))) != 0;
522 } else { 484 } else {
523 // Move 2 bytes at a time, but track 32-bit boundaries 485 // Move 2 bytes at a time, but track 32-bit boundaries
524 p += 2; 486 p += 2;
525 on_32bit = ((on_32bit + 1) % 2) != 0; 487 on_32bit = ((on_32bit + 1) % 2) != 0;
526 } 488 }
527 } 489 }
528 490
529 return true; 491 return true;
530 } 492 }
531 493
532 } // namespace courgette 494 } // namespace courgette
OLDNEW
« no previous file with comments | « courgette/disassembler_elf_32_arm.h ('k') | courgette/disassembler_elf_32_x86.h » ('j') | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698