1 /*
2  * Copyright (C) 2017 The Android Open Source Project
3  *
4  * Licensed under the Apache License, Version 2.0 (the "License");
5  * you may not use this file except in compliance with the License.
6  * You may obtain a copy of the License at
7  *
8  *      http://www.apache.org/licenses/LICENSE-2.0
9  *
10  * Unless required by applicable law or agreed to in writing, software
11  * distributed under the License is distributed on an "AS IS" BASIS,
12  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13  * See the License for the specific language governing permissions and
14  * limitations under the License.
15  */
16 
17 #include "slicer/bytecode_encoder.h"
18 #include "slicer/common.h"
19 #include "slicer/chronometer.h"
20 
21 #include <assert.h>
22 
23 namespace lir {
24 
25 // Pack a 16bit word: 00AA
Pack_Z_8(dex::u4 a)26 static dex::u2 Pack_Z_8(dex::u4 a) {
27   dex::u2 fa = (a & 0xff);
28   SLICER_CHECK(fa == a);
29   return fa;
30 }
31 
32 // Pack a 16bit word: AABB
Pack_8_8(dex::u4 a,dex::u4 b)33 static dex::u2 Pack_8_8(dex::u4 a, dex::u4 b) {
34   dex::u2 fa = (a & 0xff);
35   SLICER_CHECK(fa == a);
36   dex::u2 fb = (b & 0xff);
37   SLICER_CHECK(fb == b);
38   return (fa << 8) | fb;
39 }
40 
41 // Pack a 16bit word: ABCC
Pack_4_4_8(dex::u4 a,dex::u4 b,dex::u4 c)42 static dex::u2 Pack_4_4_8(dex::u4 a, dex::u4 b, dex::u4 c) {
43   dex::u2 fa = (a & 0xf);
44   SLICER_CHECK(fa == a);
45   dex::u2 fb = (b & 0xf);
46   SLICER_CHECK(fb == b);
47   dex::u2 fc = (c & 0xff);
48   SLICER_CHECK(fc == c);
49   return (fa << 12) | (fb << 8) | fc;
50 }
51 
52 // Pack a 16bit word: ABCD
Pack_4_4_4_4(dex::u4 a,dex::u4 b,dex::u4 c,dex::u4 d)53 static dex::u2 Pack_4_4_4_4(dex::u4 a, dex::u4 b, dex::u4 c, dex::u4 d) {
54   dex::u2 fa = (a & 0xf);
55   SLICER_CHECK(fa == a);
56   dex::u2 fb = (b & 0xf);
57   SLICER_CHECK(fb == b);
58   dex::u2 fc = (c & 0xf);
59   SLICER_CHECK(fc == c);
60   dex::u2 fd = (d & 0xf);
61   SLICER_CHECK(fd == d);
62   return (fa << 12) | (fb << 8) | (fc << 4) | fd;
63 }
64 
65 // Pack a 16bit word: AAAA
Pack_16(dex::u4 a)66 static dex::u2 Pack_16(dex::u4 a) {
67   dex::u2 fa = (a & 0xffff);
68   SLICER_CHECK(fa == a);
69   return fa;
70 }
71 
72 // Trim a 4bit signed integer, making sure we're not discarding significant bits
Trim_S0(dex::u4 value)73 static dex::u4 Trim_S0(dex::u4 value) {
74   dex::u4 trim = value & 0xf;
75   SLICER_CHECK(dex::u4(dex::s4(trim << 28) >> 28) == value);
76   return trim;
77 }
78 
79 // Trim a 8bit signed integer, making sure we're not discarding significant bits
Trim_S1(dex::u4 value)80 static dex::u4 Trim_S1(dex::u4 value) {
81   dex::u4 trim = value & 0xff;
82   SLICER_CHECK(dex::u4(dex::s4(trim << 24) >> 24) == value);
83   return trim;
84 }
85 
86 // Trim a 16bit signed integer, making sure we're not discarding significant bits
Trim_S2(dex::u4 value)87 static dex::u4 Trim_S2(dex::u4 value) {
88   dex::u4 trim = value & 0xffff;
89   SLICER_CHECK(dex::u4(dex::s4(trim << 16) >> 16) == value);
90   return trim;
91 }
92 
93 // Returns a register operand, checking the match between format and type
94 // (register fields can encode either a single 32bit vreg or a wide 64bit vreg pair)
GetRegA(const Bytecode * bytecode,int index)95 static dex::u4 GetRegA(const Bytecode* bytecode, int index) {
96   auto flags = dex::GetFlagsFromOpcode(bytecode->opcode);
97   return (flags & dex::kInstrWideRegA) != 0
98              ? bytecode->CastOperand<VRegPair>(index)->base_reg
99              : bytecode->CastOperand<VReg>(index)->reg;
100 }
101 
102 // Returns a register operand, checking the match between format and type
103 // (register fields can encode either a single 32bit vreg or a wide 64bit vreg pair)
GetRegB(const Bytecode * bytecode,int index)104 static dex::u4 GetRegB(const Bytecode* bytecode, int index) {
105   auto flags = dex::GetFlagsFromOpcode(bytecode->opcode);
106   return (flags & dex::kInstrWideRegB) != 0
107              ? bytecode->CastOperand<VRegPair>(index)->base_reg
108              : bytecode->CastOperand<VReg>(index)->reg;
109 }
110 
111 // Returns a register operand, checking the match between format and type
112 // (register fields can encode either a single 32bit vreg or a wide 64bit vreg pair)
GetRegC(const Bytecode * bytecode,int index)113 static dex::u4 GetRegC(const Bytecode* bytecode, int index) {
114   auto flags = dex::GetFlagsFromOpcode(bytecode->opcode);
115   return (flags & dex::kInstrWideRegC) != 0
116              ? bytecode->CastOperand<VRegPair>(index)->base_reg
117              : bytecode->CastOperand<VReg>(index)->reg;
118 }
119 
120 // Encode one instruction into a .dex bytecode
121 //
122 // NOTE: the formats and the operand notation is documented here:
123 //   https://source.android.com/devices/tech/dalvik/instruction-formats.html
124 //
Visit(Bytecode * bytecode)125 bool BytecodeEncoder::Visit(Bytecode* bytecode) {
126   bytecode->offset = offset_;
127   dex::Opcode opcode = bytecode->opcode;
128 
129   // Unconditionally replace short (8bit) branches with
130   // medium-range (16bit) branches. This should cover 99.999% of
131   // the cases and it avoids a more complex branch length handling.
132   if (opcode == dex::OP_GOTO) {
133     opcode = dex::OP_GOTO_16;
134   }
135 
136   auto buff_offset = bytecode_.size();
137   auto format = dex::GetFormatFromOpcode(opcode);
138 
139   switch (format) {
140     case dex::kFmt10x:  // op
141     {
142       SLICER_CHECK(bytecode->operands.size() == 0);
143       bytecode_.Push<dex::u2>(Pack_Z_8(opcode));
144     } break;
145 
146     case dex::kFmt12x:  // op vA, vB
147     {
148       SLICER_CHECK(bytecode->operands.size() == 2);
149       dex::u4 vA = GetRegA(bytecode, 0);
150       dex::u4 vB = GetRegB(bytecode, 1);
151       bytecode_.Push<dex::u2>(Pack_4_4_8(vB, vA, opcode));
152     } break;
153 
154     case dex::kFmt22x:  // op vAA, vBBBB
155     {
156       SLICER_CHECK(bytecode->operands.size() == 2);
157       dex::u4 vA = GetRegA(bytecode, 0);
158       dex::u4 vB = GetRegB(bytecode, 1);
159       bytecode_.Push<dex::u2>(Pack_8_8(vA, opcode));
160       bytecode_.Push<dex::u2>(Pack_16(vB));
161     } break;
162 
163     case dex::kFmt32x:  // op vAAAA, vBBBB
164     {
165       SLICER_CHECK(bytecode->operands.size() == 2);
166       dex::u4 vA = GetRegA(bytecode, 0);
167       dex::u4 vB = GetRegB(bytecode, 1);
168       bytecode_.Push<dex::u2>(Pack_Z_8(opcode));
169       bytecode_.Push<dex::u2>(Pack_16(vA));
170       bytecode_.Push<dex::u2>(Pack_16(vB));
171     } break;
172 
173     case dex::kFmt11n:  // op vA, #+B
174     {
175       SLICER_CHECK(bytecode->operands.size() == 2);
176       dex::u4 vA = GetRegA(bytecode, 0);
177       dex::u4 B = Trim_S0(bytecode->CastOperand<Const32>(1)->u.u4_value);
178       bytecode_.Push<dex::u2>(Pack_4_4_8(B, vA, opcode));
179     } break;
180 
181     case dex::kFmt21s:  // op vAA, #+BBBB
182     {
183       SLICER_CHECK(bytecode->operands.size() == 2);
184       dex::u4 vA = GetRegA(bytecode, 0);
185       dex::u4 B = Trim_S2(bytecode->CastOperand<Const32>(1)->u.u4_value);
186       bytecode_.Push<dex::u2>(Pack_8_8(vA, opcode));
187       bytecode_.Push<dex::u2>(Pack_16(B));
188     } break;
189 
190     case dex::kFmt11x:  // op vAA
191     {
192       SLICER_CHECK(bytecode->operands.size() == 1);
193       dex::u4 vA = GetRegA(bytecode, 0);
194       bytecode_.Push<dex::u2>(Pack_8_8(vA, opcode));
195     } break;
196 
197     case dex::kFmt31i:  // op vAA, #+BBBBBBBB
198     {
199       SLICER_CHECK(bytecode->operands.size() == 2);
200       dex::u4 vA = GetRegA(bytecode, 0);
201       dex::u4 B = bytecode->CastOperand<Const32>(1)->u.u4_value;
202       bytecode_.Push<dex::u2>(Pack_8_8(vA, opcode));
203       bytecode_.Push<dex::u2>(Pack_16(B & 0xffff));
204       bytecode_.Push<dex::u2>(Pack_16(B >> 16));
205     } break;
206 
207     case dex::kFmt20t:  // op +AAAA
208     {
209       SLICER_CHECK(bytecode->operands.size() == 1);
210       auto label = bytecode->CastOperand<CodeLocation>(0)->label;
211       dex::u4 A = 0;
212       if (label->offset != kInvalidOffset) {
213         assert(label->offset <= offset_);
214         A = label->offset - offset_;
215         SLICER_CHECK(A != 0);
216         SLICER_CHECK((A >> 16) == 0xffff);  // TODO: out of range!
217       } else {
218         fixups_.push_back(LabelFixup(offset_, label, true));
219       }
220       bytecode_.Push<dex::u2>(Pack_Z_8(opcode));
221       bytecode_.Push<dex::u2>(Pack_16(A & 0xffff));
222     } break;
223 
224     case dex::kFmt30t:  // op +AAAAAAAA
225     {
226       SLICER_CHECK(bytecode->operands.size() == 1);
227       auto label = bytecode->CastOperand<CodeLocation>(0)->label;
228       dex::u4 A = 0;
229       if (label->offset != kInvalidOffset) {
230         // NOTE: goto/32 can branch to itself
231         assert(label->offset <= offset_);
232         A = label->offset - offset_;
233       } else {
234         fixups_.push_back(LabelFixup(offset_, label, false));
235       }
236       bytecode_.Push<dex::u2>(Pack_Z_8(opcode));
237       bytecode_.Push<dex::u2>(Pack_16(A & 0xffff));
238       bytecode_.Push<dex::u2>(Pack_16(A >> 16));
239     } break;
240 
241     case dex::kFmt21t:  // op vAA, +BBBB
242     {
243       SLICER_CHECK(bytecode->operands.size() == 2);
244       dex::u4 vA = GetRegA(bytecode, 0);
245       auto label = bytecode->CastOperand<CodeLocation>(1)->label;
246       dex::u4 B = 0;
247       if (label->offset != kInvalidOffset) {
248         assert(label->offset <= offset_);
249         B = label->offset - offset_;
250         SLICER_CHECK(B != 0);
251         SLICER_CHECK((B >> 16) == 0xffff);  // TODO: out of range!
252       } else {
253         fixups_.push_back(LabelFixup(offset_, label, true));
254       }
255       bytecode_.Push<dex::u2>(Pack_8_8(vA, opcode));
256       bytecode_.Push<dex::u2>(Pack_16(B & 0xffff));
257     } break;
258 
259     case dex::kFmt22t:  // op vA, vB, +CCCC
260     {
261       SLICER_CHECK(bytecode->operands.size() == 3);
262       dex::u4 vA = GetRegA(bytecode, 0);
263       dex::u4 vB = GetRegB(bytecode, 1);
264       auto label = bytecode->CastOperand<CodeLocation>(2)->label;
265       dex::u4 C = 0;
266       if (label->offset != kInvalidOffset) {
267         assert(label->offset <= offset_);
268         C = label->offset - offset_;
269         SLICER_CHECK(C != 0);
270         SLICER_CHECK((C >> 16) == 0xffff);  // TODO: out of range!
271       } else {
272         fixups_.push_back(LabelFixup(offset_, label, true));
273       }
274       bytecode_.Push<dex::u2>(Pack_4_4_8(vB, vA, opcode));
275       bytecode_.Push<dex::u2>(Pack_16(C & 0xffff));
276     } break;
277 
278     case dex::kFmt31t:  // op vAA, +BBBBBBBB
279     {
280       SLICER_CHECK(bytecode->operands.size() == 2);
281       dex::u4 vA = GetRegA(bytecode, 0);
282       auto label = bytecode->CastOperand<CodeLocation>(1)->label;
283       dex::u4 B = 0;
284       if (label->offset != kInvalidOffset) {
285         assert(label->offset <= offset_);
286         B = label->offset - offset_;
287         SLICER_CHECK(B != 0);
288       } else {
289         fixups_.push_back(LabelFixup(offset_, label, false));
290       }
291       bytecode_.Push<dex::u2>(Pack_8_8(vA, opcode));
292       bytecode_.Push<dex::u2>(Pack_16(B & 0xffff));
293       bytecode_.Push<dex::u2>(Pack_16(B >> 16));
294     } break;
295 
296     case dex::kFmt23x:  // op vAA, vBB, vCC
297     {
298       SLICER_CHECK(bytecode->operands.size() == 3);
299       dex::u4 vA = GetRegA(bytecode, 0);
300       dex::u4 vB = GetRegB(bytecode, 1);
301       dex::u4 vC = GetRegC(bytecode, 2);
302       bytecode_.Push<dex::u2>(Pack_8_8(vA, opcode));
303       bytecode_.Push<dex::u2>(Pack_8_8(vC, vB));
304     } break;
305 
306     case dex::kFmt22b:  // op vAA, vBB, #+CC
307     {
308       SLICER_CHECK(bytecode->operands.size() == 3);
309       dex::u4 vA = GetRegA(bytecode, 0);
310       dex::u4 vB = GetRegB(bytecode, 1);
311       dex::u4 C = Trim_S1(bytecode->CastOperand<Const32>(2)->u.u4_value);
312       bytecode_.Push<dex::u2>(Pack_8_8(vA, opcode));
313       bytecode_.Push<dex::u2>(Pack_8_8(C, vB));
314     } break;
315 
316     case dex::kFmt22s:  // op vA, vB, #+CCCC
317     {
318       SLICER_CHECK(bytecode->operands.size() == 3);
319       dex::u4 vA = GetRegA(bytecode, 0);
320       dex::u4 vB = GetRegB(bytecode, 1);
321       dex::u4 C = Trim_S2(bytecode->CastOperand<Const32>(2)->u.u4_value);
322       bytecode_.Push<dex::u2>(Pack_4_4_8(vB, vA, opcode));
323       bytecode_.Push<dex::u2>(Pack_16(C));
324     } break;
325 
326     case dex::kFmt22c:  // op vA, vB, thing@CCCC
327     {
328       SLICER_CHECK(bytecode->operands.size() == 3);
329       dex::u4 vA = GetRegA(bytecode, 0);
330       dex::u4 vB = GetRegB(bytecode, 1);
331       dex::u4 C = bytecode->CastOperand<IndexedOperand>(2)->index;
332       bytecode_.Push<dex::u2>(Pack_4_4_8(vB, vA, opcode));
333       bytecode_.Push<dex::u2>(Pack_16(C));
334     } break;
335 
336     case dex::kFmt21c:  // op vAA, thing@BBBB
337     {
338       SLICER_CHECK(bytecode->operands.size() == 2);
339       dex::u4 vA = GetRegA(bytecode, 0);
340       dex::u4 B = bytecode->CastOperand<IndexedOperand>(1)->index;
341       bytecode_.Push<dex::u2>(Pack_8_8(vA, opcode));
342       bytecode_.Push<dex::u2>(Pack_16(B));
343     } break;
344 
345     case dex::kFmt31c:  // op vAA, string@BBBBBBBB
346     {
347       SLICER_CHECK(bytecode->operands.size() == 2);
348       dex::u4 vA = GetRegA(bytecode, 0);
349       dex::u4 B = bytecode->CastOperand<IndexedOperand>(1)->index;
350       bytecode_.Push<dex::u2>(Pack_8_8(vA, opcode));
351       bytecode_.Push<dex::u2>(Pack_16(B & 0xffff));
352       bytecode_.Push<dex::u2>(Pack_16(B >> 16));
353     } break;
354 
355     case dex::kFmt35c:  // op {vC,vD,vE,vF,vG}, thing@BBBB
356     {
357       SLICER_CHECK(bytecode->operands.size() == 2);
358       const auto& regs = bytecode->CastOperand<VRegList>(0)->registers;
359       dex::u4 B = bytecode->CastOperand<IndexedOperand>(1)->index;
360       dex::u4 A = regs.size();
361       dex::u4 C = (A > 0) ? regs[0] : 0;
362       dex::u4 D = (A > 1) ? regs[1] : 0;
363       dex::u4 E = (A > 2) ? regs[2] : 0;
364       dex::u4 F = (A > 3) ? regs[3] : 0;
365       dex::u4 G = (A > 4) ? regs[4] : 0;
366       bytecode_.Push<dex::u2>(Pack_4_4_8(A, G, opcode));
367       bytecode_.Push<dex::u2>(Pack_16(B));
368       bytecode_.Push<dex::u2>(Pack_4_4_4_4(F, E, D, C));
369 
370       // keep track of the outs_count
371       if ((dex::GetFlagsFromOpcode(opcode) & dex::kInstrInvoke) != 0) {
372         outs_count_ = std::max(outs_count_, A);
373       }
374     } break;
375 
376     case dex::kFmt3rc:  // op {vCCCC .. v(CCCC+AA-1)}, thing@BBBB
377     {
378       SLICER_CHECK(bytecode->operands.size() == 2);
379       auto vreg_range = bytecode->CastOperand<VRegRange>(0);
380       dex::u4 A = vreg_range->count;
381       dex::u4 B = bytecode->CastOperand<IndexedOperand>(1)->index;
382       dex::u4 C = vreg_range->base_reg;
383       bytecode_.Push<dex::u2>(Pack_8_8(A, opcode));
384       bytecode_.Push<dex::u2>(Pack_16(B));
385       bytecode_.Push<dex::u2>(Pack_16(C));
386 
387       // keep track of the outs_count
388       if ((dex::GetFlagsFromOpcode(opcode) & dex::kInstrInvoke) != 0) {
389         outs_count_ = std::max(outs_count_, A);
390       }
391     } break;
392 
393     case dex::kFmt51l:  // op vAA, #+BBBBBBBBBBBBBBBB
394     {
395       SLICER_CHECK(bytecode->operands.size() == 2);
396       dex::u4 vA = GetRegA(bytecode, 0);
397       dex::u8 B = bytecode->CastOperand<Const64>(1)->u.u8_value;
398       bytecode_.Push<dex::u2>(Pack_8_8(vA, opcode));
399       bytecode_.Push<dex::u2>(Pack_16((B >> 0) & 0xffff));
400       bytecode_.Push<dex::u2>(Pack_16((B >> 16) & 0xffff));
401       bytecode_.Push<dex::u2>(Pack_16((B >> 32) & 0xffff));
402       bytecode_.Push<dex::u2>(Pack_16((B >> 48) & 0xffff));
403     } break;
404 
405     case dex::kFmt21h:  // op vAA, #+BBBB0000[00000000]
406       SLICER_CHECK(bytecode->operands.size() == 2);
407       switch (opcode) {
408         case dex::OP_CONST_HIGH16: {
409           dex::u4 vA = GetRegA(bytecode, 0);
410           dex::u4 B = bytecode->CastOperand<Const32>(1)->u.u4_value >> 16;
411           bytecode_.Push<dex::u2>(Pack_8_8(vA, opcode));
412           bytecode_.Push<dex::u2>(Pack_16(B));
413         } break;
414 
415         case dex::OP_CONST_WIDE_HIGH16: {
416           dex::u4 vA = GetRegA(bytecode, 0);
417           dex::u4 B = bytecode->CastOperand<Const64>(1)->u.u8_value >> 48;
418           bytecode_.Push<dex::u2>(Pack_8_8(vA, opcode));
419           bytecode_.Push<dex::u2>(Pack_16(B));
420         } break;
421 
422         default:
423           SLICER_FATAL("Unexpected fmt21h opcode: 0x%02x", opcode);
424       }
425       break;
426 
427     default:
428       SLICER_FATAL("Unexpected format: 0x%02x", format);
429   }
430 
431   SLICER_CHECK(bytecode_.size() - buff_offset == 2 * GetWidthFromOpcode(opcode));
432   offset_ += GetWidthFromOpcode(opcode);
433   return true;
434 }
435 
Visit(PackedSwitchPayload * packed_switch)436 bool BytecodeEncoder::Visit(PackedSwitchPayload* packed_switch) {
437   SLICER_CHECK(offset_ % 2 == 0);
438 
439   // keep track of the switches
440   packed_switch->offset = offset_;
441   auto& instr = packed_switches_[offset_];
442   SLICER_CHECK(instr == nullptr);
443   instr = packed_switch;
444 
445   // we're going to fix up the offsets in a later pass
446   auto orig_size = bytecode_.size();
447   bytecode_.Push<dex::u2>(dex::kPackedSwitchSignature);
448   bytecode_.Push<dex::u2>(Pack_16(packed_switch->targets.size()));
449   bytecode_.Push<dex::s4>(packed_switch->first_key);
450   for (size_t i = 0; i < packed_switch->targets.size(); ++i) {
451     bytecode_.Push<dex::u4>(0);
452   }
453 
454   // offset is in 16bit units, not bytes
455   offset_ += (bytecode_.size() - orig_size) / 2;
456 
457   return true;
458 }
459 
Visit(SparseSwitchPayload * sparse_switch)460 bool BytecodeEncoder::Visit(SparseSwitchPayload* sparse_switch) {
461   SLICER_CHECK(offset_ % 2 == 0);
462 
463   // keep track of the switches
464   sparse_switch->offset = offset_;
465   auto& instr = sparse_switches_[offset_];
466   SLICER_CHECK(instr == nullptr);
467   instr = sparse_switch;
468 
469   // we're going to fix up the offsets in a later pass
470   auto orig_size = bytecode_.size();
471   bytecode_.Push<dex::u2>(dex::kSparseSwitchSignature);
472   bytecode_.Push<dex::u2>(Pack_16(sparse_switch->switch_cases.size()));
473   for (const auto& switch_case : sparse_switch->switch_cases) {
474     bytecode_.Push<dex::s4>(switch_case.key);
475   }
476   for (size_t i = 0; i < sparse_switch->switch_cases.size(); ++i) {
477     bytecode_.Push<dex::u4>(0);
478   }
479   offset_ += (bytecode_.size() - orig_size) / 2;
480 
481   return true;
482 }
483 
Visit(ArrayData * array_data)484 bool BytecodeEncoder::Visit(ArrayData* array_data) {
485   SLICER_CHECK(offset_ % 2 == 0);
486 
487   array_data->offset = offset_;
488   auto orig_size = bytecode_.size();
489   // kArrayDataSignature is already included by array_data->data
490   // (no need to emit here)
491   bytecode_.Push(array_data->data);
492   offset_ += (bytecode_.size() - orig_size) / 2;
493   return true;
494 }
495 
Visit(Label * label)496 bool BytecodeEncoder::Visit(Label* label) {
497   // aligned label?
498   if (label->aligned && offset_ % 2 == 1) {
499     bytecode_.Push<dex::u2>(dex::OP_NOP);
500     ++offset_;
501   }
502 
503   label->offset = offset_;
504   return true;
505 }
506 
Visit(DbgInfoHeader * dbg_header)507 bool BytecodeEncoder::Visit(DbgInfoHeader* dbg_header) {
508   dbg_header->offset = offset_;
509   return true;
510 }
511 
Visit(DbgInfoAnnotation * dbg_annotation)512 bool BytecodeEncoder::Visit(DbgInfoAnnotation* dbg_annotation) {
513   dbg_annotation->offset = offset_;
514   return true;
515 }
516 
Visit(TryBlockBegin * try_begin)517 bool BytecodeEncoder::Visit(TryBlockBegin* try_begin) {
518   try_begin->offset = offset_;
519   return true;
520 }
521 
Visit(TryBlockEnd * try_end)522 bool BytecodeEncoder::Visit(TryBlockEnd* try_end) {
523   try_end->offset = offset_;
524   return true;
525 }
526 
FixupSwitchOffsets()527 void BytecodeEncoder::FixupSwitchOffsets() {
528   dex::u2* const begin = bytecode_.ptr<dex::u2>(0);
529   dex::u2* const end = begin + bytecode_.size() / 2;
530   dex::u2* ptr = begin;
531   while (ptr < end) {
532     const auto opcode = dex::OpcodeFromBytecode(*ptr);
533     const auto offset = ptr - begin;
534     if (opcode == dex::OP_PACKED_SWITCH) {
535       auto dex_instr = dex::DecodeInstruction(ptr);
536       FixupPackedSwitch(offset, offset + dex::s4(dex_instr.vB));
537     } else if (opcode == dex::OP_SPARSE_SWITCH) {
538       auto dex_instr = dex::DecodeInstruction(ptr);
539       FixupSparseSwitch(offset, offset + dex::s4(dex_instr.vB));
540     }
541     auto isize = dex::GetWidthFromBytecode(ptr);
542     SLICER_CHECK(isize > 0);
543     ptr += isize;
544   }
545   SLICER_CHECK(ptr == end);
546 }
547 
FixupPackedSwitch(dex::u4 base_offset,dex::u4 payload_offset)548 void BytecodeEncoder::FixupPackedSwitch(dex::u4 base_offset,
549                                         dex::u4 payload_offset) {
550   auto instr = packed_switches_[payload_offset];
551   SLICER_CHECK(instr != nullptr);
552 
553   auto payload = bytecode_.ptr<dex::PackedSwitchPayload>(payload_offset * 2);
554   SLICER_CHECK(payload->ident == dex::kPackedSwitchSignature);
555   SLICER_CHECK(reinterpret_cast<dex::u1*>(payload->targets + payload->size) <=
556         bytecode_.data() + bytecode_.size());
557 
558   for (int i = 0; i < payload->size; ++i) {
559     auto label = instr->targets[i];
560     assert(label->offset != kInvalidOffset);
561     payload->targets[i] = label->offset - base_offset;
562   }
563 }
564 
FixupSparseSwitch(dex::u4 base_offset,dex::u4 payload_offset)565 void BytecodeEncoder::FixupSparseSwitch(dex::u4 base_offset,
566                                         dex::u4 payload_offset) {
567   auto instr = sparse_switches_[payload_offset];
568   SLICER_CHECK(instr != nullptr);
569 
570   auto payload = bytecode_.ptr<dex::SparseSwitchPayload>(payload_offset * 2);
571   SLICER_CHECK(payload->ident == dex::kSparseSwitchSignature);
572 
573   dex::s4* const targets = payload->data + payload->size;
574   SLICER_CHECK(reinterpret_cast<dex::u1*>(targets + payload->size) <=
575         bytecode_.data() + bytecode_.size());
576 
577   for (int i = 0; i < payload->size; ++i) {
578     auto label = instr->switch_cases[i].target;
579     assert(label->offset != kInvalidOffset);
580     targets[i] = label->offset - base_offset;
581   }
582 }
583 
FixupLabels()584 void BytecodeEncoder::FixupLabels() {
585   for (const LabelFixup& fixup : fixups_) {
586     dex::u4 label_offset = fixup.label->offset;
587     assert(label_offset != kInvalidOffset);
588     assert(label_offset > fixup.offset);
589     dex::u4 rel_offset = label_offset - fixup.offset;
590     SLICER_CHECK(rel_offset != 0);
591     dex::u2* instr = bytecode_.ptr<dex::u2>(fixup.offset * 2);
592     if (fixup.short_fixup) {
593       // TODO: explicit out-of-range check
594       assert(instr[1] == 0);
595       instr[1] = Pack_16(rel_offset);
596     } else {
597       assert(instr[1] == 0);
598       assert(instr[2] == 0);
599       instr[1] = Pack_16(rel_offset & 0xffff);
600       instr[2] = Pack_16(rel_offset >> 16);
601     }
602   }
603 }
604 
Encode(ir::Code * ir_code,std::shared_ptr<ir::DexFile> dex_ir)605 void BytecodeEncoder::Encode(ir::Code* ir_code, std::shared_ptr<ir::DexFile> dex_ir) {
606   SLICER_CHECK(bytecode_.empty());
607   SLICER_CHECK(offset_ == 0);
608   SLICER_CHECK(outs_count_ == 0);
609 
610   packed_switches_.clear();
611   sparse_switches_.clear();
612 
613   // reset all instruction offsets
614   for (auto instr : instructions_) {
615     instr->offset = kInvalidOffset;
616   }
617 
618   // generate the .dex bytecodes
619   for (auto instr : instructions_) {
620     instr->Accept(this);
621   }
622 
623   // no more appending (read & write is ok)
624   bytecode_.Seal(2);
625 
626   FixupLabels();
627   FixupSwitchOffsets();
628 
629   // update ir::Code
630   ir_code->instructions = slicer::ArrayView<const dex::u2>(
631       bytecode_.ptr<dex::u2>(0), bytecode_.size() / 2);
632   ir_code->outs_count = outs_count_;
633 
634   // attach the new bytecode
635   dex_ir->AttachBuffer(std::move(bytecode_));
636 }
637 
638 }  // namespace lir
639