1 // Copyright 2014 the V8 project authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
4 
5 #include "src/compiler/move-optimizer.h"
6 
7 namespace v8 {
8 namespace internal {
9 namespace compiler {
10 
11 namespace {
12 
13 struct MoveKey {
14   InstructionOperand source;
15   InstructionOperand destination;
16 };
17 
18 struct MoveKeyCompare {
operator ()v8::internal::compiler::__anon6498dd0a0111::MoveKeyCompare19   bool operator()(const MoveKey& a, const MoveKey& b) const {
20     if (a.source.EqualsCanonicalized(b.source)) {
21       return a.destination.CompareCanonicalized(b.destination);
22     }
23     return a.source.CompareCanonicalized(b.source);
24   }
25 };
26 
27 typedef ZoneMap<MoveKey, unsigned, MoveKeyCompare> MoveMap;
28 
29 class OperandSet {
30  public:
OperandSet(ZoneVector<InstructionOperand> * buffer)31   explicit OperandSet(ZoneVector<InstructionOperand>* buffer)
32       : set_(buffer), fp_reps_(0) {
33     buffer->clear();
34   }
35 
InsertOp(const InstructionOperand & op)36   void InsertOp(const InstructionOperand& op) {
37     set_->push_back(op);
38 
39     if (!kSimpleFPAliasing && op.IsFPRegister())
40       fp_reps_ |= RepBit(LocationOperand::cast(op).representation());
41   }
42 
Contains(const InstructionOperand & op) const43   bool Contains(const InstructionOperand& op) const {
44     for (const InstructionOperand& elem : *set_) {
45       if (elem.EqualsCanonicalized(op)) return true;
46     }
47     return false;
48   }
49 
ContainsOpOrAlias(const InstructionOperand & op) const50   bool ContainsOpOrAlias(const InstructionOperand& op) const {
51     if (Contains(op)) return true;
52 
53     if (!kSimpleFPAliasing && op.IsFPRegister()) {
54       // Platforms where FP registers have complex aliasing need extra checks.
55       const LocationOperand& loc = LocationOperand::cast(op);
56       MachineRepresentation rep = loc.representation();
57       // If haven't encountered mixed rep FP registers, skip the extra checks.
58       if (!HasMixedFPReps(fp_reps_ | RepBit(rep))) return false;
59 
60       // Check register against aliasing registers of other FP representations.
61       MachineRepresentation other_rep1, other_rep2;
62       switch (rep) {
63         case MachineRepresentation::kFloat32:
64           other_rep1 = MachineRepresentation::kFloat64;
65           other_rep2 = MachineRepresentation::kSimd128;
66           break;
67         case MachineRepresentation::kFloat64:
68           other_rep1 = MachineRepresentation::kFloat32;
69           other_rep2 = MachineRepresentation::kSimd128;
70           break;
71         case MachineRepresentation::kSimd128:
72           other_rep1 = MachineRepresentation::kFloat32;
73           other_rep2 = MachineRepresentation::kFloat64;
74           break;
75         default:
76           UNREACHABLE();
77           break;
78       }
79       const RegisterConfiguration* config = RegisterConfiguration::Turbofan();
80       int base = -1;
81       int aliases =
82           config->GetAliases(rep, loc.register_code(), other_rep1, &base);
83       DCHECK(aliases > 0 || (aliases == 0 && base == -1));
84       while (aliases--) {
85         if (Contains(AllocatedOperand(LocationOperand::REGISTER, other_rep1,
86                                       base + aliases))) {
87           return true;
88         }
89       }
90       aliases = config->GetAliases(rep, loc.register_code(), other_rep2, &base);
91       DCHECK(aliases > 0 || (aliases == 0 && base == -1));
92       while (aliases--) {
93         if (Contains(AllocatedOperand(LocationOperand::REGISTER, other_rep2,
94                                       base + aliases))) {
95           return true;
96         }
97       }
98     }
99     return false;
100   }
101 
102  private:
RepBit(MachineRepresentation rep)103   static int RepBit(MachineRepresentation rep) {
104     return 1 << static_cast<int>(rep);
105   }
106 
HasMixedFPReps(int reps)107   static bool HasMixedFPReps(int reps) {
108     return reps && !base::bits::IsPowerOfTwo32(reps);
109   }
110 
111   ZoneVector<InstructionOperand>* set_;
112   int fp_reps_;
113 };
114 
FindFirstNonEmptySlot(const Instruction * instr)115 int FindFirstNonEmptySlot(const Instruction* instr) {
116   int i = Instruction::FIRST_GAP_POSITION;
117   for (; i <= Instruction::LAST_GAP_POSITION; i++) {
118     ParallelMove* moves = instr->parallel_moves()[i];
119     if (moves == nullptr) continue;
120     for (MoveOperands* move : *moves) {
121       if (!move->IsRedundant()) return i;
122       move->Eliminate();
123     }
124     moves->clear();  // Clear this redundant move.
125   }
126   return i;
127 }
128 
129 }  // namespace
130 
MoveOptimizer(Zone * local_zone,InstructionSequence * code)131 MoveOptimizer::MoveOptimizer(Zone* local_zone, InstructionSequence* code)
132     : local_zone_(local_zone),
133       code_(code),
134       local_vector_(local_zone),
135       operand_buffer1(local_zone),
136       operand_buffer2(local_zone) {}
137 
Run()138 void MoveOptimizer::Run() {
139   for (Instruction* instruction : code()->instructions()) {
140     CompressGaps(instruction);
141   }
142   for (InstructionBlock* block : code()->instruction_blocks()) {
143     CompressBlock(block);
144   }
145   for (InstructionBlock* block : code()->instruction_blocks()) {
146     if (block->PredecessorCount() <= 1) continue;
147     if (!block->IsDeferred()) {
148       bool has_only_deferred = true;
149       for (RpoNumber& pred_id : block->predecessors()) {
150         if (!code()->InstructionBlockAt(pred_id)->IsDeferred()) {
151           has_only_deferred = false;
152           break;
153         }
154       }
155       // This would pull down common moves. If the moves occur in deferred
156       // blocks, and the closest common successor is not deferred, we lose the
157       // optimization of just spilling/filling in deferred blocks, when the
158       // current block is not deferred.
159       if (has_only_deferred) continue;
160     }
161     OptimizeMerge(block);
162   }
163   for (Instruction* gap : code()->instructions()) {
164     FinalizeMoves(gap);
165   }
166 }
167 
RemoveClobberedDestinations(Instruction * instruction)168 void MoveOptimizer::RemoveClobberedDestinations(Instruction* instruction) {
169   if (instruction->IsCall()) return;
170   ParallelMove* moves = instruction->parallel_moves()[0];
171   if (moves == nullptr) return;
172 
173   DCHECK(instruction->parallel_moves()[1] == nullptr ||
174          instruction->parallel_moves()[1]->empty());
175 
176   OperandSet outputs(&operand_buffer1);
177   OperandSet inputs(&operand_buffer2);
178 
179   // Outputs and temps are treated together as potentially clobbering a
180   // destination operand.
181   for (size_t i = 0; i < instruction->OutputCount(); ++i) {
182     outputs.InsertOp(*instruction->OutputAt(i));
183   }
184   for (size_t i = 0; i < instruction->TempCount(); ++i) {
185     outputs.InsertOp(*instruction->TempAt(i));
186   }
187 
188   // Input operands block elisions.
189   for (size_t i = 0; i < instruction->InputCount(); ++i) {
190     inputs.InsertOp(*instruction->InputAt(i));
191   }
192 
193   // Elide moves made redundant by the instruction.
194   for (MoveOperands* move : *moves) {
195     if (outputs.ContainsOpOrAlias(move->destination()) &&
196         !inputs.ContainsOpOrAlias(move->destination())) {
197       move->Eliminate();
198     }
199   }
200 
201   // The ret instruction makes any assignment before it unnecessary, except for
202   // the one for its input.
203   if (instruction->IsRet() || instruction->IsTailCall()) {
204     for (MoveOperands* move : *moves) {
205       if (!inputs.ContainsOpOrAlias(move->destination())) {
206         move->Eliminate();
207       }
208     }
209   }
210 }
211 
MigrateMoves(Instruction * to,Instruction * from)212 void MoveOptimizer::MigrateMoves(Instruction* to, Instruction* from) {
213   if (from->IsCall()) return;
214 
215   ParallelMove* from_moves = from->parallel_moves()[0];
216   if (from_moves == nullptr || from_moves->empty()) return;
217 
218   OperandSet dst_cant_be(&operand_buffer1);
219   OperandSet src_cant_be(&operand_buffer2);
220 
221   // If an operand is an input to the instruction, we cannot move assignments
222   // where it appears on the LHS.
223   for (size_t i = 0; i < from->InputCount(); ++i) {
224     dst_cant_be.InsertOp(*from->InputAt(i));
225   }
226   // If an operand is output to the instruction, we cannot move assignments
227   // where it appears on the RHS, because we would lose its value before the
228   // instruction.
229   // Same for temp operands.
230   // The output can't appear on the LHS because we performed
231   // RemoveClobberedDestinations for the "from" instruction.
232   for (size_t i = 0; i < from->OutputCount(); ++i) {
233     src_cant_be.InsertOp(*from->OutputAt(i));
234   }
235   for (size_t i = 0; i < from->TempCount(); ++i) {
236     src_cant_be.InsertOp(*from->TempAt(i));
237   }
238   for (MoveOperands* move : *from_moves) {
239     if (move->IsRedundant()) continue;
240     // Assume dest has a value "V". If we have a "dest = y" move, then we can't
241     // move "z = dest", because z would become y rather than "V".
242     // We assume CompressMoves has happened before this, which means we don't
243     // have more than one assignment to dest.
244     src_cant_be.InsertOp(move->destination());
245   }
246 
247   ZoneSet<MoveKey, MoveKeyCompare> move_candidates(local_zone());
248   // We start with all the moves that don't have conflicting source or
249   // destination operands are eligible for being moved down.
250   for (MoveOperands* move : *from_moves) {
251     if (move->IsRedundant()) continue;
252     if (!dst_cant_be.ContainsOpOrAlias(move->destination())) {
253       MoveKey key = {move->source(), move->destination()};
254       move_candidates.insert(key);
255     }
256   }
257   if (move_candidates.empty()) return;
258 
259   // Stabilize the candidate set.
260   bool changed = false;
261   do {
262     changed = false;
263     for (auto iter = move_candidates.begin(); iter != move_candidates.end();) {
264       auto current = iter;
265       ++iter;
266       InstructionOperand src = current->source;
267       if (src_cant_be.ContainsOpOrAlias(src)) {
268         src_cant_be.InsertOp(current->destination);
269         move_candidates.erase(current);
270         changed = true;
271       }
272     }
273   } while (changed);
274 
275   ParallelMove to_move(local_zone());
276   for (MoveOperands* move : *from_moves) {
277     if (move->IsRedundant()) continue;
278     MoveKey key = {move->source(), move->destination()};
279     if (move_candidates.find(key) != move_candidates.end()) {
280       to_move.AddMove(move->source(), move->destination(), code_zone());
281       move->Eliminate();
282     }
283   }
284   if (to_move.empty()) return;
285 
286   ParallelMove* dest =
287       to->GetOrCreateParallelMove(Instruction::GapPosition::START, code_zone());
288 
289   CompressMoves(&to_move, dest);
290   DCHECK(dest->empty());
291   for (MoveOperands* m : to_move) {
292     dest->push_back(m);
293   }
294 }
295 
CompressMoves(ParallelMove * left,MoveOpVector * right)296 void MoveOptimizer::CompressMoves(ParallelMove* left, MoveOpVector* right) {
297   if (right == nullptr) return;
298 
299   MoveOpVector& eliminated = local_vector();
300   DCHECK(eliminated.empty());
301 
302   if (!left->empty()) {
303     // Modify the right moves in place and collect moves that will be killed by
304     // merging the two gaps.
305     for (MoveOperands* move : *right) {
306       if (move->IsRedundant()) continue;
307       left->PrepareInsertAfter(move, &eliminated);
308     }
309     // Eliminate dead moves.
310     for (MoveOperands* to_eliminate : eliminated) {
311       to_eliminate->Eliminate();
312     }
313     eliminated.clear();
314   }
315   // Add all possibly modified moves from right side.
316   for (MoveOperands* move : *right) {
317     if (move->IsRedundant()) continue;
318     left->push_back(move);
319   }
320   // Nuke right.
321   right->clear();
322   DCHECK(eliminated.empty());
323 }
324 
CompressGaps(Instruction * instruction)325 void MoveOptimizer::CompressGaps(Instruction* instruction) {
326   int i = FindFirstNonEmptySlot(instruction);
327   bool has_moves = i <= Instruction::LAST_GAP_POSITION;
328   USE(has_moves);
329 
330   if (i == Instruction::LAST_GAP_POSITION) {
331     std::swap(instruction->parallel_moves()[Instruction::FIRST_GAP_POSITION],
332               instruction->parallel_moves()[Instruction::LAST_GAP_POSITION]);
333   } else if (i == Instruction::FIRST_GAP_POSITION) {
334     CompressMoves(
335         instruction->parallel_moves()[Instruction::FIRST_GAP_POSITION],
336         instruction->parallel_moves()[Instruction::LAST_GAP_POSITION]);
337   }
338   // We either have no moves, or, after swapping or compressing, we have
339   // all the moves in the first gap position, and none in the second/end gap
340   // position.
341   ParallelMove* first =
342       instruction->parallel_moves()[Instruction::FIRST_GAP_POSITION];
343   ParallelMove* last =
344       instruction->parallel_moves()[Instruction::LAST_GAP_POSITION];
345   USE(first);
346   USE(last);
347 
348   DCHECK(!has_moves ||
349          (first != nullptr && (last == nullptr || last->empty())));
350 }
351 
CompressBlock(InstructionBlock * block)352 void MoveOptimizer::CompressBlock(InstructionBlock* block) {
353   int first_instr_index = block->first_instruction_index();
354   int last_instr_index = block->last_instruction_index();
355 
356   // Start by removing gap assignments where the output of the subsequent
357   // instruction appears on LHS, as long as they are not needed by its input.
358   Instruction* prev_instr = code()->instructions()[first_instr_index];
359   RemoveClobberedDestinations(prev_instr);
360 
361   for (int index = first_instr_index + 1; index <= last_instr_index; ++index) {
362     Instruction* instr = code()->instructions()[index];
363     // Migrate to the gap of prev_instr eligible moves from instr.
364     MigrateMoves(instr, prev_instr);
365     // Remove gap assignments clobbered by instr's output.
366     RemoveClobberedDestinations(instr);
367     prev_instr = instr;
368   }
369 }
370 
371 
LastInstruction(const InstructionBlock * block) const372 const Instruction* MoveOptimizer::LastInstruction(
373     const InstructionBlock* block) const {
374   return code()->instructions()[block->last_instruction_index()];
375 }
376 
377 
OptimizeMerge(InstructionBlock * block)378 void MoveOptimizer::OptimizeMerge(InstructionBlock* block) {
379   DCHECK(block->PredecessorCount() > 1);
380   // Ensure that the last instruction in all incoming blocks don't contain
381   // things that would prevent moving gap moves across them.
382   for (RpoNumber& pred_index : block->predecessors()) {
383     const InstructionBlock* pred = code()->InstructionBlockAt(pred_index);
384 
385     // If the predecessor has more than one successor, we shouldn't attempt to
386     // move down to this block (one of the successors) any of the gap moves,
387     // because their effect may be necessary to the other successors.
388     if (pred->SuccessorCount() > 1) return;
389 
390     const Instruction* last_instr =
391         code()->instructions()[pred->last_instruction_index()];
392     if (last_instr->IsCall()) return;
393     if (last_instr->TempCount() != 0) return;
394     if (last_instr->OutputCount() != 0) return;
395     for (size_t i = 0; i < last_instr->InputCount(); ++i) {
396       const InstructionOperand* op = last_instr->InputAt(i);
397       if (!op->IsConstant() && !op->IsImmediate()) return;
398     }
399   }
400   // TODO(dcarney): pass a ZoneStats down for this?
401   MoveMap move_map(local_zone());
402   size_t correct_counts = 0;
403   // Accumulate set of shared moves.
404   for (RpoNumber& pred_index : block->predecessors()) {
405     const InstructionBlock* pred = code()->InstructionBlockAt(pred_index);
406     const Instruction* instr = LastInstruction(pred);
407     if (instr->parallel_moves()[0] == nullptr ||
408         instr->parallel_moves()[0]->empty()) {
409       return;
410     }
411     for (const MoveOperands* move : *instr->parallel_moves()[0]) {
412       if (move->IsRedundant()) continue;
413       InstructionOperand src = move->source();
414       InstructionOperand dst = move->destination();
415       MoveKey key = {src, dst};
416       auto res = move_map.insert(std::make_pair(key, 1));
417       if (!res.second) {
418         res.first->second++;
419         if (res.first->second == block->PredecessorCount()) {
420           correct_counts++;
421         }
422       }
423     }
424   }
425   if (move_map.empty() || correct_counts == 0) return;
426 
427   // Find insertion point.
428   Instruction* instr = code()->instructions()[block->first_instruction_index()];
429 
430   if (correct_counts != move_map.size()) {
431     // Moves that are unique to each predecessor won't be pushed to the common
432     // successor.
433     OperandSet conflicting_srcs(&operand_buffer1);
434     for (auto iter = move_map.begin(), end = move_map.end(); iter != end;) {
435       auto current = iter;
436       ++iter;
437       if (current->second != block->PredecessorCount()) {
438         InstructionOperand dest = current->first.destination;
439         // Not all the moves in all the gaps are the same. Maybe some are. If
440         // there are such moves, we could move them, but the destination of the
441         // moves staying behind can't appear as a source of a common move,
442         // because the move staying behind will clobber this destination.
443         conflicting_srcs.InsertOp(dest);
444         move_map.erase(current);
445       }
446     }
447 
448     bool changed = false;
449     do {
450       // If a common move can't be pushed to the common successor, then its
451       // destination also can't appear as source to any move being pushed.
452       changed = false;
453       for (auto iter = move_map.begin(), end = move_map.end(); iter != end;) {
454         auto current = iter;
455         ++iter;
456         DCHECK_EQ(block->PredecessorCount(), current->second);
457         if (conflicting_srcs.ContainsOpOrAlias(current->first.source)) {
458           conflicting_srcs.InsertOp(current->first.destination);
459           move_map.erase(current);
460           changed = true;
461         }
462       }
463     } while (changed);
464   }
465 
466   if (move_map.empty()) return;
467 
468   DCHECK_NOT_NULL(instr);
469   bool gap_initialized = true;
470   if (instr->parallel_moves()[0] != nullptr &&
471       !instr->parallel_moves()[0]->empty()) {
472     // Will compress after insertion.
473     gap_initialized = false;
474     std::swap(instr->parallel_moves()[0], instr->parallel_moves()[1]);
475   }
476   ParallelMove* moves = instr->GetOrCreateParallelMove(
477       static_cast<Instruction::GapPosition>(0), code_zone());
478   // Delete relevant entries in predecessors and move everything to block.
479   bool first_iteration = true;
480   for (RpoNumber& pred_index : block->predecessors()) {
481     const InstructionBlock* pred = code()->InstructionBlockAt(pred_index);
482     for (MoveOperands* move : *LastInstruction(pred)->parallel_moves()[0]) {
483       if (move->IsRedundant()) continue;
484       MoveKey key = {move->source(), move->destination()};
485       auto it = move_map.find(key);
486       if (it != move_map.end()) {
487         if (first_iteration) {
488           moves->AddMove(move->source(), move->destination());
489         }
490         move->Eliminate();
491       }
492     }
493     first_iteration = false;
494   }
495   // Compress.
496   if (!gap_initialized) {
497     CompressMoves(instr->parallel_moves()[0], instr->parallel_moves()[1]);
498   }
499   CompressBlock(block);
500 }
501 
502 
503 namespace {
504 
IsSlot(const InstructionOperand & op)505 bool IsSlot(const InstructionOperand& op) {
506   return op.IsStackSlot() || op.IsFPStackSlot();
507 }
508 
509 
LoadCompare(const MoveOperands * a,const MoveOperands * b)510 bool LoadCompare(const MoveOperands* a, const MoveOperands* b) {
511   if (!a->source().EqualsCanonicalized(b->source())) {
512     return a->source().CompareCanonicalized(b->source());
513   }
514   if (IsSlot(a->destination()) && !IsSlot(b->destination())) return false;
515   if (!IsSlot(a->destination()) && IsSlot(b->destination())) return true;
516   return a->destination().CompareCanonicalized(b->destination());
517 }
518 
519 }  // namespace
520 
521 
522 // Split multiple loads of the same constant or stack slot off into the second
523 // slot and keep remaining moves in the first slot.
FinalizeMoves(Instruction * instr)524 void MoveOptimizer::FinalizeMoves(Instruction* instr) {
525   MoveOpVector& loads = local_vector();
526   DCHECK(loads.empty());
527 
528   ParallelMove* parallel_moves = instr->parallel_moves()[0];
529   if (parallel_moves == nullptr) return;
530   // Find all the loads.
531   for (MoveOperands* move : *parallel_moves) {
532     if (move->IsRedundant()) continue;
533     if (move->source().IsConstant() || IsSlot(move->source())) {
534       loads.push_back(move);
535     }
536   }
537   if (loads.empty()) return;
538   // Group the loads by source, moving the preferred destination to the
539   // beginning of the group.
540   std::sort(loads.begin(), loads.end(), LoadCompare);
541   MoveOperands* group_begin = nullptr;
542   for (MoveOperands* load : loads) {
543     // New group.
544     if (group_begin == nullptr ||
545         !load->source().EqualsCanonicalized(group_begin->source())) {
546       group_begin = load;
547       continue;
548     }
549     // Nothing to be gained from splitting here.
550     if (IsSlot(group_begin->destination())) continue;
551     // Insert new move into slot 1.
552     ParallelMove* slot_1 = instr->GetOrCreateParallelMove(
553         static_cast<Instruction::GapPosition>(1), code_zone());
554     slot_1->AddMove(group_begin->destination(), load->destination());
555     load->Eliminate();
556   }
557   loads.clear();
558 }
559 
560 }  // namespace compiler
561 }  // namespace internal
562 }  // namespace v8
563