1 /*
2  * Copyright © 2010 Intel Corporation
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice (including the next
12  * paragraph) shall be included in all copies or substantial portions of the
13  * Software.
14  *
15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21  * DEALINGS IN THE SOFTWARE.
22  */
23 
24 #include "glsl_types.h"
25 #include "loop_analysis.h"
26 #include "ir_hierarchical_visitor.h"
27 
28 class loop_unroll_visitor : public ir_hierarchical_visitor {
29 public:
loop_unroll_visitor(loop_state * state,unsigned max_iterations)30    loop_unroll_visitor(loop_state *state, unsigned max_iterations)
31    {
32       this->state = state;
33       this->progress = false;
34       this->max_iterations = max_iterations;
35    }
36 
37    virtual ir_visitor_status visit_leave(ir_loop *ir);
38 
39    loop_state *state;
40 
41    bool progress;
42    unsigned max_iterations;
43 };
44 
45 
46 static bool
is_break(ir_instruction * ir)47 is_break(ir_instruction *ir)
48 {
49    return ir != NULL && ir->ir_type == ir_type_loop_jump
50 		     && ((ir_loop_jump *) ir)->is_break();
51 }
52 
53 class loop_unroll_count : public ir_hierarchical_visitor {
54 public:
55    int nodes;
56    bool fail;
57 
loop_unroll_count(exec_list * list)58    loop_unroll_count(exec_list *list)
59    {
60       nodes = 0;
61       fail = false;
62 
63       run(list);
64    }
65 
visit_enter(ir_assignment * ir)66    virtual ir_visitor_status visit_enter(ir_assignment *ir)
67    {
68       nodes++;
69       return visit_continue;
70    }
71 
visit_enter(ir_expression * ir)72    virtual ir_visitor_status visit_enter(ir_expression *ir)
73    {
74       nodes++;
75       return visit_continue;
76    }
77 
visit_enter(ir_loop * ir)78    virtual ir_visitor_status visit_enter(ir_loop *ir)
79    {
80       fail = true;
81       return visit_continue;
82    }
83 };
84 
85 
86 ir_visitor_status
visit_leave(ir_loop * ir)87 loop_unroll_visitor::visit_leave(ir_loop *ir)
88 {
89    loop_variable_state *const ls = this->state->get(ir);
90    int iterations;
91 
92    /* If we've entered a loop that hasn't been analyzed, something really,
93     * really bad has happened.
94     */
95    if (ls == NULL) {
96       assert(ls != NULL);
97       return visit_continue;
98    }
99 
100    iterations = ls->max_iterations;
101 
102    /* Don't try to unroll loops where the number of iterations is not known
103     * at compile-time.
104     */
105    if (iterations < 0)
106       return visit_continue;
107 
108    /* Don't try to unroll loops that have zillions of iterations either.
109     */
110    if (iterations > (int) max_iterations)
111       return visit_continue;
112 
113    /* Don't try to unroll nested loops and loops with a huge body.
114     */
115    loop_unroll_count count(&ir->body_instructions);
116 
117    if (count.fail || count.nodes * iterations > (int)max_iterations * 5)
118       return visit_continue;
119 
120    if (ls->num_loop_jumps > 1)
121       return visit_continue;
122    else if (ls->num_loop_jumps) {
123       ir_instruction *last_ir = (ir_instruction *) ir->body_instructions.get_tail();
124       assert(last_ir != NULL);
125 
126       if (is_break(last_ir)) {
127          /* If the only loop-jump is a break at the end of the loop, the loop
128           * will execute exactly once.  Remove the break, set the iteration
129           * count, and fall through to the normal unroller.
130           */
131          last_ir->remove();
132          iterations = 1;
133 
134          this->progress = true;
135       } else {
136          ir_if *ir_if = NULL;
137          ir_instruction *break_ir = NULL;
138          bool continue_from_then_branch = false;
139 
140          foreach_list(node, &ir->body_instructions) {
141             /* recognize loops in the form produced by ir_lower_jumps */
142             ir_instruction *cur_ir = (ir_instruction *) node;
143 
144             ir_if = cur_ir->as_if();
145             if (ir_if != NULL) {
146 	       /* Determine which if-statement branch, if any, ends with a
147 		* break.  The branch that did *not* have the break will get a
148 		* temporary continue inserted in each iteration of the loop
149 		* unroll.
150 		*
151 		* Note that since ls->num_loop_jumps is <= 1, it is impossible
152 		* for both branches to end with a break.
153 		*/
154                ir_instruction *ir_if_last =
155                   (ir_instruction *) ir_if->then_instructions.get_tail();
156 
157                if (is_break(ir_if_last)) {
158                   continue_from_then_branch = false;
159                   break_ir = ir_if_last;
160                   break;
161                } else {
162                   ir_if_last =
163 		     (ir_instruction *) ir_if->else_instructions.get_tail();
164 
165                   if (is_break(ir_if_last)) {
166                      break_ir = ir_if_last;
167                      continue_from_then_branch = true;
168                      break;
169                   }
170                }
171             }
172          }
173 
174          if (break_ir == NULL)
175             return visit_continue;
176 
177          /* move instructions after then if in the continue branch */
178          while (!ir_if->get_next()->is_tail_sentinel()) {
179             ir_instruction *move_ir = (ir_instruction *) ir_if->get_next();
180 
181             move_ir->remove();
182             if (continue_from_then_branch)
183                ir_if->then_instructions.push_tail(move_ir);
184             else
185                ir_if->else_instructions.push_tail(move_ir);
186          }
187 
188          /* Remove the break from the if-statement.
189           */
190          break_ir->remove();
191 
192          void *const mem_ctx = ralloc_parent(ir);
193          ir_instruction *ir_to_replace = ir;
194 
195          for (int i = 0; i < iterations; i++) {
196             exec_list copy_list;
197 
198             copy_list.make_empty();
199             clone_ir_list(mem_ctx, &copy_list, &ir->body_instructions);
200 
201             ir_if = ((ir_instruction *) copy_list.get_tail())->as_if();
202             assert(ir_if != NULL);
203 
204             ir_to_replace->insert_before(&copy_list);
205             ir_to_replace->remove();
206 
207             /* placeholder that will be removed in the next iteration */
208             ir_to_replace =
209 	       new(mem_ctx) ir_loop_jump(ir_loop_jump::jump_continue);
210 
211             exec_list *const list = (continue_from_then_branch)
212                ? &ir_if->then_instructions : &ir_if->else_instructions;
213 
214             list->push_tail(ir_to_replace);
215          }
216 
217          ir_to_replace->remove();
218 
219          this->progress = true;
220          return visit_continue;
221       }
222    }
223 
224    void *const mem_ctx = ralloc_parent(ir);
225 
226    for (int i = 0; i < iterations; i++) {
227       exec_list copy_list;
228 
229       copy_list.make_empty();
230       clone_ir_list(mem_ctx, &copy_list, &ir->body_instructions);
231 
232       ir->insert_before(&copy_list);
233    }
234 
235    /* The loop has been replaced by the unrolled copies.  Remove the original
236     * loop from the IR sequence.
237     */
238    ir->remove();
239 
240    this->progress = true;
241    return visit_continue;
242 }
243 
244 
245 bool
unroll_loops(exec_list * instructions,loop_state * ls,unsigned max_iterations)246 unroll_loops(exec_list *instructions, loop_state *ls, unsigned max_iterations)
247 {
248    loop_unroll_visitor v(ls, max_iterations);
249 
250    v.run(instructions);
251 
252    return v.progress;
253 }
254