Subversion Repositories Kolibri OS

Rev

Go to most recent revision | Details | Last modification | View Log | RSS feed

Rev Author Line No. Line
4358 Serge 1
/*
2
 * Copyright © 2010 Intel Corporation
3
 *
4
 * Permission is hereby granted, free of charge, to any person obtaining a
5
 * copy of this software and associated documentation files (the "Software"),
6
 * to deal in the Software without restriction, including without limitation
7
 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8
 * and/or sell copies of the Software, and to permit persons to whom the
9
 * Software is furnished to do so, subject to the following conditions:
10
 *
11
 * The above copyright notice and this permission notice (including the next
12
 * paragraph) shall be included in all copies or substantial portions of the
13
 * Software.
14
 *
15
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18
 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20
 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21
 * DEALINGS IN THE SOFTWARE.
22
 */
23
 
24
/**
25
 * \file opt_dead_code_local.cpp
26
 *
27
 * Eliminates local dead assignments from the code.
28
 *
29
 * This operates on basic blocks, tracking assignments and finding if
30
 * they're used before the variable is completely reassigned.
31
 *
32
 * Compare this to ir_dead_code.cpp, which operates globally looking
33
 * for assignments to variables that are never read.
34
 */
35
 
36
#include "ir.h"
37
#include "ir_basic_block.h"
38
#include "ir_optimization.h"
39
#include "glsl_types.h"
40
 
41
static bool debug = false;
42
 
43
namespace {
44
 
45
class assignment_entry : public exec_node
46
{
47
public:
48
   assignment_entry(ir_variable *lhs, ir_assignment *ir)
49
   {
50
      assert(lhs);
51
      assert(ir);
52
      this->lhs = lhs;
53
      this->ir = ir;
54
      this->available = ir->write_mask;
55
   }
56
 
57
   ir_variable *lhs;
58
   ir_assignment *ir;
59
 
60
   /* bitmask of xyzw channels written that haven't been used so far. */
61
   int available;
62
};
63
 
64
class kill_for_derefs_visitor : public ir_hierarchical_visitor {
65
public:
66
   kill_for_derefs_visitor(exec_list *assignments)
67
   {
68
      this->assignments = assignments;
69
   }
70
 
71
   void kill_channels(ir_variable *const var, int used)
72
   {
73
      foreach_iter(exec_list_iterator, iter, *this->assignments) {
74
	 assignment_entry *entry = (assignment_entry *)iter.get();
75
 
76
	 if (entry->lhs == var) {
77
	    if (var->type->is_scalar() || var->type->is_vector()) {
78
	       if (debug)
79
		  printf("kill %s (0x%01x - 0x%01x)\n", entry->lhs->name,
80
			 entry->available, used);
81
	       entry->available &= ~used;
82
	       if (!entry->available)
83
		  entry->remove();
84
	    } else {
85
	       if (debug)
86
		  printf("kill %s\n", entry->lhs->name);
87
	       entry->remove();
88
	    }
89
	 }
90
      }
91
   }
92
 
93
   virtual ir_visitor_status visit(ir_dereference_variable *ir)
94
   {
95
      kill_channels(ir->var, ~0);
96
 
97
      return visit_continue;
98
   }
99
 
100
   virtual ir_visitor_status visit(ir_swizzle *ir)
101
   {
102
      ir_dereference_variable *deref = ir->val->as_dereference_variable();
103
      if (!deref)
104
	 return visit_continue;
105
 
106
      int used = 0;
107
      used |= 1 << ir->mask.x;
108
      used |= 1 << ir->mask.y;
109
      used |= 1 << ir->mask.z;
110
      used |= 1 << ir->mask.w;
111
 
112
      kill_channels(deref->var, used);
113
 
114
      return visit_continue_with_parent;
115
   }
116
 
117
private:
118
   exec_list *assignments;
119
};
120
 
121
class array_index_visit : public ir_hierarchical_visitor {
122
public:
123
   array_index_visit(ir_hierarchical_visitor *v)
124
   {
125
      this->visitor = v;
126
   }
127
 
128
   virtual ir_visitor_status visit_enter(class ir_dereference_array *ir)
129
   {
130
      ir->array_index->accept(visitor);
131
      return visit_continue;
132
   }
133
 
134
   static void run(ir_instruction *ir, ir_hierarchical_visitor *v)
135
   {
136
      array_index_visit top_visit(v);
137
      ir->accept(& top_visit);
138
   }
139
 
140
   ir_hierarchical_visitor *visitor;
141
};
142
 
143
} /* unnamed namespace */
144
 
145
/**
146
 * Adds an entry to the available copy list if it's a plain assignment
147
 * of a variable to a variable.
148
 */
149
static bool
150
process_assignment(void *ctx, ir_assignment *ir, exec_list *assignments)
151
{
152
   ir_variable *var = NULL;
153
   bool progress = false;
154
   kill_for_derefs_visitor v(assignments);
155
 
156
   /* Kill assignment entries for things used to produce this assignment. */
157
   ir->rhs->accept(&v);
158
   if (ir->condition) {
159
      ir->condition->accept(&v);
160
   }
161
 
162
   /* Kill assignment enties used as array indices.
163
    */
164
   array_index_visit::run(ir->lhs, &v);
165
   var = ir->lhs->variable_referenced();
166
   assert(var);
167
 
168
   /* Now, check if we did a whole-variable assignment. */
169
   if (!ir->condition) {
170
      ir_dereference_variable *deref_var = ir->lhs->as_dereference_variable();
171
 
172
      /* If it's a vector type, we can do per-channel elimination of
173
       * use of the RHS.
174
       */
175
      if (deref_var && (deref_var->var->type->is_scalar() ||
176
			deref_var->var->type->is_vector())) {
177
 
178
	 if (debug)
179
	    printf("looking for %s.0x%01x to remove\n", var->name,
180
		   ir->write_mask);
181
 
182
	 foreach_iter(exec_list_iterator, iter, *assignments) {
183
	    assignment_entry *entry = (assignment_entry *)iter.get();
184
 
185
	    if (entry->lhs != var)
186
	       continue;
187
 
188
	    int remove = entry->available & ir->write_mask;
189
	    if (debug) {
190
	       printf("%s 0x%01x - 0x%01x = 0x%01x\n",
191
		      var->name,
192
		      entry->ir->write_mask,
193
		      remove, entry->ir->write_mask & ~remove);
194
	    }
195
	    if (remove) {
196
	       progress = true;
197
 
198
	       if (debug) {
199
		  printf("rewriting:\n  ");
200
		  entry->ir->print();
201
		  printf("\n");
202
	       }
203
 
204
	       entry->ir->write_mask &= ~remove;
205
	       entry->available &= ~remove;
206
	       if (entry->ir->write_mask == 0) {
207
		  /* Delete the dead assignment. */
208
		  entry->ir->remove();
209
		  entry->remove();
210
	       } else {
211
		  void *mem_ctx = ralloc_parent(entry->ir);
212
		  /* Reswizzle the RHS arguments according to the new
213
		   * write_mask.
214
		   */
215
		  unsigned components[4];
216
		  unsigned channels = 0;
217
		  unsigned next = 0;
218
 
219
		  for (int i = 0; i < 4; i++) {
220
		     if ((entry->ir->write_mask | remove) & (1 << i)) {
221
			if (!(remove & (1 << i)))
222
			   components[channels++] = next;
223
			next++;
224
		     }
225
		  }
226
 
227
		  entry->ir->rhs = new(mem_ctx) ir_swizzle(entry->ir->rhs,
228
							   components,
229
							   channels);
230
		  if (debug) {
231
		     printf("to:\n  ");
232
		     entry->ir->print();
233
		     printf("\n");
234
		  }
235
	       }
236
	    }
237
	 }
238
      } else if (ir->whole_variable_written() != NULL) {
239
	 /* We did a whole-variable assignment.  So, any instruction in
240
	  * the assignment list with the same LHS is dead.
241
	  */
242
	 if (debug)
243
	    printf("looking for %s to remove\n", var->name);
244
	 foreach_iter(exec_list_iterator, iter, *assignments) {
245
	    assignment_entry *entry = (assignment_entry *)iter.get();
246
 
247
	    if (entry->lhs == var) {
248
	       if (debug)
249
		  printf("removing %s\n", var->name);
250
	       entry->ir->remove();
251
	       entry->remove();
252
	       progress = true;
253
	    }
254
	 }
255
      }
256
   }
257
 
258
   /* Add this instruction to the assignment list available to be removed. */
259
   assignment_entry *entry = new(ctx) assignment_entry(var, ir);
260
   assignments->push_tail(entry);
261
 
262
   if (debug) {
263
      printf("add %s\n", var->name);
264
 
265
      printf("current entries\n");
266
      foreach_iter(exec_list_iterator, iter, *assignments) {
267
	 assignment_entry *entry = (assignment_entry *)iter.get();
268
 
269
	 printf("    %s (0x%01x)\n", entry->lhs->name, entry->available);
270
      }
271
   }
272
 
273
   return progress;
274
}
275
 
276
static void
277
dead_code_local_basic_block(ir_instruction *first,
278
			     ir_instruction *last,
279
			     void *data)
280
{
281
   ir_instruction *ir, *ir_next;
282
   /* List of avaialble_copy */
283
   exec_list assignments;
284
   bool *out_progress = (bool *)data;
285
   bool progress = false;
286
 
287
   void *ctx = ralloc_context(NULL);
288
   /* Safe looping, since process_assignment */
289
   for (ir = first, ir_next = (ir_instruction *)first->next;;
290
	ir = ir_next, ir_next = (ir_instruction *)ir->next) {
291
      ir_assignment *ir_assign = ir->as_assignment();
292
 
293
      if (debug) {
294
	 ir->print();
295
	 printf("\n");
296
      }
297
 
298
      if (ir_assign) {
299
	 progress = process_assignment(ctx, ir_assign, &assignments) || progress;
300
      } else {
301
	 kill_for_derefs_visitor kill(&assignments);
302
	 ir->accept(&kill);
303
      }
304
 
305
      if (ir == last)
306
	 break;
307
   }
308
   *out_progress = progress;
309
   ralloc_free(ctx);
310
}
311
 
312
/**
313
 * Does a copy propagation pass on the code present in the instruction stream.
314
 */
315
bool
316
do_dead_code_local(exec_list *instructions)
317
{
318
   bool progress = false;
319
 
320
   call_for_basic_blocks(instructions, dead_code_local_basic_block, &progress);
321
 
322
   return progress;
323
}