1bc1dc812c6fe9ba7fd25607e7fd016e8e9b4a40
[mesa.git] / src / gallium / drivers / lima / ir / pp / liveness.c
1 /*
2 * Copyright (c) 2019 Lima Project
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sub license,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the
12 * next paragraph) shall be included in all copies or substantial portions
13 * of the Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21 * DEALINGS IN THE SOFTWARE.
22 *
23 */
24
25 #include "ppir.h"
26
27 /* Propagates liveness from a liveness set to another by performing the
28 * union between sets. */
29 static void
30 ppir_liveness_propagate(ppir_compiler *comp,
31 struct ppir_liveness *dest, struct ppir_liveness *src,
32 struct set *dest_set, struct set *src_set)
33 {
34 set_foreach(src_set, entry_src) {
35 const struct ppir_liveness *s = entry_src->key;
36 assert(s);
37
38 unsigned int regalloc_index = s->reg->regalloc_index;
39
40 dest[regalloc_index].reg = src[regalloc_index].reg;
41 dest[regalloc_index].mask |= src[regalloc_index].mask;
42 _mesa_set_add(dest_set, &dest[regalloc_index]);
43 }
44 }
45
46 /* Clone a liveness set (without propagation) */
47 static void
48 ppir_liveness_set_clone(ppir_compiler *comp,
49 struct ppir_liveness *dest, struct ppir_liveness *src,
50 struct set *dest_set, struct set *src_set)
51 {
52 _mesa_set_clear(dest_set, NULL);
53 memset(dest, 0, list_length(&comp->reg_list) * sizeof(struct ppir_liveness));
54 memcpy(dest, src,
55 list_length(&comp->reg_list) * sizeof(struct ppir_liveness));
56
57 set_foreach(src_set, entry_src) {
58 const struct ppir_liveness *s = entry_src->key;
59 assert(s);
60
61 unsigned int regalloc_index = s->reg->regalloc_index;
62 dest[regalloc_index].reg = src[regalloc_index].reg;
63 dest[regalloc_index].mask = src[regalloc_index].mask;
64 _mesa_set_add(dest_set, &dest[regalloc_index]);
65 }
66 }
67
68 /* Check whether two liveness sets are equal. */
69 static bool
70 ppir_liveness_set_equal(ppir_compiler *comp,
71 struct ppir_liveness *l1, struct ppir_liveness *l2,
72 struct set *set1, struct set *set2)
73 {
74 set_foreach(set1, entry1) {
75 const struct ppir_liveness *k1 = entry1->key;
76 unsigned int regalloc_index = k1->reg->regalloc_index;
77
78 struct set_entry *entry2 = _mesa_set_search(set2, &l2[regalloc_index]);
79 if (!entry2)
80 return false;
81
82 const struct ppir_liveness *k2 = entry2->key;
83
84 if (k1->mask != k2->mask)
85 return false;
86 }
87 set_foreach(set2, entry2) {
88 const struct ppir_liveness *k2 = entry2->key;
89 unsigned int regalloc_index = k2->reg->regalloc_index;
90
91 struct set_entry *entry1 = _mesa_set_search(set1, &l1[regalloc_index]);
92 if (!entry1)
93 return false;
94
95 const struct ppir_liveness *k1 = entry1->key;
96
97 if (k2->mask != k1->mask)
98 return false;
99 }
100 return true;
101 }
102
103 /* Update the liveness information of the instruction by adding its srcs
104 * as live registers to the live_in set. */
105 static void
106 ppir_liveness_instr_srcs(ppir_compiler *comp, ppir_instr *instr)
107 {
108 for (int i = PPIR_INSTR_SLOT_NUM-1; i >= 0; i--) {
109 ppir_node *node = instr->slots[i];
110 if (!node)
111 continue;
112
113 switch(node->op) {
114 case ppir_op_const:
115 case ppir_op_undef:
116 continue;
117 default:
118 break;
119 }
120
121 for (int i = 0; i < ppir_node_get_src_num(node); i++) {
122 ppir_src *src = ppir_node_get_src(node, i);
123 if (!src || src->type == ppir_target_pipeline)
124 continue;
125
126 ppir_reg *reg = ppir_src_get_reg(src);
127 if (!reg || reg->undef)
128 continue;
129
130 /* if some other op on this same instruction is writing,
131 * we just need to reserve a register for this particular
132 * instruction. Add the register to live_out to make that
133 * interference happen without propagating its liveness. */
134 if (src->node && src->node->instr == instr) {
135 instr->live_out[reg->regalloc_index].reg = reg;
136 _mesa_set_add(instr->live_out_set, &instr->live_out[reg->regalloc_index]);
137 continue;
138 }
139
140 struct set_entry *live = _mesa_set_search(instr->live_in_set,
141 &instr->live_in[reg->regalloc_index]);
142 if (src->type == ppir_target_ssa) {
143 /* reg is read, needs to be live before instr */
144 if (live)
145 continue;
146
147 instr->live_in[reg->regalloc_index].reg = reg;
148 _mesa_set_add(instr->live_in_set, &instr->live_in[reg->regalloc_index]);
149 }
150 else {
151 unsigned int mask = ppir_src_get_mask(node);
152
153 /* read reg is type register, need to check if this sets
154 * any additional bits in the current mask */
155 if (live && (instr->live_in[reg->regalloc_index].mask ==
156 (instr->live_in[reg->regalloc_index].mask | mask)))
157 continue;
158
159 /* some new components */
160 instr->live_in[reg->regalloc_index].reg = reg;
161 instr->live_in[reg->regalloc_index].mask |= mask;
162 _mesa_set_add(instr->live_in_set, &instr->live_in[reg->regalloc_index]);
163 }
164 }
165 }
166 }
167
168
169 /* Update the liveness information of the instruction by removing its
170 * dests from the live_in set. */
171 static void
172 ppir_liveness_instr_dest(ppir_compiler *comp, ppir_instr *instr)
173 {
174 for (int i = PPIR_INSTR_SLOT_NUM-1; i >= 0; i--) {
175 ppir_node *node = instr->slots[i];
176 if (!node)
177 continue;
178
179 switch(node->op) {
180 case ppir_op_const:
181 case ppir_op_undef:
182 case ppir_op_store_color: /* never clear dest if its store output */
183 continue;
184 default:
185 break;
186 }
187
188 ppir_dest *dest = ppir_node_get_dest(node);
189 if (!dest || dest->type == ppir_target_pipeline)
190 continue;
191 ppir_reg *reg = ppir_dest_get_reg(dest);
192 if (!reg || reg->undef)
193 continue;
194
195 struct set_entry *live = _mesa_set_search(instr->live_in_set,
196 &instr->live_in[reg->regalloc_index]);
197
198 /* If a register is written but wasn't read in a later instruction, it is
199 * either dead code or a bug. For now, assign an interference to it to
200 * ensure it doesn't get assigned a live register and overwrites it. */
201 if (!live) {
202 instr->live_out[reg->regalloc_index].reg = reg;
203 _mesa_set_add(instr->live_out_set, &instr->live_out[reg->regalloc_index]);
204 continue;
205 }
206
207 if (dest->type == ppir_target_ssa) {
208 /* reg is written and ssa, is not live before instr */
209 _mesa_set_remove_key(instr->live_in_set, &instr->live_in[reg->regalloc_index]);
210 }
211 else {
212 unsigned int mask = ppir_src_get_mask(node);
213 /* written reg is type register, need to check if this clears
214 * the remaining mask to remove it from the live set */
215 if (instr->live_in[reg->regalloc_index].mask ==
216 (instr->live_in[reg->regalloc_index].mask & ~mask))
217 continue;
218
219 instr->live_in[reg->regalloc_index].mask &= ~mask;
220 /* unset reg if all remaining bits were cleared */
221 if (!instr->live_in[reg->regalloc_index].mask) {
222 _mesa_set_remove_key(instr->live_in_set, &instr->live_in[reg->regalloc_index]);
223 }
224 }
225 }
226 }
227
228 /* Main loop, iterate blocks/instructions/ops backwards, propagate
229 * livenss and update liveness of each instruction. */
230 static bool
231 ppir_liveness_compute_live_sets(ppir_compiler *comp)
232 {
233 bool cont = false;
234 list_for_each_entry_rev(ppir_block, block, &comp->block_list, list) {
235 ppir_instr *first = list_first_entry(&block->instr_list, ppir_instr, list);
236 ppir_instr *last = list_last_entry(&block->instr_list, ppir_instr, list);
237
238 /* inherit live_out from the other blocks live_in */
239 for (int i = 0; i < 2; i++) {
240 ppir_block *succ = block->successors[i];
241 if (!succ)
242 continue;
243
244 ppir_liveness_propagate(comp, block->live_out, succ->live_in,
245 block->live_out_set, succ->live_in_set);
246 }
247
248 list_for_each_entry_rev(ppir_instr, instr, &block->instr_list, list) {
249 /* inherit (or-) live variables from next instr or block */
250 if (instr == last) {
251 ppir_liveness_set_clone(comp,
252 instr->live_out, block->live_out,
253 instr->live_out_set, block->live_out_set);
254 }
255 else {
256 ppir_instr *next_instr = LIST_ENTRY(ppir_instr, instr->list.next, list);
257 ppir_liveness_set_clone(comp,
258 instr->live_out, next_instr->live_in,
259 instr->live_out_set, next_instr->live_in_set);
260 }
261 /* initial copy to check for changes */
262 struct set *temp_live_in_set = _mesa_set_create(comp,
263 _mesa_hash_pointer,
264 _mesa_key_pointer_equal);
265 struct ppir_liveness temp_live_in[list_length(&comp->reg_list)];
266 ppir_liveness_set_clone(comp,
267 temp_live_in, instr->live_in,
268 temp_live_in_set, instr->live_in_set);
269
270 /* initialize live_in for potential changes */
271 ppir_liveness_propagate(comp, instr->live_in, instr->live_out,
272 instr->live_in_set, instr->live_out_set);
273
274 ppir_liveness_instr_dest(comp, instr);
275 ppir_liveness_instr_srcs(comp, instr);
276
277 cont |= !ppir_liveness_set_equal(comp, temp_live_in, instr->live_in,
278 temp_live_in_set, instr->live_in_set);
279 }
280
281 /* inherit live_in from the first instruction in the block,
282 * or live_out if it is empty */
283 if (!list_is_empty(&block->instr_list) && first && first->scheduled)
284 ppir_liveness_set_clone(comp, block->live_in, first->live_in,
285 block->live_in_set, first->live_in_set);
286 else
287 ppir_liveness_set_clone(comp, block->live_in, block->live_out,
288 block->live_in_set, block->live_out_set);
289 }
290
291 return cont;
292 }
293
294 /*
295 * Liveness analysis is based on https://en.wikipedia.org/wiki/Live_variable_analysis
296 * This implementation calculates liveness before/after each
297 * instruction. Aggregated block liveness information is stored
298 * before/after blocks for conveniency (handle e.g. empty blocks).
299 * Blocks/instructions/ops are iterated backwards so register reads are
300 * propagated up to the instruction that writes it.
301 *
302 * 1) Before computing liveness for each instruction, propagate live_out
303 * from the next instruction. If it is the last instruction in a
304 * block, propagate liveness from all possible next instructions
305 * (in this case, this information comes from the live_out of the
306 * block itself).
307 * 2) Calculate live_in for the each instruction. The initial live_in is
308 * a copy of its live_out so registers who aren't touched by this
309 * instruction are kept intact.
310 * - If a register is written by this instruction, it no longer needs
311 * to be live before the instruction, so it is removed from live_in.
312 * - If a register is read by this instruction, it needs to be live
313 * before its execution, so add it to live_in.
314 * - Non-ssa registers are a special case. For this, the algorithm
315 * keeps and updates the mask of live components following the same
316 * logic as above. The register is only removed from the live set
317 * when no live components are left.
318 * - If a non-ssa register is written and read in the same
319 * instruction, it stays in live_in.
320 * - Another special case is a ssa register that is written by an
321 * early op in the instruction, and read by a later op. In this case,
322 * the algorithm adds it to the live_out set so that the register
323 * allocator properly assigns an interference for it.
324 * 3) The algorithm must run over the entire program until it converges,
325 * i.e. a full run happens without changes. This is because blocks
326 * are updated sequentially and updates in a block may need to be
327 * propagated to parent blocks that were already calculated in the
328 * current run.
329 */
330 void
331 ppir_liveness_analysis(ppir_compiler *comp)
332 {
333 while (ppir_liveness_compute_live_sets(comp))
334 ;
335 }