2 * Copyright (C) 2014 Rob Clark <robclark@freedesktop.org>
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
24 * Rob Clark <robclark@freedesktop.org>
30 * Find/group instruction neighbors:
34 insert_mov(struct ir3_instruction
*collect
, int idx
)
36 struct ir3_instruction
*src
= ssa(collect
->regs
[idx
+1]);
37 struct ir3_instruction
*mov
= ir3_MOV(src
->block
, src
,
38 (collect
->regs
[idx
+1]->flags
& IR3_REG_HALF
) ? TYPE_U16
: TYPE_U32
);
40 collect
->regs
[idx
+1]->instr
= mov
;
42 /* if collect and src are in the same block, move the inserted mov
43 * to just before the collect to avoid a use-before-def. Otherwise
44 * it should be safe to leave at the end of the block it is in:
46 if (src
->block
== collect
->block
) {
47 ir3_instr_move_before(mov
, collect
);
51 /* verify that cur != instr, but cur is also not in instr's neighbor-list: */
53 in_neighbor_list(struct ir3_instruction
*instr
, struct ir3_instruction
*cur
, int pos
)
63 for (instr
= ir3_neighbor_first(instr
); instr
; instr
= instr
->cp
.right
)
64 if ((idx
++ != pos
) && (instr
== cur
))
71 group_collect(struct ir3_instruction
*collect
)
73 struct ir3_register
**regs
= &collect
->regs
[1];
74 unsigned n
= collect
->regs_count
- 1;
76 /* first pass, figure out what has conflicts and needs a mov
77 * inserted. Do this up front, before starting to setup
78 * left/right neighbor pointers. Trying to do it in a single
79 * pass could result in a situation where we can't even setup
80 * the mov's right neighbor ptr if the next instr also needs
84 for (unsigned i
= 0; i
< n
; i
++) {
85 struct ir3_instruction
*instr
= ssa(regs
[i
]);
87 struct ir3_instruction
*left
= (i
> 0) ? ssa(regs
[i
- 1]) : NULL
;
88 struct ir3_instruction
*right
= (i
< (n
-1)) ? ssa(regs
[i
+ 1]) : NULL
;
91 /* check for left/right neighbor conflicts: */
92 conflict
= conflicts(instr
->cp
.left
, left
) ||
93 conflicts(instr
->cp
.right
, right
);
95 /* Mixing array elements and higher register classes
96 * (ie. groups) doesn't really work out in RA. See:
98 * https://trello.com/c/DqeDkeVf/156-bug-with-stk-70frag
100 if (instr
->regs
[0]->flags
& IR3_REG_ARRAY
)
103 /* we also can't have an instr twice in the group: */
104 for (unsigned j
= i
+ 1; (j
< n
) && !conflict
; j
++)
105 if (in_neighbor_list(ssa(regs
[j
]), instr
, i
))
109 insert_mov(collect
, i
);
110 /* inserting the mov may have caused a conflict
111 * against the previous:
118 /* second pass, now that we've inserted mov's, fixup left/right
119 * neighbors. This is guaranteed to succeed, since by definition
120 * the newly inserted mov's cannot conflict with anything.
122 for (unsigned i
= 0; i
< n
; i
++) {
123 struct ir3_instruction
*instr
= ssa(regs
[i
]);
125 struct ir3_instruction
*left
= (i
> 0) ? ssa(regs
[i
- 1]) : NULL
;
126 struct ir3_instruction
*right
= (i
< (n
-1)) ? ssa(regs
[i
+ 1]) : NULL
;
128 debug_assert(!conflicts(instr
->cp
.left
, left
));
130 instr
->cp
.left_cnt
++;
131 instr
->cp
.left
= left
;
134 debug_assert(!conflicts(instr
->cp
.right
, right
));
136 instr
->cp
.right_cnt
++;
137 instr
->cp
.right
= right
;
144 instr_find_neighbors(struct ir3_instruction
*instr
)
146 bool progress
= false;
148 if (ir3_instr_check_mark(instr
))
151 if (instr
->opc
== OPC_META_COLLECT
) {
152 group_collect(instr
);
156 foreach_ssa_src (src
, instr
)
157 progress
|= instr_find_neighbors(src
);
163 find_neighbors(struct ir3
*ir
)
165 bool progress
= false;
168 foreach_output (out
, ir
)
169 progress
|= instr_find_neighbors(out
);
171 foreach_block (block
, &ir
->block_list
) {
172 for (i
= 0; i
< block
->keeps_count
; i
++) {
173 struct ir3_instruction
*instr
= block
->keeps
[i
];
174 progress
|= instr_find_neighbors(instr
);
177 /* We also need to account for if-condition: */
178 if (block
->condition
)
179 progress
|= instr_find_neighbors(block
->condition
);
186 ir3_group(struct ir3
*ir
)
189 return find_neighbors(ir
);