2 * Copyright (c) 2017 Lima Project
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sub license,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the
12 * next paragraph) shall be included in all copies or substantial portions
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21 * DEALINGS IN THE SOFTWARE.
25 #include "util/u_math.h"
26 #include "util/ralloc.h"
27 #include "util/bitscan.h"
31 const ppir_op_info ppir_op_infos
[] = {
35 PPIR_INSTR_SLOT_ALU_SCL_ADD
, PPIR_INSTR_SLOT_ALU_SCL_MUL
,
36 PPIR_INSTR_SLOT_ALU_VEC_ADD
, PPIR_INSTR_SLOT_ALU_VEC_MUL
,
52 PPIR_INSTR_SLOT_ALU_SCL_MUL
, PPIR_INSTR_SLOT_ALU_VEC_MUL
,
59 PPIR_INSTR_SLOT_ALU_SCL_ADD
, PPIR_INSTR_SLOT_ALU_VEC_ADD
,
66 PPIR_INSTR_SLOT_ALU_VEC_ADD
, PPIR_INSTR_SLOT_END
72 PPIR_INSTR_SLOT_ALU_VEC_ADD
, PPIR_INSTR_SLOT_END
78 PPIR_INSTR_SLOT_ALU_COMBINE
, PPIR_INSTR_SLOT_END
84 PPIR_INSTR_SLOT_ALU_COMBINE
, PPIR_INSTR_SLOT_END
90 PPIR_INSTR_SLOT_ALU_COMBINE
, PPIR_INSTR_SLOT_END
96 PPIR_INSTR_SLOT_ALU_COMBINE
, PPIR_INSTR_SLOT_END
102 PPIR_INSTR_SLOT_ALU_COMBINE
, PPIR_INSTR_SLOT_END
108 PPIR_INSTR_SLOT_ALU_COMBINE
, PPIR_INSTR_SLOT_END
114 PPIR_INSTR_SLOT_ALU_SCL_ADD
, PPIR_INSTR_SLOT_ALU_SCL_MUL
,
115 PPIR_INSTR_SLOT_ALU_VEC_ADD
, PPIR_INSTR_SLOT_ALU_VEC_MUL
,
122 PPIR_INSTR_SLOT_ALU_SCL_ADD
, PPIR_INSTR_SLOT_ALU_SCL_MUL
,
123 PPIR_INSTR_SLOT_ALU_VEC_ADD
, PPIR_INSTR_SLOT_ALU_VEC_MUL
,
130 PPIR_INSTR_SLOT_ALU_SCL_ADD
, PPIR_INSTR_SLOT_ALU_VEC_ADD
,
137 PPIR_INSTR_SLOT_ALU_SCL_ADD
, PPIR_INSTR_SLOT_ALU_VEC_ADD
,
144 PPIR_INSTR_SLOT_ALU_SCL_ADD
, PPIR_INSTR_SLOT_ALU_VEC_ADD
,
151 PPIR_INSTR_SLOT_ALU_SCL_ADD
, PPIR_INSTR_SLOT_ALU_VEC_ADD
,
158 PPIR_INSTR_SLOT_ALU_SCL_ADD
, PPIR_INSTR_SLOT_ALU_VEC_ADD
,
165 PPIR_INSTR_SLOT_ALU_SCL_MUL
, PPIR_INSTR_SLOT_ALU_VEC_MUL
,
172 PPIR_INSTR_SLOT_ALU_SCL_MUL
, PPIR_INSTR_SLOT_ALU_VEC_MUL
,
179 PPIR_INSTR_SLOT_ALU_SCL_MUL
, PPIR_INSTR_SLOT_ALU_VEC_MUL
,
186 PPIR_INSTR_SLOT_ALU_SCL_MUL
, PPIR_INSTR_SLOT_ALU_VEC_MUL
,
199 PPIR_INSTR_SLOT_ALU_SCL_MUL
, PPIR_INSTR_SLOT_ALU_SCL_ADD
,
200 PPIR_INSTR_SLOT_ALU_VEC_MUL
, PPIR_INSTR_SLOT_ALU_VEC_ADD
,
207 PPIR_INSTR_SLOT_ALU_SCL_MUL
, PPIR_INSTR_SLOT_ALU_SCL_ADD
,
208 PPIR_INSTR_SLOT_ALU_VEC_MUL
, PPIR_INSTR_SLOT_ALU_VEC_ADD
,
215 PPIR_INSTR_SLOT_ALU_SCL_MUL
, PPIR_INSTR_SLOT_ALU_SCL_ADD
,
216 PPIR_INSTR_SLOT_ALU_VEC_MUL
, PPIR_INSTR_SLOT_ALU_VEC_ADD
,
223 PPIR_INSTR_SLOT_ALU_SCL_MUL
, PPIR_INSTR_SLOT_ALU_SCL_ADD
,
224 PPIR_INSTR_SLOT_ALU_VEC_MUL
, PPIR_INSTR_SLOT_ALU_VEC_ADD
,
228 [ppir_op_sel_cond
] = {
229 /* effectively mov, but must be scheduled only to
230 * PPIR_INSTR_SLOT_ALU_SCL_MUL */
233 PPIR_INSTR_SLOT_ALU_SCL_MUL
, PPIR_INSTR_SLOT_END
239 PPIR_INSTR_SLOT_ALU_SCL_ADD
, PPIR_INSTR_SLOT_ALU_VEC_ADD
,
246 PPIR_INSTR_SLOT_ALU_COMBINE
, PPIR_INSTR_SLOT_END
249 [ppir_op_load_varying
] = {
251 .type
= ppir_node_type_load
,
253 PPIR_INSTR_SLOT_VARYING
, PPIR_INSTR_SLOT_END
256 [ppir_op_load_coords
] = {
258 .type
= ppir_node_type_load
,
260 PPIR_INSTR_SLOT_VARYING
, PPIR_INSTR_SLOT_END
263 [ppir_op_load_coords_reg
] = {
264 .name
= "ld_coords_reg",
265 .type
= ppir_node_type_load
,
267 PPIR_INSTR_SLOT_VARYING
, PPIR_INSTR_SLOT_END
270 [ppir_op_load_fragcoord
] = {
271 .name
= "ld_fragcoord",
272 .type
= ppir_node_type_load
,
274 PPIR_INSTR_SLOT_VARYING
, PPIR_INSTR_SLOT_END
277 [ppir_op_load_pointcoord
] = {
278 .name
= "ld_pointcoord",
279 .type
= ppir_node_type_load
,
281 PPIR_INSTR_SLOT_VARYING
, PPIR_INSTR_SLOT_END
284 [ppir_op_load_frontface
] = {
285 .name
= "ld_frontface",
286 .type
= ppir_node_type_load
,
288 PPIR_INSTR_SLOT_VARYING
, PPIR_INSTR_SLOT_END
291 [ppir_op_load_uniform
] = {
293 .type
= ppir_node_type_load
,
295 PPIR_INSTR_SLOT_UNIFORM
, PPIR_INSTR_SLOT_END
298 [ppir_op_load_texture
] = {
300 .type
= ppir_node_type_load_texture
,
302 PPIR_INSTR_SLOT_TEXLD
, PPIR_INSTR_SLOT_END
305 [ppir_op_load_temp
] = {
307 .type
= ppir_node_type_load
,
309 PPIR_INSTR_SLOT_UNIFORM
, PPIR_INSTR_SLOT_END
314 .type
= ppir_node_type_const
,
316 [ppir_op_store_color
] = {
318 .type
= ppir_node_type_alu
,
320 PPIR_INSTR_SLOT_ALU_VEC_ADD
, PPIR_INSTR_SLOT_ALU_VEC_MUL
,
324 [ppir_op_store_temp
] = {
326 .type
= ppir_node_type_store
,
328 PPIR_INSTR_SLOT_STORE_TEMP
, PPIR_INSTR_SLOT_END
331 [ppir_op_discard
] = {
333 .type
= ppir_node_type_discard
,
335 PPIR_INSTR_SLOT_BRANCH
, PPIR_INSTR_SLOT_END
340 .type
= ppir_node_type_branch
,
342 PPIR_INSTR_SLOT_BRANCH
, PPIR_INSTR_SLOT_END
347 .type
= ppir_node_type_alu
,
353 .type
= ppir_node_type_alu
,
359 void *ppir_node_create(ppir_block
*block
, ppir_op op
, int index
, unsigned mask
)
361 ppir_compiler
*comp
= block
->comp
;
362 static const int node_size
[] = {
363 [ppir_node_type_alu
] = sizeof(ppir_alu_node
),
364 [ppir_node_type_const
] = sizeof(ppir_const_node
),
365 [ppir_node_type_load
] = sizeof(ppir_load_node
),
366 [ppir_node_type_store
] = sizeof(ppir_store_node
),
367 [ppir_node_type_load_texture
] = sizeof(ppir_load_texture_node
),
368 [ppir_node_type_discard
] = sizeof(ppir_discard_node
),
369 [ppir_node_type_branch
] = sizeof(ppir_branch_node
),
372 ppir_node_type type
= ppir_op_infos
[op
].type
;
373 int size
= node_size
[type
];
374 ppir_node
*node
= rzalloc_size(block
, size
);
378 list_inithead(&node
->succ_list
);
379 list_inithead(&node
->pred_list
);
383 /* reg has 4 slots for each componemt write node */
385 comp
->var_nodes
[(index
<< 2) + comp
->reg_base
+ u_bit_scan(&mask
)] = node
;
386 snprintf(node
->name
, sizeof(node
->name
), "reg%d", index
);
388 comp
->var_nodes
[index
] = node
;
389 snprintf(node
->name
, sizeof(node
->name
), "ssa%d", index
);
393 snprintf(node
->name
, sizeof(node
->name
), "new");
397 node
->index
= comp
->cur_index
++;
403 void ppir_node_add_dep(ppir_node
*succ
, ppir_node
*pred
,
406 /* don't add dep for two nodes from different block */
407 if (succ
->block
!= pred
->block
)
410 /* don't add duplicated dep */
411 ppir_node_foreach_pred(succ
, dep
) {
412 if (dep
->pred
== pred
)
416 ppir_dep
*dep
= ralloc(succ
, ppir_dep
);
420 list_addtail(&dep
->pred_link
, &succ
->pred_list
);
421 list_addtail(&dep
->succ_link
, &pred
->succ_list
);
424 void ppir_node_remove_dep(ppir_dep
*dep
)
426 list_del(&dep
->succ_link
);
427 list_del(&dep
->pred_link
);
431 static void _ppir_node_replace_child(ppir_src
*src
, ppir_node
*old_child
, ppir_node
*new_child
)
433 ppir_dest
*od
= ppir_node_get_dest(old_child
);
434 if (ppir_node_target_equal(src
, od
)) {
435 ppir_node_target_assign(src
, new_child
);
439 void ppir_node_replace_child(ppir_node
*parent
, ppir_node
*old_child
, ppir_node
*new_child
)
441 switch (parent
->type
) {
442 case ppir_node_type_alu
:
444 ppir_alu_node
*alu
= ppir_node_to_alu(parent
);
445 for (int i
= 0; i
< alu
->num_src
; i
++)
446 _ppir_node_replace_child(alu
->src
+ i
, old_child
, new_child
);
449 case ppir_node_type_branch
:
451 ppir_branch_node
*branch
= ppir_node_to_branch(parent
);
452 for (int i
= 0; i
< 2; i
++)
453 _ppir_node_replace_child(branch
->src
+ i
, old_child
, new_child
);
456 case ppir_node_type_load
:
458 ppir_load_node
*load
= ppir_node_to_load(parent
);
459 _ppir_node_replace_child(&load
->src
, old_child
, new_child
);
462 case ppir_node_type_load_texture
:
464 ppir_load_texture_node
*load_texture
= ppir_node_to_load_texture(parent
);
465 for (int i
= 0; i
< load_texture
->num_src
; i
++)
466 _ppir_node_replace_child(ppir_node_get_src(parent
, i
), old_child
, new_child
);
469 case ppir_node_type_store
:
471 ppir_store_node
*store
= ppir_node_to_store(parent
);
472 _ppir_node_replace_child(&store
->src
, old_child
, new_child
);
476 ppir_debug("unknown node type in %s\n", __func__
);
481 void ppir_node_replace_pred(ppir_dep
*dep
, ppir_node
*new_pred
)
483 list_del(&dep
->succ_link
);
484 dep
->pred
= new_pred
;
485 list_addtail(&dep
->succ_link
, &new_pred
->succ_list
);
488 ppir_dep
*ppir_dep_for_pred(ppir_node
*node
, ppir_node
*pred
)
493 if (node
->block
!= pred
->block
)
496 ppir_node_foreach_pred(node
, dep
) {
497 if (dep
->pred
== pred
)
503 void ppir_node_replace_all_succ(ppir_node
*dst
, ppir_node
*src
)
505 ppir_node_foreach_succ_safe(src
, dep
) {
506 ppir_node_replace_pred(dep
, dst
);
507 ppir_node_replace_child(dep
->succ
, src
, dst
);
511 void ppir_node_delete(ppir_node
*node
)
513 ppir_node_foreach_succ_safe(node
, dep
)
514 ppir_node_remove_dep(dep
);
516 ppir_node_foreach_pred_safe(node
, dep
)
517 ppir_node_remove_dep(dep
);
519 list_del(&node
->list
);
523 static void ppir_node_print_dest(ppir_dest
*dest
)
525 switch (dest
->type
) {
526 case ppir_target_ssa
:
527 printf("ssa%d", dest
->ssa
.index
);
529 case ppir_target_pipeline
:
530 printf("pipeline %d", dest
->pipeline
);
532 case ppir_target_register
:
533 printf("reg %d", dest
->reg
->index
);
538 static void ppir_node_print_src(ppir_src
*src
)
541 case ppir_target_ssa
: {
543 printf("ssa node %d", src
->node
->index
);
545 printf("ssa idx %d", src
->ssa
? src
->ssa
->index
: -1);
548 case ppir_target_pipeline
:
550 printf("pipeline %d node %d", src
->pipeline
, src
->node
->index
);
552 printf("pipeline %d", src
->pipeline
);
554 case ppir_target_register
:
555 printf("reg %d", src
->reg
->index
);
560 static void ppir_node_print_node(ppir_node
*node
, int space
)
562 for (int i
= 0; i
< space
; i
++)
565 printf("%s%d: %s %s: ", node
->printed
&& !ppir_node_is_leaf(node
) ? "+" : "",
566 node
->index
, ppir_op_infos
[node
->op
].name
, node
->name
);
568 ppir_dest
*dest
= ppir_node_get_dest(node
);
571 ppir_node_print_dest(dest
);
574 if (ppir_node_get_src_num(node
) > 0) {
577 for (int i
= 0; i
< ppir_node_get_src_num(node
); i
++) {
578 ppir_node_print_src(ppir_node_get_src(node
, i
));
579 if (i
!= (ppir_node_get_src_num(node
) - 1))
584 if (!node
->printed
) {
585 ppir_node_foreach_pred(node
, dep
) {
586 ppir_node
*pred
= dep
->pred
;
587 ppir_node_print_node(pred
, space
+ 2);
590 node
->printed
= true;
594 void ppir_node_print_prog(ppir_compiler
*comp
)
596 if (!(lima_debug
& LIMA_DEBUG_PP
))
599 list_for_each_entry(ppir_block
, block
, &comp
->block_list
, list
) {
600 list_for_each_entry(ppir_node
, node
, &block
->node_list
, list
) {
601 node
->printed
= false;
605 printf("========prog========\n");
606 list_for_each_entry(ppir_block
, block
, &comp
->block_list
, list
) {
607 printf("-------block %3d-------\n", block
->index
);
608 list_for_each_entry(ppir_node
, node
, &block
->node_list
, list
) {
609 if (ppir_node_is_root(node
))
610 ppir_node_print_node(node
, 0);
613 printf("====================\n");
616 static ppir_node
*ppir_node_clone_const(ppir_block
*block
, ppir_node
*node
)
618 ppir_const_node
*cnode
= ppir_node_to_const(node
);
619 ppir_const_node
*new_cnode
= ppir_node_create(block
, ppir_op_const
, -1, 0);
624 list_addtail(&new_cnode
->node
.list
, &block
->node_list
);
626 new_cnode
->constant
.num
= cnode
->constant
.num
;
627 for (int i
= 0; i
< cnode
->constant
.num
; i
++) {
628 new_cnode
->constant
.value
[i
] = cnode
->constant
.value
[i
];
630 new_cnode
->dest
.type
= ppir_target_ssa
;
631 new_cnode
->dest
.ssa
.num_components
= cnode
->dest
.ssa
.num_components
;
632 new_cnode
->dest
.write_mask
= cnode
->dest
.write_mask
;
634 return &new_cnode
->node
;
638 ppir_node_clone_load(ppir_block
*block
, ppir_node
*node
)
640 ppir_load_node
*load_node
= ppir_node_to_load(node
);
641 ppir_load_node
*new_lnode
= ppir_node_create(block
, node
->op
, -1, 0);
646 list_addtail(&new_lnode
->node
.list
, &block
->node_list
);
648 new_lnode
->num_components
= load_node
->num_components
;
649 new_lnode
->index
= load_node
->index
;
651 ppir_dest
*dest
= ppir_node_get_dest(node
);
652 new_lnode
->dest
= *dest
;
654 ppir_src
*src
= ppir_node_get_src(node
, 0);
656 new_lnode
->num_src
= 1;
658 case ppir_target_ssa
:
659 ppir_node_target_assign(&new_lnode
->src
, src
->node
);
660 ppir_node_add_dep(&new_lnode
->node
, src
->node
, ppir_dep_src
);
662 case ppir_target_register
:
663 new_lnode
->src
.type
= src
->type
;
664 new_lnode
->src
.reg
= src
->reg
;
665 new_lnode
->src
.node
= NULL
;
668 /* Load nodes can't consume pipeline registers */
673 return &new_lnode
->node
;
677 ppir_delete_if_orphan(ppir_block
*block
, ppir_node
*node
)
679 ppir_dest
*dest
= ppir_node_get_dest(node
);
683 ppir_node_foreach_succ_safe(node
, dep
) {
684 ppir_node
*succ
= dep
->succ
;
685 for (int i
= 0; i
< ppir_node_get_src_num(succ
); i
++) {
686 ppir_src
*src
= ppir_node_get_src(succ
, i
);
689 if (ppir_node_target_equal(src
, dest
))
694 ppir_node_delete(node
);
697 ppir_node
*ppir_node_clone(ppir_block
*block
, ppir_node
*node
)
701 return ppir_node_clone_const(block
, node
);
702 case ppir_op_load_uniform
:
703 case ppir_op_load_varying
:
704 case ppir_op_load_temp
:
705 case ppir_op_load_coords
:
706 case ppir_op_load_coords_reg
:
707 return ppir_node_clone_load(block
, node
);
713 ppir_node
*ppir_node_insert_mov(ppir_node
*node
)
715 ppir_node
*move
= ppir_node_create(node
->block
, ppir_op_mov
, -1, 0);
719 ppir_dest
*dest
= ppir_node_get_dest(node
);
720 ppir_alu_node
*alu
= ppir_node_to_alu(move
);
723 ppir_node_target_assign(alu
->src
, node
);
725 for (int s
= 0; s
< 4; s
++)
726 alu
->src
->swizzle
[s
] = s
;
728 ppir_node_replace_all_succ(move
, node
);
729 ppir_node_add_dep(move
, node
, ppir_dep_src
);
730 list_addtail(&move
->list
, &node
->list
);
735 ppir_node
*ppir_node_insert_mov_all_blocks(ppir_node
*old
)
737 ppir_node
*move
= ppir_node_insert_mov(old
);
738 ppir_compiler
*comp
= old
->block
->comp
;
740 list_for_each_entry(ppir_block
, block
, &comp
->block_list
, list
) {
741 if (old
->block
== block
)
743 list_for_each_entry_safe(ppir_node
, node
, &block
->node_list
, list
) {
744 for (int i
= 0; i
< ppir_node_get_src_num(node
); i
++){
745 ppir_src
*src
= ppir_node_get_src(node
, i
);
748 if (src
->node
== old
)
749 ppir_node_target_assign(src
, move
);
756 bool ppir_node_has_single_src_succ(ppir_node
*node
)
758 if (list_is_singular(&node
->succ_list
) &&
759 list_first_entry(&node
->succ_list
,
760 ppir_dep
, succ_link
)->type
== ppir_dep_src
)
764 ppir_node_foreach_succ(node
, dep
) {
765 if (dep
->type
!= ppir_dep_src
)