4 #include "llvm-c/Disassembler.h"
5 #include "ac_llvm_util.h"
7 #include <llvm/ADT/StringRef.h>
11 void print_asm(Program
*program
, std::vector
<uint32_t>& binary
,
12 unsigned exec_size
, enum radeon_family family
, std::ostream
& out
)
14 std::vector
<bool> referenced_blocks(program
->blocks
.size());
15 referenced_blocks
[0] = true;
16 for (Block
& block
: program
->blocks
) {
17 for (unsigned succ
: block
.linear_succs
)
18 referenced_blocks
[succ
] = true;
21 std::vector
<std::tuple
<uint64_t, llvm::StringRef
, uint8_t>> symbols
;
22 std::vector
<std::array
<char,16>> block_names
;
23 block_names
.reserve(program
->blocks
.size());
24 for (Block
& block
: program
->blocks
) {
25 if (!referenced_blocks
[block
.index
])
27 std::array
<char, 16> name
;
28 sprintf(name
.data(), "BB%u", block
.index
);
29 block_names
.push_back(name
);
30 symbols
.emplace_back(block
.offset
* 4, llvm::StringRef(block_names
[block_names
.size() - 1].data()), 0);
33 LLVMDisasmContextRef disasm
= LLVMCreateDisasmCPU("amdgcn-mesa-mesa3d",
34 ac_get_llvm_processor_name(family
),
35 &symbols
, 0, NULL
, NULL
);
40 unsigned next_block
= 0;
41 while (pos
< exec_size
) {
42 while (next_block
< program
->blocks
.size() && pos
== program
->blocks
[next_block
].offset
) {
43 if (referenced_blocks
[next_block
])
44 out
<< "BB" << std::dec
<< next_block
<< ":" << std::endl
;
48 size_t l
= LLVMDisasmInstruction(disasm
, (uint8_t *) &binary
[pos
],
49 (exec_size
- pos
) * sizeof(uint32_t), pos
* 4,
50 outline
, sizeof(outline
));
53 const int align_width
= 60;
54 if (program
->chip_class
== GFX9
&& !l
&& ((binary
[pos
] & 0xffff8000) == 0xd1348000)) { /* not actually an invalid instruction */
55 out
<< std::left
<< std::setw(align_width
) << std::setfill(' ') << "\tv_add_u32_e64 + clamp";
58 out
<< std::left
<< std::setw(align_width
) << std::setfill(' ') << "(invalid instruction)";
62 out
<< std::left
<< std::setw(align_width
) << std::setfill(' ') << outline
;
64 new_pos
= pos
+ l
/ 4;
69 for (; pos
< new_pos
; pos
++)
70 out
<< " " << std::setfill('0') << std::setw(8) << std::hex
<< binary
[pos
];
73 out
<< std::setfill(' ') << std::setw(0) << std::dec
;
74 assert(next_block
== program
->blocks
.size());
76 LLVMDisasmDispose(disasm
);
78 if (program
->constant_data
.size()) {
79 out
<< std::endl
<< "/* constant data */" << std::endl
;
80 for (unsigned i
= 0; i
< program
->constant_data
.size(); i
+= 32) {
81 out
<< '[' << std::setw(6) << std::setfill('0') << std::dec
<< i
<< ']';
82 unsigned line_size
= std::min
<size_t>(program
->constant_data
.size() - i
, 32);
83 for (unsigned j
= 0; j
< line_size
; j
+= 4) {
84 unsigned size
= std::min
<size_t>(program
->constant_data
.size() - (i
+ j
), 4);
86 memcpy(&v
, &program
->constant_data
[i
+ j
], size
);
87 out
<< " " << std::setw(8) << std::setfill('0') << std::hex
<< v
;
93 out
<< std::setfill(' ') << std::setw(0) << std::dec
;
96 /* Invalid instructions usually lead to GPU hangs, which can make
97 * getting the actual invalid instruction hard. Abort here so that we
98 * can find the problem.