v3d: Use ldunif instructions for uniforms.
[mesa.git] / src / broadcom / compiler / vir_dump.c
1 /*
2 * Copyright © 2016-2017 Broadcom
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 */
23
24 #include "broadcom/common/v3d_device_info.h"
25 #include "v3d_compiler.h"
26
27 /* Prints a human-readable description of the uniform reference. */
28 void
29 vir_dump_uniform(enum quniform_contents contents,
30 uint32_t data)
31 {
32 static const char *quniform_names[] = {
33 [QUNIFORM_ALPHA_REF] = "alpha_ref",
34 [QUNIFORM_VIEWPORT_X_SCALE] = "vp_x_scale",
35 [QUNIFORM_VIEWPORT_Y_SCALE] = "vp_y_scale",
36 [QUNIFORM_VIEWPORT_Z_OFFSET] = "vp_z_offset",
37 [QUNIFORM_VIEWPORT_Z_SCALE] = "vp_z_scale",
38 [QUNIFORM_SHARED_OFFSET] = "shared_offset",
39 };
40
41 switch (contents) {
42 case QUNIFORM_CONSTANT:
43 fprintf(stderr, "0x%08x / %f", data, uif(data));
44 break;
45
46 case QUNIFORM_UNIFORM:
47 fprintf(stderr, "push[%d]", data);
48 break;
49
50 case QUNIFORM_TEXTURE_CONFIG_P1:
51 fprintf(stderr, "tex[%d].p1", data);
52 break;
53
54 case QUNIFORM_TMU_CONFIG_P0:
55 fprintf(stderr, "tex[%d].p0 | 0x%x",
56 v3d_tmu_config_data_get_unit(data),
57 v3d_tmu_config_data_get_value(data));
58 break;
59
60 case QUNIFORM_TMU_CONFIG_P1:
61 fprintf(stderr, "tex[%d].p1 | 0x%x",
62 v3d_tmu_config_data_get_unit(data),
63 v3d_tmu_config_data_get_value(data));
64 break;
65
66 case QUNIFORM_IMAGE_TMU_CONFIG_P0:
67 fprintf(stderr, "img[%d].p0 | 0x%x",
68 v3d_tmu_config_data_get_unit(data),
69 v3d_tmu_config_data_get_value(data));
70 break;
71
72 case QUNIFORM_TEXTURE_WIDTH:
73 fprintf(stderr, "tex[%d].width", data);
74 break;
75 case QUNIFORM_TEXTURE_HEIGHT:
76 fprintf(stderr, "tex[%d].height", data);
77 break;
78 case QUNIFORM_TEXTURE_DEPTH:
79 fprintf(stderr, "tex[%d].depth", data);
80 break;
81 case QUNIFORM_TEXTURE_ARRAY_SIZE:
82 fprintf(stderr, "tex[%d].array_size", data);
83 break;
84 case QUNIFORM_TEXTURE_LEVELS:
85 fprintf(stderr, "tex[%d].levels", data);
86 break;
87
88 case QUNIFORM_IMAGE_WIDTH:
89 fprintf(stderr, "img[%d].width", data);
90 break;
91 case QUNIFORM_IMAGE_HEIGHT:
92 fprintf(stderr, "img[%d].height", data);
93 break;
94 case QUNIFORM_IMAGE_DEPTH:
95 fprintf(stderr, "img[%d].depth", data);
96 break;
97 case QUNIFORM_IMAGE_ARRAY_SIZE:
98 fprintf(stderr, "img[%d].array_size", data);
99 break;
100
101 case QUNIFORM_UBO_ADDR:
102 fprintf(stderr, "ubo[%d]", data);
103 break;
104
105 case QUNIFORM_SSBO_OFFSET:
106 fprintf(stderr, "ssbo[%d]", data);
107 break;
108
109 case QUNIFORM_GET_BUFFER_SIZE:
110 fprintf(stderr, "ssbo_size[%d]", data);
111 break;
112
113 case QUNIFORM_NUM_WORK_GROUPS:
114 fprintf(stderr, "num_wg.%c", data < 3 ? "xyz"[data] : '?');
115 break;
116
117 default:
118 if (quniform_contents_is_texture_p0(contents)) {
119 fprintf(stderr, "tex[%d].p0: 0x%08x",
120 contents - QUNIFORM_TEXTURE_CONFIG_P0_0,
121 data);
122 } else if (contents < ARRAY_SIZE(quniform_names) &&
123 quniform_names[contents]) {
124 fprintf(stderr, "%s",
125 quniform_names[contents]);
126 } else {
127 fprintf(stderr, "%d / 0x%08x", contents, data);
128 }
129 }
130 }
131
132 static void
133 vir_print_reg(struct v3d_compile *c, const struct qinst *inst,
134 struct qreg reg)
135 {
136 static const char *files[] = {
137 [QFILE_TEMP] = "t",
138 [QFILE_TLB] = "tlb",
139 [QFILE_TLBU] = "tlbu",
140 };
141
142 switch (reg.file) {
143
144 case QFILE_NULL:
145 fprintf(stderr, "null");
146 break;
147
148 case QFILE_LOAD_IMM:
149 fprintf(stderr, "0x%08x (%f)", reg.index, uif(reg.index));
150 break;
151
152 case QFILE_REG:
153 fprintf(stderr, "rf%d", reg.index);
154 break;
155
156 case QFILE_MAGIC:
157 fprintf(stderr, "%s", v3d_qpu_magic_waddr_name(reg.index));
158 break;
159
160 case QFILE_SMALL_IMM: {
161 uint32_t unpacked;
162 bool ok = v3d_qpu_small_imm_unpack(c->devinfo,
163 inst->qpu.raddr_b,
164 &unpacked);
165 assert(ok); (void) ok;
166
167 if ((int)inst->qpu.raddr_b >= -16 &&
168 (int)inst->qpu.raddr_b <= 15)
169 fprintf(stderr, "%d", unpacked);
170 else
171 fprintf(stderr, "%f", uif(unpacked));
172 break;
173 }
174
175 case QFILE_VPM:
176 fprintf(stderr, "vpm%d.%d",
177 reg.index / 4, reg.index % 4);
178 break;
179
180 case QFILE_TLB:
181 case QFILE_TLBU:
182 fprintf(stderr, "%s", files[reg.file]);
183 break;
184
185 default:
186 fprintf(stderr, "%s%d", files[reg.file], reg.index);
187 break;
188 }
189 }
190
191 static void
192 vir_dump_sig_addr(const struct v3d_device_info *devinfo,
193 const struct v3d_qpu_instr *instr)
194 {
195 if (devinfo->ver < 41)
196 return;
197
198 if (!instr->sig_magic)
199 fprintf(stderr, ".rf%d", instr->sig_addr);
200 else {
201 const char *name = v3d_qpu_magic_waddr_name(instr->sig_addr);
202 if (name)
203 fprintf(stderr, ".%s", name);
204 else
205 fprintf(stderr, ".UNKNOWN%d", instr->sig_addr);
206 }
207 }
208
209 static void
210 vir_dump_sig(struct v3d_compile *c, struct qinst *inst)
211 {
212 struct v3d_qpu_sig *sig = &inst->qpu.sig;
213
214 if (sig->thrsw)
215 fprintf(stderr, "; thrsw");
216 if (sig->ldvary) {
217 fprintf(stderr, "; ldvary");
218 vir_dump_sig_addr(c->devinfo, &inst->qpu);
219 }
220 if (sig->ldvpm)
221 fprintf(stderr, "; ldvpm");
222 if (sig->ldtmu) {
223 fprintf(stderr, "; ldtmu");
224 vir_dump_sig_addr(c->devinfo, &inst->qpu);
225 }
226 if (sig->ldtlb) {
227 fprintf(stderr, "; ldtlb");
228 vir_dump_sig_addr(c->devinfo, &inst->qpu);
229 }
230 if (sig->ldtlbu) {
231 fprintf(stderr, "; ldtlbu");
232 vir_dump_sig_addr(c->devinfo, &inst->qpu);
233 }
234 if (sig->ldunif)
235 fprintf(stderr, "; ldunif");
236 if (sig->ldunifrf) {
237 fprintf(stderr, "; ldunifrf");
238 vir_dump_sig_addr(c->devinfo, &inst->qpu);
239 }
240 if (sig->ldunifa)
241 fprintf(stderr, "; ldunifa");
242 if (sig->ldunifarf) {
243 fprintf(stderr, "; ldunifarf");
244 vir_dump_sig_addr(c->devinfo, &inst->qpu);
245 }
246 if (sig->wrtmuc)
247 fprintf(stderr, "; wrtmuc");
248 }
249
250 static void
251 vir_dump_alu(struct v3d_compile *c, struct qinst *inst)
252 {
253 struct v3d_qpu_instr *instr = &inst->qpu;
254 int nsrc = vir_get_nsrc(inst);
255 enum v3d_qpu_input_unpack unpack[2];
256
257 if (inst->qpu.alu.add.op != V3D_QPU_A_NOP) {
258 fprintf(stderr, "%s", v3d_qpu_add_op_name(instr->alu.add.op));
259 fprintf(stderr, "%s", v3d_qpu_cond_name(instr->flags.ac));
260 fprintf(stderr, "%s", v3d_qpu_pf_name(instr->flags.apf));
261 fprintf(stderr, "%s", v3d_qpu_uf_name(instr->flags.auf));
262 fprintf(stderr, " ");
263
264 vir_print_reg(c, inst, inst->dst);
265 fprintf(stderr, "%s", v3d_qpu_pack_name(instr->alu.add.output_pack));
266
267 unpack[0] = instr->alu.add.a_unpack;
268 unpack[1] = instr->alu.add.b_unpack;
269 } else {
270 fprintf(stderr, "%s", v3d_qpu_mul_op_name(instr->alu.mul.op));
271 fprintf(stderr, "%s", v3d_qpu_cond_name(instr->flags.mc));
272 fprintf(stderr, "%s", v3d_qpu_pf_name(instr->flags.mpf));
273 fprintf(stderr, "%s", v3d_qpu_uf_name(instr->flags.muf));
274 fprintf(stderr, " ");
275
276 vir_print_reg(c, inst, inst->dst);
277 fprintf(stderr, "%s", v3d_qpu_pack_name(instr->alu.mul.output_pack));
278
279 unpack[0] = instr->alu.mul.a_unpack;
280 unpack[1] = instr->alu.mul.b_unpack;
281 }
282
283 for (int i = 0; i < nsrc; i++) {
284 fprintf(stderr, ", ");
285 vir_print_reg(c, inst, inst->src[i]);
286 fprintf(stderr, "%s", v3d_qpu_unpack_name(unpack[i]));
287 }
288
289 vir_dump_sig(c, inst);
290 }
291
292 void
293 vir_dump_inst(struct v3d_compile *c, struct qinst *inst)
294 {
295 struct v3d_qpu_instr *instr = &inst->qpu;
296
297 switch (inst->qpu.type) {
298 case V3D_QPU_INSTR_TYPE_ALU:
299 vir_dump_alu(c, inst);
300 break;
301 case V3D_QPU_INSTR_TYPE_BRANCH:
302 fprintf(stderr, "b");
303 if (instr->branch.ub)
304 fprintf(stderr, "u");
305
306 fprintf(stderr, "%s",
307 v3d_qpu_branch_cond_name(instr->branch.cond));
308 fprintf(stderr, "%s", v3d_qpu_msfign_name(instr->branch.msfign));
309
310 switch (instr->branch.bdi) {
311 case V3D_QPU_BRANCH_DEST_ABS:
312 fprintf(stderr, " zero_addr+0x%08x", instr->branch.offset);
313 break;
314
315 case V3D_QPU_BRANCH_DEST_REL:
316 fprintf(stderr, " %d", instr->branch.offset);
317 break;
318
319 case V3D_QPU_BRANCH_DEST_LINK_REG:
320 fprintf(stderr, " lri");
321 break;
322
323 case V3D_QPU_BRANCH_DEST_REGFILE:
324 fprintf(stderr, " rf%d", instr->branch.raddr_a);
325 break;
326 }
327
328 if (instr->branch.ub) {
329 switch (instr->branch.bdu) {
330 case V3D_QPU_BRANCH_DEST_ABS:
331 fprintf(stderr, ", a:unif");
332 break;
333
334 case V3D_QPU_BRANCH_DEST_REL:
335 fprintf(stderr, ", r:unif");
336 break;
337
338 case V3D_QPU_BRANCH_DEST_LINK_REG:
339 fprintf(stderr, ", lri");
340 break;
341
342 case V3D_QPU_BRANCH_DEST_REGFILE:
343 fprintf(stderr, ", rf%d", instr->branch.raddr_a);
344 break;
345 }
346 }
347 break;
348 }
349
350 if (vir_has_uniform(inst)) {
351 fprintf(stderr, " (");
352 vir_dump_uniform(c->uniform_contents[inst->uniform],
353 c->uniform_data[inst->uniform]);
354 fprintf(stderr, ")");
355 }
356 }
357
358 void
359 vir_dump(struct v3d_compile *c)
360 {
361 int ip = 0;
362
363 vir_for_each_block(block, c) {
364 fprintf(stderr, "BLOCK %d:\n", block->index);
365 vir_for_each_inst(inst, block) {
366 if (c->live_intervals_valid) {
367 bool first = true;
368
369 for (int i = 0; i < c->num_temps; i++) {
370 if (c->temp_start[i] != ip)
371 continue;
372
373 if (first) {
374 first = false;
375 } else {
376 fprintf(stderr, ", ");
377 }
378 fprintf(stderr, "S%4d", i);
379 }
380
381 if (first)
382 fprintf(stderr, " ");
383 else
384 fprintf(stderr, " ");
385 }
386
387 if (c->live_intervals_valid) {
388 bool first = true;
389
390 for (int i = 0; i < c->num_temps; i++) {
391 if (c->temp_end[i] != ip)
392 continue;
393
394 if (first) {
395 first = false;
396 } else {
397 fprintf(stderr, ", ");
398 }
399 fprintf(stderr, "E%4d", i);
400 }
401
402 if (first)
403 fprintf(stderr, " ");
404 else
405 fprintf(stderr, " ");
406 }
407
408 vir_dump_inst(c, inst);
409 fprintf(stderr, "\n");
410 ip++;
411 }
412 if (block->successors[1]) {
413 fprintf(stderr, "-> BLOCK %d, %d\n",
414 block->successors[0]->index,
415 block->successors[1]->index);
416 } else if (block->successors[0]) {
417 fprintf(stderr, "-> BLOCK %d\n",
418 block->successors[0]->index);
419 }
420 }
421 }