2 * Copyright © 2008 Keith Packard
4 * Permission to use, copy, modify, distribute, and sell this software and its
5 * documentation for any purpose is hereby granted without fee, provided that
6 * the above copyright notice appear in all copies and that both that copyright
7 * notice and this permission notice appear in supporting documentation, and
8 * that the name of the copyright holders not be used in advertising or
9 * publicity pertaining to distribution of the software without specific,
10 * written prior permission. The copyright holders make no representations
11 * about the suitability of this software for any purpose. It is provided "as
12 * is" without express or implied warranty.
14 * THE COPYRIGHT HOLDERS DISCLAIM ALL WARRANTIES WITH REGARD TO THIS SOFTWARE,
15 * INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS, IN NO
16 * EVENT SHALL THE COPYRIGHT HOLDERS BE LIABLE FOR ANY SPECIAL, INDIRECT OR
17 * CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE,
18 * DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER
19 * TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE
30 #include "main/mtypes.h"
32 #include "brw_context.h"
33 #include "brw_defines.h"
35 const struct opcode_desc opcode_descs
[128] = {
36 [BRW_OPCODE_MOV
] = { .name
= "mov", .nsrc
= 1, .ndst
= 1 },
37 [BRW_OPCODE_FRC
] = { .name
= "frc", .nsrc
= 1, .ndst
= 1 },
38 [BRW_OPCODE_RNDU
] = { .name
= "rndu", .nsrc
= 1, .ndst
= 1 },
39 [BRW_OPCODE_RNDD
] = { .name
= "rndd", .nsrc
= 1, .ndst
= 1 },
40 [BRW_OPCODE_RNDE
] = { .name
= "rnde", .nsrc
= 1, .ndst
= 1 },
41 [BRW_OPCODE_RNDZ
] = { .name
= "rndz", .nsrc
= 1, .ndst
= 1 },
42 [BRW_OPCODE_NOT
] = { .name
= "not", .nsrc
= 1, .ndst
= 1 },
43 [BRW_OPCODE_LZD
] = { .name
= "lzd", .nsrc
= 1, .ndst
= 1 },
45 [BRW_OPCODE_MUL
] = { .name
= "mul", .nsrc
= 2, .ndst
= 1 },
46 [BRW_OPCODE_MAC
] = { .name
= "mac", .nsrc
= 2, .ndst
= 1 },
47 [BRW_OPCODE_MACH
] = { .name
= "mach", .nsrc
= 2, .ndst
= 1 },
48 [BRW_OPCODE_LINE
] = { .name
= "line", .nsrc
= 2, .ndst
= 1 },
49 [BRW_OPCODE_PLN
] = { .name
= "pln", .nsrc
= 2, .ndst
= 1 },
50 [BRW_OPCODE_MAD
] = { .name
= "mad", .nsrc
= 3, .ndst
= 1 },
51 [BRW_OPCODE_SAD2
] = { .name
= "sad2", .nsrc
= 2, .ndst
= 1 },
52 [BRW_OPCODE_SADA2
] = { .name
= "sada2", .nsrc
= 2, .ndst
= 1 },
53 [BRW_OPCODE_DP4
] = { .name
= "dp4", .nsrc
= 2, .ndst
= 1 },
54 [BRW_OPCODE_DPH
] = { .name
= "dph", .nsrc
= 2, .ndst
= 1 },
55 [BRW_OPCODE_DP3
] = { .name
= "dp3", .nsrc
= 2, .ndst
= 1 },
56 [BRW_OPCODE_DP2
] = { .name
= "dp2", .nsrc
= 2, .ndst
= 1 },
57 [BRW_OPCODE_MATH
] = { .name
= "math", .nsrc
= 2, .ndst
= 1 },
59 [BRW_OPCODE_AVG
] = { .name
= "avg", .nsrc
= 2, .ndst
= 1 },
60 [BRW_OPCODE_ADD
] = { .name
= "add", .nsrc
= 2, .ndst
= 1 },
61 [BRW_OPCODE_SEL
] = { .name
= "sel", .nsrc
= 2, .ndst
= 1 },
62 [BRW_OPCODE_AND
] = { .name
= "and", .nsrc
= 2, .ndst
= 1 },
63 [BRW_OPCODE_OR
] = { .name
= "or", .nsrc
= 2, .ndst
= 1 },
64 [BRW_OPCODE_XOR
] = { .name
= "xor", .nsrc
= 2, .ndst
= 1 },
65 [BRW_OPCODE_SHR
] = { .name
= "shr", .nsrc
= 2, .ndst
= 1 },
66 [BRW_OPCODE_SHL
] = { .name
= "shl", .nsrc
= 2, .ndst
= 1 },
67 [BRW_OPCODE_ASR
] = { .name
= "asr", .nsrc
= 2, .ndst
= 1 },
68 [BRW_OPCODE_CMP
] = { .name
= "cmp", .nsrc
= 2, .ndst
= 1 },
69 [BRW_OPCODE_CMPN
] = { .name
= "cmpn", .nsrc
= 2, .ndst
= 1 },
71 [BRW_OPCODE_SEND
] = { .name
= "send", .nsrc
= 1, .ndst
= 1 },
72 [BRW_OPCODE_SENDC
] = { .name
= "sendc", .nsrc
= 1, .ndst
= 1 },
73 [BRW_OPCODE_NOP
] = { .name
= "nop", .nsrc
= 0, .ndst
= 0 },
74 [BRW_OPCODE_JMPI
] = { .name
= "jmpi", .nsrc
= 0, .ndst
= 0 },
75 [BRW_OPCODE_IF
] = { .name
= "if", .nsrc
= 2, .ndst
= 0 },
76 [BRW_OPCODE_IFF
] = { .name
= "iff", .nsrc
= 2, .ndst
= 1 },
77 [BRW_OPCODE_WHILE
] = { .name
= "while", .nsrc
= 2, .ndst
= 0 },
78 [BRW_OPCODE_ELSE
] = { .name
= "else", .nsrc
= 2, .ndst
= 0 },
79 [BRW_OPCODE_BREAK
] = { .name
= "break", .nsrc
= 2, .ndst
= 0 },
80 [BRW_OPCODE_CONTINUE
] = { .name
= "cont", .nsrc
= 1, .ndst
= 0 },
81 [BRW_OPCODE_HALT
] = { .name
= "halt", .nsrc
= 1, .ndst
= 0 },
82 [BRW_OPCODE_MSAVE
] = { .name
= "msave", .nsrc
= 1, .ndst
= 1 },
83 [BRW_OPCODE_PUSH
] = { .name
= "push", .nsrc
= 1, .ndst
= 1 },
84 [BRW_OPCODE_MRESTORE
] = { .name
= "mrest", .nsrc
= 1, .ndst
= 1 },
85 [BRW_OPCODE_POP
] = { .name
= "pop", .nsrc
= 2, .ndst
= 0 },
86 [BRW_OPCODE_WAIT
] = { .name
= "wait", .nsrc
= 1, .ndst
= 0 },
87 [BRW_OPCODE_DO
] = { .name
= "do", .nsrc
= 0, .ndst
= 0 },
88 [BRW_OPCODE_ENDIF
] = { .name
= "endif", .nsrc
= 2, .ndst
= 0 },
90 static const struct opcode_desc
*opcode
= opcode_descs
;
92 static const char * const conditional_modifier
[16] = {
93 [BRW_CONDITIONAL_NONE
] = "",
94 [BRW_CONDITIONAL_Z
] = ".e",
95 [BRW_CONDITIONAL_NZ
] = ".ne",
96 [BRW_CONDITIONAL_G
] = ".g",
97 [BRW_CONDITIONAL_GE
] = ".ge",
98 [BRW_CONDITIONAL_L
] = ".l",
99 [BRW_CONDITIONAL_LE
] = ".le",
100 [BRW_CONDITIONAL_R
] = ".r",
101 [BRW_CONDITIONAL_O
] = ".o",
102 [BRW_CONDITIONAL_U
] = ".u",
105 static const char * const negate
[2] = {
110 static const char * const _abs
[2] = {
115 static const char * const vert_stride
[16] = {
126 static const char * const width
[8] = {
134 static const char * const horiz_stride
[4] = {
141 static const char * const chan_sel
[4] = {
148 static const char * const debug_ctrl
[2] = {
153 static const char * const saturate
[2] = {
158 static const char * const accwr
[2] = {
163 static const char * const wectrl
[2] = {
168 static const char * const exec_size
[8] = {
177 static const char * const pred_inv
[2] = {
182 static const char * const pred_ctrl_align16
[16] = {
192 static const char * const pred_ctrl_align1
[16] = {
206 static const char * const thread_ctrl
[4] = {
211 static const char * const compr_ctrl
[4] = {
218 static const char * const dep_ctrl
[4] = {
222 [3] = "NoDDClr,NoDDChk",
225 static const char * const mask_ctrl
[4] = {
230 static const char * const access_mode
[2] = {
235 static const char * const reg_encoding
[8] = {
245 const int reg_type_size
[8] = {
255 static const char * const reg_file
[4] = {
262 static const char * const writemask
[16] = {
281 static const char * const end_of_thread
[2] = {
286 static const char * const target_function
[16] = {
287 [BRW_SFID_NULL
] = "null",
288 [BRW_SFID_MATH
] = "math",
289 [BRW_SFID_SAMPLER
] = "sampler",
290 [BRW_SFID_MESSAGE_GATEWAY
] = "gateway",
291 [BRW_SFID_DATAPORT_READ
] = "read",
292 [BRW_SFID_DATAPORT_WRITE
] = "write",
293 [BRW_SFID_URB
] = "urb",
294 [BRW_SFID_THREAD_SPAWNER
] = "thread_spawner"
297 static const char * const target_function_gen6
[16] = {
298 [BRW_SFID_NULL
] = "null",
299 [BRW_SFID_MATH
] = "math",
300 [BRW_SFID_SAMPLER
] = "sampler",
301 [BRW_SFID_MESSAGE_GATEWAY
] = "gateway",
302 [BRW_SFID_URB
] = "urb",
303 [BRW_SFID_THREAD_SPAWNER
] = "thread_spawner",
304 [GEN6_SFID_DATAPORT_SAMPLER_CACHE
] = "sampler",
305 [GEN6_SFID_DATAPORT_RENDER_CACHE
] = "render",
306 [GEN6_SFID_DATAPORT_CONSTANT_CACHE
] = "const",
307 [GEN7_SFID_DATAPORT_DATA_CACHE
] = "data"
310 static const char * const dp_rc_msg_type_gen6
[16] = {
311 [BRW_DATAPORT_READ_MESSAGE_OWORD_BLOCK_READ
] = "OWORD block read",
312 [GEN6_DATAPORT_READ_MESSAGE_RENDER_UNORM_READ
] = "RT UNORM read",
313 [GEN6_DATAPORT_READ_MESSAGE_OWORD_DUAL_BLOCK_READ
] = "OWORD dual block read",
314 [GEN6_DATAPORT_READ_MESSAGE_MEDIA_BLOCK_READ
] = "media block read",
315 [GEN6_DATAPORT_READ_MESSAGE_OWORD_UNALIGN_BLOCK_READ
] = "OWORD unaligned block read",
316 [GEN6_DATAPORT_READ_MESSAGE_DWORD_SCATTERED_READ
] = "DWORD scattered read",
317 [GEN6_DATAPORT_WRITE_MESSAGE_DWORD_ATOMIC_WRITE
] = "DWORD atomic write",
318 [GEN6_DATAPORT_WRITE_MESSAGE_OWORD_BLOCK_WRITE
] = "OWORD block write",
319 [GEN6_DATAPORT_WRITE_MESSAGE_OWORD_DUAL_BLOCK_WRITE
] = "OWORD dual block write",
320 [GEN6_DATAPORT_WRITE_MESSAGE_MEDIA_BLOCK_WRITE
] = "media block write",
321 [GEN6_DATAPORT_WRITE_MESSAGE_DWORD_SCATTERED_WRITE
] = "DWORD scattered write",
322 [GEN6_DATAPORT_WRITE_MESSAGE_RENDER_TARGET_WRITE
] = "RT write",
323 [GEN6_DATAPORT_WRITE_MESSAGE_STREAMED_VB_WRITE
] = "streamed VB write",
324 [GEN6_DATAPORT_WRITE_MESSAGE_RENDER_TARGET_UNORM_WRITE
] = "RT UNORMc write",
327 static const char * const math_function
[16] = {
328 [BRW_MATH_FUNCTION_INV
] = "inv",
329 [BRW_MATH_FUNCTION_LOG
] = "log",
330 [BRW_MATH_FUNCTION_EXP
] = "exp",
331 [BRW_MATH_FUNCTION_SQRT
] = "sqrt",
332 [BRW_MATH_FUNCTION_RSQ
] = "rsq",
333 [BRW_MATH_FUNCTION_SIN
] = "sin",
334 [BRW_MATH_FUNCTION_COS
] = "cos",
335 [BRW_MATH_FUNCTION_SINCOS
] = "sincos",
336 [BRW_MATH_FUNCTION_TAN
] = "tan",
337 [BRW_MATH_FUNCTION_POW
] = "pow",
338 [BRW_MATH_FUNCTION_INT_DIV_QUOTIENT_AND_REMAINDER
] = "intdivmod",
339 [BRW_MATH_FUNCTION_INT_DIV_QUOTIENT
] = "intdiv",
340 [BRW_MATH_FUNCTION_INT_DIV_REMAINDER
] = "intmod",
343 static const char * const math_saturate
[2] = {
348 static const char * const math_signed
[2] = {
353 static const char * const math_scalar
[2] = {
358 static const char * const math_precision
[2] = {
360 [1] = "partial_precision"
363 static const char * const urb_opcode
[2] = {
368 static const char * const urb_swizzle
[4] = {
369 [BRW_URB_SWIZZLE_NONE
] = "",
370 [BRW_URB_SWIZZLE_INTERLEAVE
] = "interleave",
371 [BRW_URB_SWIZZLE_TRANSPOSE
] = "transpose",
374 static const char * const urb_allocate
[2] = {
379 static const char * const urb_used
[2] = {
384 static const char * const urb_complete
[2] = {
389 static const char * const sampler_target_format
[4] = {
398 static int string (FILE *file
, const char *string
)
400 fputs (string
, file
);
401 column
+= strlen (string
);
405 static int format (FILE *f
, const char *format
, ...)
409 va_start (args
, format
);
411 vsnprintf (buf
, sizeof (buf
) - 1, format
, args
);
417 static int newline (FILE *f
)
424 static int pad (FILE *f
, int c
)
432 static int control (FILE *file
, const char *name
, const char * const ctrl
[],
433 GLuint id
, int *space
)
436 fprintf (file
, "*** invalid %s value %d ",
444 string (file
, ctrl
[id
]);
451 static int print_opcode (FILE *file
, int id
)
453 if (!opcode
[id
].name
) {
454 format (file
, "*** invalid opcode value %d ", id
);
457 string (file
, opcode
[id
].name
);
461 static int reg (FILE *file
, GLuint _reg_file
, GLuint _reg_nr
)
465 /* Clear the Compr4 instruction compression bit. */
466 if (_reg_file
== BRW_MESSAGE_REGISTER_FILE
)
467 _reg_nr
&= ~(1 << 7);
469 if (_reg_file
== BRW_ARCHITECTURE_REGISTER_FILE
) {
470 switch (_reg_nr
& 0xf0) {
472 string (file
, "null");
474 case BRW_ARF_ADDRESS
:
475 format (file
, "a%d", _reg_nr
& 0x0f);
477 case BRW_ARF_ACCUMULATOR
:
478 format (file
, "acc%d", _reg_nr
& 0x0f);
481 format (file
, "f%d", _reg_nr
& 0x0f);
484 format (file
, "mask%d", _reg_nr
& 0x0f);
486 case BRW_ARF_MASK_STACK
:
487 format (file
, "msd%d", _reg_nr
& 0x0f);
490 format (file
, "sr%d", _reg_nr
& 0x0f);
492 case BRW_ARF_CONTROL
:
493 format (file
, "cr%d", _reg_nr
& 0x0f);
495 case BRW_ARF_NOTIFICATION_COUNT
:
496 format (file
, "n%d", _reg_nr
& 0x0f);
503 format (file
, "ARF%d", _reg_nr
);
507 err
|= control (file
, "src reg file", reg_file
, _reg_file
, NULL
);
508 format (file
, "%d", _reg_nr
);
513 static int dest (FILE *file
, struct brw_instruction
*inst
)
517 if (inst
->header
.access_mode
== BRW_ALIGN_1
)
519 if (inst
->bits1
.da1
.dest_address_mode
== BRW_ADDRESS_DIRECT
)
521 err
|= reg (file
, inst
->bits1
.da1
.dest_reg_file
, inst
->bits1
.da1
.dest_reg_nr
);
524 if (inst
->bits1
.da1
.dest_subreg_nr
)
525 format (file
, ".%d", inst
->bits1
.da1
.dest_subreg_nr
/
526 reg_type_size
[inst
->bits1
.da1
.dest_reg_type
]);
528 err
|= control (file
, "horiz stride", horiz_stride
, inst
->bits1
.da1
.dest_horiz_stride
, NULL
);
530 err
|= control (file
, "dest reg encoding", reg_encoding
, inst
->bits1
.da1
.dest_reg_type
, NULL
);
534 string (file
, "g[a0");
535 if (inst
->bits1
.ia1
.dest_subreg_nr
)
536 format (file
, ".%d", inst
->bits1
.ia1
.dest_subreg_nr
/
537 reg_type_size
[inst
->bits1
.ia1
.dest_reg_type
]);
538 if (inst
->bits1
.ia1
.dest_indirect_offset
)
539 format (file
, " %d", inst
->bits1
.ia1
.dest_indirect_offset
);
541 err
|= control (file
, "horiz stride", horiz_stride
, inst
->bits1
.ia1
.dest_horiz_stride
, NULL
);
543 err
|= control (file
, "dest reg encoding", reg_encoding
, inst
->bits1
.ia1
.dest_reg_type
, NULL
);
548 if (inst
->bits1
.da16
.dest_address_mode
== BRW_ADDRESS_DIRECT
)
550 err
|= reg (file
, inst
->bits1
.da16
.dest_reg_file
, inst
->bits1
.da16
.dest_reg_nr
);
553 if (inst
->bits1
.da16
.dest_subreg_nr
)
554 format (file
, ".%d", inst
->bits1
.da16
.dest_subreg_nr
/
555 reg_type_size
[inst
->bits1
.da16
.dest_reg_type
]);
556 string (file
, "<1>");
557 err
|= control (file
, "writemask", writemask
, inst
->bits1
.da16
.dest_writemask
, NULL
);
558 err
|= control (file
, "dest reg encoding", reg_encoding
, inst
->bits1
.da16
.dest_reg_type
, NULL
);
563 string (file
, "Indirect align16 address mode not supported");
570 static int dest_3src (FILE *file
, struct brw_instruction
*inst
)
575 if (inst
->bits1
.da3src
.dest_reg_file
)
576 reg_file
= BRW_MESSAGE_REGISTER_FILE
;
578 reg_file
= BRW_GENERAL_REGISTER_FILE
;
580 err
|= reg (file
, reg_file
, inst
->bits1
.da3src
.dest_reg_nr
);
583 if (inst
->bits1
.da3src
.dest_subreg_nr
)
584 format (file
, ".%d", inst
->bits1
.da3src
.dest_subreg_nr
);
585 string (file
, "<1>");
586 err
|= control (file
, "writemask", writemask
, inst
->bits1
.da3src
.dest_writemask
, NULL
);
587 err
|= control (file
, "dest reg encoding", reg_encoding
, BRW_REGISTER_TYPE_F
, NULL
);
592 static int src_align1_region (FILE *file
,
593 GLuint _vert_stride
, GLuint _width
, GLuint _horiz_stride
)
597 err
|= control (file
, "vert stride", vert_stride
, _vert_stride
, NULL
);
599 err
|= control (file
, "width", width
, _width
, NULL
);
601 err
|= control (file
, "horiz_stride", horiz_stride
, _horiz_stride
, NULL
);
606 static int src_da1 (FILE *file
, GLuint type
, GLuint _reg_file
,
607 GLuint _vert_stride
, GLuint _width
, GLuint _horiz_stride
,
608 GLuint reg_num
, GLuint sub_reg_num
, GLuint __abs
, GLuint _negate
)
611 err
|= control (file
, "negate", negate
, _negate
, NULL
);
612 err
|= control (file
, "abs", _abs
, __abs
, NULL
);
614 err
|= reg (file
, _reg_file
, reg_num
);
618 format (file
, ".%d", sub_reg_num
/ reg_type_size
[type
]); /* use formal style like spec */
619 src_align1_region (file
, _vert_stride
, _width
, _horiz_stride
);
620 err
|= control (file
, "src reg encoding", reg_encoding
, type
, NULL
);
624 static int src_ia1 (FILE *file
,
628 GLuint _addr_subreg_nr
,
632 GLuint _horiz_stride
,
637 err
|= control (file
, "negate", negate
, _negate
, NULL
);
638 err
|= control (file
, "abs", _abs
, __abs
, NULL
);
640 string (file
, "g[a0");
642 format (file
, ".%d", _addr_subreg_nr
);
644 format (file
, " %d", _addr_imm
);
646 src_align1_region (file
, _vert_stride
, _width
, _horiz_stride
);
647 err
|= control (file
, "src reg encoding", reg_encoding
, type
, NULL
);
651 static int src_da16 (FILE *file
,
665 err
|= control (file
, "negate", negate
, _negate
, NULL
);
666 err
|= control (file
, "abs", _abs
, __abs
, NULL
);
668 err
|= reg (file
, _reg_file
, _reg_nr
);
672 /* bit4 for subreg number byte addressing. Make this same meaning as
673 in da1 case, so output looks consistent. */
674 format (file
, ".%d", 16 / reg_type_size
[_reg_type
]);
676 err
|= control (file
, "vert stride", vert_stride
, _vert_stride
, NULL
);
677 string (file
, ",4,1>");
679 * Three kinds of swizzle display:
680 * identity - nothing printed
681 * 1->all - print the single channel
682 * 1->1 - print the mapping
684 if (swz_x
== BRW_CHANNEL_X
&&
685 swz_y
== BRW_CHANNEL_Y
&&
686 swz_z
== BRW_CHANNEL_Z
&&
687 swz_w
== BRW_CHANNEL_W
)
691 else if (swz_x
== swz_y
&& swz_x
== swz_z
&& swz_x
== swz_w
)
694 err
|= control (file
, "channel select", chan_sel
, swz_x
, NULL
);
699 err
|= control (file
, "channel select", chan_sel
, swz_x
, NULL
);
700 err
|= control (file
, "channel select", chan_sel
, swz_y
, NULL
);
701 err
|= control (file
, "channel select", chan_sel
, swz_z
, NULL
);
702 err
|= control (file
, "channel select", chan_sel
, swz_w
, NULL
);
704 err
|= control (file
, "src da16 reg type", reg_encoding
, _reg_type
, NULL
);
708 static int src0_3src (FILE *file
, struct brw_instruction
*inst
)
711 GLuint swz_x
= (inst
->bits2
.da3src
.src0_swizzle
>> 0) & 0x3;
712 GLuint swz_y
= (inst
->bits2
.da3src
.src0_swizzle
>> 2) & 0x3;
713 GLuint swz_z
= (inst
->bits2
.da3src
.src0_swizzle
>> 4) & 0x3;
714 GLuint swz_w
= (inst
->bits2
.da3src
.src0_swizzle
>> 6) & 0x3;
716 err
|= control (file
, "negate", negate
, inst
->bits1
.da3src
.src0_negate
, NULL
);
717 err
|= control (file
, "abs", _abs
, inst
->bits1
.da3src
.src0_abs
, NULL
);
719 err
|= reg (file
, BRW_GENERAL_REGISTER_FILE
, inst
->bits2
.da3src
.src0_reg_nr
);
722 if (inst
->bits2
.da3src
.src0_subreg_nr
)
723 format (file
, ".%d", inst
->bits2
.da3src
.src0_subreg_nr
);
724 string (file
, "<4,1,1>");
725 err
|= control (file
, "src da16 reg type", reg_encoding
,
726 BRW_REGISTER_TYPE_F
, NULL
);
728 * Three kinds of swizzle display:
729 * identity - nothing printed
730 * 1->all - print the single channel
731 * 1->1 - print the mapping
733 if (swz_x
== BRW_CHANNEL_X
&&
734 swz_y
== BRW_CHANNEL_Y
&&
735 swz_z
== BRW_CHANNEL_Z
&&
736 swz_w
== BRW_CHANNEL_W
)
740 else if (swz_x
== swz_y
&& swz_x
== swz_z
&& swz_x
== swz_w
)
743 err
|= control (file
, "channel select", chan_sel
, swz_x
, NULL
);
748 err
|= control (file
, "channel select", chan_sel
, swz_x
, NULL
);
749 err
|= control (file
, "channel select", chan_sel
, swz_y
, NULL
);
750 err
|= control (file
, "channel select", chan_sel
, swz_z
, NULL
);
751 err
|= control (file
, "channel select", chan_sel
, swz_w
, NULL
);
756 static int src1_3src (FILE *file
, struct brw_instruction
*inst
)
759 GLuint swz_x
= (inst
->bits2
.da3src
.src1_swizzle
>> 0) & 0x3;
760 GLuint swz_y
= (inst
->bits2
.da3src
.src1_swizzle
>> 2) & 0x3;
761 GLuint swz_z
= (inst
->bits2
.da3src
.src1_swizzle
>> 4) & 0x3;
762 GLuint swz_w
= (inst
->bits2
.da3src
.src1_swizzle
>> 6) & 0x3;
763 GLuint src1_subreg_nr
= (inst
->bits2
.da3src
.src1_subreg_nr_low
|
764 (inst
->bits3
.da3src
.src1_subreg_nr_high
<< 2));
766 err
|= control (file
, "negate", negate
, inst
->bits1
.da3src
.src1_negate
,
768 err
|= control (file
, "abs", _abs
, inst
->bits1
.da3src
.src1_abs
, NULL
);
770 err
|= reg (file
, BRW_GENERAL_REGISTER_FILE
,
771 inst
->bits3
.da3src
.src1_reg_nr
);
775 format (file
, ".%d", src1_subreg_nr
);
776 string (file
, "<4,1,1>");
777 err
|= control (file
, "src da16 reg type", reg_encoding
,
778 BRW_REGISTER_TYPE_F
, NULL
);
780 * Three kinds of swizzle display:
781 * identity - nothing printed
782 * 1->all - print the single channel
783 * 1->1 - print the mapping
785 if (swz_x
== BRW_CHANNEL_X
&&
786 swz_y
== BRW_CHANNEL_Y
&&
787 swz_z
== BRW_CHANNEL_Z
&&
788 swz_w
== BRW_CHANNEL_W
)
792 else if (swz_x
== swz_y
&& swz_x
== swz_z
&& swz_x
== swz_w
)
795 err
|= control (file
, "channel select", chan_sel
, swz_x
, NULL
);
800 err
|= control (file
, "channel select", chan_sel
, swz_x
, NULL
);
801 err
|= control (file
, "channel select", chan_sel
, swz_y
, NULL
);
802 err
|= control (file
, "channel select", chan_sel
, swz_z
, NULL
);
803 err
|= control (file
, "channel select", chan_sel
, swz_w
, NULL
);
809 static int src2_3src (FILE *file
, struct brw_instruction
*inst
)
812 GLuint swz_x
= (inst
->bits3
.da3src
.src2_swizzle
>> 0) & 0x3;
813 GLuint swz_y
= (inst
->bits3
.da3src
.src2_swizzle
>> 2) & 0x3;
814 GLuint swz_z
= (inst
->bits3
.da3src
.src2_swizzle
>> 4) & 0x3;
815 GLuint swz_w
= (inst
->bits3
.da3src
.src2_swizzle
>> 6) & 0x3;
817 err
|= control (file
, "negate", negate
, inst
->bits1
.da3src
.src2_negate
,
819 err
|= control (file
, "abs", _abs
, inst
->bits1
.da3src
.src2_abs
, NULL
);
821 err
|= reg (file
, BRW_GENERAL_REGISTER_FILE
,
822 inst
->bits3
.da3src
.src2_reg_nr
);
825 if (inst
->bits3
.da3src
.src2_subreg_nr
)
826 format (file
, ".%d", inst
->bits3
.da3src
.src2_subreg_nr
);
827 string (file
, "<4,1,1>");
828 err
|= control (file
, "src da16 reg type", reg_encoding
,
829 BRW_REGISTER_TYPE_F
, NULL
);
831 * Three kinds of swizzle display:
832 * identity - nothing printed
833 * 1->all - print the single channel
834 * 1->1 - print the mapping
836 if (swz_x
== BRW_CHANNEL_X
&&
837 swz_y
== BRW_CHANNEL_Y
&&
838 swz_z
== BRW_CHANNEL_Z
&&
839 swz_w
== BRW_CHANNEL_W
)
843 else if (swz_x
== swz_y
&& swz_x
== swz_z
&& swz_x
== swz_w
)
846 err
|= control (file
, "channel select", chan_sel
, swz_x
, NULL
);
851 err
|= control (file
, "channel select", chan_sel
, swz_x
, NULL
);
852 err
|= control (file
, "channel select", chan_sel
, swz_y
, NULL
);
853 err
|= control (file
, "channel select", chan_sel
, swz_z
, NULL
);
854 err
|= control (file
, "channel select", chan_sel
, swz_w
, NULL
);
859 static int imm (FILE *file
, GLuint type
, struct brw_instruction
*inst
) {
861 case BRW_REGISTER_TYPE_UD
:
862 format (file
, "0x%08xUD", inst
->bits3
.ud
);
864 case BRW_REGISTER_TYPE_D
:
865 format (file
, "%dD", inst
->bits3
.d
);
867 case BRW_REGISTER_TYPE_UW
:
868 format (file
, "0x%04xUW", (uint16_t) inst
->bits3
.ud
);
870 case BRW_REGISTER_TYPE_W
:
871 format (file
, "%dW", (int16_t) inst
->bits3
.d
);
873 case BRW_REGISTER_TYPE_UB
:
874 format (file
, "0x%02xUB", (int8_t) inst
->bits3
.ud
);
876 case BRW_REGISTER_TYPE_VF
:
877 format (file
, "Vector Float");
879 case BRW_REGISTER_TYPE_V
:
880 format (file
, "0x%08xV", inst
->bits3
.ud
);
882 case BRW_REGISTER_TYPE_F
:
883 format (file
, "%-gF", inst
->bits3
.f
);
888 static int src0 (FILE *file
, struct brw_instruction
*inst
)
890 if (inst
->bits1
.da1
.src0_reg_file
== BRW_IMMEDIATE_VALUE
)
891 return imm (file
, inst
->bits1
.da1
.src0_reg_type
,
893 else if (inst
->header
.access_mode
== BRW_ALIGN_1
)
895 if (inst
->bits2
.da1
.src0_address_mode
== BRW_ADDRESS_DIRECT
)
897 return src_da1 (file
,
898 inst
->bits1
.da1
.src0_reg_type
,
899 inst
->bits1
.da1
.src0_reg_file
,
900 inst
->bits2
.da1
.src0_vert_stride
,
901 inst
->bits2
.da1
.src0_width
,
902 inst
->bits2
.da1
.src0_horiz_stride
,
903 inst
->bits2
.da1
.src0_reg_nr
,
904 inst
->bits2
.da1
.src0_subreg_nr
,
905 inst
->bits2
.da1
.src0_abs
,
906 inst
->bits2
.da1
.src0_negate
);
910 return src_ia1 (file
,
911 inst
->bits1
.ia1
.src0_reg_type
,
912 inst
->bits1
.ia1
.src0_reg_file
,
913 inst
->bits2
.ia1
.src0_indirect_offset
,
914 inst
->bits2
.ia1
.src0_subreg_nr
,
915 inst
->bits2
.ia1
.src0_negate
,
916 inst
->bits2
.ia1
.src0_abs
,
917 inst
->bits2
.ia1
.src0_address_mode
,
918 inst
->bits2
.ia1
.src0_horiz_stride
,
919 inst
->bits2
.ia1
.src0_width
,
920 inst
->bits2
.ia1
.src0_vert_stride
);
925 if (inst
->bits2
.da16
.src0_address_mode
== BRW_ADDRESS_DIRECT
)
927 return src_da16 (file
,
928 inst
->bits1
.da16
.src0_reg_type
,
929 inst
->bits1
.da16
.src0_reg_file
,
930 inst
->bits2
.da16
.src0_vert_stride
,
931 inst
->bits2
.da16
.src0_reg_nr
,
932 inst
->bits2
.da16
.src0_subreg_nr
,
933 inst
->bits2
.da16
.src0_abs
,
934 inst
->bits2
.da16
.src0_negate
,
935 inst
->bits2
.da16
.src0_swz_x
,
936 inst
->bits2
.da16
.src0_swz_y
,
937 inst
->bits2
.da16
.src0_swz_z
,
938 inst
->bits2
.da16
.src0_swz_w
);
942 string (file
, "Indirect align16 address mode not supported");
948 static int src1 (FILE *file
, struct brw_instruction
*inst
)
950 if (inst
->bits1
.da1
.src1_reg_file
== BRW_IMMEDIATE_VALUE
)
951 return imm (file
, inst
->bits1
.da1
.src1_reg_type
,
953 else if (inst
->header
.access_mode
== BRW_ALIGN_1
)
955 if (inst
->bits3
.da1
.src1_address_mode
== BRW_ADDRESS_DIRECT
)
957 return src_da1 (file
,
958 inst
->bits1
.da1
.src1_reg_type
,
959 inst
->bits1
.da1
.src1_reg_file
,
960 inst
->bits3
.da1
.src1_vert_stride
,
961 inst
->bits3
.da1
.src1_width
,
962 inst
->bits3
.da1
.src1_horiz_stride
,
963 inst
->bits3
.da1
.src1_reg_nr
,
964 inst
->bits3
.da1
.src1_subreg_nr
,
965 inst
->bits3
.da1
.src1_abs
,
966 inst
->bits3
.da1
.src1_negate
);
970 return src_ia1 (file
,
971 inst
->bits1
.ia1
.src1_reg_type
,
972 inst
->bits1
.ia1
.src1_reg_file
,
973 inst
->bits3
.ia1
.src1_indirect_offset
,
974 inst
->bits3
.ia1
.src1_subreg_nr
,
975 inst
->bits3
.ia1
.src1_negate
,
976 inst
->bits3
.ia1
.src1_abs
,
977 inst
->bits3
.ia1
.src1_address_mode
,
978 inst
->bits3
.ia1
.src1_horiz_stride
,
979 inst
->bits3
.ia1
.src1_width
,
980 inst
->bits3
.ia1
.src1_vert_stride
);
985 if (inst
->bits3
.da16
.src1_address_mode
== BRW_ADDRESS_DIRECT
)
987 return src_da16 (file
,
988 inst
->bits1
.da16
.src1_reg_type
,
989 inst
->bits1
.da16
.src1_reg_file
,
990 inst
->bits3
.da16
.src1_vert_stride
,
991 inst
->bits3
.da16
.src1_reg_nr
,
992 inst
->bits3
.da16
.src1_subreg_nr
,
993 inst
->bits3
.da16
.src1_abs
,
994 inst
->bits3
.da16
.src1_negate
,
995 inst
->bits3
.da16
.src1_swz_x
,
996 inst
->bits3
.da16
.src1_swz_y
,
997 inst
->bits3
.da16
.src1_swz_z
,
998 inst
->bits3
.da16
.src1_swz_w
);
1002 string (file
, "Indirect align16 address mode not supported");
1017 static int qtr_ctrl(FILE *file
, struct brw_instruction
*inst
)
1019 int qtr_ctl
= inst
->header
.compression_control
;
1020 int exec_size
= esize
[inst
->header
.execution_size
];
1022 if (exec_size
== 8) {
1025 string (file
, " 1Q");
1028 string (file
, " 2Q");
1031 string (file
, " 3Q");
1034 string (file
, " 4Q");
1037 } else if (exec_size
== 16){
1039 string (file
, " 1H");
1041 string (file
, " 2H");
1046 int brw_disasm (FILE *file
, struct brw_instruction
*inst
, int gen
)
1051 if (inst
->header
.predicate_control
) {
1053 err
|= control (file
, "predicate inverse", pred_inv
, inst
->header
.predicate_inverse
, NULL
);
1054 format (file
, "f%d", gen
>= 7 ? inst
->bits2
.da1
.flag_reg_nr
: 0);
1055 if (inst
->bits2
.da1
.flag_subreg_nr
)
1056 format (file
, ".%d", inst
->bits2
.da1
.flag_subreg_nr
);
1057 if (inst
->header
.access_mode
== BRW_ALIGN_1
)
1058 err
|= control (file
, "predicate control align1", pred_ctrl_align1
,
1059 inst
->header
.predicate_control
, NULL
);
1061 err
|= control (file
, "predicate control align16", pred_ctrl_align16
,
1062 inst
->header
.predicate_control
, NULL
);
1063 string (file
, ") ");
1066 err
|= print_opcode (file
, inst
->header
.opcode
);
1067 err
|= control (file
, "saturate", saturate
, inst
->header
.saturate
, NULL
);
1068 err
|= control (file
, "debug control", debug_ctrl
, inst
->header
.debug_control
, NULL
);
1070 if (inst
->header
.opcode
== BRW_OPCODE_MATH
) {
1072 err
|= control (file
, "function", math_function
,
1073 inst
->header
.destreg__conditionalmod
, NULL
);
1074 } else if (inst
->header
.opcode
!= BRW_OPCODE_SEND
&&
1075 inst
->header
.opcode
!= BRW_OPCODE_SENDC
) {
1076 err
|= control (file
, "conditional modifier", conditional_modifier
,
1077 inst
->header
.destreg__conditionalmod
, NULL
);
1079 /* If we're using the conditional modifier, print which flags reg is
1080 * used for it. Note that on gen6+, the embedded-condition SEL and
1081 * control flow doesn't update flags.
1083 if (inst
->header
.destreg__conditionalmod
&&
1084 (gen
< 6 || (inst
->header
.opcode
!= BRW_OPCODE_SEL
&&
1085 inst
->header
.opcode
!= BRW_OPCODE_IF
&&
1086 inst
->header
.opcode
!= BRW_OPCODE_WHILE
))) {
1087 format (file
, ".f%d", gen
>= 7 ? inst
->bits2
.da1
.flag_reg_nr
: 0);
1088 if (inst
->bits2
.da1
.flag_subreg_nr
)
1089 format (file
, ".%d", inst
->bits2
.da1
.flag_subreg_nr
);
1093 if (inst
->header
.opcode
!= BRW_OPCODE_NOP
) {
1095 err
|= control (file
, "execution size", exec_size
, inst
->header
.execution_size
, NULL
);
1099 if (inst
->header
.opcode
== BRW_OPCODE_SEND
&& gen
< 6)
1100 format (file
, " %d", inst
->header
.destreg__conditionalmod
);
1102 if (opcode
[inst
->header
.opcode
].nsrc
== 3) {
1104 err
|= dest_3src (file
, inst
);
1107 err
|= src0_3src (file
, inst
);
1110 err
|= src1_3src (file
, inst
);
1113 err
|= src2_3src (file
, inst
);
1115 if (opcode
[inst
->header
.opcode
].ndst
> 0) {
1117 err
|= dest (file
, inst
);
1118 } else if (gen
== 7 && (inst
->header
.opcode
== BRW_OPCODE_ELSE
||
1119 inst
->header
.opcode
== BRW_OPCODE_ENDIF
||
1120 inst
->header
.opcode
== BRW_OPCODE_WHILE
)) {
1121 format (file
, " %d", inst
->bits3
.break_cont
.jip
);
1122 } else if (gen
== 6 && (inst
->header
.opcode
== BRW_OPCODE_IF
||
1123 inst
->header
.opcode
== BRW_OPCODE_ELSE
||
1124 inst
->header
.opcode
== BRW_OPCODE_ENDIF
||
1125 inst
->header
.opcode
== BRW_OPCODE_WHILE
)) {
1126 format (file
, " %d", inst
->bits1
.branch_gen6
.jump_count
);
1127 } else if ((gen
>= 6 && (inst
->header
.opcode
== BRW_OPCODE_BREAK
||
1128 inst
->header
.opcode
== BRW_OPCODE_CONTINUE
||
1129 inst
->header
.opcode
== BRW_OPCODE_HALT
)) ||
1130 (gen
== 7 && inst
->header
.opcode
== BRW_OPCODE_IF
)) {
1131 format (file
, " %d %d", inst
->bits3
.break_cont
.uip
, inst
->bits3
.break_cont
.jip
);
1132 } else if (inst
->header
.opcode
== BRW_OPCODE_JMPI
) {
1133 format (file
, " %d", inst
->bits3
.d
);
1136 if (opcode
[inst
->header
.opcode
].nsrc
> 0) {
1138 err
|= src0 (file
, inst
);
1140 if (opcode
[inst
->header
.opcode
].nsrc
> 1) {
1142 err
|= src1 (file
, inst
);
1146 if (inst
->header
.opcode
== BRW_OPCODE_SEND
||
1147 inst
->header
.opcode
== BRW_OPCODE_SENDC
) {
1148 enum brw_message_target target
;
1151 target
= inst
->header
.destreg__conditionalmod
;
1153 target
= inst
->bits2
.send_gen5
.sfid
;
1155 target
= inst
->bits3
.generic
.msg_target
;
1162 err
|= control (file
, "target function", target_function_gen6
,
1165 err
|= control (file
, "target function", target_function
,
1171 err
|= control (file
, "math function", math_function
,
1172 inst
->bits3
.math
.function
, &space
);
1173 err
|= control (file
, "math saturate", math_saturate
,
1174 inst
->bits3
.math
.saturate
, &space
);
1175 err
|= control (file
, "math signed", math_signed
,
1176 inst
->bits3
.math
.int_type
, &space
);
1177 err
|= control (file
, "math scalar", math_scalar
,
1178 inst
->bits3
.math
.data_type
, &space
);
1179 err
|= control (file
, "math precision", math_precision
,
1180 inst
->bits3
.math
.precision
, &space
);
1182 case BRW_SFID_SAMPLER
:
1184 format (file
, " (%d, %d, %d, %d)",
1185 inst
->bits3
.sampler_gen7
.binding_table_index
,
1186 inst
->bits3
.sampler_gen7
.sampler
,
1187 inst
->bits3
.sampler_gen7
.msg_type
,
1188 inst
->bits3
.sampler_gen7
.simd_mode
);
1189 } else if (gen
>= 5) {
1190 format (file
, " (%d, %d, %d, %d)",
1191 inst
->bits3
.sampler_gen5
.binding_table_index
,
1192 inst
->bits3
.sampler_gen5
.sampler
,
1193 inst
->bits3
.sampler_gen5
.msg_type
,
1194 inst
->bits3
.sampler_gen5
.simd_mode
);
1195 } else if (0 /* FINISHME: is_g4x */) {
1196 format (file
, " (%d, %d)",
1197 inst
->bits3
.sampler_g4x
.binding_table_index
,
1198 inst
->bits3
.sampler_g4x
.sampler
);
1200 format (file
, " (%d, %d, ",
1201 inst
->bits3
.sampler
.binding_table_index
,
1202 inst
->bits3
.sampler
.sampler
);
1203 err
|= control (file
, "sampler target format",
1204 sampler_target_format
,
1205 inst
->bits3
.sampler
.return_format
, NULL
);
1209 case BRW_SFID_DATAPORT_READ
:
1211 format (file
, " (%d, %d, %d, %d)",
1212 inst
->bits3
.gen6_dp
.binding_table_index
,
1213 inst
->bits3
.gen6_dp
.msg_control
,
1214 inst
->bits3
.gen6_dp
.msg_type
,
1215 inst
->bits3
.gen6_dp
.send_commit_msg
);
1216 } else if (gen
>= 5 /* FINISHME: || is_g4x */) {
1217 format (file
, " (%d, %d, %d)",
1218 inst
->bits3
.dp_read_gen5
.binding_table_index
,
1219 inst
->bits3
.dp_read_gen5
.msg_control
,
1220 inst
->bits3
.dp_read_gen5
.msg_type
);
1222 format (file
, " (%d, %d, %d)",
1223 inst
->bits3
.dp_read
.binding_table_index
,
1224 inst
->bits3
.dp_read
.msg_control
,
1225 inst
->bits3
.dp_read
.msg_type
);
1229 case BRW_SFID_DATAPORT_WRITE
:
1231 format (file
, " (");
1233 err
|= control (file
, "DP rc message type",
1234 dp_rc_msg_type_gen6
,
1235 inst
->bits3
.gen7_dp
.msg_type
, &space
);
1237 format (file
, ", %d, %d, %d)",
1238 inst
->bits3
.gen7_dp
.binding_table_index
,
1239 inst
->bits3
.gen7_dp
.msg_control
,
1240 inst
->bits3
.gen7_dp
.msg_type
);
1241 } else if (gen
== 6) {
1242 format (file
, " (");
1244 err
|= control (file
, "DP rc message type",
1245 dp_rc_msg_type_gen6
,
1246 inst
->bits3
.gen6_dp
.msg_type
, &space
);
1248 format (file
, ", %d, %d, %d, %d)",
1249 inst
->bits3
.gen6_dp
.binding_table_index
,
1250 inst
->bits3
.gen6_dp
.msg_control
,
1251 inst
->bits3
.gen6_dp
.msg_type
,
1252 inst
->bits3
.gen6_dp
.send_commit_msg
);
1254 format (file
, " (%d, %d, %d, %d)",
1255 inst
->bits3
.dp_write
.binding_table_index
,
1256 (inst
->bits3
.dp_write
.last_render_target
<< 3) |
1257 inst
->bits3
.dp_write
.msg_control
,
1258 inst
->bits3
.dp_write
.msg_type
,
1259 inst
->bits3
.dp_write
.send_commit_msg
);
1265 format (file
, " %d", inst
->bits3
.urb_gen5
.offset
);
1267 format (file
, " %d", inst
->bits3
.urb
.offset
);
1272 err
|= control (file
, "urb opcode", urb_opcode
,
1273 inst
->bits3
.urb_gen5
.opcode
, &space
);
1275 err
|= control (file
, "urb swizzle", urb_swizzle
,
1276 inst
->bits3
.urb
.swizzle_control
, &space
);
1277 err
|= control (file
, "urb allocate", urb_allocate
,
1278 inst
->bits3
.urb
.allocate
, &space
);
1279 err
|= control (file
, "urb used", urb_used
,
1280 inst
->bits3
.urb
.used
, &space
);
1281 err
|= control (file
, "urb complete", urb_complete
,
1282 inst
->bits3
.urb
.complete
, &space
);
1284 case BRW_SFID_THREAD_SPAWNER
:
1286 case GEN7_SFID_DATAPORT_DATA_CACHE
:
1287 format (file
, " (%d, %d, %d)",
1288 inst
->bits3
.gen7_dp
.binding_table_index
,
1289 inst
->bits3
.gen7_dp
.msg_control
,
1290 inst
->bits3
.gen7_dp
.msg_type
);
1295 format (file
, "unsupported target %d", target
);
1301 format (file
, "mlen %d",
1302 inst
->bits3
.generic_gen5
.msg_length
);
1303 format (file
, " rlen %d",
1304 inst
->bits3
.generic_gen5
.response_length
);
1306 format (file
, "mlen %d",
1307 inst
->bits3
.generic
.msg_length
);
1308 format (file
, " rlen %d",
1309 inst
->bits3
.generic
.response_length
);
1313 if (inst
->header
.opcode
!= BRW_OPCODE_NOP
) {
1316 err
|= control(file
, "access mode", access_mode
, inst
->header
.access_mode
, &space
);
1318 err
|= control (file
, "write enable control", wectrl
, inst
->header
.mask_control
, &space
);
1320 err
|= control (file
, "mask control", mask_ctrl
, inst
->header
.mask_control
, &space
);
1321 err
|= control (file
, "dependency control", dep_ctrl
, inst
->header
.dependency_control
, &space
);
1324 err
|= qtr_ctrl (file
, inst
);
1326 if (inst
->header
.compression_control
== BRW_COMPRESSION_COMPRESSED
&&
1327 opcode
[inst
->header
.opcode
].ndst
> 0 &&
1328 inst
->bits1
.da1
.dest_reg_file
== BRW_MESSAGE_REGISTER_FILE
&&
1329 inst
->bits1
.da1
.dest_reg_nr
& (1 << 7)) {
1330 format (file
, " compr4");
1332 err
|= control (file
, "compression control", compr_ctrl
,
1333 inst
->header
.compression_control
, &space
);
1337 err
|= control (file
, "thread control", thread_ctrl
, inst
->header
.thread_control
, &space
);
1339 err
|= control (file
, "acc write control", accwr
, inst
->header
.acc_wr_control
, &space
);
1340 if (inst
->header
.opcode
== BRW_OPCODE_SEND
||
1341 inst
->header
.opcode
== BRW_OPCODE_SENDC
)
1342 err
|= control (file
, "end of thread", end_of_thread
,
1343 inst
->bits3
.generic
.end_of_thread
, &space
);