2 * Copyright © 2016 Broadcom
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
26 #include "util/macros.h"
27 #include "broadcom/common/v3d_device_info.h"
28 #include "broadcom/qpu/qpu_disasm.h"
29 #include "broadcom/qpu/qpu_instr.h"
36 { 33, 0x3d003186bb800000ull
, "nop ; nop ; ldvary" },
37 { 33, 0x3c20318105829000ull
, "fadd r1, r1, r5 ; nop ; thrsw" },
38 { 33, 0x3c403186bb81d000ull
, "vpmsetup -, r5 ; nop ; ldunif" },
39 { 33, 0x3f003186bb800000ull
, "nop ; nop ; ldvpm" },
40 { 33, 0x3c002380b6edb000ull
, "or rf0, r3, r3 ; mov vpm, r3" },
41 { 33, 0x57403006bbb80000ull
, "nop ; fmul r0, rf0, r5 ; ldvpm; ldunif" },
43 /* vfmul input packing */
44 { 33, 0x101e8b6e8aad4000ull
, "fmax.nornn rf46, r4.l, r2.l; vfmul.ifnb rf45, r3, r5" },
45 { 33, 0x1857d3c219825000ull
, "faddnf.norc r2.l, r5.l, r4; vfmul.ifb rf15, r0.ll, r4; ldunif" },
46 { 33, 0x1c0a0dfde2294000ull
, "fcmp.ifna rf61.h, r4.abs, r2.l; vfmul rf55, r2.hh, r1" },
47 { 33, 0x2011c89b402cc000ull
, "fsub.norz rf27, r4.abs, r1.abs; vfmul.ifa rf34, r3.swp, r1" },
49 /* small immediates */
50 { 33, 0x5de24398bbdc6218ull
, "vflb.andnn rf24 ; fmul rf14, -8, rf8.h" },
51 { 33, 0x25ef83d8b166f00full
, "vfmin.pushn rf24, 15.ff, r5; smul24.ifnb rf15, r1, r3" },
52 { 33, 0xadedcdf70839f990ull
, "faddnf.pushc rf55, -16.l, r3.abs; fmul.ifb rf55.l, rf38.l, r1.h" },
53 { 33, 0x7dff89fa6a01f020ull
, "fsub.nornc rf58.h, 0x3b800000.l, r3.l; fmul.ifnb rf39, r0.h, r0.h" },
55 /* branch conditions */
56 { 33, 0x02000006002034c0ull
, "b.anyap rf19" },
57 { 33, 0x02679356b4201000ull
, "b.anyap -1268280496" },
58 { 33, 0x02b76a2dd0400000ull
, "b.anynaq zero_addr+0xd0b76a28" },
59 { 33, 0x0200000500402000ull
, "b.anynaq lri" },
60 { 33, 0x0216fe167301c8c0ull
, "bu.anya zero_addr+0x7316fe10, rf35" },
61 { 33, 0x020000050040e000ull
, "bu.anynaq lri, r:unif" },
62 { 33, 0x0200000300006000ull
, "bu.na0 lri, a:unif" },
64 /* Special waddr names */
65 { 33, 0x3c00318735808000ull
, "vfpack tlb, r0, r1 ; nop" },
66 { 33, 0xe0571c938e8d5000ull
, "fmax.andc recip, r5.h, r2.l; fmul.ifb rf50.h, r3.l, r4.abs; ldunif" },
67 { 33, 0xc04098d4382c9000ull
, "add.pushn rsqrt, r1, r1; fmul rf35.h, r3.abs, r1.abs; ldunif" },
68 { 33, 0x481edcd6b3184500ull
, "vfmin.norn log, r4.hh, r0; fmul.ifnb rf51, rf20.abs, r0.l" },
69 { 33, 0x041618d57c453000ull
, "shl.andn exp, r3, r2; add.ifb rf35, r1, r2" },
70 { 33, 0x7048e5da49272800ull
, "fsub.ifa rf26, r2.l, rf32; fmul.pushc sin, r1.h, r1.abs; ldunif" },
73 { 41, 0x1f010520cf60a000ull
, "fcmp.andz rf32, r2.h, r1.h; vfmul rf20, r0.hh, r3; ldunifa" },
74 { 41, 0x932045e6c16ea000ull
, "fcmp rf38, r2.abs, r5; fmul rf23.l, r3, r3.abs; ldunifarf.rf1" },
75 { 41, 0xd72f0434e43ae5c0ull
, "fcmp rf52.h, rf23, r5.abs; fmul rf16.h, rf23, r1; ldunifarf.rf60" },
76 { 41, 0xdb3048eb9d533780ull
, "fmax rf43.l, r3.h, rf30; fmul rf35.h, r4, r2.l; ldunifarf.r1" },
77 { 41, 0x733620471e6ce700ull
, "faddnf rf7.l, rf28.h, r1.l; fmul r1, r3.h, r3.abs; ldunifarf.rsqrt2" },
78 { 41, 0x9c094adef634b000ull
, "ffloor.ifb rf30.l, r3; fmul.pushz rf43.l, r5, r1.h" },
81 { 41, 0x3de020c7bdfd200dull
, "ldvpmg_in rf7, r2, r2; mov r3, 13" },
82 { 41, 0x3de02040f8ff7201ull
, "stvpmv 1, rf8 ; mov r1, 1" },
83 { 41, 0xd8000e50bb2d3000ull
, "sampid rf16 ; fmul rf57.h, r3, r1.l" },
87 swap_mux(enum v3d_qpu_mux
*a
, enum v3d_qpu_mux
*b
)
89 enum v3d_qpu_mux t
= *a
;
95 swap_pack(enum v3d_qpu_input_unpack
*a
, enum v3d_qpu_input_unpack
*b
)
97 enum v3d_qpu_input_unpack t
= *a
;
103 main(int argc
, char **argv
)
105 struct v3d_device_info devinfo
= { };
108 for (int i
= 0; i
< ARRAY_SIZE(tests
); i
++) {
109 devinfo
.ver
= tests
[i
].ver
;
111 printf("Testing v%d.%d 0x%016llx... ",
112 devinfo
.ver
/ 10, devinfo
.ver
% 10,
113 (long long)tests
[i
].inst
);
115 const char *disasm_output
= v3d_qpu_disasm(&devinfo
,
118 if (strcmp(disasm_output
, tests
[i
].expected
) != 0) {
120 printf(" Expected: \"%s\"\n", tests
[i
].expected
);
121 printf(" Got: \"%s\"\n", disasm_output
);
126 struct v3d_qpu_instr instr
;
127 if (!v3d_qpu_instr_unpack(&devinfo
, tests
[i
].inst
, &instr
)) {
128 printf("FAIL (unpack) %s\n", tests
[i
].expected
);
133 if (instr
.type
== V3D_QPU_INSTR_TYPE_ALU
) {
134 switch (instr
.alu
.add
.op
) {
136 case V3D_QPU_A_FADDNF
:
139 /* Swap the operands to be sure that we test
140 * how the QPUs distinguish between these ops.
142 swap_mux(&instr
.alu
.add
.a
,
144 swap_pack(&instr
.alu
.add
.a_unpack
,
145 &instr
.alu
.add
.b_unpack
);
152 if (!v3d_qpu_instr_pack(&devinfo
, &instr
, &repack
)) {
153 printf("FAIL (pack) %s\n", tests
[i
].expected
);
158 if (repack
!= tests
[i
].inst
) {
159 printf("FAIL (repack) 0x%016llx\n", (long long)repack
);
160 printf(" Expected: \"%s\"\n", tests
[i
].expected
);
161 const char *redisasm
= v3d_qpu_disasm(&devinfo
, repack
);
162 printf(" Got: \"%s\"\n", redisasm
);