panfrost/midgard: Add fround(_even), ftrunc, ffma
[mesa.git] / src / gallium / drivers / panfrost / midgard / midgard.h
1 /* Author(s):
2 * Connor Abbott
3 * Alyssa Rosenzweig
4 *
5 * Copyright (c) 2013 Connor Abbott (connor@abbott.cx)
6 * Copyright (c) 2018 Alyssa Rosenzweig (alyssa@rosenzweig.io)
7 *
8 * Permission is hereby granted, free of charge, to any person obtaining a copy
9 * of this software and associated documentation files (the "Software"), to deal
10 * in the Software without restriction, including without limitation the rights
11 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
12 * copies of the Software, and to permit persons to whom the Software is
13 * furnished to do so, subject to the following conditions:
14 *
15 * The above copyright notice and this permission notice shall be included in
16 * all copies or substantial portions of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
19 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
20 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
21 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
22 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
23 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
24 * THE SOFTWARE.
25 */
26
27 #ifndef __midgard_h__
28 #define __midgard_h__
29
30 #include <stdint.h>
31 #include <stdbool.h>
32
33 typedef enum {
34 midgard_word_type_alu,
35 midgard_word_type_load_store,
36 midgard_word_type_texture,
37 midgard_word_type_unknown
38 } midgard_word_type;
39
40 typedef enum {
41 midgard_alu_vmul,
42 midgard_alu_sadd,
43 midgard_alu_smul,
44 midgard_alu_vadd,
45 midgard_alu_lut
46 } midgard_alu;
47
48 /*
49 * ALU words
50 */
51
52 typedef enum {
53 midgard_alu_op_fadd = 0x10,
54 midgard_alu_op_fmul = 0x14,
55 midgard_alu_op_fmin = 0x28,
56 midgard_alu_op_fmax = 0x2C,
57 midgard_alu_op_fmov = 0x30,
58 midgard_alu_op_froundeven = 0x34,
59 midgard_alu_op_ftrunc = 0x35,
60 midgard_alu_op_ffloor = 0x36,
61 midgard_alu_op_fceil = 0x37,
62 midgard_alu_op_ffma = 0x38,
63 midgard_alu_op_fdot3 = 0x3C,
64 midgard_alu_op_fdot3r = 0x3D,
65 midgard_alu_op_fdot4 = 0x3E,
66 midgard_alu_op_freduce = 0x3F,
67 midgard_alu_op_iadd = 0x40,
68 midgard_alu_op_ishladd = 0x41,
69 midgard_alu_op_isub = 0x46,
70 midgard_alu_op_imul = 0x58,
71 midgard_alu_op_imin = 0x60,
72 midgard_alu_op_imax = 0x62,
73 midgard_alu_op_iasr = 0x68,
74 midgard_alu_op_ilsr = 0x69,
75 midgard_alu_op_ishl = 0x6E,
76 midgard_alu_op_iand = 0x70,
77 midgard_alu_op_ior = 0x71,
78 midgard_alu_op_inot = 0x72,
79 midgard_alu_op_iandnot = 0x74, /* (a, b) -> a & ~b, used for not/b2f */
80 midgard_alu_op_ixor = 0x76,
81 midgard_alu_op_imov = 0x7B,
82 midgard_alu_op_feq = 0x80,
83 midgard_alu_op_fne = 0x81,
84 midgard_alu_op_flt = 0x82,
85 midgard_alu_op_fle = 0x83,
86 midgard_alu_op_fball_eq = 0x88,
87 midgard_alu_op_bball_eq = 0x89,
88 midgard_alu_op_bbany_neq = 0x90, /* used for bvec4(1) */
89 midgard_alu_op_fbany_neq = 0x91, /* bvec4(0) also */
90 midgard_alu_op_f2i = 0x99,
91 midgard_alu_op_f2u8 = 0x9C,
92 midgard_alu_op_f2u = 0x9D,
93 midgard_alu_op_ieq = 0xA0,
94 midgard_alu_op_ine = 0xA1,
95 midgard_alu_op_ilt = 0xA4,
96 midgard_alu_op_ile = 0xA5,
97 midgard_alu_op_iball_eq = 0xA8,
98 midgard_alu_op_ball = 0xA9,
99 midgard_alu_op_ibany_neq = 0xB1,
100 midgard_alu_op_i2f = 0xB8,
101 midgard_alu_op_u2f = 0xBC,
102 midgard_alu_op_icsel = 0xC1,
103 midgard_alu_op_fcsel = 0xC5,
104 midgard_alu_op_fround = 0xC6,
105 midgard_alu_op_fatan_pt2 = 0xE8,
106 midgard_alu_op_frcp = 0xF0,
107 midgard_alu_op_frsqrt = 0xF2,
108 midgard_alu_op_fsqrt = 0xF3,
109 midgard_alu_op_fexp2 = 0xF4,
110 midgard_alu_op_flog2 = 0xF5,
111 midgard_alu_op_fsin = 0xF6,
112 midgard_alu_op_fcos = 0xF7,
113 midgard_alu_op_fatan2_pt1 = 0xF9,
114 } midgard_alu_op;
115
116 typedef enum {
117 midgard_outmod_none = 0,
118 midgard_outmod_pos = 1,
119 midgard_outmod_int = 2,
120 midgard_outmod_sat = 3
121 } midgard_outmod;
122
123 typedef enum {
124 midgard_reg_mode_quarter = 0,
125 midgard_reg_mode_half = 1,
126 midgard_reg_mode_full = 2,
127 midgard_reg_mode_double = 3 /* TODO: verify */
128 } midgard_reg_mode;
129
130 typedef enum {
131 midgard_dest_override_lower = 0,
132 midgard_dest_override_upper = 1,
133 midgard_dest_override_none = 2
134 } midgard_dest_override;
135
136 typedef struct
137 __attribute__((__packed__))
138 {
139 bool abs : 1;
140 bool negate : 1;
141
142 /* replicate lower half if dest = half, or low/high half selection if
143 * dest = full
144 */
145 bool rep_low : 1;
146 bool rep_high : 1; /* unused if dest = full */
147 bool half : 1; /* only matters if dest = full */
148 unsigned swizzle : 8;
149 }
150 midgard_vector_alu_src;
151
152 typedef struct
153 __attribute__((__packed__))
154 {
155 midgard_alu_op op : 8;
156 midgard_reg_mode reg_mode : 2;
157 unsigned src1 : 13;
158 unsigned src2 : 13;
159 midgard_dest_override dest_override : 2;
160 midgard_outmod outmod : 2;
161 unsigned mask : 8;
162 }
163 midgard_vector_alu;
164
165 typedef struct
166 __attribute__((__packed__))
167 {
168 bool abs : 1;
169 bool negate : 1;
170 bool full : 1; /* 0 = half, 1 = full */
171 unsigned component : 3;
172 }
173 midgard_scalar_alu_src;
174
175 typedef struct
176 __attribute__((__packed__))
177 {
178 midgard_alu_op op : 8;
179 unsigned src1 : 6;
180 unsigned src2 : 11;
181 unsigned unknown : 1;
182 midgard_outmod outmod : 2;
183 bool output_full : 1;
184 unsigned output_component : 3;
185 }
186 midgard_scalar_alu;
187
188 typedef struct
189 __attribute__((__packed__))
190 {
191 unsigned src1_reg : 5;
192 unsigned src2_reg : 5;
193 unsigned out_reg : 5;
194 bool src2_imm : 1;
195 }
196 midgard_reg_info;
197
198 typedef enum {
199 midgard_jmp_writeout_op_branch_uncond = 1,
200 midgard_jmp_writeout_op_branch_cond = 2,
201 midgard_jmp_writeout_op_discard = 4,
202 midgard_jmp_writeout_op_writeout = 7,
203 } midgard_jmp_writeout_op;
204
205 typedef enum {
206 midgard_condition_write0 = 0,
207 midgard_condition_false = 1,
208 midgard_condition_true = 2,
209 midgard_condition_always = 3, /* Special for writeout/uncond discard */
210 } midgard_condition;
211
212 typedef struct
213 __attribute__((__packed__))
214 {
215 midgard_jmp_writeout_op op : 3; /* == branch_uncond */
216 unsigned dest_tag : 4; /* tag of branch destination */
217 unsigned unknown : 2;
218 int offset : 7;
219 }
220 midgard_branch_uncond;
221
222 typedef struct
223 __attribute__((__packed__))
224 {
225 midgard_jmp_writeout_op op : 3; /* == branch_cond */
226 unsigned dest_tag : 4; /* tag of branch destination */
227 int offset : 7;
228 midgard_condition cond : 2;
229 }
230 midgard_branch_cond;
231
232 typedef struct
233 __attribute__((__packed__))
234 {
235 midgard_jmp_writeout_op op : 3; /* == branch_cond */
236 unsigned dest_tag : 4; /* tag of branch destination */
237 unsigned unknown : 2;
238 signed offset : 23;
239 unsigned cond : 16;
240 }
241 midgard_branch_extended;
242
243 typedef struct
244 __attribute__((__packed__))
245 {
246 midgard_jmp_writeout_op op : 3; /* == writeout */
247 unsigned unknown : 13;
248 }
249 midgard_writeout;
250
251 /*
252 * Load/store words
253 */
254
255 typedef enum {
256 midgard_op_ld_st_noop = 0x03,
257 midgard_op_load_attr_16 = 0x95,
258 midgard_op_load_attr_32 = 0x94,
259 midgard_op_load_vary_16 = 0x99,
260 midgard_op_load_vary_32 = 0x98,
261 midgard_op_load_color_buffer_16 = 0x9D,
262 midgard_op_load_color_buffer_8 = 0xBA,
263 midgard_op_load_uniform_16 = 0xAC,
264 midgard_op_load_uniform_32 = 0xB0,
265 midgard_op_store_vary_16 = 0xD5,
266 midgard_op_store_vary_32 = 0xD4
267 } midgard_load_store_op;
268
269 typedef enum {
270 midgard_interp_centroid = 1,
271 midgard_interp_default = 2
272 } midgard_interpolation;
273
274 typedef struct
275 __attribute__((__packed__))
276 {
277 unsigned zero1 : 4; /* Always zero */
278
279 /* Varying qualifiers, zero if not a varying */
280 unsigned flat : 1;
281 unsigned is_varying : 1; /* Always one for varying, but maybe something else? */
282 midgard_interpolation interpolation : 2;
283
284 unsigned zero2 : 2; /* Always zero */
285 }
286 midgard_varying_parameter;
287
288 typedef struct
289 __attribute__((__packed__))
290 {
291 midgard_load_store_op op : 8;
292 unsigned reg : 5;
293 unsigned mask : 4;
294 unsigned swizzle : 8;
295 unsigned unknown : 16;
296
297 unsigned varying_parameters : 10;
298
299 unsigned address : 9;
300 }
301 midgard_load_store_word;
302
303 typedef struct
304 __attribute__((__packed__))
305 {
306 unsigned type : 4;
307 unsigned next_type : 4;
308 uint64_t word1 : 60;
309 uint64_t word2 : 60;
310 }
311 midgard_load_store;
312
313 /* Texture pipeline results are in r28-r29 */
314 #define REG_TEX_BASE 28
315
316 /* Texture opcodes... maybe? */
317 #define TEXTURE_OP_NORMAL 0x11
318 #define TEXTURE_OP_TEXEL_FETCH 0x14
319
320 /* Texture format types, found in format */
321 #define TEXTURE_CUBE 0x00
322 #define TEXTURE_2D 0x02
323 #define TEXTURE_3D 0x03
324
325 typedef struct
326 __attribute__((__packed__))
327 {
328 unsigned type : 4;
329 unsigned next_type : 4;
330
331 unsigned op : 6;
332 unsigned shadow : 1;
333 unsigned unknown3 : 1;
334
335 /* A little obscure, but last is set for the last texture operation in
336 * a shader. cont appears to just be last's opposite (?). Yeah, I know,
337 * kind of funky.. BiOpen thinks it could do with memory hinting, or
338 * tile locking? */
339
340 unsigned cont : 1;
341 unsigned last : 1;
342
343 unsigned format : 5;
344 unsigned has_offset : 1;
345
346 /* Like in Bifrost */
347 unsigned filter : 1;
348
349 unsigned in_reg_select : 1;
350 unsigned in_reg_upper : 1;
351
352 unsigned in_reg_swizzle_left : 2;
353 unsigned in_reg_swizzle_right : 2;
354
355 unsigned unknown1 : 2;
356
357 unsigned unknown8 : 4;
358
359 unsigned out_full : 1;
360
361 /* Always 1 afaict... */
362 unsigned unknown7 : 2;
363
364 unsigned out_reg_select : 1;
365 unsigned out_upper : 1;
366
367 unsigned mask : 4;
368
369 unsigned unknown2 : 2;
370
371 unsigned swizzle : 8;
372 unsigned unknown4 : 8;
373
374 unsigned unknownA : 4;
375
376 unsigned offset_unknown1 : 1;
377 unsigned offset_reg_select : 1;
378 unsigned offset_reg_upper : 1;
379 unsigned offset_unknown4 : 1;
380 unsigned offset_unknown5 : 1;
381 unsigned offset_unknown6 : 1;
382 unsigned offset_unknown7 : 1;
383 unsigned offset_unknown8 : 1;
384 unsigned offset_unknown9 : 1;
385
386 unsigned unknownB : 3;
387
388 /* Texture bias or LOD, depending on whether it is executed in a
389 * fragment/vertex shader respectively. Compute as int(2^8 * biasf).
390 *
391 * For texel fetch, this is the LOD as is. */
392 unsigned bias : 8;
393
394 unsigned unknown9 : 8;
395
396 unsigned texture_handle : 16;
397 unsigned sampler_handle : 16;
398 }
399 midgard_texture_word;
400
401 /* Opcode name table */
402
403 static char *alu_opcode_names[256] = {
404 [midgard_alu_op_fadd] = "fadd",
405 [midgard_alu_op_fmul] = "fmul",
406 [midgard_alu_op_fmin] = "fmin",
407 [midgard_alu_op_fmax] = "fmax",
408 [midgard_alu_op_fmov] = "fmov",
409 [midgard_alu_op_froundeven] = "froundeven",
410 [midgard_alu_op_ftrunc] = "ftrunc",
411 [midgard_alu_op_ffloor] = "ffloor",
412 [midgard_alu_op_fceil] = "fceil",
413 [midgard_alu_op_ffma] = "ffma",
414 [midgard_alu_op_fdot3] = "fdot3",
415 [midgard_alu_op_fdot3r] = "fdot3r",
416 [midgard_alu_op_fdot4] = "fdot4",
417 [midgard_alu_op_freduce] = "freduce",
418 [midgard_alu_op_imin] = "imin",
419 [midgard_alu_op_imax] = "imax",
420 [midgard_alu_op_ishl] = "ishl",
421 [midgard_alu_op_iasr] = "iasr",
422 [midgard_alu_op_ilsr] = "ilsr",
423 [midgard_alu_op_iadd] = "iadd",
424 [midgard_alu_op_ishladd] = "ishladd",
425 [midgard_alu_op_isub] = "isub",
426 [midgard_alu_op_imul] = "imul",
427 [midgard_alu_op_imov] = "imov",
428 [midgard_alu_op_iand] = "iand",
429 [midgard_alu_op_ior] = "ior",
430 [midgard_alu_op_inot] = "inot",
431 [midgard_alu_op_iandnot] = "iandnot",
432 [midgard_alu_op_ixor] = "ixor",
433 [midgard_alu_op_feq] = "feq",
434 [midgard_alu_op_fne] = "fne",
435 [midgard_alu_op_flt] = "flt",
436 [midgard_alu_op_fle] = "fle",
437 [midgard_alu_op_fball_eq] = "fball_eq",
438 [midgard_alu_op_fbany_neq] = "fbany_neq",
439 [midgard_alu_op_bball_eq] = "bball_eq",
440 [midgard_alu_op_bbany_neq] = "bbany_neq",
441 [midgard_alu_op_f2i] = "f2i",
442 [midgard_alu_op_f2u] = "f2u",
443 [midgard_alu_op_f2u8] = "f2u8",
444 [midgard_alu_op_ieq] = "ieq",
445 [midgard_alu_op_ine] = "ine",
446 [midgard_alu_op_ilt] = "ilt",
447 [midgard_alu_op_ile] = "ile",
448 [midgard_alu_op_iball_eq] = "iball_eq",
449 [midgard_alu_op_ball] = "ball",
450 [midgard_alu_op_ibany_neq] = "ibany_neq",
451 [midgard_alu_op_i2f] = "i2f",
452 [midgard_alu_op_u2f] = "u2f",
453 [midgard_alu_op_icsel] = "icsel",
454 [midgard_alu_op_fcsel] = "fcsel",
455 [midgard_alu_op_fround] = "fround",
456 [midgard_alu_op_fatan_pt2] = "fatan_pt2",
457 [midgard_alu_op_frcp] = "frcp",
458 [midgard_alu_op_frsqrt] = "frsqrt",
459 [midgard_alu_op_fsqrt] = "fsqrt",
460 [midgard_alu_op_fexp2] = "fexp2",
461 [midgard_alu_op_flog2] = "flog2",
462 [midgard_alu_op_fsin] = "fsin",
463 [midgard_alu_op_fcos] = "fcos",
464 [midgard_alu_op_fatan2_pt1] = "fatan2_pt1"
465 };
466
467 static char *load_store_opcode_names[256] = {
468 [midgard_op_load_attr_16] = "ld_attr_16",
469 [midgard_op_load_attr_32] = "ld_attr_32",
470 [midgard_op_load_vary_16] = "ld_vary_16",
471 [midgard_op_load_vary_32] = "ld_vary_32",
472 [midgard_op_load_uniform_16] = "ld_uniform_16",
473 [midgard_op_load_uniform_32] = "ld_uniform_32",
474 [midgard_op_load_color_buffer_8] = "ld_color_buffer_8",
475 [midgard_op_load_color_buffer_16] = "ld_color_buffer_16",
476 [midgard_op_store_vary_16] = "st_vary_16",
477 [midgard_op_store_vary_32] = "st_vary_32"
478 };
479
480 #endif