freedreno/ir3: Simpify the immediates from an array of vec4 to array of dwords.
[mesa.git] / src / freedreno / ir3 / ir3_parser.y
1 /*
2 * Copyright (c) 2013 Rob Clark <robclark@freedesktop.org>
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 * SOFTWARE.
22 */
23
24 %code requires {
25 #include "ir3/ir3_assembler.h"
26
27 struct ir3 * ir3_parse(struct ir3_shader_variant *v,
28 struct ir3_kernel_info *k, FILE *f);
29 }
30
31 %{
32 #define YYDEBUG 0
33
34 #include <stdlib.h>
35 #include <stdio.h>
36 #include <string.h>
37 #include <math.h>
38
39 #include "util/u_math.h"
40
41 #include "ir3/ir3.h"
42 #include "ir3/ir3_shader.h"
43 #include "ir3/instr-a3xx.h"
44
45 #include "ir3_parser.h"
46
47 /* ir3 treats the abs/neg flags as separate flags for float vs integer,
48 * but in the instruction encoding they are the same thing. Tracking
49 * them separately is only for the benefit of ir3 opt passes, and not
50 * required here, so just use the float versions:
51 */
52 #define IR3_REG_ABS IR3_REG_FABS
53 #define IR3_REG_NEGATE IR3_REG_FNEG
54
55 static struct ir3_kernel_info *info;
56 static struct ir3_shader_variant *variant;
57 /* NOTE the assembler doesn't really use the ir3_block construction
58 * like the compiler does. Everything is treated as one large block.
59 * Which might happen to contain flow control. But since we don't
60 * use any of the ir3 backend passes (sched, RA, etc) this doesn't
61 * really matter.
62 */
63 static struct ir3_block *block; /* current shader block */
64 static struct ir3_instruction *instr; /* current instruction */
65
66 static struct {
67 unsigned flags;
68 unsigned repeat;
69 unsigned nop;
70 } iflags;
71
72 static struct {
73 unsigned flags;
74 unsigned wrmask;
75 } rflags;
76
77 int ir3_yyget_lineno(void);
78
79 static struct ir3_instruction * new_instr(opc_t opc)
80 {
81 instr = ir3_instr_create(block, opc);
82 instr->flags = iflags.flags;
83 instr->repeat = iflags.repeat;
84 instr->nop = iflags.nop;
85 instr->line = ir3_yyget_lineno();
86 iflags.flags = iflags.repeat = iflags.nop = 0;
87 return instr;
88 }
89
90 static void new_shader(void)
91 {
92 variant->ir = ir3_create(variant->shader->compiler, variant);
93 block = ir3_block_create(variant->ir);
94 list_addtail(&block->node, &variant->ir->block_list);
95 }
96
97 static type_t parse_type(const char **type)
98 {
99 if (!strncmp("f16", *type, 3)) {
100 *type += 3;
101 return TYPE_F16;
102 } else if (!strncmp("f32", *type, 3)) {
103 *type += 3;
104 return TYPE_F32;
105 } else if (!strncmp("u16", *type, 3)) {
106 *type += 3;
107 return TYPE_U16;
108 } else if (!strncmp("u32", *type, 3)) {
109 *type += 3;
110 return TYPE_U32;
111 } else if (!strncmp("s16", *type, 3)) {
112 *type += 3;
113 return TYPE_S16;
114 } else if (!strncmp("s32", *type, 3)) {
115 *type += 3;
116 return TYPE_S32;
117 } else if (!strncmp("u8", *type, 2)) {
118 *type += 2;
119 return TYPE_U8;
120 } else if (!strncmp("s8", *type, 2)) {
121 *type += 2;
122 return TYPE_S8;
123 } else {
124 assert(0); /* shouldn't get here */
125 return ~0;
126 }
127 }
128
129 static struct ir3_instruction * parse_type_type(struct ir3_instruction *instr,
130 const char *type_type)
131 {
132 instr->cat1.src_type = parse_type(&type_type);
133 instr->cat1.dst_type = parse_type(&type_type);
134 return instr;
135 }
136
137 static struct ir3_register * new_reg(int num, unsigned flags)
138 {
139 struct ir3_register *reg;
140 flags |= rflags.flags;
141 if (num & 0x1)
142 flags |= IR3_REG_HALF;
143 reg = ir3_reg_create(instr, num>>1, flags);
144 reg->wrmask = MAX2(1, rflags.wrmask);
145 rflags.flags = rflags.wrmask = 0;
146 return reg;
147 }
148
149 static struct ir3_register * dummy_dst(void)
150 {
151 return new_reg(0, 0);
152 }
153
154 static void add_const(unsigned reg, unsigned c0, unsigned c1, unsigned c2, unsigned c3)
155 {
156 struct ir3_const_state *const_state = ir3_const_state(variant);
157 assert((reg & 0x7) == 0);
158 int idx = reg >> (1 + 2); /* low bit is half vs full, next two bits are swiz */
159 if (const_state->immediates_count == const_state->immediates_size) {
160 const_state->immediates = rerzalloc(const_state,
161 const_state->immediates,
162 __typeof__(const_state->immediates[0]),
163 const_state->immediates_size,
164 const_state->immediates_size + 4);
165 const_state->immediates_size += 4;
166 }
167 const_state->immediates[idx * 4 + 0] = c0;
168 const_state->immediates[idx * 4 + 1] = c1;
169 const_state->immediates[idx * 4 + 2] = c2;
170 const_state->immediates[idx * 4 + 3] = c3;
171 const_state->immediates_count++;
172 }
173
174 static void add_sysval(unsigned reg, unsigned compmask, gl_system_value sysval)
175 {
176 unsigned n = variant->inputs_count++;
177 variant->inputs[n].regid = reg;
178 variant->inputs[n].sysval = true;
179 variant->inputs[n].slot = sysval;
180 variant->inputs[n].compmask = compmask;
181 variant->inputs[n].interpolate = INTERP_MODE_FLAT;
182 variant->total_in++;
183 }
184
185 #ifdef YYDEBUG
186 int yydebug;
187 #endif
188
189 extern int yylex(void);
190 extern FILE *ir3_yyin;
191 void ir3_yyset_lineno(int _line_number);
192
193 int yyparse(void);
194
195 static void yyerror(const char *error)
196 {
197 fprintf(stderr, "error at line %d: %s\n", ir3_yyget_lineno(), error);
198 }
199
200 struct ir3 * ir3_parse(struct ir3_shader_variant *v,
201 struct ir3_kernel_info *k, FILE *f)
202 {
203 ir3_yyset_lineno(1);
204 ir3_yyin = f;
205 #ifdef YYDEBUG
206 yydebug = 1;
207 #endif
208 info = k;
209 variant = v;
210 if (yyparse()) {
211 ir3_destroy(variant->ir);
212 variant->ir = NULL;
213 }
214 return variant->ir;
215 }
216 %}
217
218 %union {
219 int tok;
220 int num;
221 uint32_t unum;
222 double flt;
223 const char *str;
224 struct ir3_register *reg;
225 struct {
226 int start;
227 int num;
228 } range;
229 type_t type;
230 }
231
232 %{
233 #if YYDEBUG
234 static void print_token(FILE *file, int type, YYSTYPE value)
235 {
236 fprintf(file, "\ntype: %d\n", type);
237 }
238
239 #define YYPRINT(file, type, value) print_token(file, type, value)
240 #endif
241 %}
242
243 %token <num> T_INT
244 %token <unum> T_HEX
245 %token <flt> T_FLOAT
246 %token <str> T_IDENTIFIER
247 %token <num> T_REGISTER
248 %token <num> T_CONSTANT
249
250 /* @ headers (@const/@sampler/@uniform/@varying) */
251 %token <tok> T_A_LOCALSIZE
252 %token <tok> T_A_CONST
253 %token <tok> T_A_BUF
254 %token <tok> T_A_INVOCATIONID
255 %token <tok> T_A_WGID
256 %token <tok> T_A_NUMWG
257 %token <tok> T_A_IN
258 %token <tok> T_A_OUT
259 %token <tok> T_A_TEX
260 /* todo, re-add @sampler/@uniform/@varying if needed someday */
261
262 /* src register flags */
263 %token <tok> T_ABSNEG
264 %token <tok> T_NEG
265 %token <tok> T_ABS
266 %token <tok> T_R
267
268 %token <tok> T_HR
269 %token <tok> T_HC
270
271 /* dst register flags */
272 %token <tok> T_EVEN
273 %token <tok> T_POS_INFINITY
274 %token <tok> T_EI
275 %token <num> T_WRMASK
276
277 /* instruction flags */
278 %token <tok> T_SY
279 %token <tok> T_SS
280 %token <tok> T_JP
281 %token <num> T_RPT
282 %token <tok> T_UL
283 %token <tok> T_NOP
284
285 /* category 0: */
286 %token <tok> T_OP_NOP
287 %token <tok> T_OP_BR
288 %token <tok> T_OP_JUMP
289 %token <tok> T_OP_CALL
290 %token <tok> T_OP_RET
291 %token <tok> T_OP_KILL
292 %token <tok> T_OP_END
293 %token <tok> T_OP_EMIT
294 %token <tok> T_OP_CUT
295 %token <tok> T_OP_CHMASK
296 %token <tok> T_OP_CHSH
297 %token <tok> T_OP_FLOW_REV
298
299 /* category 1: */
300 %token <tok> T_OP_MOVA
301 %token <tok> T_OP_MOV
302 %token <tok> T_OP_COV
303
304 /* category 2: */
305 %token <tok> T_OP_ADD_F
306 %token <tok> T_OP_MIN_F
307 %token <tok> T_OP_MAX_F
308 %token <tok> T_OP_MUL_F
309 %token <tok> T_OP_SIGN_F
310 %token <tok> T_OP_CMPS_F
311 %token <tok> T_OP_ABSNEG_F
312 %token <tok> T_OP_CMPV_F
313 %token <tok> T_OP_FLOOR_F
314 %token <tok> T_OP_CEIL_F
315 %token <tok> T_OP_RNDNE_F
316 %token <tok> T_OP_RNDAZ_F
317 %token <tok> T_OP_TRUNC_F
318 %token <tok> T_OP_ADD_U
319 %token <tok> T_OP_ADD_S
320 %token <tok> T_OP_SUB_U
321 %token <tok> T_OP_SUB_S
322 %token <tok> T_OP_CMPS_U
323 %token <tok> T_OP_CMPS_S
324 %token <tok> T_OP_MIN_U
325 %token <tok> T_OP_MIN_S
326 %token <tok> T_OP_MAX_U
327 %token <tok> T_OP_MAX_S
328 %token <tok> T_OP_ABSNEG_S
329 %token <tok> T_OP_AND_B
330 %token <tok> T_OP_OR_B
331 %token <tok> T_OP_NOT_B
332 %token <tok> T_OP_XOR_B
333 %token <tok> T_OP_CMPV_U
334 %token <tok> T_OP_CMPV_S
335 %token <tok> T_OP_MUL_U24
336 %token <tok> T_OP_MUL_S24
337 %token <tok> T_OP_MULL_U
338 %token <tok> T_OP_BFREV_B
339 %token <tok> T_OP_CLZ_S
340 %token <tok> T_OP_CLZ_B
341 %token <tok> T_OP_SHL_B
342 %token <tok> T_OP_SHR_B
343 %token <tok> T_OP_ASHR_B
344 %token <tok> T_OP_BARY_F
345 %token <tok> T_OP_MGEN_B
346 %token <tok> T_OP_GETBIT_B
347 %token <tok> T_OP_SETRM
348 %token <tok> T_OP_CBITS_B
349 %token <tok> T_OP_SHB
350 %token <tok> T_OP_MSAD
351
352 /* category 3: */
353 %token <tok> T_OP_MAD_U16
354 %token <tok> T_OP_MADSH_U16
355 %token <tok> T_OP_MAD_S16
356 %token <tok> T_OP_MADSH_M16
357 %token <tok> T_OP_MAD_U24
358 %token <tok> T_OP_MAD_S24
359 %token <tok> T_OP_MAD_F16
360 %token <tok> T_OP_MAD_F32
361 %token <tok> T_OP_SEL_B16
362 %token <tok> T_OP_SEL_B32
363 %token <tok> T_OP_SEL_S16
364 %token <tok> T_OP_SEL_S32
365 %token <tok> T_OP_SEL_F16
366 %token <tok> T_OP_SEL_F32
367 %token <tok> T_OP_SAD_S16
368 %token <tok> T_OP_SAD_S32
369
370 /* category 4: */
371 %token <tok> T_OP_RCP
372 %token <tok> T_OP_RSQ
373 %token <tok> T_OP_LOG2
374 %token <tok> T_OP_EXP2
375 %token <tok> T_OP_SIN
376 %token <tok> T_OP_COS
377 %token <tok> T_OP_SQRT
378 %token <tok> T_OP_HRSQ
379 %token <tok> T_OP_HLOG2
380 %token <tok> T_OP_HEXP2
381
382 /* category 5: */
383 %token <tok> T_OP_ISAM
384 %token <tok> T_OP_ISAML
385 %token <tok> T_OP_ISAMM
386 %token <tok> T_OP_SAM
387 %token <tok> T_OP_SAMB
388 %token <tok> T_OP_SAML
389 %token <tok> T_OP_SAMGQ
390 %token <tok> T_OP_GETLOD
391 %token <tok> T_OP_CONV
392 %token <tok> T_OP_CONVM
393 %token <tok> T_OP_GETSIZE
394 %token <tok> T_OP_GETBUF
395 %token <tok> T_OP_GETPOS
396 %token <tok> T_OP_GETINFO
397 %token <tok> T_OP_DSX
398 %token <tok> T_OP_DSY
399 %token <tok> T_OP_GATHER4R
400 %token <tok> T_OP_GATHER4G
401 %token <tok> T_OP_GATHER4B
402 %token <tok> T_OP_GATHER4A
403 %token <tok> T_OP_SAMGP0
404 %token <tok> T_OP_SAMGP1
405 %token <tok> T_OP_SAMGP2
406 %token <tok> T_OP_SAMGP3
407 %token <tok> T_OP_DSXPP_1
408 %token <tok> T_OP_DSYPP_1
409 %token <tok> T_OP_RGETPOS
410 %token <tok> T_OP_RGETINFO
411
412 /* category 6: */
413 %token <tok> T_OP_LDG
414 %token <tok> T_OP_LDL
415 %token <tok> T_OP_LDP
416 %token <tok> T_OP_STG
417 %token <tok> T_OP_STL
418 %token <tok> T_OP_STP
419 %token <tok> T_OP_LDIB
420 %token <tok> T_OP_G2L
421 %token <tok> T_OP_L2G
422 %token <tok> T_OP_PREFETCH
423 %token <tok> T_OP_LDLW
424 %token <tok> T_OP_STLW
425 %token <tok> T_OP_RESFMT
426 %token <tok> T_OP_RESINF
427 %token <tok> T_OP_ATOMIC_ADD
428 %token <tok> T_OP_ATOMIC_SUB
429 %token <tok> T_OP_ATOMIC_XCHG
430 %token <tok> T_OP_ATOMIC_INC
431 %token <tok> T_OP_ATOMIC_DEC
432 %token <tok> T_OP_ATOMIC_CMPXCHG
433 %token <tok> T_OP_ATOMIC_MIN
434 %token <tok> T_OP_ATOMIC_MAX
435 %token <tok> T_OP_ATOMIC_AND
436 %token <tok> T_OP_ATOMIC_OR
437 %token <tok> T_OP_ATOMIC_XOR
438 %token <tok> T_OP_LDGB
439 %token <tok> T_OP_STGB
440 %token <tok> T_OP_STIB
441 %token <tok> T_OP_LDC
442 %token <tok> T_OP_LDLV
443
444 /* type qualifiers: */
445 %token <tok> T_TYPE_F16
446 %token <tok> T_TYPE_F32
447 %token <tok> T_TYPE_U16
448 %token <tok> T_TYPE_U32
449 %token <tok> T_TYPE_S16
450 %token <tok> T_TYPE_S32
451 %token <tok> T_TYPE_U8
452 %token <tok> T_TYPE_S8
453
454 %token <tok> T_UNTYPED
455 %token <tok> T_TYPED
456
457 %token <tok> T_1D
458 %token <tok> T_2D
459 %token <tok> T_3D
460 %token <tok> T_4D
461
462 /* condition qualifiers: */
463 %token <tok> T_LT
464 %token <tok> T_LE
465 %token <tok> T_GT
466 %token <tok> T_GE
467 %token <tok> T_EQ
468 %token <tok> T_NE
469
470 %token <tok> T_S2EN
471 %token <tok> T_SAMP
472 %token <tok> T_TEX
473 %token <tok> T_BASE
474
475 %token <tok> T_NAN
476 %token <tok> T_INF
477 %token <num> T_A0
478 %token <num> T_P0
479 %token <str> T_CAT1_TYPE_TYPE
480
481 %type <num> integer offset
482 %type <flt> float
483 %type <reg> reg const
484 %type <tok> cat1_opc
485 %type <tok> cat2_opc_1src cat2_opc_2src_cnd cat2_opc_2src
486 %type <tok> cat3_opc
487 %type <tok> cat4_opc
488 %type <tok> cat5_opc cat5_samp cat5_tex cat5_type
489 %type <type> type
490 %type <unum> const_val
491
492 %error-verbose
493
494 %start shader
495
496 %%
497
498 shader: { new_shader(); } headers instrs
499
500 headers:
501 | header headers
502
503 header: localsize_header
504 | const_header
505 | buf_header
506 | invocationid_header
507 | wgid_header
508 | numwg_header
509 | in_header
510 | out_header
511 | tex_header
512
513 const_val: T_FLOAT { $$ = fui($1); }
514 | T_INT { $$ = $1; }
515 | '-' T_INT { $$ = -$2; }
516 | T_HEX { $$ = $1; }
517
518 localsize_header: T_A_LOCALSIZE const_val ',' const_val ',' const_val {
519 info->local_size[0] = $2;
520 info->local_size[1] = $4;
521 info->local_size[2] = $6;
522 }
523
524 const_header: T_A_CONST '(' T_CONSTANT ')' const_val ',' const_val ',' const_val ',' const_val {
525 add_const($3, $5, $7, $9, $11);
526 }
527
528 buf_header: T_A_BUF const_val {
529 int idx = info->num_bufs++;
530 assert(idx < MAX_BUFS);
531 info->buf_sizes[idx] = $2;
532 }
533
534 invocationid_header: T_A_INVOCATIONID '(' T_REGISTER ')' {
535 assert(($3 & 0x1) == 0); /* half-reg not allowed */
536 unsigned reg = $3 >> 1;
537 add_sysval(reg, 0x7, SYSTEM_VALUE_LOCAL_INVOCATION_ID);
538 }
539
540 wgid_header: T_A_WGID '(' T_REGISTER ')' {
541 assert(($3 & 0x1) == 0); /* half-reg not allowed */
542 unsigned reg = $3 >> 1;
543 assert(reg >= regid(48, 0)); /* must be a high reg */
544 add_sysval(reg, 0x7, SYSTEM_VALUE_WORK_GROUP_ID);
545 }
546
547 numwg_header: T_A_NUMWG '(' T_CONSTANT ')' {
548 assert(($3 & 0x1) == 0); /* half-reg not allowed */
549 unsigned reg = $3 >> 1;
550 info->numwg = reg;
551 /* reserve space in immediates for the actual value to be plugged in later: */
552 add_const($3, 0, 0, 0, 0);
553 }
554
555 /* Stubs for now */
556 in_header: T_A_IN '(' T_REGISTER ')' T_IDENTIFIER '(' T_IDENTIFIER '=' integer ')' { }
557
558 out_header: T_A_OUT '(' T_REGISTER ')' T_IDENTIFIER '(' T_IDENTIFIER '=' integer ')' { }
559
560 tex_header: T_A_TEX '(' T_REGISTER ')'
561 T_IDENTIFIER '=' integer ',' /* src */
562 T_IDENTIFIER '=' integer ',' /* samp */
563 T_IDENTIFIER '=' integer ',' /* tex */
564 T_IDENTIFIER '=' integer ',' /* wrmask */
565 T_IDENTIFIER '=' integer /* cmd */ { }
566
567 iflag: T_SY { iflags.flags |= IR3_INSTR_SY; }
568 | T_SS { iflags.flags |= IR3_INSTR_SS; }
569 | T_JP { iflags.flags |= IR3_INSTR_JP; }
570 | T_RPT { iflags.repeat = $1; }
571 | T_UL { iflags.flags |= IR3_INSTR_UL; }
572 | T_NOP { iflags.nop = $1; }
573
574 iflags:
575 | iflag iflags
576
577 instrs: instr instrs
578 | instr
579
580 instr: iflags cat0_instr
581 | iflags cat1_instr
582 | iflags cat2_instr
583 | iflags cat3_instr
584 | iflags cat4_instr
585 | iflags cat5_instr
586 | iflags cat6_instr
587
588 cat0_src: '!' T_P0 { instr->cat0.inv = true; instr->cat0.comp = $2 >> 1; }
589 | T_P0 { instr->cat0.comp = $1 >> 1; }
590
591 cat0_immed: '#' integer { instr->cat0.immed = $2; }
592
593 cat0_instr: T_OP_NOP { new_instr(OPC_NOP); }
594 | T_OP_BR { new_instr(OPC_B); } cat0_src ',' cat0_immed
595 | T_OP_JUMP { new_instr(OPC_JUMP); } cat0_immed
596 | T_OP_CALL { new_instr(OPC_CALL); } cat0_immed
597 | T_OP_RET { new_instr(OPC_RET); }
598 | T_OP_KILL { new_instr(OPC_KILL); } cat0_src
599 | T_OP_END { new_instr(OPC_END); }
600 | T_OP_EMIT { new_instr(OPC_EMIT); }
601 | T_OP_CUT { new_instr(OPC_CUT); }
602 | T_OP_CHMASK { new_instr(OPC_CHMASK); }
603 | T_OP_CHSH { new_instr(OPC_CHSH); }
604 | T_OP_FLOW_REV { new_instr(OPC_FLOW_REV); }
605
606 cat1_opc: T_OP_MOVA {
607 new_instr(OPC_MOV);
608 instr->cat1.src_type = TYPE_S16;
609 instr->cat1.dst_type = TYPE_S16;
610 }
611 | T_OP_MOV '.' T_CAT1_TYPE_TYPE {
612 parse_type_type(new_instr(OPC_MOV), $3);
613 }
614 | T_OP_COV '.' T_CAT1_TYPE_TYPE {
615 parse_type_type(new_instr(OPC_MOV), $3);
616 }
617
618 cat1_instr: cat1_opc dst_reg ',' src_reg_or_const_or_rel_or_imm
619
620 cat2_opc_1src: T_OP_ABSNEG_F { new_instr(OPC_ABSNEG_F); }
621 | T_OP_ABSNEG_S { new_instr(OPC_ABSNEG_S); }
622 | T_OP_CLZ_B { new_instr(OPC_CLZ_B); }
623 | T_OP_CLZ_S { new_instr(OPC_CLZ_S); }
624 | T_OP_SIGN_F { new_instr(OPC_SIGN_F); }
625 | T_OP_FLOOR_F { new_instr(OPC_FLOOR_F); }
626 | T_OP_CEIL_F { new_instr(OPC_CEIL_F); }
627 | T_OP_RNDNE_F { new_instr(OPC_RNDNE_F); }
628 | T_OP_RNDAZ_F { new_instr(OPC_RNDAZ_F); }
629 | T_OP_TRUNC_F { new_instr(OPC_TRUNC_F); }
630 | T_OP_NOT_B { new_instr(OPC_NOT_B); }
631 | T_OP_BFREV_B { new_instr(OPC_BFREV_B); }
632 | T_OP_SETRM { new_instr(OPC_SETRM); }
633 | T_OP_CBITS_B { new_instr(OPC_CBITS_B); }
634
635 cat2_opc_2src_cnd: T_OP_CMPS_F { new_instr(OPC_CMPS_F); }
636 | T_OP_CMPS_U { new_instr(OPC_CMPS_U); }
637 | T_OP_CMPS_S { new_instr(OPC_CMPS_S); }
638 | T_OP_CMPV_F { new_instr(OPC_CMPV_F); }
639 | T_OP_CMPV_U { new_instr(OPC_CMPV_U); }
640 | T_OP_CMPV_S { new_instr(OPC_CMPV_S); }
641
642 cat2_opc_2src: T_OP_ADD_F { new_instr(OPC_ADD_F); }
643 | T_OP_MIN_F { new_instr(OPC_MIN_F); }
644 | T_OP_MAX_F { new_instr(OPC_MAX_F); }
645 | T_OP_MUL_F { new_instr(OPC_MUL_F); }
646 | T_OP_ADD_U { new_instr(OPC_ADD_U); }
647 | T_OP_ADD_S { new_instr(OPC_ADD_S); }
648 | T_OP_SUB_U { new_instr(OPC_SUB_U); }
649 | T_OP_SUB_S { new_instr(OPC_SUB_S); }
650 | T_OP_MIN_U { new_instr(OPC_MIN_U); }
651 | T_OP_MIN_S { new_instr(OPC_MIN_S); }
652 | T_OP_MAX_U { new_instr(OPC_MAX_U); }
653 | T_OP_MAX_S { new_instr(OPC_MAX_S); }
654 | T_OP_AND_B { new_instr(OPC_AND_B); }
655 | T_OP_OR_B { new_instr(OPC_OR_B); }
656 | T_OP_XOR_B { new_instr(OPC_XOR_B); }
657 | T_OP_MUL_U24 { new_instr(OPC_MUL_U24); }
658 | T_OP_MUL_S24 { new_instr(OPC_MUL_S24); }
659 | T_OP_MULL_U { new_instr(OPC_MULL_U); }
660 | T_OP_SHL_B { new_instr(OPC_SHL_B); }
661 | T_OP_SHR_B { new_instr(OPC_SHR_B); }
662 | T_OP_ASHR_B { new_instr(OPC_ASHR_B); }
663 | T_OP_BARY_F { new_instr(OPC_BARY_F); }
664 | T_OP_MGEN_B { new_instr(OPC_MGEN_B); }
665 | T_OP_GETBIT_B { new_instr(OPC_GETBIT_B); }
666 | T_OP_SHB { new_instr(OPC_SHB); }
667 | T_OP_MSAD { new_instr(OPC_MSAD); }
668
669 cond: T_LT { instr->cat2.condition = IR3_COND_LT; }
670 | T_LE { instr->cat2.condition = IR3_COND_LE; }
671 | T_GT { instr->cat2.condition = IR3_COND_GT; }
672 | T_GE { instr->cat2.condition = IR3_COND_GE; }
673 | T_EQ { instr->cat2.condition = IR3_COND_EQ; }
674 | T_NE { instr->cat2.condition = IR3_COND_NE; }
675
676 cat2_instr: cat2_opc_1src dst_reg ',' src_reg_or_const_or_rel_or_imm
677 | cat2_opc_2src_cnd '.' cond dst_reg ',' src_reg_or_const_or_rel_or_imm ',' src_reg_or_const_or_rel_or_imm
678 | cat2_opc_2src dst_reg ',' src_reg_or_const_or_rel_or_imm ',' src_reg_or_const_or_rel_or_imm
679
680 cat3_opc: T_OP_MAD_U16 { new_instr(OPC_MAD_U16); }
681 | T_OP_MADSH_U16 { new_instr(OPC_MADSH_U16); }
682 | T_OP_MAD_S16 { new_instr(OPC_MAD_S16); }
683 | T_OP_MADSH_M16 { new_instr(OPC_MADSH_M16); }
684 | T_OP_MAD_U24 { new_instr(OPC_MAD_U24); }
685 | T_OP_MAD_S24 { new_instr(OPC_MAD_S24); }
686 | T_OP_MAD_F16 { new_instr(OPC_MAD_F16); }
687 | T_OP_MAD_F32 { new_instr(OPC_MAD_F32); }
688 | T_OP_SEL_B16 { new_instr(OPC_SEL_B16); }
689 | T_OP_SEL_B32 { new_instr(OPC_SEL_B32); }
690 | T_OP_SEL_S16 { new_instr(OPC_SEL_S16); }
691 | T_OP_SEL_S32 { new_instr(OPC_SEL_S32); }
692 | T_OP_SEL_F16 { new_instr(OPC_SEL_F16); }
693 | T_OP_SEL_F32 { new_instr(OPC_SEL_F32); }
694 | T_OP_SAD_S16 { new_instr(OPC_SAD_S16); }
695 | T_OP_SAD_S32 { new_instr(OPC_SAD_S32); }
696
697 cat3_instr: cat3_opc dst_reg ',' src_reg_or_const_or_rel ',' src_reg_or_const ',' src_reg_or_const_or_rel
698
699 cat4_opc: T_OP_RCP { new_instr(OPC_RCP); }
700 | T_OP_RSQ { new_instr(OPC_RSQ); }
701 | T_OP_LOG2 { new_instr(OPC_LOG2); }
702 | T_OP_EXP2 { new_instr(OPC_EXP2); }
703 | T_OP_SIN { new_instr(OPC_SIN); }
704 | T_OP_COS { new_instr(OPC_COS); }
705 | T_OP_SQRT { new_instr(OPC_SQRT); }
706 | T_OP_HRSQ { new_instr(OPC_HRSQ); }
707 | T_OP_HLOG2 { new_instr(OPC_HLOG2); }
708 | T_OP_HEXP2 { new_instr(OPC_HEXP2); }
709
710 cat4_instr: cat4_opc dst_reg ',' src_reg_or_const_or_rel_or_imm
711
712 cat5_opc_dsxypp: T_OP_DSXPP_1 { new_instr(OPC_DSXPP_1); }
713 | T_OP_DSYPP_1 { new_instr(OPC_DSYPP_1); }
714
715 cat5_opc: T_OP_ISAM { new_instr(OPC_ISAM); }
716 | T_OP_ISAML { new_instr(OPC_ISAML); }
717 | T_OP_ISAMM { new_instr(OPC_ISAMM); }
718 | T_OP_SAM { new_instr(OPC_SAM); }
719 | T_OP_SAMB { new_instr(OPC_SAMB); }
720 | T_OP_SAML { new_instr(OPC_SAML); }
721 | T_OP_SAMGQ { new_instr(OPC_SAMGQ); }
722 | T_OP_GETLOD { new_instr(OPC_GETLOD); }
723 | T_OP_CONV { new_instr(OPC_CONV); }
724 | T_OP_CONVM { new_instr(OPC_CONVM); }
725 | T_OP_GETSIZE { new_instr(OPC_GETSIZE); }
726 | T_OP_GETBUF { new_instr(OPC_GETBUF); }
727 | T_OP_GETPOS { new_instr(OPC_GETPOS); }
728 | T_OP_GETINFO { new_instr(OPC_GETINFO); }
729 | T_OP_DSX { new_instr(OPC_DSX); }
730 | T_OP_DSY { new_instr(OPC_DSY); }
731 | T_OP_GATHER4R { new_instr(OPC_GATHER4R); }
732 | T_OP_GATHER4G { new_instr(OPC_GATHER4G); }
733 | T_OP_GATHER4B { new_instr(OPC_GATHER4B); }
734 | T_OP_GATHER4A { new_instr(OPC_GATHER4A); }
735 | T_OP_SAMGP0 { new_instr(OPC_SAMGP0); }
736 | T_OP_SAMGP1 { new_instr(OPC_SAMGP1); }
737 | T_OP_SAMGP2 { new_instr(OPC_SAMGP2); }
738 | T_OP_SAMGP3 { new_instr(OPC_SAMGP3); }
739 | T_OP_RGETPOS { new_instr(OPC_RGETPOS); }
740 | T_OP_RGETINFO { new_instr(OPC_RGETINFO); }
741
742 cat5_flag: '.' T_3D { instr->flags |= IR3_INSTR_3D; }
743 | '.' 'a' { instr->flags |= IR3_INSTR_A; }
744 | '.' 'o' { instr->flags |= IR3_INSTR_O; }
745 | '.' 'p' { instr->flags |= IR3_INSTR_P; }
746 | '.' 's' { instr->flags |= IR3_INSTR_S; }
747 | '.' T_S2EN { instr->flags |= IR3_INSTR_S2EN; }
748 | '.' T_BASE { instr->flags |= IR3_INSTR_B; instr->cat5.tex_base = $2; }
749 cat5_flags:
750 | cat5_flag cat5_flags
751
752 cat5_samp: T_SAMP { instr->cat5.samp = $1; }
753 cat5_tex: T_TEX { if (instr->flags & IR3_INSTR_B) instr->cat5.samp |= ($1 << 4); else instr->cat5.tex = $1; }
754 cat5_type: '(' type ')' { instr->cat5.type = $2; }
755
756 cat5_instr: cat5_opc_dsxypp cat5_flags dst_reg ',' src_reg
757 | cat5_opc cat5_flags cat5_type dst_reg ',' src_reg ',' src_reg ',' cat5_samp ',' cat5_tex
758 | cat5_opc cat5_flags cat5_type dst_reg ',' src_reg ',' src_reg ',' cat5_samp
759 | cat5_opc cat5_flags cat5_type dst_reg ',' src_reg ',' src_reg ',' cat5_tex
760 | cat5_opc cat5_flags cat5_type dst_reg ',' src_reg ',' src_reg
761 | cat5_opc cat5_flags cat5_type dst_reg ',' src_reg ',' cat5_samp ',' cat5_tex
762 | cat5_opc cat5_flags cat5_type dst_reg ',' src_reg ',' cat5_samp
763 | cat5_opc cat5_flags cat5_type dst_reg ',' src_reg ',' cat5_tex
764 | cat5_opc cat5_flags cat5_type dst_reg ',' src_reg
765 | cat5_opc cat5_flags cat5_type dst_reg ',' cat5_samp ',' cat5_tex
766 | cat5_opc cat5_flags cat5_type dst_reg ',' cat5_samp
767 | cat5_opc cat5_flags cat5_type dst_reg ',' cat5_tex
768 | cat5_opc cat5_flags cat5_type dst_reg
769
770 cat6_typed: '.' T_UNTYPED { instr->cat6.typed = 0; }
771 | '.' T_TYPED { instr->cat6.typed = 1; }
772
773 cat6_dim: '.' T_1D { instr->cat6.d = 1; }
774 | '.' T_2D { instr->cat6.d = 2; }
775 | '.' T_3D { instr->cat6.d = 3; }
776 | '.' T_4D { instr->cat6.d = 4; }
777
778 cat6_type: '.' type { instr->cat6.type = $2; }
779 cat6_offset: offset { instr->cat6.src_offset = $1; }
780 cat6_immed: integer { instr->cat6.iim_val = $1; }
781
782 cat6_load: T_OP_LDG { new_instr(OPC_LDG); } cat6_type dst_reg ',' 'g' '[' reg cat6_offset ']' ',' cat6_immed
783 | T_OP_LDP { new_instr(OPC_LDP); } cat6_type dst_reg ',' 'p' '[' reg cat6_offset ']' ',' cat6_immed
784 | T_OP_LDL { new_instr(OPC_LDL); } cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
785 | T_OP_LDLW { new_instr(OPC_LDLW); } cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
786 | T_OP_LDLV { new_instr(OPC_LDLV); } cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
787
788 // TODO some of the cat6 instructions have different syntax for a6xx..
789 //| T_OP_LDIB { new_instr(OPC_LDIB); } cat6_type dst_reg cat6_offset ',' reg ',' cat6_immed
790
791 cat6_store: T_OP_STG { new_instr(OPC_STG); } cat6_type 'g' '[' dst_reg cat6_offset ']' ',' reg ',' cat6_immed
792 | T_OP_STP { new_instr(OPC_STP); } cat6_type 'p' '[' dst_reg cat6_offset ']' ',' reg ',' cat6_immed
793 | T_OP_STL { new_instr(OPC_STL); } cat6_type 'l' '[' dst_reg cat6_offset ']' ',' reg ',' cat6_immed
794 | T_OP_STLW { new_instr(OPC_STLW); } cat6_type 'l' '[' dst_reg cat6_offset ']' ',' reg ',' cat6_immed
795
796 cat6_storeib: T_OP_STIB { new_instr(OPC_STIB); dummy_dst(); } cat6_typed cat6_dim cat6_type '.' cat6_immed'g' '[' immediate ']' '+' reg ',' reg
797
798 cat6_prefetch: T_OP_PREFETCH { new_instr(OPC_PREFETCH); new_reg(0,0); /* dummy dst */ } 'g' '[' reg cat6_offset ']' ',' cat6_immed
799
800 cat6_atomic_l_g: '.' 'g' { instr->flags |= IR3_INSTR_G; }
801 | '.' 'l' { }
802
803 cat6_atomic: T_OP_ATOMIC_ADD { new_instr(OPC_ATOMIC_ADD); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
804 | T_OP_ATOMIC_SUB { new_instr(OPC_ATOMIC_SUB); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
805 | T_OP_ATOMIC_XCHG { new_instr(OPC_ATOMIC_XCHG); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
806 | T_OP_ATOMIC_INC { new_instr(OPC_ATOMIC_INC); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
807 | T_OP_ATOMIC_DEC { new_instr(OPC_ATOMIC_DEC); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
808 | T_OP_ATOMIC_CMPXCHG { new_instr(OPC_ATOMIC_CMPXCHG); }cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
809 | T_OP_ATOMIC_MIN { new_instr(OPC_ATOMIC_MIN); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
810 | T_OP_ATOMIC_MAX { new_instr(OPC_ATOMIC_MAX); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
811 | T_OP_ATOMIC_AND { new_instr(OPC_ATOMIC_AND); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
812 | T_OP_ATOMIC_OR { new_instr(OPC_ATOMIC_OR); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
813 | T_OP_ATOMIC_XOR { new_instr(OPC_ATOMIC_XOR); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
814
815 cat6_todo: T_OP_G2L { new_instr(OPC_G2L); }
816 | T_OP_L2G { new_instr(OPC_L2G); }
817 | T_OP_RESFMT { new_instr(OPC_RESFMT); }
818 | T_OP_RESINF { new_instr(OPC_RESINFO); }
819 | T_OP_LDGB { new_instr(OPC_LDGB); }
820 | T_OP_STGB { new_instr(OPC_STGB); }
821 | T_OP_LDC { new_instr(OPC_LDC); }
822
823 cat6_instr: cat6_load
824 | cat6_store
825 | cat6_storeib
826 | cat6_prefetch
827 | cat6_atomic
828 | cat6_todo
829
830 reg: T_REGISTER { $$ = new_reg($1, 0); }
831 | T_A0 { $$ = new_reg((61 << 3) + $1, IR3_REG_HALF); }
832 | T_P0 { $$ = new_reg((62 << 3) + $1, 0); }
833
834 const: T_CONSTANT { $$ = new_reg($1, IR3_REG_CONST); }
835
836 dst_reg_flag: T_EVEN { rflags.flags |= IR3_REG_EVEN; }
837 | T_POS_INFINITY { rflags.flags |= IR3_REG_POS_INF; }
838 | T_EI { rflags.flags |= IR3_REG_EI; }
839 | T_WRMASK { rflags.wrmask = $1; }
840
841 dst_reg_flags: dst_reg_flag
842 | dst_reg_flag dst_reg_flags
843
844 /* note: destination registers are always incremented in repeat */
845 dst_reg: reg { $1->flags |= IR3_REG_R; }
846 | dst_reg_flags reg { $2->flags |= IR3_REG_R; }
847
848 src_reg_flag: T_ABSNEG { rflags.flags |= IR3_REG_ABS|IR3_REG_NEGATE; }
849 | T_NEG { rflags.flags |= IR3_REG_NEGATE; }
850 | T_ABS { rflags.flags |= IR3_REG_ABS; }
851 | T_R { rflags.flags |= IR3_REG_R; }
852
853 src_reg_flags: src_reg_flag
854 | src_reg_flag src_reg_flags
855
856 src_reg: reg
857 | src_reg_flags reg
858
859 src_const: const
860 | src_reg_flags const
861
862 src_reg_or_const: src_reg
863 | src_const
864
865 src_reg_or_const_or_rel: src_reg_or_const
866 | relative
867
868 src_reg_or_const_or_rel_or_imm: src_reg_or_const_or_rel
869 | src_reg_flags immediate
870 | immediate
871
872 offset: { $$ = 0; }
873 | '+' integer { $$ = $2; }
874 | '-' integer { $$ = -$2; }
875
876 relative: 'r' '<' T_A0 offset '>' { new_reg(0, IR3_REG_RELATIV)->array.offset = $4; }
877 | 'c' '<' T_A0 offset '>' { new_reg(0, IR3_REG_RELATIV | IR3_REG_CONST)->array.offset = $4; }
878 | T_HR '<' T_A0 offset '>' { new_reg(0, IR3_REG_RELATIV | IR3_REG_HALF)->array.offset = $4; }
879 | T_HC '<' T_A0 offset '>' { new_reg(0, IR3_REG_RELATIV | IR3_REG_CONST | IR3_REG_HALF)->array.offset = $4; }
880
881 immediate: integer { new_reg(0, IR3_REG_IMMED)->iim_val = $1; }
882 | '(' integer ')' { new_reg(0, IR3_REG_IMMED)->fim_val = $2; }
883 | '(' float ')' { new_reg(0, IR3_REG_IMMED)->fim_val = $2; }
884 | '(' T_NAN ')' { new_reg(0, IR3_REG_IMMED)->fim_val = NAN; }
885 | '(' T_INF ')' { new_reg(0, IR3_REG_IMMED)->fim_val = INFINITY; }
886
887 integer: T_INT { $$ = $1; }
888 | '-' T_INT { $$ = -$2; }
889 | T_HEX { $$ = $1; }
890 | '-' T_HEX { $$ = -$2; }
891
892 float: T_FLOAT { $$ = $1; }
893 | '-' T_FLOAT { $$ = -$2; }
894
895 type: T_TYPE_F16 { $$ = TYPE_F16; }
896 | T_TYPE_F32 { $$ = TYPE_F32; }
897 | T_TYPE_U16 { $$ = TYPE_U16; }
898 | T_TYPE_U32 { $$ = TYPE_U32; }
899 | T_TYPE_S16 { $$ = TYPE_S16; }
900 | T_TYPE_S32 { $$ = TYPE_S32; }
901 | T_TYPE_U8 { $$ = TYPE_U8; }
902 | T_TYPE_S8 { $$ = TYPE_S8; }