For easier reuse.
Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/4741>
*/
#include "ir3/ir3_compiler.h"
+#include "ir3/ir3_parser.h"
#include "ir3_asm.h"
-#include "ir3_parser.h"
struct ir3_kernel *
ir3_asm_assemble(struct ir3_compiler *c, FILE *in)
#include "main.h"
#include "ir3/ir3_shader.h"
-#include "ir3_parser.h"
+#include "ir3/ir3_parser.h"
struct ir3_kernel {
struct kernel base;
+++ /dev/null
-/*
- * Copyright (c) 2013 Rob Clark <robclark@freedesktop.org>
- *
- * Permission is hereby granted, free of charge, to any person obtaining a
- * copy of this software and associated documentation files (the "Software"),
- * to deal in the Software without restriction, including without limitation
- * the rights to use, copy, modify, merge, publish, distribute, sublicense,
- * and/or sell copies of the Software, and to permit persons to whom the
- * Software is furnished to do so, subject to the following conditions:
- *
- * The above copyright notice and this permission notice (including the next
- * paragraph) shall be included in all copies or substantial portions of the
- * Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
- * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
- * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
- * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
- * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
- * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
- * SOFTWARE.
- */
-
-%{
-#include <stdlib.h>
-#include "ir3/ir3.h"
-#include "ir3_parser.h"
-
-#define YY_NO_INPUT
-#define YY_NO_UNPUT
-#define TOKEN(t) (ir3_yylval.tok = t)
-extern YYSTYPE ir3_yylval;
-
-static int parse_wrmask(const char *src)
-{
- int i, num = 0;
- for (i = 0; i < 4; i++) {
- if ("xyzw"[i] == src[1]) {
- num |= (1 << i);
- src++;
- }
- }
- return num;
-}
-
-static int parse_reg(const char *str)
-{
- int num = 0;
- if (str[0] == 'h') {
- str++;
- num++;
- }
- str++;
- num += strtol(str, (char **)&str, 10) << 3;
- switch (str[1]) {
- case 'x': num += 0; break;
- case 'y': num += 2; break;
- case 'z': num += 4; break;
- case 'w': num += 6; break;
- default: assert(0); break;
- }
- return num;
-}
-%}
-
-%option noyywrap
-%option prefix="ir3_yy"
-
-%%
-"\n" yylineno++;
-[ \t] ; /* ignore whitespace */
-";"[^\n]*"\n" yylineno++; /* ignore comments */
-[0-9]+"."[0-9]+ ir3_yylval.flt = strtod(yytext, NULL); return T_FLOAT;
-[0-9]* ir3_yylval.num = strtoul(yytext, NULL, 0); return T_INT;
-"0x"[0-9a-fA-F]* ir3_yylval.num = strtoul(yytext, NULL, 0); return T_HEX;
-"@localsize" return TOKEN(T_A_LOCALSIZE);
-"@const" return TOKEN(T_A_CONST);
-"@buf" return TOKEN(T_A_BUF);
-"@invocationid" return TOKEN(T_A_INVOCATIONID);
-"@wgid" return TOKEN(T_A_WGID);
-"@numwg" return TOKEN(T_A_NUMWG);
-"(sy)" return TOKEN(T_SY);
-"(ss)" return TOKEN(T_SS);
-"(absneg)" return TOKEN(T_ABSNEG);
-"(neg)" return TOKEN(T_NEG);
-"(abs)" return TOKEN(T_ABS);
-"(r)" return TOKEN(T_R);
-"(ul)" return TOKEN(T_UL);
-"(even)" return TOKEN(T_EVEN);
-"(pos_infinity)" return TOKEN(T_POS_INFINITY);
-"(ei)" return TOKEN(T_EI);
-"(jp)" return TOKEN(T_JP);
-"(rpt"[0-7]")" ir3_yylval.num = strtol(yytext+4, NULL, 10); return T_RPT;
-"(nop"[0-7]")" ir3_yylval.num = strtol(yytext+4, NULL, 10); return T_NOP;
-"("[x]?[y]?[z]?[w]?")" ir3_yylval.num = parse_wrmask(yytext); return T_WRMASK;
-
-[h]?"r"[0-9]+"."[xyzw] ir3_yylval.num = parse_reg(yytext); return T_REGISTER;
-[h]?"c"[0-9]+"."[xyzw] ir3_yylval.num = parse_reg(yytext); return T_CONSTANT;
-"a0."[xyzw] ir3_yylval.num = parse_reg(yytext); return T_A0;
-"p0."[xyzw] ir3_yylval.num = parse_reg(yytext); return T_P0;
-"s#"[0-9]+ ir3_yylval.num = strtol(yytext+2, NULL, 10); return T_SAMP;
-"t#"[0-9]+ ir3_yylval.num = strtol(yytext+2, NULL, 10); return T_TEX;
-
- /* category 0: */
-"nop" return TOKEN(T_OP_NOP);
-"br" return TOKEN(T_OP_BR);
-"jump" return TOKEN(T_OP_JUMP);
-"call" return TOKEN(T_OP_CALL);
-"ret" return TOKEN(T_OP_RET);
-"kill" return TOKEN(T_OP_KILL);
-"end" return TOKEN(T_OP_END);
-"emit" return TOKEN(T_OP_EMIT);
-"cut" return TOKEN(T_OP_CUT);
-"chmask" return TOKEN(T_OP_CHMASK);
-"chsh" return TOKEN(T_OP_CHSH);
-"flow_rev" return TOKEN(T_OP_FLOW_REV);
-
- /* category 1: */
-"mova" return TOKEN(T_OP_MOVA);
-"mov" return TOKEN(T_OP_MOV);
-"cov" return TOKEN(T_OP_COV);
-
-("f16"|"f32"|"u16"|"u32"|"s16"|"s32"|"u8"|"s8"){2} ir3_yylval.str = yytext; return T_CAT1_TYPE_TYPE;
-
- /* category 2: */
-"add.f" return TOKEN(T_OP_ADD_F);
-"min.f" return TOKEN(T_OP_MIN_F);
-"max.f" return TOKEN(T_OP_MAX_F);
-"mul.f" return TOKEN(T_OP_MUL_F);
-"sign.f" return TOKEN(T_OP_SIGN_F);
-"cmps.f" return TOKEN(T_OP_CMPS_F);
-"absneg.f" return TOKEN(T_OP_ABSNEG_F);
-"cmpv.f" return TOKEN(T_OP_CMPV_F);
-"floor.f" return TOKEN(T_OP_FLOOR_F);
-"ceil.f" return TOKEN(T_OP_CEIL_F);
-"rndne.f" return TOKEN(T_OP_RNDNE_F);
-"rndaz.f" return TOKEN(T_OP_RNDAZ_F);
-"trunc.f" return TOKEN(T_OP_TRUNC_F);
-"add.u" return TOKEN(T_OP_ADD_U);
-"add.s" return TOKEN(T_OP_ADD_S);
-"sub.u" return TOKEN(T_OP_SUB_U);
-"sub.s" return TOKEN(T_OP_SUB_S);
-"cmps.u" return TOKEN(T_OP_CMPS_U);
-"cmps.s" return TOKEN(T_OP_CMPS_S);
-"min.u" return TOKEN(T_OP_MIN_U);
-"min.s" return TOKEN(T_OP_MIN_S);
-"max.u" return TOKEN(T_OP_MAX_U);
-"max.s" return TOKEN(T_OP_MAX_S);
-"absneg.s" return TOKEN(T_OP_ABSNEG_S);
-"and.b" return TOKEN(T_OP_AND_B);
-"or.b" return TOKEN(T_OP_OR_B);
-"not.b" return TOKEN(T_OP_NOT_B);
-"xor.b" return TOKEN(T_OP_XOR_B);
-"cmpv.u" return TOKEN(T_OP_CMPV_U);
-"cmpv.s" return TOKEN(T_OP_CMPV_S);
-"mul.u24" return TOKEN(T_OP_MUL_U24);
-"mul.s24" return TOKEN(T_OP_MUL_S24);
-"mull.u" return TOKEN(T_OP_MULL_U);
-"bfrev.b" return TOKEN(T_OP_BFREV_B);
-"clz.s" return TOKEN(T_OP_CLZ_S);
-"clz.b" return TOKEN(T_OP_CLZ_B);
-"shl.b" return TOKEN(T_OP_SHL_B);
-"shr.b" return TOKEN(T_OP_SHR_B);
-"ashr.b" return TOKEN(T_OP_ASHR_B);
-"bary.f" return TOKEN(T_OP_BARY_F);
-"mgen.b" return TOKEN(T_OP_MGEN_B);
-"getbit.b" return TOKEN(T_OP_GETBIT_B);
-"setrm" return TOKEN(T_OP_SETRM);
-"cbits.b" return TOKEN(T_OP_CBITS_B);
-"shb" return TOKEN(T_OP_SHB);
-"msad" return TOKEN(T_OP_MSAD);
-
- /* category 3: */
-"mad.u16" return TOKEN(T_OP_MAD_U16);
-"madsh.u16" return TOKEN(T_OP_MADSH_U16);
-"mad.s16" return TOKEN(T_OP_MAD_S16);
-"madsh.m16" return TOKEN(T_OP_MADSH_M16);
-"mad.u24" return TOKEN(T_OP_MAD_U24);
-"mad.s24" return TOKEN(T_OP_MAD_S24);
-"mad.f16" return TOKEN(T_OP_MAD_F16);
-"mad.f32" return TOKEN(T_OP_MAD_F32);
-"sel.b16" return TOKEN(T_OP_SEL_B16);
-"sel.b32" return TOKEN(T_OP_SEL_B32);
-"sel.s16" return TOKEN(T_OP_SEL_S16);
-"sel.s32" return TOKEN(T_OP_SEL_S32);
-"sel.f16" return TOKEN(T_OP_SEL_F16);
-"sel.f32" return TOKEN(T_OP_SEL_F32);
-"sad.s16" return TOKEN(T_OP_SAD_S16);
-"sad.s32" return TOKEN(T_OP_SAD_S32);
-
- /* category 4: */
-"rcp" return TOKEN(T_OP_RCP);
-"rsq" return TOKEN(T_OP_RSQ);
-"log2" return TOKEN(T_OP_LOG2);
-"exp2" return TOKEN(T_OP_EXP2);
-"sin" return TOKEN(T_OP_SIN);
-"cos" return TOKEN(T_OP_COS);
-"sqrt" return TOKEN(T_OP_SQRT);
-"hrsq" return TOKEN(T_OP_HRSQ);
-"hlog2" return TOKEN(T_OP_HLOG2);
-"hexp2" return TOKEN(T_OP_HEXP2);
-
- /* category 5: */
-"isam" return TOKEN(T_OP_ISAM);
-"isaml" return TOKEN(T_OP_ISAML);
-"isamm" return TOKEN(T_OP_ISAMM);
-"sam" return TOKEN(T_OP_SAM);
-"samb" return TOKEN(T_OP_SAMB);
-"saml" return TOKEN(T_OP_SAML);
-"samgq" return TOKEN(T_OP_SAMGQ);
-"getlod" return TOKEN(T_OP_GETLOD);
-"conv" return TOKEN(T_OP_CONV);
-"convm" return TOKEN(T_OP_CONVM);
-"getsize" return TOKEN(T_OP_GETSIZE);
-"getbuf" return TOKEN(T_OP_GETBUF);
-"getpos" return TOKEN(T_OP_GETPOS);
-"getinfo" return TOKEN(T_OP_GETINFO);
-"dsx" return TOKEN(T_OP_DSX);
-"dsy" return TOKEN(T_OP_DSY);
-"gather4r" return TOKEN(T_OP_GATHER4R);
-"gather4g" return TOKEN(T_OP_GATHER4G);
-"gather4b" return TOKEN(T_OP_GATHER4B);
-"gather4a" return TOKEN(T_OP_GATHER4A);
-"samgp0" return TOKEN(T_OP_SAMGP0);
-"samgp1" return TOKEN(T_OP_SAMGP1);
-"samgp2" return TOKEN(T_OP_SAMGP2);
-"samgp3" return TOKEN(T_OP_SAMGP3);
-"dsxpp.1" return TOKEN(T_OP_DSXPP_1);
-"dsypp.1" return TOKEN(T_OP_DSYPP_1);
-"rgetpos" return TOKEN(T_OP_RGETPOS);
-"rgetinfo" return TOKEN(T_OP_RGETINFO);
-
- /* category 6: */
-"ldg" return TOKEN(T_OP_LDG);
-"ldl" return TOKEN(T_OP_LDL);
-"ldp" return TOKEN(T_OP_LDP);
-"stg" return TOKEN(T_OP_STG);
-"stl" return TOKEN(T_OP_STL);
-"stp" return TOKEN(T_OP_STP);
-"ldib" return TOKEN(T_OP_LDIB);
-"g2l" return TOKEN(T_OP_G2L);
-"l2g" return TOKEN(T_OP_L2G);
-"prefetch" return TOKEN(T_OP_PREFETCH);
-"ldlw" return TOKEN(T_OP_LDLW);
-"stlw" return TOKEN(T_OP_STLW);
-"resfmt" return TOKEN(T_OP_RESFMT);
-"resinf" return TOKEN(T_OP_RESINF);
-"atomic.add" return TOKEN(T_OP_ATOMIC_ADD);
-"atomic.sub" return TOKEN(T_OP_ATOMIC_SUB);
-"atomic.xchg" return TOKEN(T_OP_ATOMIC_XCHG);
-"atomic.inc" return TOKEN(T_OP_ATOMIC_INC);
-"atomic.dec" return TOKEN(T_OP_ATOMIC_DEC);
-"atomic.cmpxchg" return TOKEN(T_OP_ATOMIC_CMPXCHG);
-"atomic.min" return TOKEN(T_OP_ATOMIC_MIN);
-"atomic.max" return TOKEN(T_OP_ATOMIC_MAX);
-"atomic.and" return TOKEN(T_OP_ATOMIC_AND);
-"atomic.or" return TOKEN(T_OP_ATOMIC_OR);
-"atomic.xor" return TOKEN(T_OP_ATOMIC_XOR);
-"ldgb" return TOKEN(T_OP_LDGB);
-"stgb" return TOKEN(T_OP_STGB);
-"stib" return TOKEN(T_OP_STIB);
-"ldc" return TOKEN(T_OP_LDC);
-"ldlv" return TOKEN(T_OP_LDLV);
-
-"f16" return TOKEN(T_TYPE_F16);
-"f32" return TOKEN(T_TYPE_F32);
-"u16" return TOKEN(T_TYPE_U16);
-"u32" return TOKEN(T_TYPE_U32);
-"s16" return TOKEN(T_TYPE_S16);
-"s32" return TOKEN(T_TYPE_S32);
-"u8" return TOKEN(T_TYPE_U8);
-"s8" return TOKEN(T_TYPE_S8);
-
-"untyped" return TOKEN(T_UNTYPED);
-"typed" return TOKEN(T_TYPED);
-
-"1d" return TOKEN(T_1D);
-"2d" return TOKEN(T_2D);
-"3d" return TOKEN(T_3D);
-"4d" return TOKEN(T_4D);
-
-"lt" return TOKEN(T_LT);
-"le" return TOKEN(T_LE);
-"gt" return TOKEN(T_GT);
-"ge" return TOKEN(T_GE);
-"eq" return TOKEN(T_EQ);
-"ne" return TOKEN(T_NE);
-
-"a" return 'a';
-"o" return 'o';
-"p" return 'p';
-"s2en" return TOKEN(T_S2EN);
-"s" return 's';
-"base"[0-9]+ ir3_yylval.num = strtol(yytext+4, NULL, 10); return T_BASE;
-
-"=" return '=';
-"(" return '(';
-")" return ')';
-"[" return '[';
-"]" return ']';
-"," return ',';
-"." return '.';
-"-" return '-';
-"+" return '+';
-"|" return '|';
-"c" return 'c';
-"r" return 'r';
-"g" return 'g';
-"l" return 'l';
-"<" return '<';
-">" return '>';
-"!" return '!';
-"#" return '#';
-
-"nan" return TOKEN(T_NAN);
-"inf" return TOKEN(T_INF);
-
-[a-zA-Z_][a-zA-Z_0-9]* ir3_yylval.str = yytext; return T_IDENTIFIER;
-. fprintf(stderr, "error at line %d: Unknown token: %s\n", ir3_yyget_lineno(), yytext); yyterminate();
-%%
+++ /dev/null
-/*
- * Copyright (c) 2013 Rob Clark <robclark@freedesktop.org>
- *
- * Permission is hereby granted, free of charge, to any person obtaining a
- * copy of this software and associated documentation files (the "Software"),
- * to deal in the Software without restriction, including without limitation
- * the rights to use, copy, modify, merge, publish, distribute, sublicense,
- * and/or sell copies of the Software, and to permit persons to whom the
- * Software is furnished to do so, subject to the following conditions:
- *
- * The above copyright notice and this permission notice (including the next
- * paragraph) shall be included in all copies or substantial portions of the
- * Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
- * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
- * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
- * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
- * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
- * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
- * SOFTWARE.
- */
-
-%code requires {
-
-#define MAX_BUFS 4
-
-struct ir3_kernel_info {
- uint32_t local_size[3];
- uint32_t num_bufs;
- uint32_t buf_sizes[MAX_BUFS]; /* size in dwords */
-
- /* driver-param uniforms: */
- unsigned numwg;
-};
-
-struct ir3 * ir3_parse(struct ir3_shader_variant *v,
- struct ir3_kernel_info *k, FILE *f);
-}
-
-%{
-#define YYDEBUG 0
-
-#include <stdlib.h>
-#include <stdio.h>
-#include <string.h>
-#include <math.h>
-
-#include "util/u_math.h"
-
-#include "ir3/ir3.h"
-#include "ir3/ir3_shader.h"
-#include "ir3/instr-a3xx.h"
-
-#include "ir3_parser.h"
-
-/* ir3 treats the abs/neg flags as separate flags for float vs integer,
- * but in the instruction encoding they are the same thing. Tracking
- * them separately is only for the benefit of ir3 opt passes, and not
- * required here, so just use the float versions:
- */
-#define IR3_REG_ABS IR3_REG_FABS
-#define IR3_REG_NEGATE IR3_REG_FNEG
-
-static struct ir3_kernel_info *info;
-static struct ir3_shader_variant *variant;
-/* NOTE the assembler doesn't really use the ir3_block construction
- * like the compiler does. Everything is treated as one large block.
- * Which might happen to contain flow control. But since we don't
- * use any of the ir3 backend passes (sched, RA, etc) this doesn't
- * really matter.
- */
-static struct ir3_block *block; /* current shader block */
-static struct ir3_instruction *instr; /* current instruction */
-
-static struct {
- unsigned flags;
- unsigned repeat;
- unsigned nop;
-} iflags;
-
-static struct {
- unsigned flags;
- unsigned wrmask;
-} rflags;
-
-int ir3_yyget_lineno(void);
-
-static struct ir3_instruction * new_instr(opc_t opc)
-{
- instr = ir3_instr_create(block, opc);
- instr->flags = iflags.flags;
- instr->repeat = iflags.repeat;
- instr->nop = iflags.nop;
- instr->line = ir3_yyget_lineno();
- iflags.flags = iflags.repeat = iflags.nop = 0;
- return instr;
-}
-
-static void new_shader(void)
-{
- variant->ir = ir3_create(variant->shader->compiler, variant->shader->type);
- block = ir3_block_create(variant->ir);
- list_addtail(&block->node, &variant->ir->block_list);
-}
-
-static type_t parse_type(const char **type)
-{
- if (!strncmp("f16", *type, 3)) {
- *type += 3;
- return TYPE_F16;
- } else if (!strncmp("f32", *type, 3)) {
- *type += 3;
- return TYPE_F32;
- } else if (!strncmp("u16", *type, 3)) {
- *type += 3;
- return TYPE_U16;
- } else if (!strncmp("u32", *type, 3)) {
- *type += 3;
- return TYPE_U32;
- } else if (!strncmp("s16", *type, 3)) {
- *type += 3;
- return TYPE_S16;
- } else if (!strncmp("s32", *type, 3)) {
- *type += 3;
- return TYPE_S32;
- } else if (!strncmp("u8", *type, 2)) {
- *type += 2;
- return TYPE_U8;
- } else if (!strncmp("s8", *type, 2)) {
- *type += 2;
- return TYPE_S8;
- } else {
- assert(0); /* shouldn't get here */
- return ~0;
- }
-}
-
-static struct ir3_instruction * parse_type_type(struct ir3_instruction *instr,
- const char *type_type)
-{
- instr->cat1.src_type = parse_type(&type_type);
- instr->cat1.dst_type = parse_type(&type_type);
- return instr;
-}
-
-static struct ir3_register * new_reg(int num, unsigned flags)
-{
- struct ir3_register *reg;
- flags |= rflags.flags;
- if (num & 0x1)
- flags |= IR3_REG_HALF;
- reg = ir3_reg_create(instr, num>>1, flags);
- reg->wrmask = MAX2(1, rflags.wrmask);
- rflags.flags = rflags.wrmask = 0;
- return reg;
-}
-
-static struct ir3_register * dummy_dst(void)
-{
- return new_reg(0, 0);
-}
-
-static void add_const(unsigned reg, unsigned c0, unsigned c1, unsigned c2, unsigned c3)
-{
- struct ir3_const_state *const_state = &variant->shader->const_state;
- assert((reg & 0x7) == 0);
- int idx = reg >> (1 + 2); /* low bit is half vs full, next two bits are swiz */
- if (const_state->immediate_idx == const_state->immediates_size * 4) {
- const_state->immediates_size += 4;
- const_state->immediates = realloc (const_state->immediates,
- const_state->immediates_size * sizeof(const_state->immediates[0]));
- }
- const_state->immediates[idx].val[0] = c0;
- const_state->immediates[idx].val[1] = c1;
- const_state->immediates[idx].val[2] = c2;
- const_state->immediates[idx].val[3] = c3;
- const_state->immediates_count = idx + 1;
- const_state->immediate_idx++;
-}
-
-static void add_sysval(unsigned reg, unsigned compmask, gl_system_value sysval)
-{
- unsigned n = variant->inputs_count++;
- variant->inputs[n].regid = reg;
- variant->inputs[n].sysval = true;
- variant->inputs[n].slot = sysval;
- variant->inputs[n].compmask = compmask;
- variant->inputs[n].interpolate = INTERP_MODE_FLAT;
- variant->total_in++;
-}
-
-#ifdef YYDEBUG
-int yydebug;
-#endif
-
-extern int yylex(void);
-extern FILE *ir3_yyin;
-
-int yyparse(void);
-
-static void yyerror(const char *error)
-{
- fprintf(stderr, "error at line %d: %s\n", ir3_yyget_lineno(), error);
-}
-
-struct ir3 * ir3_parse(struct ir3_shader_variant *v,
- struct ir3_kernel_info *k, FILE *f)
-{
- ir3_yyin = f;
-#ifdef YYDEBUG
- yydebug = 1;
-#endif
- info = k;
- variant = v;
- if (yyparse()) {
- ir3_destroy(variant->ir);
- variant->ir = NULL;
- }
- return variant->ir;
-}
-%}
-
-%union {
- int tok;
- int num;
- uint32_t unum;
- double flt;
- const char *str;
- struct ir3_register *reg;
- struct {
- int start;
- int num;
- } range;
- type_t type;
-}
-
-%{
-#if YYDEBUG
-static void print_token(FILE *file, int type, YYSTYPE value)
-{
- fprintf(file, "\ntype: %d\n", type);
-}
-
-#define YYPRINT(file, type, value) print_token(file, type, value)
-#endif
-%}
-
-%token <num> T_INT
-%token <unum> T_HEX
-%token <flt> T_FLOAT
-%token <str> T_IDENTIFIER
-%token <num> T_REGISTER
-%token <num> T_CONSTANT
-
-/* @ headers (@const/@sampler/@uniform/@varying) */
-%token <tok> T_A_LOCALSIZE
-%token <tok> T_A_CONST
-%token <tok> T_A_BUF
-%token <tok> T_A_INVOCATIONID
-%token <tok> T_A_WGID
-%token <tok> T_A_NUMWG
-/* todo, re-add @sampler/@uniform/@varying if needed someday */
-
-/* src register flags */
-%token <tok> T_ABSNEG
-%token <tok> T_NEG
-%token <tok> T_ABS
-%token <tok> T_R
-
-/* dst register flags */
-%token <tok> T_EVEN
-%token <tok> T_POS_INFINITY
-%token <tok> T_EI
-%token <num> T_WRMASK
-
-/* instruction flags */
-%token <tok> T_SY
-%token <tok> T_SS
-%token <tok> T_JP
-%token <num> T_RPT
-%token <tok> T_UL
-%token <tok> T_NOP
-
-/* category 0: */
-%token <tok> T_OP_NOP
-%token <tok> T_OP_BR
-%token <tok> T_OP_JUMP
-%token <tok> T_OP_CALL
-%token <tok> T_OP_RET
-%token <tok> T_OP_KILL
-%token <tok> T_OP_END
-%token <tok> T_OP_EMIT
-%token <tok> T_OP_CUT
-%token <tok> T_OP_CHMASK
-%token <tok> T_OP_CHSH
-%token <tok> T_OP_FLOW_REV
-
-/* category 1: */
-%token <tok> T_OP_MOVA
-%token <tok> T_OP_MOV
-%token <tok> T_OP_COV
-
-/* category 2: */
-%token <tok> T_OP_ADD_F
-%token <tok> T_OP_MIN_F
-%token <tok> T_OP_MAX_F
-%token <tok> T_OP_MUL_F
-%token <tok> T_OP_SIGN_F
-%token <tok> T_OP_CMPS_F
-%token <tok> T_OP_ABSNEG_F
-%token <tok> T_OP_CMPV_F
-%token <tok> T_OP_FLOOR_F
-%token <tok> T_OP_CEIL_F
-%token <tok> T_OP_RNDNE_F
-%token <tok> T_OP_RNDAZ_F
-%token <tok> T_OP_TRUNC_F
-%token <tok> T_OP_ADD_U
-%token <tok> T_OP_ADD_S
-%token <tok> T_OP_SUB_U
-%token <tok> T_OP_SUB_S
-%token <tok> T_OP_CMPS_U
-%token <tok> T_OP_CMPS_S
-%token <tok> T_OP_MIN_U
-%token <tok> T_OP_MIN_S
-%token <tok> T_OP_MAX_U
-%token <tok> T_OP_MAX_S
-%token <tok> T_OP_ABSNEG_S
-%token <tok> T_OP_AND_B
-%token <tok> T_OP_OR_B
-%token <tok> T_OP_NOT_B
-%token <tok> T_OP_XOR_B
-%token <tok> T_OP_CMPV_U
-%token <tok> T_OP_CMPV_S
-%token <tok> T_OP_MUL_U24
-%token <tok> T_OP_MUL_S24
-%token <tok> T_OP_MULL_U
-%token <tok> T_OP_BFREV_B
-%token <tok> T_OP_CLZ_S
-%token <tok> T_OP_CLZ_B
-%token <tok> T_OP_SHL_B
-%token <tok> T_OP_SHR_B
-%token <tok> T_OP_ASHR_B
-%token <tok> T_OP_BARY_F
-%token <tok> T_OP_MGEN_B
-%token <tok> T_OP_GETBIT_B
-%token <tok> T_OP_SETRM
-%token <tok> T_OP_CBITS_B
-%token <tok> T_OP_SHB
-%token <tok> T_OP_MSAD
-
-/* category 3: */
-%token <tok> T_OP_MAD_U16
-%token <tok> T_OP_MADSH_U16
-%token <tok> T_OP_MAD_S16
-%token <tok> T_OP_MADSH_M16
-%token <tok> T_OP_MAD_U24
-%token <tok> T_OP_MAD_S24
-%token <tok> T_OP_MAD_F16
-%token <tok> T_OP_MAD_F32
-%token <tok> T_OP_SEL_B16
-%token <tok> T_OP_SEL_B32
-%token <tok> T_OP_SEL_S16
-%token <tok> T_OP_SEL_S32
-%token <tok> T_OP_SEL_F16
-%token <tok> T_OP_SEL_F32
-%token <tok> T_OP_SAD_S16
-%token <tok> T_OP_SAD_S32
-
-/* category 4: */
-%token <tok> T_OP_RCP
-%token <tok> T_OP_RSQ
-%token <tok> T_OP_LOG2
-%token <tok> T_OP_EXP2
-%token <tok> T_OP_SIN
-%token <tok> T_OP_COS
-%token <tok> T_OP_SQRT
-%token <tok> T_OP_HRSQ
-%token <tok> T_OP_HLOG2
-%token <tok> T_OP_HEXP2
-
-/* category 5: */
-%token <tok> T_OP_ISAM
-%token <tok> T_OP_ISAML
-%token <tok> T_OP_ISAMM
-%token <tok> T_OP_SAM
-%token <tok> T_OP_SAMB
-%token <tok> T_OP_SAML
-%token <tok> T_OP_SAMGQ
-%token <tok> T_OP_GETLOD
-%token <tok> T_OP_CONV
-%token <tok> T_OP_CONVM
-%token <tok> T_OP_GETSIZE
-%token <tok> T_OP_GETBUF
-%token <tok> T_OP_GETPOS
-%token <tok> T_OP_GETINFO
-%token <tok> T_OP_DSX
-%token <tok> T_OP_DSY
-%token <tok> T_OP_GATHER4R
-%token <tok> T_OP_GATHER4G
-%token <tok> T_OP_GATHER4B
-%token <tok> T_OP_GATHER4A
-%token <tok> T_OP_SAMGP0
-%token <tok> T_OP_SAMGP1
-%token <tok> T_OP_SAMGP2
-%token <tok> T_OP_SAMGP3
-%token <tok> T_OP_DSXPP_1
-%token <tok> T_OP_DSYPP_1
-%token <tok> T_OP_RGETPOS
-%token <tok> T_OP_RGETINFO
-
-/* category 6: */
-%token <tok> T_OP_LDG
-%token <tok> T_OP_LDL
-%token <tok> T_OP_LDP
-%token <tok> T_OP_STG
-%token <tok> T_OP_STL
-%token <tok> T_OP_STP
-%token <tok> T_OP_LDIB
-%token <tok> T_OP_G2L
-%token <tok> T_OP_L2G
-%token <tok> T_OP_PREFETCH
-%token <tok> T_OP_LDLW
-%token <tok> T_OP_STLW
-%token <tok> T_OP_RESFMT
-%token <tok> T_OP_RESINF
-%token <tok> T_OP_ATOMIC_ADD
-%token <tok> T_OP_ATOMIC_SUB
-%token <tok> T_OP_ATOMIC_XCHG
-%token <tok> T_OP_ATOMIC_INC
-%token <tok> T_OP_ATOMIC_DEC
-%token <tok> T_OP_ATOMIC_CMPXCHG
-%token <tok> T_OP_ATOMIC_MIN
-%token <tok> T_OP_ATOMIC_MAX
-%token <tok> T_OP_ATOMIC_AND
-%token <tok> T_OP_ATOMIC_OR
-%token <tok> T_OP_ATOMIC_XOR
-%token <tok> T_OP_LDGB
-%token <tok> T_OP_STGB
-%token <tok> T_OP_STIB
-%token <tok> T_OP_LDC
-%token <tok> T_OP_LDLV
-
-/* type qualifiers: */
-%token <tok> T_TYPE_F16
-%token <tok> T_TYPE_F32
-%token <tok> T_TYPE_U16
-%token <tok> T_TYPE_U32
-%token <tok> T_TYPE_S16
-%token <tok> T_TYPE_S32
-%token <tok> T_TYPE_U8
-%token <tok> T_TYPE_S8
-
-%token <tok> T_UNTYPED
-%token <tok> T_TYPED
-
-%token <tok> T_1D
-%token <tok> T_2D
-%token <tok> T_3D
-%token <tok> T_4D
-
-/* condition qualifiers: */
-%token <tok> T_LT
-%token <tok> T_LE
-%token <tok> T_GT
-%token <tok> T_GE
-%token <tok> T_EQ
-%token <tok> T_NE
-
-%token <tok> T_S2EN
-%token <tok> T_SAMP
-%token <tok> T_TEX
-%token <tok> T_BASE
-
-%token <tok> T_NAN
-%token <tok> T_INF
-%token <num> T_A0
-%token <num> T_P0
-%token <str> T_CAT1_TYPE_TYPE
-
-%type <num> integer offset
-%type <flt> float
-%type <reg> reg const
-%type <tok> cat1_opc
-%type <tok> cat2_opc_1src cat2_opc_2src_cnd cat2_opc_2src
-%type <tok> cat3_opc
-%type <tok> cat4_opc
-%type <tok> cat5_opc cat5_samp cat5_tex cat5_type
-%type <type> type
-%type <unum> const_val
-
-%error-verbose
-
-%start shader
-
-%%
-
-shader: { new_shader(); } headers instrs
-
-headers:
-| header headers
-
-header: localsize_header
-| const_header
-| buf_header
-| invocationid_header
-| wgid_header
-| numwg_header
-
-const_val: T_FLOAT { $$ = fui($1); }
-| T_INT { $$ = $1; }
-| '-' T_INT { $$ = -$2; }
-| T_HEX { $$ = $1; }
-
-localsize_header: T_A_LOCALSIZE const_val ',' const_val ',' const_val {
- info->local_size[0] = $2;
- info->local_size[1] = $4;
- info->local_size[2] = $6;
-}
-
-const_header: T_A_CONST '(' T_CONSTANT ')' const_val ',' const_val ',' const_val ',' const_val {
- add_const($3, $5, $7, $9, $11);
-}
-
-buf_header: T_A_BUF const_val {
- int idx = info->num_bufs++;
- assert(idx < MAX_BUFS);
- info->buf_sizes[idx] = $2;
-}
-
-invocationid_header: T_A_INVOCATIONID '(' T_REGISTER ')' {
- assert(($3 & 0x1) == 0); /* half-reg not allowed */
- unsigned reg = $3 >> 1;
- add_sysval(reg, 0x7, SYSTEM_VALUE_LOCAL_INVOCATION_ID);
-}
-
-wgid_header: T_A_WGID '(' T_REGISTER ')' {
- assert(($3 & 0x1) == 0); /* half-reg not allowed */
- unsigned reg = $3 >> 1;
- assert(reg >= regid(48, 0)); /* must be a high reg */
- add_sysval(reg, 0x7, SYSTEM_VALUE_WORK_GROUP_ID);
-}
-
-numwg_header: T_A_NUMWG '(' T_CONSTANT ')' {
- assert(($3 & 0x1) == 0); /* half-reg not allowed */
- unsigned reg = $3 >> 1;
- info->numwg = reg;
- /* reserve space in immediates for the actual value to be plugged in later: */
- add_const($3, 0, 0, 0, 0);
-}
-
-iflag: T_SY { iflags.flags |= IR3_INSTR_SY; }
-| T_SS { iflags.flags |= IR3_INSTR_SS; }
-| T_JP { iflags.flags |= IR3_INSTR_JP; }
-| T_RPT { iflags.repeat = $1; }
-| T_UL { iflags.flags |= IR3_INSTR_UL; }
-| T_NOP { iflags.nop = $1; }
-
-iflags:
-| iflag iflags
-
-instrs: instr instrs
-| instr
-
-instr: iflags cat0_instr
-| iflags cat1_instr
-| iflags cat2_instr
-| iflags cat3_instr
-| iflags cat4_instr
-| iflags cat5_instr
-| iflags cat6_instr
-
-cat0_src: '!' T_P0 { instr->cat0.inv = true; instr->cat0.comp = $2 >> 1; }
-| T_P0 { instr->cat0.comp = $1 >> 1; }
-
-cat0_immed: '#' integer { instr->cat0.immed = $2; }
-
-cat0_instr: T_OP_NOP { new_instr(OPC_NOP); }
-| T_OP_BR { new_instr(OPC_BR); } cat0_src ',' cat0_immed
-| T_OP_JUMP { new_instr(OPC_JUMP); } cat0_immed
-| T_OP_CALL { new_instr(OPC_CALL); } cat0_immed
-| T_OP_RET { new_instr(OPC_RET); }
-| T_OP_KILL { new_instr(OPC_KILL); } cat0_src
-| T_OP_END { new_instr(OPC_END); }
-| T_OP_EMIT { new_instr(OPC_EMIT); }
-| T_OP_CUT { new_instr(OPC_CUT); }
-| T_OP_CHMASK { new_instr(OPC_CHMASK); }
-| T_OP_CHSH { new_instr(OPC_CHSH); }
-| T_OP_FLOW_REV { new_instr(OPC_FLOW_REV); }
-
-cat1_opc: T_OP_MOVA {
- new_instr(OPC_MOV);
- instr->cat1.src_type = TYPE_S16;
- instr->cat1.dst_type = TYPE_S16;
-}
-| T_OP_MOV '.' T_CAT1_TYPE_TYPE {
- parse_type_type(new_instr(OPC_MOV), $3);
-}
-| T_OP_COV '.' T_CAT1_TYPE_TYPE {
- parse_type_type(new_instr(OPC_MOV), $3);
-}
-
-cat1_instr: cat1_opc dst_reg ',' src_reg_or_const_or_rel_or_imm
-
-cat2_opc_1src: T_OP_ABSNEG_F { new_instr(OPC_ABSNEG_F); }
-| T_OP_ABSNEG_S { new_instr(OPC_ABSNEG_S); }
-| T_OP_CLZ_B { new_instr(OPC_CLZ_B); }
-| T_OP_CLZ_S { new_instr(OPC_CLZ_S); }
-| T_OP_SIGN_F { new_instr(OPC_SIGN_F); }
-| T_OP_FLOOR_F { new_instr(OPC_FLOOR_F); }
-| T_OP_CEIL_F { new_instr(OPC_CEIL_F); }
-| T_OP_RNDNE_F { new_instr(OPC_RNDNE_F); }
-| T_OP_RNDAZ_F { new_instr(OPC_RNDAZ_F); }
-| T_OP_TRUNC_F { new_instr(OPC_TRUNC_F); }
-| T_OP_NOT_B { new_instr(OPC_NOT_B); }
-| T_OP_BFREV_B { new_instr(OPC_BFREV_B); }
-| T_OP_SETRM { new_instr(OPC_SETRM); }
-| T_OP_CBITS_B { new_instr(OPC_CBITS_B); }
-
-cat2_opc_2src_cnd: T_OP_CMPS_F { new_instr(OPC_CMPS_F); }
-| T_OP_CMPS_U { new_instr(OPC_CMPS_U); }
-| T_OP_CMPS_S { new_instr(OPC_CMPS_S); }
-| T_OP_CMPV_F { new_instr(OPC_CMPV_F); }
-| T_OP_CMPV_U { new_instr(OPC_CMPV_U); }
-| T_OP_CMPV_S { new_instr(OPC_CMPV_S); }
-
-cat2_opc_2src: T_OP_ADD_F { new_instr(OPC_ADD_F); }
-| T_OP_MIN_F { new_instr(OPC_MIN_F); }
-| T_OP_MAX_F { new_instr(OPC_MAX_F); }
-| T_OP_MUL_F { new_instr(OPC_MUL_F); }
-| T_OP_ADD_U { new_instr(OPC_ADD_U); }
-| T_OP_ADD_S { new_instr(OPC_ADD_S); }
-| T_OP_SUB_U { new_instr(OPC_SUB_U); }
-| T_OP_SUB_S { new_instr(OPC_SUB_S); }
-| T_OP_MIN_U { new_instr(OPC_MIN_U); }
-| T_OP_MIN_S { new_instr(OPC_MIN_S); }
-| T_OP_MAX_U { new_instr(OPC_MAX_U); }
-| T_OP_MAX_S { new_instr(OPC_MAX_S); }
-| T_OP_AND_B { new_instr(OPC_AND_B); }
-| T_OP_OR_B { new_instr(OPC_OR_B); }
-| T_OP_XOR_B { new_instr(OPC_XOR_B); }
-| T_OP_MUL_U24 { new_instr(OPC_MUL_U24); }
-| T_OP_MUL_S24 { new_instr(OPC_MUL_S24); }
-| T_OP_MULL_U { new_instr(OPC_MULL_U); }
-| T_OP_SHL_B { new_instr(OPC_SHL_B); }
-| T_OP_SHR_B { new_instr(OPC_SHR_B); }
-| T_OP_ASHR_B { new_instr(OPC_ASHR_B); }
-| T_OP_BARY_F { new_instr(OPC_BARY_F); }
-| T_OP_MGEN_B { new_instr(OPC_MGEN_B); }
-| T_OP_GETBIT_B { new_instr(OPC_GETBIT_B); }
-| T_OP_SHB { new_instr(OPC_SHB); }
-| T_OP_MSAD { new_instr(OPC_MSAD); }
-
-cond: T_LT { instr->cat2.condition = IR3_COND_LT; }
-| T_LE { instr->cat2.condition = IR3_COND_LE; }
-| T_GT { instr->cat2.condition = IR3_COND_GT; }
-| T_GE { instr->cat2.condition = IR3_COND_GE; }
-| T_EQ { instr->cat2.condition = IR3_COND_EQ; }
-| T_NE { instr->cat2.condition = IR3_COND_NE; }
-
-cat2_instr: cat2_opc_1src dst_reg ',' src_reg_or_const_or_rel_or_imm
-| cat2_opc_2src_cnd '.' cond dst_reg ',' src_reg_or_const_or_rel_or_imm ',' src_reg_or_const_or_rel_or_imm
-| cat2_opc_2src dst_reg ',' src_reg_or_const_or_rel_or_imm ',' src_reg_or_const_or_rel_or_imm
-
-cat3_opc: T_OP_MAD_U16 { new_instr(OPC_MAD_U16); }
-| T_OP_MADSH_U16 { new_instr(OPC_MADSH_U16); }
-| T_OP_MAD_S16 { new_instr(OPC_MAD_S16); }
-| T_OP_MADSH_M16 { new_instr(OPC_MADSH_M16); }
-| T_OP_MAD_U24 { new_instr(OPC_MAD_U24); }
-| T_OP_MAD_S24 { new_instr(OPC_MAD_S24); }
-| T_OP_MAD_F16 { new_instr(OPC_MAD_F16); }
-| T_OP_MAD_F32 { new_instr(OPC_MAD_F32); }
-| T_OP_SEL_B16 { new_instr(OPC_SEL_B16); }
-| T_OP_SEL_B32 { new_instr(OPC_SEL_B32); }
-| T_OP_SEL_S16 { new_instr(OPC_SEL_S16); }
-| T_OP_SEL_S32 { new_instr(OPC_SEL_S32); }
-| T_OP_SEL_F16 { new_instr(OPC_SEL_F16); }
-| T_OP_SEL_F32 { new_instr(OPC_SEL_F32); }
-| T_OP_SAD_S16 { new_instr(OPC_SAD_S16); }
-| T_OP_SAD_S32 { new_instr(OPC_SAD_S32); }
-
-cat3_instr: cat3_opc dst_reg ',' src_reg_or_const_or_rel ',' src_reg_or_const ',' src_reg_or_const_or_rel
-
-cat4_opc: T_OP_RCP { new_instr(OPC_RCP); }
-| T_OP_RSQ { new_instr(OPC_RSQ); }
-| T_OP_LOG2 { new_instr(OPC_LOG2); }
-| T_OP_EXP2 { new_instr(OPC_EXP2); }
-| T_OP_SIN { new_instr(OPC_SIN); }
-| T_OP_COS { new_instr(OPC_COS); }
-| T_OP_SQRT { new_instr(OPC_SQRT); }
-| T_OP_HRSQ { new_instr(OPC_HRSQ); }
-| T_OP_HLOG2 { new_instr(OPC_HLOG2); }
-| T_OP_HEXP2 { new_instr(OPC_HEXP2); }
-
-cat4_instr: cat4_opc dst_reg ',' src_reg_or_const_or_rel_or_imm
-
-cat5_opc_dsxypp: T_OP_DSXPP_1 { new_instr(OPC_DSXPP_1); }
-| T_OP_DSYPP_1 { new_instr(OPC_DSYPP_1); }
-
-cat5_opc: T_OP_ISAM { new_instr(OPC_ISAM); }
-| T_OP_ISAML { new_instr(OPC_ISAML); }
-| T_OP_ISAMM { new_instr(OPC_ISAMM); }
-| T_OP_SAM { new_instr(OPC_SAM); }
-| T_OP_SAMB { new_instr(OPC_SAMB); }
-| T_OP_SAML { new_instr(OPC_SAML); }
-| T_OP_SAMGQ { new_instr(OPC_SAMGQ); }
-| T_OP_GETLOD { new_instr(OPC_GETLOD); }
-| T_OP_CONV { new_instr(OPC_CONV); }
-| T_OP_CONVM { new_instr(OPC_CONVM); }
-| T_OP_GETSIZE { new_instr(OPC_GETSIZE); }
-| T_OP_GETBUF { new_instr(OPC_GETBUF); }
-| T_OP_GETPOS { new_instr(OPC_GETPOS); }
-| T_OP_GETINFO { new_instr(OPC_GETINFO); }
-| T_OP_DSX { new_instr(OPC_DSX); }
-| T_OP_DSY { new_instr(OPC_DSY); }
-| T_OP_GATHER4R { new_instr(OPC_GATHER4R); }
-| T_OP_GATHER4G { new_instr(OPC_GATHER4G); }
-| T_OP_GATHER4B { new_instr(OPC_GATHER4B); }
-| T_OP_GATHER4A { new_instr(OPC_GATHER4A); }
-| T_OP_SAMGP0 { new_instr(OPC_SAMGP0); }
-| T_OP_SAMGP1 { new_instr(OPC_SAMGP1); }
-| T_OP_SAMGP2 { new_instr(OPC_SAMGP2); }
-| T_OP_SAMGP3 { new_instr(OPC_SAMGP3); }
-| T_OP_RGETPOS { new_instr(OPC_RGETPOS); }
-| T_OP_RGETINFO { new_instr(OPC_RGETINFO); }
-
-cat5_flag: '.' T_3D { instr->flags |= IR3_INSTR_3D; }
-| '.' 'a' { instr->flags |= IR3_INSTR_A; }
-| '.' 'o' { instr->flags |= IR3_INSTR_O; }
-| '.' 'p' { instr->flags |= IR3_INSTR_P; }
-| '.' 's' { instr->flags |= IR3_INSTR_S; }
-| '.' T_S2EN { instr->flags |= IR3_INSTR_S2EN; }
-| '.' T_BASE { instr->flags |= IR3_INSTR_B; instr->cat5.tex_base = $2; }
-cat5_flags:
-| cat5_flag cat5_flags
-
-cat5_samp: T_SAMP { instr->cat5.samp = $1; }
-cat5_tex: T_TEX { if (instr->flags & IR3_INSTR_B) instr->cat5.samp |= ($1 << 4); else instr->cat5.tex = $1; }
-cat5_type: '(' type ')' { instr->cat5.type = $2; }
-
-cat5_instr: cat5_opc_dsxypp cat5_flags dst_reg ',' src_reg
-| cat5_opc cat5_flags cat5_type dst_reg ',' src_reg ',' src_reg ',' cat5_samp ',' cat5_tex
-| cat5_opc cat5_flags cat5_type dst_reg ',' src_reg ',' src_reg ',' cat5_samp
-| cat5_opc cat5_flags cat5_type dst_reg ',' src_reg ',' src_reg ',' cat5_tex
-| cat5_opc cat5_flags cat5_type dst_reg ',' src_reg ',' src_reg
-| cat5_opc cat5_flags cat5_type dst_reg ',' src_reg ',' cat5_samp ',' cat5_tex
-| cat5_opc cat5_flags cat5_type dst_reg ',' src_reg ',' cat5_samp
-| cat5_opc cat5_flags cat5_type dst_reg ',' src_reg ',' cat5_tex
-| cat5_opc cat5_flags cat5_type dst_reg ',' src_reg
-| cat5_opc cat5_flags cat5_type dst_reg ',' cat5_samp ',' cat5_tex
-| cat5_opc cat5_flags cat5_type dst_reg ',' cat5_samp
-| cat5_opc cat5_flags cat5_type dst_reg ',' cat5_tex
-| cat5_opc cat5_flags cat5_type dst_reg
-
-cat6_typed: '.' T_UNTYPED { instr->cat6.typed = 0; }
-| '.' T_TYPED { instr->cat6.typed = 1; }
-
-cat6_dim: '.' T_1D { instr->cat6.d = 1; }
-| '.' T_2D { instr->cat6.d = 2; }
-| '.' T_3D { instr->cat6.d = 3; }
-| '.' T_4D { instr->cat6.d = 4; }
-
-cat6_type: '.' type { instr->cat6.type = $2; }
-cat6_offset: offset { instr->cat6.src_offset = $1; }
-cat6_immed: integer { instr->cat6.iim_val = $1; }
-
-cat6_load: T_OP_LDG { new_instr(OPC_LDG); } cat6_type dst_reg ',' 'g' '[' reg cat6_offset ']' ',' cat6_immed
-| T_OP_LDP { new_instr(OPC_LDP); } cat6_type dst_reg ',' 'p' '[' reg cat6_offset ']' ',' cat6_immed
-| T_OP_LDL { new_instr(OPC_LDL); } cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
-| T_OP_LDLW { new_instr(OPC_LDLW); } cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
-| T_OP_LDLV { new_instr(OPC_LDLV); } cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
-
-// TODO some of the cat6 instructions have different syntax for a6xx..
-//| T_OP_LDIB { new_instr(OPC_LDIB); } cat6_type dst_reg cat6_offset ',' reg ',' cat6_immed
-
-cat6_store: T_OP_STG { new_instr(OPC_STG); } cat6_type 'g' '[' dst_reg cat6_offset ']' ',' reg ',' cat6_immed
-| T_OP_STP { new_instr(OPC_STP); } cat6_type 'p' '[' dst_reg cat6_offset ']' ',' reg ',' cat6_immed
-| T_OP_STL { new_instr(OPC_STL); } cat6_type 'l' '[' dst_reg cat6_offset ']' ',' reg ',' cat6_immed
-| T_OP_STLW { new_instr(OPC_STLW); } cat6_type 'l' '[' dst_reg cat6_offset ']' ',' reg ',' cat6_immed
-
-cat6_storeib: T_OP_STIB { new_instr(OPC_STIB); dummy_dst(); } cat6_typed cat6_dim cat6_type '.' cat6_immed'g' '[' immediate ']' '+' reg ',' reg
-
-cat6_prefetch: T_OP_PREFETCH { new_instr(OPC_PREFETCH); new_reg(0,0); /* dummy dst */ } 'g' '[' reg cat6_offset ']' ',' cat6_immed
-
-cat6_atomic_l_g: '.' 'g' { instr->flags |= IR3_INSTR_G; }
-| '.' 'l' { }
-
-cat6_atomic: T_OP_ATOMIC_ADD { new_instr(OPC_ATOMIC_ADD); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
-| T_OP_ATOMIC_SUB { new_instr(OPC_ATOMIC_SUB); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
-| T_OP_ATOMIC_XCHG { new_instr(OPC_ATOMIC_XCHG); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
-| T_OP_ATOMIC_INC { new_instr(OPC_ATOMIC_INC); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
-| T_OP_ATOMIC_DEC { new_instr(OPC_ATOMIC_DEC); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
-| T_OP_ATOMIC_CMPXCHG { new_instr(OPC_ATOMIC_CMPXCHG); }cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
-| T_OP_ATOMIC_MIN { new_instr(OPC_ATOMIC_MIN); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
-| T_OP_ATOMIC_MAX { new_instr(OPC_ATOMIC_MAX); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
-| T_OP_ATOMIC_AND { new_instr(OPC_ATOMIC_AND); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
-| T_OP_ATOMIC_OR { new_instr(OPC_ATOMIC_OR); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
-| T_OP_ATOMIC_XOR { new_instr(OPC_ATOMIC_XOR); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
-
-cat6_todo: T_OP_G2L { new_instr(OPC_G2L); }
-| T_OP_L2G { new_instr(OPC_L2G); }
-| T_OP_RESFMT { new_instr(OPC_RESFMT); }
-| T_OP_RESINF { new_instr(OPC_RESINFO); }
-| T_OP_LDGB { new_instr(OPC_LDGB); }
-| T_OP_STGB { new_instr(OPC_STGB); }
-| T_OP_LDC { new_instr(OPC_LDC); }
-
-cat6_instr: cat6_load
-| cat6_store
-| cat6_storeib
-| cat6_prefetch
-| cat6_atomic
-| cat6_todo
-
-reg: T_REGISTER { $$ = new_reg($1, 0); }
-| T_A0 { $$ = new_reg((61 << 3) + $1, IR3_REG_HALF); }
-| T_P0 { $$ = new_reg((62 << 3) + $1, 0); }
-
-const: T_CONSTANT { $$ = new_reg($1, IR3_REG_CONST); }
-
-dst_reg_flag: T_EVEN { rflags.flags |= IR3_REG_EVEN; }
-| T_POS_INFINITY { rflags.flags |= IR3_REG_POS_INF; }
-| T_EI { rflags.flags |= IR3_REG_EI; }
-| T_WRMASK { rflags.wrmask = $1; }
-
-dst_reg_flags: dst_reg_flag
-| dst_reg_flag dst_reg_flags
-
- /* note: destination registers are always incremented in repeat */
-dst_reg: reg { $1->flags |= IR3_REG_R; }
-| dst_reg_flags reg { $2->flags |= IR3_REG_R; }
-
-src_reg_flag: T_ABSNEG { rflags.flags |= IR3_REG_ABS|IR3_REG_NEGATE; }
-| T_NEG { rflags.flags |= IR3_REG_NEGATE; }
-| T_ABS { rflags.flags |= IR3_REG_ABS; }
-| T_R { rflags.flags |= IR3_REG_R; }
-
-src_reg_flags: src_reg_flag
-| src_reg_flag src_reg_flags
-
-src_reg: reg
-| src_reg_flags reg
-
-src_const: const
-| src_reg_flags const
-
-src_reg_or_const: src_reg
-| src_const
-
-src_reg_or_const_or_rel: src_reg_or_const
-| relative
-
-src_reg_or_const_or_rel_or_imm: src_reg_or_const_or_rel
-| src_reg_flags immediate
-| immediate
-
-offset: { $$ = 0; }
-| '+' integer { $$ = $2; }
-| '-' integer { $$ = -$2; }
-
-relative: 'r' '<' T_A0 offset '>' { new_reg(0, IR3_REG_RELATIV)->array.offset = $4; }
-| 'c' '<' T_A0 offset '>' { new_reg(0, IR3_REG_RELATIV | IR3_REG_CONST)->array.offset = $4; }
-
-immediate: integer { new_reg(0, IR3_REG_IMMED)->iim_val = $1; }
-| '(' integer ')' { new_reg(0, IR3_REG_IMMED)->fim_val = $2; }
-| '(' float ')' { new_reg(0, IR3_REG_IMMED)->fim_val = $2; }
-| '(' T_NAN ')' { new_reg(0, IR3_REG_IMMED)->fim_val = NAN; }
-| '(' T_INF ')' { new_reg(0, IR3_REG_IMMED)->fim_val = INFINITY; }
-
-integer: T_INT { $$ = $1; }
-| '-' T_INT { $$ = -$2; }
-| T_HEX { $$ = $1; }
-| '-' T_HEX { $$ = -$2; }
-
-float: T_FLOAT { $$ = $1; }
-| '-' T_FLOAT { $$ = -$2; }
-
-type: T_TYPE_F16 { $$ = TYPE_F16; }
-| T_TYPE_F32 { $$ = TYPE_F32; }
-| T_TYPE_U16 { $$ = TYPE_U16; }
-| T_TYPE_U32 { $$ = TYPE_U32; }
-| T_TYPE_S16 { $$ = TYPE_S16; }
-| T_TYPE_S32 { $$ = TYPE_S32; }
-| T_TYPE_U8 { $$ = TYPE_U8; }
-| T_TYPE_S8 { $$ = TYPE_S8; }
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
# SOFTWARE.
-ir3_parser = custom_target(
- 'ir3_parser.[ch]',
- input: 'ir3_parser.y',
- output: ['ir3_parser.c', 'ir3_parser.h'],
- command: [
- prog_bison, '@INPUT@', '--name-prefix=ir3_yy', '--defines=@OUTPUT1@', '--output=@OUTPUT0@'
- ]
-)
-
-ir3_lexer = custom_target(
- 'ir3_lexer.c',
- input: 'ir3_lexer.l',
- output: 'ir3_lexer.c',
- command: [
- prog_flex, '-o', '@OUTPUT@', '@INPUT@'
- ]
-)
-
computerator_files = [
'a6xx.c',
'ir3_asm.c',
'main.c',
freedreno_xml_header_files,
- ir3_parser[0],
- ir3_parser[1],
- ir3_lexer
]
computerator = executable(
--- /dev/null
+/*
+ * Copyright (c) 2013 Rob Clark <robclark@freedesktop.org>
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice (including the next
+ * paragraph) shall be included in all copies or substantial portions of the
+ * Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+ * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+ * SOFTWARE.
+ */
+
+%{
+#include <stdlib.h>
+#include "ir3/ir3.h"
+#include "ir3_parser.h"
+
+#define YY_NO_INPUT
+#define YY_NO_UNPUT
+#define TOKEN(t) (ir3_yylval.tok = t)
+extern YYSTYPE ir3_yylval;
+
+static int parse_wrmask(const char *src)
+{
+ int i, num = 0;
+ for (i = 0; i < 4; i++) {
+ if ("xyzw"[i] == src[1]) {
+ num |= (1 << i);
+ src++;
+ }
+ }
+ return num;
+}
+
+static int parse_reg(const char *str)
+{
+ int num = 0;
+ if (str[0] == 'h') {
+ str++;
+ num++;
+ }
+ str++;
+ num += strtol(str, (char **)&str, 10) << 3;
+ switch (str[1]) {
+ case 'x': num += 0; break;
+ case 'y': num += 2; break;
+ case 'z': num += 4; break;
+ case 'w': num += 6; break;
+ default: assert(0); break;
+ }
+ return num;
+}
+%}
+
+%option noyywrap
+%option prefix="ir3_yy"
+
+%%
+"\n" yylineno++;
+[ \t] ; /* ignore whitespace */
+";"[^\n]*"\n" yylineno++; /* ignore comments */
+[0-9]+"."[0-9]+ ir3_yylval.flt = strtod(yytext, NULL); return T_FLOAT;
+[0-9]* ir3_yylval.num = strtoul(yytext, NULL, 0); return T_INT;
+"0x"[0-9a-fA-F]* ir3_yylval.num = strtoul(yytext, NULL, 0); return T_HEX;
+"@localsize" return TOKEN(T_A_LOCALSIZE);
+"@const" return TOKEN(T_A_CONST);
+"@buf" return TOKEN(T_A_BUF);
+"@invocationid" return TOKEN(T_A_INVOCATIONID);
+"@wgid" return TOKEN(T_A_WGID);
+"@numwg" return TOKEN(T_A_NUMWG);
+"(sy)" return TOKEN(T_SY);
+"(ss)" return TOKEN(T_SS);
+"(absneg)" return TOKEN(T_ABSNEG);
+"(neg)" return TOKEN(T_NEG);
+"(abs)" return TOKEN(T_ABS);
+"(r)" return TOKEN(T_R);
+"(ul)" return TOKEN(T_UL);
+"(even)" return TOKEN(T_EVEN);
+"(pos_infinity)" return TOKEN(T_POS_INFINITY);
+"(ei)" return TOKEN(T_EI);
+"(jp)" return TOKEN(T_JP);
+"(rpt"[0-7]")" ir3_yylval.num = strtol(yytext+4, NULL, 10); return T_RPT;
+"(nop"[0-7]")" ir3_yylval.num = strtol(yytext+4, NULL, 10); return T_NOP;
+"("[x]?[y]?[z]?[w]?")" ir3_yylval.num = parse_wrmask(yytext); return T_WRMASK;
+
+[h]?"r"[0-9]+"."[xyzw] ir3_yylval.num = parse_reg(yytext); return T_REGISTER;
+[h]?"c"[0-9]+"."[xyzw] ir3_yylval.num = parse_reg(yytext); return T_CONSTANT;
+"a0."[xyzw] ir3_yylval.num = parse_reg(yytext); return T_A0;
+"p0."[xyzw] ir3_yylval.num = parse_reg(yytext); return T_P0;
+"s#"[0-9]+ ir3_yylval.num = strtol(yytext+2, NULL, 10); return T_SAMP;
+"t#"[0-9]+ ir3_yylval.num = strtol(yytext+2, NULL, 10); return T_TEX;
+
+ /* category 0: */
+"nop" return TOKEN(T_OP_NOP);
+"br" return TOKEN(T_OP_BR);
+"jump" return TOKEN(T_OP_JUMP);
+"call" return TOKEN(T_OP_CALL);
+"ret" return TOKEN(T_OP_RET);
+"kill" return TOKEN(T_OP_KILL);
+"end" return TOKEN(T_OP_END);
+"emit" return TOKEN(T_OP_EMIT);
+"cut" return TOKEN(T_OP_CUT);
+"chmask" return TOKEN(T_OP_CHMASK);
+"chsh" return TOKEN(T_OP_CHSH);
+"flow_rev" return TOKEN(T_OP_FLOW_REV);
+
+ /* category 1: */
+"mova" return TOKEN(T_OP_MOVA);
+"mov" return TOKEN(T_OP_MOV);
+"cov" return TOKEN(T_OP_COV);
+
+("f16"|"f32"|"u16"|"u32"|"s16"|"s32"|"u8"|"s8"){2} ir3_yylval.str = yytext; return T_CAT1_TYPE_TYPE;
+
+ /* category 2: */
+"add.f" return TOKEN(T_OP_ADD_F);
+"min.f" return TOKEN(T_OP_MIN_F);
+"max.f" return TOKEN(T_OP_MAX_F);
+"mul.f" return TOKEN(T_OP_MUL_F);
+"sign.f" return TOKEN(T_OP_SIGN_F);
+"cmps.f" return TOKEN(T_OP_CMPS_F);
+"absneg.f" return TOKEN(T_OP_ABSNEG_F);
+"cmpv.f" return TOKEN(T_OP_CMPV_F);
+"floor.f" return TOKEN(T_OP_FLOOR_F);
+"ceil.f" return TOKEN(T_OP_CEIL_F);
+"rndne.f" return TOKEN(T_OP_RNDNE_F);
+"rndaz.f" return TOKEN(T_OP_RNDAZ_F);
+"trunc.f" return TOKEN(T_OP_TRUNC_F);
+"add.u" return TOKEN(T_OP_ADD_U);
+"add.s" return TOKEN(T_OP_ADD_S);
+"sub.u" return TOKEN(T_OP_SUB_U);
+"sub.s" return TOKEN(T_OP_SUB_S);
+"cmps.u" return TOKEN(T_OP_CMPS_U);
+"cmps.s" return TOKEN(T_OP_CMPS_S);
+"min.u" return TOKEN(T_OP_MIN_U);
+"min.s" return TOKEN(T_OP_MIN_S);
+"max.u" return TOKEN(T_OP_MAX_U);
+"max.s" return TOKEN(T_OP_MAX_S);
+"absneg.s" return TOKEN(T_OP_ABSNEG_S);
+"and.b" return TOKEN(T_OP_AND_B);
+"or.b" return TOKEN(T_OP_OR_B);
+"not.b" return TOKEN(T_OP_NOT_B);
+"xor.b" return TOKEN(T_OP_XOR_B);
+"cmpv.u" return TOKEN(T_OP_CMPV_U);
+"cmpv.s" return TOKEN(T_OP_CMPV_S);
+"mul.u24" return TOKEN(T_OP_MUL_U24);
+"mul.s24" return TOKEN(T_OP_MUL_S24);
+"mull.u" return TOKEN(T_OP_MULL_U);
+"bfrev.b" return TOKEN(T_OP_BFREV_B);
+"clz.s" return TOKEN(T_OP_CLZ_S);
+"clz.b" return TOKEN(T_OP_CLZ_B);
+"shl.b" return TOKEN(T_OP_SHL_B);
+"shr.b" return TOKEN(T_OP_SHR_B);
+"ashr.b" return TOKEN(T_OP_ASHR_B);
+"bary.f" return TOKEN(T_OP_BARY_F);
+"mgen.b" return TOKEN(T_OP_MGEN_B);
+"getbit.b" return TOKEN(T_OP_GETBIT_B);
+"setrm" return TOKEN(T_OP_SETRM);
+"cbits.b" return TOKEN(T_OP_CBITS_B);
+"shb" return TOKEN(T_OP_SHB);
+"msad" return TOKEN(T_OP_MSAD);
+
+ /* category 3: */
+"mad.u16" return TOKEN(T_OP_MAD_U16);
+"madsh.u16" return TOKEN(T_OP_MADSH_U16);
+"mad.s16" return TOKEN(T_OP_MAD_S16);
+"madsh.m16" return TOKEN(T_OP_MADSH_M16);
+"mad.u24" return TOKEN(T_OP_MAD_U24);
+"mad.s24" return TOKEN(T_OP_MAD_S24);
+"mad.f16" return TOKEN(T_OP_MAD_F16);
+"mad.f32" return TOKEN(T_OP_MAD_F32);
+"sel.b16" return TOKEN(T_OP_SEL_B16);
+"sel.b32" return TOKEN(T_OP_SEL_B32);
+"sel.s16" return TOKEN(T_OP_SEL_S16);
+"sel.s32" return TOKEN(T_OP_SEL_S32);
+"sel.f16" return TOKEN(T_OP_SEL_F16);
+"sel.f32" return TOKEN(T_OP_SEL_F32);
+"sad.s16" return TOKEN(T_OP_SAD_S16);
+"sad.s32" return TOKEN(T_OP_SAD_S32);
+
+ /* category 4: */
+"rcp" return TOKEN(T_OP_RCP);
+"rsq" return TOKEN(T_OP_RSQ);
+"log2" return TOKEN(T_OP_LOG2);
+"exp2" return TOKEN(T_OP_EXP2);
+"sin" return TOKEN(T_OP_SIN);
+"cos" return TOKEN(T_OP_COS);
+"sqrt" return TOKEN(T_OP_SQRT);
+"hrsq" return TOKEN(T_OP_HRSQ);
+"hlog2" return TOKEN(T_OP_HLOG2);
+"hexp2" return TOKEN(T_OP_HEXP2);
+
+ /* category 5: */
+"isam" return TOKEN(T_OP_ISAM);
+"isaml" return TOKEN(T_OP_ISAML);
+"isamm" return TOKEN(T_OP_ISAMM);
+"sam" return TOKEN(T_OP_SAM);
+"samb" return TOKEN(T_OP_SAMB);
+"saml" return TOKEN(T_OP_SAML);
+"samgq" return TOKEN(T_OP_SAMGQ);
+"getlod" return TOKEN(T_OP_GETLOD);
+"conv" return TOKEN(T_OP_CONV);
+"convm" return TOKEN(T_OP_CONVM);
+"getsize" return TOKEN(T_OP_GETSIZE);
+"getbuf" return TOKEN(T_OP_GETBUF);
+"getpos" return TOKEN(T_OP_GETPOS);
+"getinfo" return TOKEN(T_OP_GETINFO);
+"dsx" return TOKEN(T_OP_DSX);
+"dsy" return TOKEN(T_OP_DSY);
+"gather4r" return TOKEN(T_OP_GATHER4R);
+"gather4g" return TOKEN(T_OP_GATHER4G);
+"gather4b" return TOKEN(T_OP_GATHER4B);
+"gather4a" return TOKEN(T_OP_GATHER4A);
+"samgp0" return TOKEN(T_OP_SAMGP0);
+"samgp1" return TOKEN(T_OP_SAMGP1);
+"samgp2" return TOKEN(T_OP_SAMGP2);
+"samgp3" return TOKEN(T_OP_SAMGP3);
+"dsxpp.1" return TOKEN(T_OP_DSXPP_1);
+"dsypp.1" return TOKEN(T_OP_DSYPP_1);
+"rgetpos" return TOKEN(T_OP_RGETPOS);
+"rgetinfo" return TOKEN(T_OP_RGETINFO);
+
+ /* category 6: */
+"ldg" return TOKEN(T_OP_LDG);
+"ldl" return TOKEN(T_OP_LDL);
+"ldp" return TOKEN(T_OP_LDP);
+"stg" return TOKEN(T_OP_STG);
+"stl" return TOKEN(T_OP_STL);
+"stp" return TOKEN(T_OP_STP);
+"ldib" return TOKEN(T_OP_LDIB);
+"g2l" return TOKEN(T_OP_G2L);
+"l2g" return TOKEN(T_OP_L2G);
+"prefetch" return TOKEN(T_OP_PREFETCH);
+"ldlw" return TOKEN(T_OP_LDLW);
+"stlw" return TOKEN(T_OP_STLW);
+"resfmt" return TOKEN(T_OP_RESFMT);
+"resinf" return TOKEN(T_OP_RESINF);
+"atomic.add" return TOKEN(T_OP_ATOMIC_ADD);
+"atomic.sub" return TOKEN(T_OP_ATOMIC_SUB);
+"atomic.xchg" return TOKEN(T_OP_ATOMIC_XCHG);
+"atomic.inc" return TOKEN(T_OP_ATOMIC_INC);
+"atomic.dec" return TOKEN(T_OP_ATOMIC_DEC);
+"atomic.cmpxchg" return TOKEN(T_OP_ATOMIC_CMPXCHG);
+"atomic.min" return TOKEN(T_OP_ATOMIC_MIN);
+"atomic.max" return TOKEN(T_OP_ATOMIC_MAX);
+"atomic.and" return TOKEN(T_OP_ATOMIC_AND);
+"atomic.or" return TOKEN(T_OP_ATOMIC_OR);
+"atomic.xor" return TOKEN(T_OP_ATOMIC_XOR);
+"ldgb" return TOKEN(T_OP_LDGB);
+"stgb" return TOKEN(T_OP_STGB);
+"stib" return TOKEN(T_OP_STIB);
+"ldc" return TOKEN(T_OP_LDC);
+"ldlv" return TOKEN(T_OP_LDLV);
+
+"f16" return TOKEN(T_TYPE_F16);
+"f32" return TOKEN(T_TYPE_F32);
+"u16" return TOKEN(T_TYPE_U16);
+"u32" return TOKEN(T_TYPE_U32);
+"s16" return TOKEN(T_TYPE_S16);
+"s32" return TOKEN(T_TYPE_S32);
+"u8" return TOKEN(T_TYPE_U8);
+"s8" return TOKEN(T_TYPE_S8);
+
+"untyped" return TOKEN(T_UNTYPED);
+"typed" return TOKEN(T_TYPED);
+
+"1d" return TOKEN(T_1D);
+"2d" return TOKEN(T_2D);
+"3d" return TOKEN(T_3D);
+"4d" return TOKEN(T_4D);
+
+"lt" return TOKEN(T_LT);
+"le" return TOKEN(T_LE);
+"gt" return TOKEN(T_GT);
+"ge" return TOKEN(T_GE);
+"eq" return TOKEN(T_EQ);
+"ne" return TOKEN(T_NE);
+
+"a" return 'a';
+"o" return 'o';
+"p" return 'p';
+"s2en" return TOKEN(T_S2EN);
+"s" return 's';
+"base"[0-9]+ ir3_yylval.num = strtol(yytext+4, NULL, 10); return T_BASE;
+
+"=" return '=';
+"(" return '(';
+")" return ')';
+"[" return '[';
+"]" return ']';
+"," return ',';
+"." return '.';
+"-" return '-';
+"+" return '+';
+"|" return '|';
+"c" return 'c';
+"r" return 'r';
+"g" return 'g';
+"l" return 'l';
+"<" return '<';
+">" return '>';
+"!" return '!';
+"#" return '#';
+
+"nan" return TOKEN(T_NAN);
+"inf" return TOKEN(T_INF);
+
+[a-zA-Z_][a-zA-Z_0-9]* ir3_yylval.str = yytext; return T_IDENTIFIER;
+. fprintf(stderr, "error at line %d: Unknown token: %s\n", ir3_yyget_lineno(), yytext); yyterminate();
+%%
--- /dev/null
+/*
+ * Copyright (c) 2013 Rob Clark <robclark@freedesktop.org>
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice (including the next
+ * paragraph) shall be included in all copies or substantial portions of the
+ * Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+ * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+ * SOFTWARE.
+ */
+
+%code requires {
+
+#define MAX_BUFS 4
+
+struct ir3_kernel_info {
+ uint32_t local_size[3];
+ uint32_t num_bufs;
+ uint32_t buf_sizes[MAX_BUFS]; /* size in dwords */
+
+ /* driver-param uniforms: */
+ unsigned numwg;
+};
+
+struct ir3 * ir3_parse(struct ir3_shader_variant *v,
+ struct ir3_kernel_info *k, FILE *f);
+}
+
+%{
+#define YYDEBUG 0
+
+#include <stdlib.h>
+#include <stdio.h>
+#include <string.h>
+#include <math.h>
+
+#include "util/u_math.h"
+
+#include "ir3/ir3.h"
+#include "ir3/ir3_shader.h"
+#include "ir3/instr-a3xx.h"
+
+#include "ir3_parser.h"
+
+/* ir3 treats the abs/neg flags as separate flags for float vs integer,
+ * but in the instruction encoding they are the same thing. Tracking
+ * them separately is only for the benefit of ir3 opt passes, and not
+ * required here, so just use the float versions:
+ */
+#define IR3_REG_ABS IR3_REG_FABS
+#define IR3_REG_NEGATE IR3_REG_FNEG
+
+static struct ir3_kernel_info *info;
+static struct ir3_shader_variant *variant;
+/* NOTE the assembler doesn't really use the ir3_block construction
+ * like the compiler does. Everything is treated as one large block.
+ * Which might happen to contain flow control. But since we don't
+ * use any of the ir3 backend passes (sched, RA, etc) this doesn't
+ * really matter.
+ */
+static struct ir3_block *block; /* current shader block */
+static struct ir3_instruction *instr; /* current instruction */
+
+static struct {
+ unsigned flags;
+ unsigned repeat;
+ unsigned nop;
+} iflags;
+
+static struct {
+ unsigned flags;
+ unsigned wrmask;
+} rflags;
+
+int ir3_yyget_lineno(void);
+
+static struct ir3_instruction * new_instr(opc_t opc)
+{
+ instr = ir3_instr_create(block, opc);
+ instr->flags = iflags.flags;
+ instr->repeat = iflags.repeat;
+ instr->nop = iflags.nop;
+ instr->line = ir3_yyget_lineno();
+ iflags.flags = iflags.repeat = iflags.nop = 0;
+ return instr;
+}
+
+static void new_shader(void)
+{
+ variant->ir = ir3_create(variant->shader->compiler, variant->shader->type);
+ block = ir3_block_create(variant->ir);
+ list_addtail(&block->node, &variant->ir->block_list);
+}
+
+static type_t parse_type(const char **type)
+{
+ if (!strncmp("f16", *type, 3)) {
+ *type += 3;
+ return TYPE_F16;
+ } else if (!strncmp("f32", *type, 3)) {
+ *type += 3;
+ return TYPE_F32;
+ } else if (!strncmp("u16", *type, 3)) {
+ *type += 3;
+ return TYPE_U16;
+ } else if (!strncmp("u32", *type, 3)) {
+ *type += 3;
+ return TYPE_U32;
+ } else if (!strncmp("s16", *type, 3)) {
+ *type += 3;
+ return TYPE_S16;
+ } else if (!strncmp("s32", *type, 3)) {
+ *type += 3;
+ return TYPE_S32;
+ } else if (!strncmp("u8", *type, 2)) {
+ *type += 2;
+ return TYPE_U8;
+ } else if (!strncmp("s8", *type, 2)) {
+ *type += 2;
+ return TYPE_S8;
+ } else {
+ assert(0); /* shouldn't get here */
+ return ~0;
+ }
+}
+
+static struct ir3_instruction * parse_type_type(struct ir3_instruction *instr,
+ const char *type_type)
+{
+ instr->cat1.src_type = parse_type(&type_type);
+ instr->cat1.dst_type = parse_type(&type_type);
+ return instr;
+}
+
+static struct ir3_register * new_reg(int num, unsigned flags)
+{
+ struct ir3_register *reg;
+ flags |= rflags.flags;
+ if (num & 0x1)
+ flags |= IR3_REG_HALF;
+ reg = ir3_reg_create(instr, num>>1, flags);
+ reg->wrmask = MAX2(1, rflags.wrmask);
+ rflags.flags = rflags.wrmask = 0;
+ return reg;
+}
+
+static struct ir3_register * dummy_dst(void)
+{
+ return new_reg(0, 0);
+}
+
+static void add_const(unsigned reg, unsigned c0, unsigned c1, unsigned c2, unsigned c3)
+{
+ struct ir3_const_state *const_state = &variant->shader->const_state;
+ assert((reg & 0x7) == 0);
+ int idx = reg >> (1 + 2); /* low bit is half vs full, next two bits are swiz */
+ if (const_state->immediate_idx == const_state->immediates_size * 4) {
+ const_state->immediates_size += 4;
+ const_state->immediates = realloc (const_state->immediates,
+ const_state->immediates_size * sizeof(const_state->immediates[0]));
+ }
+ const_state->immediates[idx].val[0] = c0;
+ const_state->immediates[idx].val[1] = c1;
+ const_state->immediates[idx].val[2] = c2;
+ const_state->immediates[idx].val[3] = c3;
+ const_state->immediates_count = idx + 1;
+ const_state->immediate_idx++;
+}
+
+static void add_sysval(unsigned reg, unsigned compmask, gl_system_value sysval)
+{
+ unsigned n = variant->inputs_count++;
+ variant->inputs[n].regid = reg;
+ variant->inputs[n].sysval = true;
+ variant->inputs[n].slot = sysval;
+ variant->inputs[n].compmask = compmask;
+ variant->inputs[n].interpolate = INTERP_MODE_FLAT;
+ variant->total_in++;
+}
+
+#ifdef YYDEBUG
+int yydebug;
+#endif
+
+extern int yylex(void);
+extern FILE *ir3_yyin;
+
+int yyparse(void);
+
+static void yyerror(const char *error)
+{
+ fprintf(stderr, "error at line %d: %s\n", ir3_yyget_lineno(), error);
+}
+
+struct ir3 * ir3_parse(struct ir3_shader_variant *v,
+ struct ir3_kernel_info *k, FILE *f)
+{
+ ir3_yyin = f;
+#ifdef YYDEBUG
+ yydebug = 1;
+#endif
+ info = k;
+ variant = v;
+ if (yyparse()) {
+ ir3_destroy(variant->ir);
+ variant->ir = NULL;
+ }
+ return variant->ir;
+}
+%}
+
+%union {
+ int tok;
+ int num;
+ uint32_t unum;
+ double flt;
+ const char *str;
+ struct ir3_register *reg;
+ struct {
+ int start;
+ int num;
+ } range;
+ type_t type;
+}
+
+%{
+#if YYDEBUG
+static void print_token(FILE *file, int type, YYSTYPE value)
+{
+ fprintf(file, "\ntype: %d\n", type);
+}
+
+#define YYPRINT(file, type, value) print_token(file, type, value)
+#endif
+%}
+
+%token <num> T_INT
+%token <unum> T_HEX
+%token <flt> T_FLOAT
+%token <str> T_IDENTIFIER
+%token <num> T_REGISTER
+%token <num> T_CONSTANT
+
+/* @ headers (@const/@sampler/@uniform/@varying) */
+%token <tok> T_A_LOCALSIZE
+%token <tok> T_A_CONST
+%token <tok> T_A_BUF
+%token <tok> T_A_INVOCATIONID
+%token <tok> T_A_WGID
+%token <tok> T_A_NUMWG
+/* todo, re-add @sampler/@uniform/@varying if needed someday */
+
+/* src register flags */
+%token <tok> T_ABSNEG
+%token <tok> T_NEG
+%token <tok> T_ABS
+%token <tok> T_R
+
+/* dst register flags */
+%token <tok> T_EVEN
+%token <tok> T_POS_INFINITY
+%token <tok> T_EI
+%token <num> T_WRMASK
+
+/* instruction flags */
+%token <tok> T_SY
+%token <tok> T_SS
+%token <tok> T_JP
+%token <num> T_RPT
+%token <tok> T_UL
+%token <tok> T_NOP
+
+/* category 0: */
+%token <tok> T_OP_NOP
+%token <tok> T_OP_BR
+%token <tok> T_OP_JUMP
+%token <tok> T_OP_CALL
+%token <tok> T_OP_RET
+%token <tok> T_OP_KILL
+%token <tok> T_OP_END
+%token <tok> T_OP_EMIT
+%token <tok> T_OP_CUT
+%token <tok> T_OP_CHMASK
+%token <tok> T_OP_CHSH
+%token <tok> T_OP_FLOW_REV
+
+/* category 1: */
+%token <tok> T_OP_MOVA
+%token <tok> T_OP_MOV
+%token <tok> T_OP_COV
+
+/* category 2: */
+%token <tok> T_OP_ADD_F
+%token <tok> T_OP_MIN_F
+%token <tok> T_OP_MAX_F
+%token <tok> T_OP_MUL_F
+%token <tok> T_OP_SIGN_F
+%token <tok> T_OP_CMPS_F
+%token <tok> T_OP_ABSNEG_F
+%token <tok> T_OP_CMPV_F
+%token <tok> T_OP_FLOOR_F
+%token <tok> T_OP_CEIL_F
+%token <tok> T_OP_RNDNE_F
+%token <tok> T_OP_RNDAZ_F
+%token <tok> T_OP_TRUNC_F
+%token <tok> T_OP_ADD_U
+%token <tok> T_OP_ADD_S
+%token <tok> T_OP_SUB_U
+%token <tok> T_OP_SUB_S
+%token <tok> T_OP_CMPS_U
+%token <tok> T_OP_CMPS_S
+%token <tok> T_OP_MIN_U
+%token <tok> T_OP_MIN_S
+%token <tok> T_OP_MAX_U
+%token <tok> T_OP_MAX_S
+%token <tok> T_OP_ABSNEG_S
+%token <tok> T_OP_AND_B
+%token <tok> T_OP_OR_B
+%token <tok> T_OP_NOT_B
+%token <tok> T_OP_XOR_B
+%token <tok> T_OP_CMPV_U
+%token <tok> T_OP_CMPV_S
+%token <tok> T_OP_MUL_U24
+%token <tok> T_OP_MUL_S24
+%token <tok> T_OP_MULL_U
+%token <tok> T_OP_BFREV_B
+%token <tok> T_OP_CLZ_S
+%token <tok> T_OP_CLZ_B
+%token <tok> T_OP_SHL_B
+%token <tok> T_OP_SHR_B
+%token <tok> T_OP_ASHR_B
+%token <tok> T_OP_BARY_F
+%token <tok> T_OP_MGEN_B
+%token <tok> T_OP_GETBIT_B
+%token <tok> T_OP_SETRM
+%token <tok> T_OP_CBITS_B
+%token <tok> T_OP_SHB
+%token <tok> T_OP_MSAD
+
+/* category 3: */
+%token <tok> T_OP_MAD_U16
+%token <tok> T_OP_MADSH_U16
+%token <tok> T_OP_MAD_S16
+%token <tok> T_OP_MADSH_M16
+%token <tok> T_OP_MAD_U24
+%token <tok> T_OP_MAD_S24
+%token <tok> T_OP_MAD_F16
+%token <tok> T_OP_MAD_F32
+%token <tok> T_OP_SEL_B16
+%token <tok> T_OP_SEL_B32
+%token <tok> T_OP_SEL_S16
+%token <tok> T_OP_SEL_S32
+%token <tok> T_OP_SEL_F16
+%token <tok> T_OP_SEL_F32
+%token <tok> T_OP_SAD_S16
+%token <tok> T_OP_SAD_S32
+
+/* category 4: */
+%token <tok> T_OP_RCP
+%token <tok> T_OP_RSQ
+%token <tok> T_OP_LOG2
+%token <tok> T_OP_EXP2
+%token <tok> T_OP_SIN
+%token <tok> T_OP_COS
+%token <tok> T_OP_SQRT
+%token <tok> T_OP_HRSQ
+%token <tok> T_OP_HLOG2
+%token <tok> T_OP_HEXP2
+
+/* category 5: */
+%token <tok> T_OP_ISAM
+%token <tok> T_OP_ISAML
+%token <tok> T_OP_ISAMM
+%token <tok> T_OP_SAM
+%token <tok> T_OP_SAMB
+%token <tok> T_OP_SAML
+%token <tok> T_OP_SAMGQ
+%token <tok> T_OP_GETLOD
+%token <tok> T_OP_CONV
+%token <tok> T_OP_CONVM
+%token <tok> T_OP_GETSIZE
+%token <tok> T_OP_GETBUF
+%token <tok> T_OP_GETPOS
+%token <tok> T_OP_GETINFO
+%token <tok> T_OP_DSX
+%token <tok> T_OP_DSY
+%token <tok> T_OP_GATHER4R
+%token <tok> T_OP_GATHER4G
+%token <tok> T_OP_GATHER4B
+%token <tok> T_OP_GATHER4A
+%token <tok> T_OP_SAMGP0
+%token <tok> T_OP_SAMGP1
+%token <tok> T_OP_SAMGP2
+%token <tok> T_OP_SAMGP3
+%token <tok> T_OP_DSXPP_1
+%token <tok> T_OP_DSYPP_1
+%token <tok> T_OP_RGETPOS
+%token <tok> T_OP_RGETINFO
+
+/* category 6: */
+%token <tok> T_OP_LDG
+%token <tok> T_OP_LDL
+%token <tok> T_OP_LDP
+%token <tok> T_OP_STG
+%token <tok> T_OP_STL
+%token <tok> T_OP_STP
+%token <tok> T_OP_LDIB
+%token <tok> T_OP_G2L
+%token <tok> T_OP_L2G
+%token <tok> T_OP_PREFETCH
+%token <tok> T_OP_LDLW
+%token <tok> T_OP_STLW
+%token <tok> T_OP_RESFMT
+%token <tok> T_OP_RESINF
+%token <tok> T_OP_ATOMIC_ADD
+%token <tok> T_OP_ATOMIC_SUB
+%token <tok> T_OP_ATOMIC_XCHG
+%token <tok> T_OP_ATOMIC_INC
+%token <tok> T_OP_ATOMIC_DEC
+%token <tok> T_OP_ATOMIC_CMPXCHG
+%token <tok> T_OP_ATOMIC_MIN
+%token <tok> T_OP_ATOMIC_MAX
+%token <tok> T_OP_ATOMIC_AND
+%token <tok> T_OP_ATOMIC_OR
+%token <tok> T_OP_ATOMIC_XOR
+%token <tok> T_OP_LDGB
+%token <tok> T_OP_STGB
+%token <tok> T_OP_STIB
+%token <tok> T_OP_LDC
+%token <tok> T_OP_LDLV
+
+/* type qualifiers: */
+%token <tok> T_TYPE_F16
+%token <tok> T_TYPE_F32
+%token <tok> T_TYPE_U16
+%token <tok> T_TYPE_U32
+%token <tok> T_TYPE_S16
+%token <tok> T_TYPE_S32
+%token <tok> T_TYPE_U8
+%token <tok> T_TYPE_S8
+
+%token <tok> T_UNTYPED
+%token <tok> T_TYPED
+
+%token <tok> T_1D
+%token <tok> T_2D
+%token <tok> T_3D
+%token <tok> T_4D
+
+/* condition qualifiers: */
+%token <tok> T_LT
+%token <tok> T_LE
+%token <tok> T_GT
+%token <tok> T_GE
+%token <tok> T_EQ
+%token <tok> T_NE
+
+%token <tok> T_S2EN
+%token <tok> T_SAMP
+%token <tok> T_TEX
+%token <tok> T_BASE
+
+%token <tok> T_NAN
+%token <tok> T_INF
+%token <num> T_A0
+%token <num> T_P0
+%token <str> T_CAT1_TYPE_TYPE
+
+%type <num> integer offset
+%type <flt> float
+%type <reg> reg const
+%type <tok> cat1_opc
+%type <tok> cat2_opc_1src cat2_opc_2src_cnd cat2_opc_2src
+%type <tok> cat3_opc
+%type <tok> cat4_opc
+%type <tok> cat5_opc cat5_samp cat5_tex cat5_type
+%type <type> type
+%type <unum> const_val
+
+%error-verbose
+
+%start shader
+
+%%
+
+shader: { new_shader(); } headers instrs
+
+headers:
+| header headers
+
+header: localsize_header
+| const_header
+| buf_header
+| invocationid_header
+| wgid_header
+| numwg_header
+
+const_val: T_FLOAT { $$ = fui($1); }
+| T_INT { $$ = $1; }
+| '-' T_INT { $$ = -$2; }
+| T_HEX { $$ = $1; }
+
+localsize_header: T_A_LOCALSIZE const_val ',' const_val ',' const_val {
+ info->local_size[0] = $2;
+ info->local_size[1] = $4;
+ info->local_size[2] = $6;
+}
+
+const_header: T_A_CONST '(' T_CONSTANT ')' const_val ',' const_val ',' const_val ',' const_val {
+ add_const($3, $5, $7, $9, $11);
+}
+
+buf_header: T_A_BUF const_val {
+ int idx = info->num_bufs++;
+ assert(idx < MAX_BUFS);
+ info->buf_sizes[idx] = $2;
+}
+
+invocationid_header: T_A_INVOCATIONID '(' T_REGISTER ')' {
+ assert(($3 & 0x1) == 0); /* half-reg not allowed */
+ unsigned reg = $3 >> 1;
+ add_sysval(reg, 0x7, SYSTEM_VALUE_LOCAL_INVOCATION_ID);
+}
+
+wgid_header: T_A_WGID '(' T_REGISTER ')' {
+ assert(($3 & 0x1) == 0); /* half-reg not allowed */
+ unsigned reg = $3 >> 1;
+ assert(reg >= regid(48, 0)); /* must be a high reg */
+ add_sysval(reg, 0x7, SYSTEM_VALUE_WORK_GROUP_ID);
+}
+
+numwg_header: T_A_NUMWG '(' T_CONSTANT ')' {
+ assert(($3 & 0x1) == 0); /* half-reg not allowed */
+ unsigned reg = $3 >> 1;
+ info->numwg = reg;
+ /* reserve space in immediates for the actual value to be plugged in later: */
+ add_const($3, 0, 0, 0, 0);
+}
+
+iflag: T_SY { iflags.flags |= IR3_INSTR_SY; }
+| T_SS { iflags.flags |= IR3_INSTR_SS; }
+| T_JP { iflags.flags |= IR3_INSTR_JP; }
+| T_RPT { iflags.repeat = $1; }
+| T_UL { iflags.flags |= IR3_INSTR_UL; }
+| T_NOP { iflags.nop = $1; }
+
+iflags:
+| iflag iflags
+
+instrs: instr instrs
+| instr
+
+instr: iflags cat0_instr
+| iflags cat1_instr
+| iflags cat2_instr
+| iflags cat3_instr
+| iflags cat4_instr
+| iflags cat5_instr
+| iflags cat6_instr
+
+cat0_src: '!' T_P0 { instr->cat0.inv = true; instr->cat0.comp = $2 >> 1; }
+| T_P0 { instr->cat0.comp = $1 >> 1; }
+
+cat0_immed: '#' integer { instr->cat0.immed = $2; }
+
+cat0_instr: T_OP_NOP { new_instr(OPC_NOP); }
+| T_OP_BR { new_instr(OPC_BR); } cat0_src ',' cat0_immed
+| T_OP_JUMP { new_instr(OPC_JUMP); } cat0_immed
+| T_OP_CALL { new_instr(OPC_CALL); } cat0_immed
+| T_OP_RET { new_instr(OPC_RET); }
+| T_OP_KILL { new_instr(OPC_KILL); } cat0_src
+| T_OP_END { new_instr(OPC_END); }
+| T_OP_EMIT { new_instr(OPC_EMIT); }
+| T_OP_CUT { new_instr(OPC_CUT); }
+| T_OP_CHMASK { new_instr(OPC_CHMASK); }
+| T_OP_CHSH { new_instr(OPC_CHSH); }
+| T_OP_FLOW_REV { new_instr(OPC_FLOW_REV); }
+
+cat1_opc: T_OP_MOVA {
+ new_instr(OPC_MOV);
+ instr->cat1.src_type = TYPE_S16;
+ instr->cat1.dst_type = TYPE_S16;
+}
+| T_OP_MOV '.' T_CAT1_TYPE_TYPE {
+ parse_type_type(new_instr(OPC_MOV), $3);
+}
+| T_OP_COV '.' T_CAT1_TYPE_TYPE {
+ parse_type_type(new_instr(OPC_MOV), $3);
+}
+
+cat1_instr: cat1_opc dst_reg ',' src_reg_or_const_or_rel_or_imm
+
+cat2_opc_1src: T_OP_ABSNEG_F { new_instr(OPC_ABSNEG_F); }
+| T_OP_ABSNEG_S { new_instr(OPC_ABSNEG_S); }
+| T_OP_CLZ_B { new_instr(OPC_CLZ_B); }
+| T_OP_CLZ_S { new_instr(OPC_CLZ_S); }
+| T_OP_SIGN_F { new_instr(OPC_SIGN_F); }
+| T_OP_FLOOR_F { new_instr(OPC_FLOOR_F); }
+| T_OP_CEIL_F { new_instr(OPC_CEIL_F); }
+| T_OP_RNDNE_F { new_instr(OPC_RNDNE_F); }
+| T_OP_RNDAZ_F { new_instr(OPC_RNDAZ_F); }
+| T_OP_TRUNC_F { new_instr(OPC_TRUNC_F); }
+| T_OP_NOT_B { new_instr(OPC_NOT_B); }
+| T_OP_BFREV_B { new_instr(OPC_BFREV_B); }
+| T_OP_SETRM { new_instr(OPC_SETRM); }
+| T_OP_CBITS_B { new_instr(OPC_CBITS_B); }
+
+cat2_opc_2src_cnd: T_OP_CMPS_F { new_instr(OPC_CMPS_F); }
+| T_OP_CMPS_U { new_instr(OPC_CMPS_U); }
+| T_OP_CMPS_S { new_instr(OPC_CMPS_S); }
+| T_OP_CMPV_F { new_instr(OPC_CMPV_F); }
+| T_OP_CMPV_U { new_instr(OPC_CMPV_U); }
+| T_OP_CMPV_S { new_instr(OPC_CMPV_S); }
+
+cat2_opc_2src: T_OP_ADD_F { new_instr(OPC_ADD_F); }
+| T_OP_MIN_F { new_instr(OPC_MIN_F); }
+| T_OP_MAX_F { new_instr(OPC_MAX_F); }
+| T_OP_MUL_F { new_instr(OPC_MUL_F); }
+| T_OP_ADD_U { new_instr(OPC_ADD_U); }
+| T_OP_ADD_S { new_instr(OPC_ADD_S); }
+| T_OP_SUB_U { new_instr(OPC_SUB_U); }
+| T_OP_SUB_S { new_instr(OPC_SUB_S); }
+| T_OP_MIN_U { new_instr(OPC_MIN_U); }
+| T_OP_MIN_S { new_instr(OPC_MIN_S); }
+| T_OP_MAX_U { new_instr(OPC_MAX_U); }
+| T_OP_MAX_S { new_instr(OPC_MAX_S); }
+| T_OP_AND_B { new_instr(OPC_AND_B); }
+| T_OP_OR_B { new_instr(OPC_OR_B); }
+| T_OP_XOR_B { new_instr(OPC_XOR_B); }
+| T_OP_MUL_U24 { new_instr(OPC_MUL_U24); }
+| T_OP_MUL_S24 { new_instr(OPC_MUL_S24); }
+| T_OP_MULL_U { new_instr(OPC_MULL_U); }
+| T_OP_SHL_B { new_instr(OPC_SHL_B); }
+| T_OP_SHR_B { new_instr(OPC_SHR_B); }
+| T_OP_ASHR_B { new_instr(OPC_ASHR_B); }
+| T_OP_BARY_F { new_instr(OPC_BARY_F); }
+| T_OP_MGEN_B { new_instr(OPC_MGEN_B); }
+| T_OP_GETBIT_B { new_instr(OPC_GETBIT_B); }
+| T_OP_SHB { new_instr(OPC_SHB); }
+| T_OP_MSAD { new_instr(OPC_MSAD); }
+
+cond: T_LT { instr->cat2.condition = IR3_COND_LT; }
+| T_LE { instr->cat2.condition = IR3_COND_LE; }
+| T_GT { instr->cat2.condition = IR3_COND_GT; }
+| T_GE { instr->cat2.condition = IR3_COND_GE; }
+| T_EQ { instr->cat2.condition = IR3_COND_EQ; }
+| T_NE { instr->cat2.condition = IR3_COND_NE; }
+
+cat2_instr: cat2_opc_1src dst_reg ',' src_reg_or_const_or_rel_or_imm
+| cat2_opc_2src_cnd '.' cond dst_reg ',' src_reg_or_const_or_rel_or_imm ',' src_reg_or_const_or_rel_or_imm
+| cat2_opc_2src dst_reg ',' src_reg_or_const_or_rel_or_imm ',' src_reg_or_const_or_rel_or_imm
+
+cat3_opc: T_OP_MAD_U16 { new_instr(OPC_MAD_U16); }
+| T_OP_MADSH_U16 { new_instr(OPC_MADSH_U16); }
+| T_OP_MAD_S16 { new_instr(OPC_MAD_S16); }
+| T_OP_MADSH_M16 { new_instr(OPC_MADSH_M16); }
+| T_OP_MAD_U24 { new_instr(OPC_MAD_U24); }
+| T_OP_MAD_S24 { new_instr(OPC_MAD_S24); }
+| T_OP_MAD_F16 { new_instr(OPC_MAD_F16); }
+| T_OP_MAD_F32 { new_instr(OPC_MAD_F32); }
+| T_OP_SEL_B16 { new_instr(OPC_SEL_B16); }
+| T_OP_SEL_B32 { new_instr(OPC_SEL_B32); }
+| T_OP_SEL_S16 { new_instr(OPC_SEL_S16); }
+| T_OP_SEL_S32 { new_instr(OPC_SEL_S32); }
+| T_OP_SEL_F16 { new_instr(OPC_SEL_F16); }
+| T_OP_SEL_F32 { new_instr(OPC_SEL_F32); }
+| T_OP_SAD_S16 { new_instr(OPC_SAD_S16); }
+| T_OP_SAD_S32 { new_instr(OPC_SAD_S32); }
+
+cat3_instr: cat3_opc dst_reg ',' src_reg_or_const_or_rel ',' src_reg_or_const ',' src_reg_or_const_or_rel
+
+cat4_opc: T_OP_RCP { new_instr(OPC_RCP); }
+| T_OP_RSQ { new_instr(OPC_RSQ); }
+| T_OP_LOG2 { new_instr(OPC_LOG2); }
+| T_OP_EXP2 { new_instr(OPC_EXP2); }
+| T_OP_SIN { new_instr(OPC_SIN); }
+| T_OP_COS { new_instr(OPC_COS); }
+| T_OP_SQRT { new_instr(OPC_SQRT); }
+| T_OP_HRSQ { new_instr(OPC_HRSQ); }
+| T_OP_HLOG2 { new_instr(OPC_HLOG2); }
+| T_OP_HEXP2 { new_instr(OPC_HEXP2); }
+
+cat4_instr: cat4_opc dst_reg ',' src_reg_or_const_or_rel_or_imm
+
+cat5_opc_dsxypp: T_OP_DSXPP_1 { new_instr(OPC_DSXPP_1); }
+| T_OP_DSYPP_1 { new_instr(OPC_DSYPP_1); }
+
+cat5_opc: T_OP_ISAM { new_instr(OPC_ISAM); }
+| T_OP_ISAML { new_instr(OPC_ISAML); }
+| T_OP_ISAMM { new_instr(OPC_ISAMM); }
+| T_OP_SAM { new_instr(OPC_SAM); }
+| T_OP_SAMB { new_instr(OPC_SAMB); }
+| T_OP_SAML { new_instr(OPC_SAML); }
+| T_OP_SAMGQ { new_instr(OPC_SAMGQ); }
+| T_OP_GETLOD { new_instr(OPC_GETLOD); }
+| T_OP_CONV { new_instr(OPC_CONV); }
+| T_OP_CONVM { new_instr(OPC_CONVM); }
+| T_OP_GETSIZE { new_instr(OPC_GETSIZE); }
+| T_OP_GETBUF { new_instr(OPC_GETBUF); }
+| T_OP_GETPOS { new_instr(OPC_GETPOS); }
+| T_OP_GETINFO { new_instr(OPC_GETINFO); }
+| T_OP_DSX { new_instr(OPC_DSX); }
+| T_OP_DSY { new_instr(OPC_DSY); }
+| T_OP_GATHER4R { new_instr(OPC_GATHER4R); }
+| T_OP_GATHER4G { new_instr(OPC_GATHER4G); }
+| T_OP_GATHER4B { new_instr(OPC_GATHER4B); }
+| T_OP_GATHER4A { new_instr(OPC_GATHER4A); }
+| T_OP_SAMGP0 { new_instr(OPC_SAMGP0); }
+| T_OP_SAMGP1 { new_instr(OPC_SAMGP1); }
+| T_OP_SAMGP2 { new_instr(OPC_SAMGP2); }
+| T_OP_SAMGP3 { new_instr(OPC_SAMGP3); }
+| T_OP_RGETPOS { new_instr(OPC_RGETPOS); }
+| T_OP_RGETINFO { new_instr(OPC_RGETINFO); }
+
+cat5_flag: '.' T_3D { instr->flags |= IR3_INSTR_3D; }
+| '.' 'a' { instr->flags |= IR3_INSTR_A; }
+| '.' 'o' { instr->flags |= IR3_INSTR_O; }
+| '.' 'p' { instr->flags |= IR3_INSTR_P; }
+| '.' 's' { instr->flags |= IR3_INSTR_S; }
+| '.' T_S2EN { instr->flags |= IR3_INSTR_S2EN; }
+| '.' T_BASE { instr->flags |= IR3_INSTR_B; instr->cat5.tex_base = $2; }
+cat5_flags:
+| cat5_flag cat5_flags
+
+cat5_samp: T_SAMP { instr->cat5.samp = $1; }
+cat5_tex: T_TEX { if (instr->flags & IR3_INSTR_B) instr->cat5.samp |= ($1 << 4); else instr->cat5.tex = $1; }
+cat5_type: '(' type ')' { instr->cat5.type = $2; }
+
+cat5_instr: cat5_opc_dsxypp cat5_flags dst_reg ',' src_reg
+| cat5_opc cat5_flags cat5_type dst_reg ',' src_reg ',' src_reg ',' cat5_samp ',' cat5_tex
+| cat5_opc cat5_flags cat5_type dst_reg ',' src_reg ',' src_reg ',' cat5_samp
+| cat5_opc cat5_flags cat5_type dst_reg ',' src_reg ',' src_reg ',' cat5_tex
+| cat5_opc cat5_flags cat5_type dst_reg ',' src_reg ',' src_reg
+| cat5_opc cat5_flags cat5_type dst_reg ',' src_reg ',' cat5_samp ',' cat5_tex
+| cat5_opc cat5_flags cat5_type dst_reg ',' src_reg ',' cat5_samp
+| cat5_opc cat5_flags cat5_type dst_reg ',' src_reg ',' cat5_tex
+| cat5_opc cat5_flags cat5_type dst_reg ',' src_reg
+| cat5_opc cat5_flags cat5_type dst_reg ',' cat5_samp ',' cat5_tex
+| cat5_opc cat5_flags cat5_type dst_reg ',' cat5_samp
+| cat5_opc cat5_flags cat5_type dst_reg ',' cat5_tex
+| cat5_opc cat5_flags cat5_type dst_reg
+
+cat6_typed: '.' T_UNTYPED { instr->cat6.typed = 0; }
+| '.' T_TYPED { instr->cat6.typed = 1; }
+
+cat6_dim: '.' T_1D { instr->cat6.d = 1; }
+| '.' T_2D { instr->cat6.d = 2; }
+| '.' T_3D { instr->cat6.d = 3; }
+| '.' T_4D { instr->cat6.d = 4; }
+
+cat6_type: '.' type { instr->cat6.type = $2; }
+cat6_offset: offset { instr->cat6.src_offset = $1; }
+cat6_immed: integer { instr->cat6.iim_val = $1; }
+
+cat6_load: T_OP_LDG { new_instr(OPC_LDG); } cat6_type dst_reg ',' 'g' '[' reg cat6_offset ']' ',' cat6_immed
+| T_OP_LDP { new_instr(OPC_LDP); } cat6_type dst_reg ',' 'p' '[' reg cat6_offset ']' ',' cat6_immed
+| T_OP_LDL { new_instr(OPC_LDL); } cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
+| T_OP_LDLW { new_instr(OPC_LDLW); } cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
+| T_OP_LDLV { new_instr(OPC_LDLV); } cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
+
+// TODO some of the cat6 instructions have different syntax for a6xx..
+//| T_OP_LDIB { new_instr(OPC_LDIB); } cat6_type dst_reg cat6_offset ',' reg ',' cat6_immed
+
+cat6_store: T_OP_STG { new_instr(OPC_STG); } cat6_type 'g' '[' dst_reg cat6_offset ']' ',' reg ',' cat6_immed
+| T_OP_STP { new_instr(OPC_STP); } cat6_type 'p' '[' dst_reg cat6_offset ']' ',' reg ',' cat6_immed
+| T_OP_STL { new_instr(OPC_STL); } cat6_type 'l' '[' dst_reg cat6_offset ']' ',' reg ',' cat6_immed
+| T_OP_STLW { new_instr(OPC_STLW); } cat6_type 'l' '[' dst_reg cat6_offset ']' ',' reg ',' cat6_immed
+
+cat6_storeib: T_OP_STIB { new_instr(OPC_STIB); dummy_dst(); } cat6_typed cat6_dim cat6_type '.' cat6_immed'g' '[' immediate ']' '+' reg ',' reg
+
+cat6_prefetch: T_OP_PREFETCH { new_instr(OPC_PREFETCH); new_reg(0,0); /* dummy dst */ } 'g' '[' reg cat6_offset ']' ',' cat6_immed
+
+cat6_atomic_l_g: '.' 'g' { instr->flags |= IR3_INSTR_G; }
+| '.' 'l' { }
+
+cat6_atomic: T_OP_ATOMIC_ADD { new_instr(OPC_ATOMIC_ADD); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
+| T_OP_ATOMIC_SUB { new_instr(OPC_ATOMIC_SUB); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
+| T_OP_ATOMIC_XCHG { new_instr(OPC_ATOMIC_XCHG); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
+| T_OP_ATOMIC_INC { new_instr(OPC_ATOMIC_INC); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
+| T_OP_ATOMIC_DEC { new_instr(OPC_ATOMIC_DEC); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
+| T_OP_ATOMIC_CMPXCHG { new_instr(OPC_ATOMIC_CMPXCHG); }cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
+| T_OP_ATOMIC_MIN { new_instr(OPC_ATOMIC_MIN); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
+| T_OP_ATOMIC_MAX { new_instr(OPC_ATOMIC_MAX); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
+| T_OP_ATOMIC_AND { new_instr(OPC_ATOMIC_AND); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
+| T_OP_ATOMIC_OR { new_instr(OPC_ATOMIC_OR); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
+| T_OP_ATOMIC_XOR { new_instr(OPC_ATOMIC_XOR); } cat6_atomic_l_g cat6_type dst_reg ',' 'l' '[' reg cat6_offset ']' ',' cat6_immed
+
+cat6_todo: T_OP_G2L { new_instr(OPC_G2L); }
+| T_OP_L2G { new_instr(OPC_L2G); }
+| T_OP_RESFMT { new_instr(OPC_RESFMT); }
+| T_OP_RESINF { new_instr(OPC_RESINFO); }
+| T_OP_LDGB { new_instr(OPC_LDGB); }
+| T_OP_STGB { new_instr(OPC_STGB); }
+| T_OP_LDC { new_instr(OPC_LDC); }
+
+cat6_instr: cat6_load
+| cat6_store
+| cat6_storeib
+| cat6_prefetch
+| cat6_atomic
+| cat6_todo
+
+reg: T_REGISTER { $$ = new_reg($1, 0); }
+| T_A0 { $$ = new_reg((61 << 3) + $1, IR3_REG_HALF); }
+| T_P0 { $$ = new_reg((62 << 3) + $1, 0); }
+
+const: T_CONSTANT { $$ = new_reg($1, IR3_REG_CONST); }
+
+dst_reg_flag: T_EVEN { rflags.flags |= IR3_REG_EVEN; }
+| T_POS_INFINITY { rflags.flags |= IR3_REG_POS_INF; }
+| T_EI { rflags.flags |= IR3_REG_EI; }
+| T_WRMASK { rflags.wrmask = $1; }
+
+dst_reg_flags: dst_reg_flag
+| dst_reg_flag dst_reg_flags
+
+ /* note: destination registers are always incremented in repeat */
+dst_reg: reg { $1->flags |= IR3_REG_R; }
+| dst_reg_flags reg { $2->flags |= IR3_REG_R; }
+
+src_reg_flag: T_ABSNEG { rflags.flags |= IR3_REG_ABS|IR3_REG_NEGATE; }
+| T_NEG { rflags.flags |= IR3_REG_NEGATE; }
+| T_ABS { rflags.flags |= IR3_REG_ABS; }
+| T_R { rflags.flags |= IR3_REG_R; }
+
+src_reg_flags: src_reg_flag
+| src_reg_flag src_reg_flags
+
+src_reg: reg
+| src_reg_flags reg
+
+src_const: const
+| src_reg_flags const
+
+src_reg_or_const: src_reg
+| src_const
+
+src_reg_or_const_or_rel: src_reg_or_const
+| relative
+
+src_reg_or_const_or_rel_or_imm: src_reg_or_const_or_rel
+| src_reg_flags immediate
+| immediate
+
+offset: { $$ = 0; }
+| '+' integer { $$ = $2; }
+| '-' integer { $$ = -$2; }
+
+relative: 'r' '<' T_A0 offset '>' { new_reg(0, IR3_REG_RELATIV)->array.offset = $4; }
+| 'c' '<' T_A0 offset '>' { new_reg(0, IR3_REG_RELATIV | IR3_REG_CONST)->array.offset = $4; }
+
+immediate: integer { new_reg(0, IR3_REG_IMMED)->iim_val = $1; }
+| '(' integer ')' { new_reg(0, IR3_REG_IMMED)->fim_val = $2; }
+| '(' float ')' { new_reg(0, IR3_REG_IMMED)->fim_val = $2; }
+| '(' T_NAN ')' { new_reg(0, IR3_REG_IMMED)->fim_val = NAN; }
+| '(' T_INF ')' { new_reg(0, IR3_REG_IMMED)->fim_val = INFINITY; }
+
+integer: T_INT { $$ = $1; }
+| '-' T_INT { $$ = -$2; }
+| T_HEX { $$ = $1; }
+| '-' T_HEX { $$ = -$2; }
+
+float: T_FLOAT { $$ = $1; }
+| '-' T_FLOAT { $$ = -$2; }
+
+type: T_TYPE_F16 { $$ = TYPE_F16; }
+| T_TYPE_F32 { $$ = TYPE_F32; }
+| T_TYPE_U16 { $$ = TYPE_U16; }
+| T_TYPE_U32 { $$ = TYPE_U32; }
+| T_TYPE_S16 { $$ = TYPE_S16; }
+| T_TYPE_S32 { $$ = TYPE_S32; }
+| T_TYPE_U8 { $$ = TYPE_U8; }
+| T_TYPE_S8 { $$ = TYPE_S8; }
depend_files : nir_algebraic_py,
)
+ir3_parser = custom_target(
+ 'ir3_parser.[ch]',
+ input: 'ir3_parser.y',
+ output: ['ir3_parser.c', 'ir3_parser.h'],
+ command: [
+ prog_bison, '@INPUT@', '--name-prefix=ir3_yy', '--defines=@OUTPUT1@', '--output=@OUTPUT0@'
+ ]
+)
+
+ir3_lexer = custom_target(
+ 'ir3_lexer.c',
+ input: 'ir3_lexer.l',
+ output: 'ir3_lexer.c',
+ command: [
+ prog_flex, '-o', '@OUTPUT@', '@INPUT@'
+ ]
+)
+
libfreedreno_ir3_files = files(
'disasm-a3xx.c',
'instr-a3xx.h',
libfreedreno_ir3 = static_library(
'freedreno_ir3',
- [libfreedreno_ir3_files, ir3_nir_trig_c, ir3_nir_imul_c],
+ [libfreedreno_ir3_files, ir3_nir_trig_c, ir3_nir_imul_c, ir3_parser[0], ir3_parser[1], ir3_lexer],
include_directories : [inc_freedreno, inc_include, inc_src, inc_mapi, inc_mesa, inc_gallium, inc_gallium_aux],
c_args : [c_vis_args, no_override_init_args],
cpp_args : [cpp_vis_args],