r600g: various fixes
[mesa.git] / src / gallium / drivers / r600 / r600_shader.h
1 /*
2 * Copyright 2010 Jerome Glisse <glisse@freedesktop.org>
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * on the rights to use, copy, modify, merge, publish, distribute, sub
8 * license, and/or sell copies of the Software, and to permit persons to whom
9 * the Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
19 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
20 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21 * USE OR OTHER DEALINGS IN THE SOFTWARE.
22 */
23 #ifndef R600_SHADER_H
24 #define R600_SHADER_H
25
26 #include "r600_compiler.h"
27 #include "radeon.h"
28
29 struct r600_state;
30
31 struct r600_shader_operand {
32 struct c_vector *vector;
33 unsigned sel;
34 unsigned chan;
35 unsigned neg;
36 unsigned abs;
37 };
38
39 struct r600_shader_vfetch {
40 struct r600_shader_vfetch *next;
41 struct r600_shader_vfetch *prev;
42 unsigned cf_addr;
43 struct r600_shader_operand src[2];
44 struct r600_shader_operand dst[4];
45 };
46
47 struct r600_shader_inst {
48 unsigned is_op3;
49 unsigned opcode;
50 unsigned inst;
51 struct r600_shader_operand src[3];
52 struct r600_shader_operand dst;
53 unsigned last;
54 };
55
56 struct r600_shader_alu {
57 struct r600_shader_alu *next;
58 struct r600_shader_alu *prev;
59 unsigned nalu;
60 unsigned nliteral;
61 unsigned nconstant;
62 struct r600_shader_inst alu[5];
63 u32 literal[4];
64 };
65
66 struct r600_shader_node {
67 struct r600_shader_node *next;
68 struct r600_shader_node *prev;
69 unsigned cf_id; /**< cf index (in dw) in byte code */
70 unsigned cf_addr; /**< instructions index (in dw) in byte code */
71 unsigned nslot; /**< number of slot (2 dw) needed by this node */
72 unsigned nfetch;
73 struct c_node *node; /**< compiler node from which this node originate */
74 struct r600_shader_vfetch vfetch; /**< list of vfetch instructions */
75 struct r600_shader_alu alu; /**< list of alu instructions */
76 };
77
78 struct r600_shader_io {
79 unsigned name;
80 unsigned gpr;
81 int sid;
82 };
83
84 struct r600_shader {
85 unsigned stack_size; /**< stack size needed by this shader */
86 unsigned ngpr; /**< number of GPR needed by this shader */
87 unsigned nconstant; /**< number of constants used by this shader */
88 unsigned nresource; /**< number of resources used by this shader */
89 unsigned noutput;
90 unsigned ninput;
91 unsigned nvector;
92 unsigned ncf; /**< total number of cf clauses */
93 unsigned nslot; /**< total number of slots (2 dw) */
94 unsigned flat_shade; /**< are we flat shading */
95 struct r600_shader_node nodes; /**< list of node */
96 struct r600_shader_io input[32];
97 struct r600_shader_io output[32];
98 /* TODO replace GPR by some better register allocator */
99 struct c_vector **gpr;
100 unsigned ndw; /**< bytes code size in dw */
101 u32 *bcode; /**< bytes code */
102 enum pipe_format resource_format[160]; /**< format of resource */
103 struct c_shader cshader;
104 };
105
106 void r600_shader_cleanup(struct r600_shader *rshader);
107 int r600_shader_register(struct r600_shader *rshader);
108 int r600_shader_node(struct r600_shader *shader);
109 void r600_shader_node_place(struct r600_shader *rshader);
110 int r600_shader_find_gpr(struct r600_shader *rshader, struct c_vector *v, unsigned swizzle,
111 struct r600_shader_operand *operand);
112 int r600_shader_vfetch_bytecode(struct r600_shader *rshader,
113 struct r600_shader_node *rnode,
114 struct r600_shader_vfetch *vfetch,
115 unsigned *cid);
116 int r600_shader_update(struct r600_shader *rshader,
117 enum pipe_format *resource_format);
118 int r600_shader_legalize(struct r600_shader *rshader);
119
120 int r700_shader_translate(struct r600_shader *rshader);
121
122 int c_shader_from_tgsi(struct c_shader *shader, unsigned type,
123 const struct tgsi_token *tokens);
124 int r600_shader_register(struct r600_shader *rshader);
125 int r600_shader_translate_rec(struct r600_shader *rshader, struct c_node *node);
126 int r700_shader_translate(struct r600_shader *rshader);
127 int r600_shader_insert_fetch(struct c_shader *shader);
128
129 enum r600_instruction {
130 INST_ADD = 0,
131 INST_MUL = 1,
132 INST_MUL_IEEE = 2,
133 INST_MAX = 3,
134 INST_MIN = 4,
135 INST_MAX_DX10 = 5,
136 INST_MIN_DX10 = 6,
137 INST_SETE = 7,
138 INST_SETGT = 8,
139 INST_SETGE = 9,
140 INST_SETNE = 10,
141 INST_SETE_DX10 = 11,
142 INST_SETGT_DX10 = 12,
143 INST_SETGE_DX10 = 13,
144 INST_SETNE_DX10 = 14,
145 INST_FRACT = 15,
146 INST_TRUNC = 16,
147 INST_CEIL = 17,
148 INST_RNDNE = 18,
149 INST_FLOOR = 19,
150 INST_MOVA = 20,
151 INST_MOVA_FLOOR = 21,
152 INST_MOVA_INT = 22,
153 INST_MOV = 23,
154 INST_NOP = 24,
155 INST_PRED_SETGT_UINT = 25,
156 INST_PRED_SETGE_UINT = 26,
157 INST_PRED_SETE = 27,
158 INST_PRED_SETGT = 28,
159 INST_PRED_SETGE = 29,
160 INST_PRED_SETNE = 30,
161 INST_PRED_SET_INV = 31,
162 INST_PRED_SET_POP = 32,
163 INST_PRED_SET_CLR = 33,
164 INST_PRED_SET_RESTORE = 34,
165 INST_PRED_SETE_PUSH = 35,
166 INST_PRED_SETGT_PUSH = 36,
167 INST_PRED_SETGE_PUSH = 37,
168 INST_PRED_SETNE_PUSH = 38,
169 INST_KILLE = 39,
170 INST_KILLGT = 40,
171 INST_KILLGE = 41,
172 INST_KILLNE = 42,
173 INST_AND_INT = 43,
174 INST_OR_INT = 44,
175 INST_XOR_INT = 45,
176 INST_NOT_INT = 46,
177 INST_ADD_INT = 47,
178 INST_SUB_INT = 48,
179 INST_MAX_INT = 49,
180 INST_MIN_INT = 50,
181 INST_MAX_UINT = 51,
182 INST_MIN_UINT = 52,
183 INST_SETE_INT = 53,
184 INST_SETGT_INT = 54,
185 INST_SETGE_INT = 55,
186 INST_SETNE_INT = 56,
187 INST_SETGT_UINT = 57,
188 INST_SETGE_UINT = 58,
189 INST_KILLGT_UINT = 59,
190 INST_KILLGE_UINT = 60,
191 INST_PRED_SETE_INT = 61,
192 INST_PRED_SETGT_INT = 62,
193 INST_PRED_SETGE_INT = 63,
194 INST_PRED_SETNE_INT = 64,
195 INST_KILLE_INT = 65,
196 INST_KILLGT_INT = 66,
197 INST_KILLGE_INT = 67,
198 INST_KILLNE_INT = 68,
199 INST_PRED_SETE_PUSH_INT = 69,
200 INST_PRED_SETGT_PUSH_INT = 70,
201 INST_PRED_SETGE_PUSH_INT = 71,
202 INST_PRED_SETNE_PUSH_INT = 72,
203 INST_PRED_SETLT_PUSH_INT = 73,
204 INST_PRED_SETLE_PUSH_INT = 74,
205 INST_DOT4 = 75,
206 INST_DOT4_IEEE = 76,
207 INST_CUBE = 77,
208 INST_MAX4 = 78,
209 INST_MOVA_GPR_INT = 79,
210 INST_EXP_IEEE = 80,
211 INST_LOG_CLAMPED = 81,
212 INST_LOG_IEEE = 82,
213 INST_RECIP_CLAMPED = 83,
214 INST_RECIP_FF = 84,
215 INST_RECIP_IEEE = 85,
216 INST_RECIPSQRT_CLAMPED = 86,
217 INST_RECIPSQRT_FF = 87,
218 INST_RECIPSQRT_IEEE = 88,
219 INST_SQRT_IEEE = 89,
220 INST_FLT_TO_INT = 90,
221 INST_INT_TO_FLT = 91,
222 INST_UINT_TO_FLT = 92,
223 INST_SIN = 93,
224 INST_COS = 94,
225 INST_ASHR_INT = 95,
226 INST_LSHR_INT = 96,
227 INST_LSHL_INT = 97,
228 INST_MULLO_INT = 98,
229 INST_MULHI_INT = 99,
230 INST_MULLO_UINT = 100,
231 INST_MULHI_UINT = 101,
232 INST_RECIP_INT = 102,
233 INST_RECIP_UINT = 103,
234 INST_FLT_TO_UINT = 104,
235 INST_MUL_LIT = 105,
236 INST_MUL_LIT_M2 = 106,
237 INST_MUL_LIT_M4 = 107,
238 INST_MUL_LIT_D2 = 108,
239 INST_MULADD = 109,
240 INST_MULADD_M2 = 110,
241 INST_MULADD_M4 = 111,
242 INST_MULADD_D2 = 112,
243 INST_MULADD_IEEE = 113,
244 INST_MULADD_IEEE_M2 = 114,
245 INST_MULADD_IEEE_M4 = 115,
246 INST_MULADD_IEEE_D2 = 116,
247 INST_CNDE = 117,
248 INST_CNDGT = 118,
249 INST_CNDGE = 119,
250 INST_CNDE_INT = 120,
251 INST_CNDGT_INT = 121,
252 INST_CNDGE_INT = 122,
253 INST_COUNT
254 };
255
256 struct r600_instruction_info {
257 enum r600_instruction instruction;
258 unsigned opcode;
259 unsigned is_trans;
260 unsigned is_op3;
261 };
262
263
264 #endif