2 * Mesa 3-D graphics library
5 * Copyright (C) 1999-2008 Brian Paul All Rights Reserved.
7 * Permission is hereby granted, free of charge, to any person obtaining a
8 * copy of this software and associated documentation files (the "Software"),
9 * to deal in the Software without restriction, including without limitation
10 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
11 * and/or sell copies of the Software, and to permit persons to whom the
12 * Software is furnished to do so, subject to the following conditions:
14 * The above copyright notice and this permission notice shall be included
15 * in all copies or substantial portions of the Software.
17 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
18 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
19 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
20 * BRIAN PAUL BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN
21 * AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
22 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
27 * \file prog_instruction.h
29 * Vertex/fragment program instruction datatypes and constants.
32 * \author Keith Whitwell
33 * \author Ian Romanick <idr@us.ibm.com>
37 #ifndef PROG_INSTRUCTION_H
38 #define PROG_INSTRUCTION_H
41 #include "main/mfeatures.h"
53 #define SWIZZLE_ZERO 4 /**< For SWZ instruction only */
54 #define SWIZZLE_ONE 5 /**< For SWZ instruction only */
55 #define SWIZZLE_NIL 7 /**< used during shader code gen (undefined value) */
58 #define MAKE_SWIZZLE4(a,b,c,d) (((a)<<0) | ((b)<<3) | ((c)<<6) | ((d)<<9))
59 #define SWIZZLE_NOOP MAKE_SWIZZLE4(0,1,2,3)
60 #define GET_SWZ(swz, idx) (((swz) >> ((idx)*3)) & 0x7)
61 #define GET_BIT(msk, idx) (((msk) >> (idx)) & 0x1)
63 #define SWIZZLE_XYZW MAKE_SWIZZLE4(SWIZZLE_X, SWIZZLE_Y, SWIZZLE_Z, SWIZZLE_W)
64 #define SWIZZLE_XXXX MAKE_SWIZZLE4(SWIZZLE_X, SWIZZLE_X, SWIZZLE_X, SWIZZLE_X)
65 #define SWIZZLE_YYYY MAKE_SWIZZLE4(SWIZZLE_Y, SWIZZLE_Y, SWIZZLE_Y, SWIZZLE_Y)
66 #define SWIZZLE_ZZZZ MAKE_SWIZZLE4(SWIZZLE_Z, SWIZZLE_Z, SWIZZLE_Z, SWIZZLE_Z)
67 #define SWIZZLE_WWWW MAKE_SWIZZLE4(SWIZZLE_W, SWIZZLE_W, SWIZZLE_W, SWIZZLE_W)
71 * Writemask values, 1 bit per component.
74 #define WRITEMASK_X 0x1
75 #define WRITEMASK_Y 0x2
76 #define WRITEMASK_XY 0x3
77 #define WRITEMASK_Z 0x4
78 #define WRITEMASK_XZ 0x5
79 #define WRITEMASK_YZ 0x6
80 #define WRITEMASK_XYZ 0x7
81 #define WRITEMASK_W 0x8
82 #define WRITEMASK_XW 0x9
83 #define WRITEMASK_YW 0xa
84 #define WRITEMASK_XYW 0xb
85 #define WRITEMASK_ZW 0xc
86 #define WRITEMASK_XZW 0xd
87 #define WRITEMASK_YZW 0xe
88 #define WRITEMASK_XYZW 0xf
96 #define COND_GT 1 /**< greater than zero */
97 #define COND_EQ 2 /**< equal to zero */
98 #define COND_LT 3 /**< less than zero */
99 #define COND_UN 4 /**< unordered (NaN) */
100 #define COND_GE 5 /**< greater then or equal to zero */
101 #define COND_LE 6 /**< less then or equal to zero */
102 #define COND_NE 7 /**< not equal to zero */
103 #define COND_TR 8 /**< always true */
104 #define COND_FL 9 /**< always false */
109 * Instruction precision for GL_NV_fragment_program
119 * Saturation modes when storing values.
122 #define SATURATE_OFF 0
123 #define SATURATE_ZERO_ONE 1
128 * Per-component negation masks
135 #define NEGATE_XYZ 0x7
136 #define NEGATE_XYZW 0xf
137 #define NEGATE_NONE 0x0
142 * Program instruction opcodes, for both vertex and fragment programs.
143 * \note changes to this opcode list must be reflected in t_vb_arbprogram.c
145 typedef enum prog_opcode
{
146 /* ARB_vp ARB_fp NV_vp NV_fp GLSL */
147 /*------------------------------------------*/
148 OPCODE_NOP
= 0, /* X */
149 OPCODE_ABS
, /* X X 1.1 X */
150 OPCODE_ADD
, /* X X X X X */
153 OPCODE_ARL
, /* X X */
154 OPCODE_ARL_NV
, /* 2 */
156 OPCODE_BGNLOOP
, /* opt */
157 OPCODE_BGNSUB
, /* opt */
158 OPCODE_BRA
, /* 2 X */
159 OPCODE_BRK
, /* 2 opt */
160 OPCODE_CAL
, /* 2 2 */
162 OPCODE_CONT
, /* opt */
163 OPCODE_COS
, /* X 2 X X */
164 OPCODE_DDX
, /* X X */
165 OPCODE_DDY
, /* X X */
168 OPCODE_DP3
, /* X X X X X */
169 OPCODE_DP4
, /* X X X X X */
170 OPCODE_DPH
, /* X X 1.1 */
171 OPCODE_DST
, /* X X X X */
173 OPCODE_END
, /* X X X X opt */
174 OPCODE_ENDIF
, /* opt */
175 OPCODE_ENDLOOP
, /* opt */
176 OPCODE_ENDSUB
, /* opt */
177 OPCODE_EX2
, /* X X 2 X X */
178 OPCODE_EXP
, /* X X X */
179 OPCODE_FLR
, /* X X 2 X X */
180 OPCODE_FRC
, /* X X 2 X X */
183 OPCODE_KIL_NV
, /* X X */
184 OPCODE_LG2
, /* X X 2 X X */
185 OPCODE_LIT
, /* X X X X */
186 OPCODE_LOG
, /* X X X */
187 OPCODE_LRP
, /* X X */
188 OPCODE_MAD
, /* X X X X X */
189 OPCODE_MAX
, /* X X X X X */
190 OPCODE_MIN
, /* X X X X X */
191 OPCODE_MOV
, /* X X X X X */
192 OPCODE_MUL
, /* X X X X X */
193 OPCODE_NOISE1
, /* X */
194 OPCODE_NOISE2
, /* X */
195 OPCODE_NOISE3
, /* X */
196 OPCODE_NOISE4
, /* X */
202 OPCODE_PK2US
, /* X */
204 OPCODE_PK4UB
, /* X */
205 OPCODE_POW
, /* X X X X */
207 OPCODE_PRINT
, /* X X */
208 OPCODE_PUSHA
, /* 3 */
209 OPCODE_RCC
, /* 1.1 */
210 OPCODE_RCP
, /* X X X X X */
211 OPCODE_RET
, /* 2 2 */
212 OPCODE_RFL
, /* X X */
213 OPCODE_RSQ
, /* X X X X X */
215 OPCODE_SEQ
, /* 2 X X */
216 OPCODE_SFL
, /* 2 X */
217 OPCODE_SGE
, /* X X X X X */
218 OPCODE_SGT
, /* 2 X X */
219 OPCODE_SIN
, /* X 2 X X */
220 OPCODE_SLE
, /* 2 X X */
221 OPCODE_SLT
, /* X X X X X */
222 OPCODE_SNE
, /* 2 X X */
224 OPCODE_STR
, /* 2 X */
225 OPCODE_SUB
, /* X X 1.1 X X */
226 OPCODE_SWZ
, /* X X */
227 OPCODE_TEX
, /* X 3 X X */
228 OPCODE_TXB
, /* X 3 X */
229 OPCODE_TXD
, /* X X */
230 OPCODE_TXL
, /* 3 2 X */
231 OPCODE_TXP
, /* X X */
232 OPCODE_TXP_NV
, /* 3 X */
233 OPCODE_TRUNC
, /* X */
235 OPCODE_UP2US
, /* X */
237 OPCODE_UP4UB
, /* X */
240 OPCODE_XPD
, /* X X X */
246 * Number of bits for the src/dst register Index field.
247 * This limits the size of temp/uniform register files.
249 #define INST_INDEX_BITS 10
253 * Instruction source register.
255 struct prog_src_register
257 GLuint File
:4; /**< One of the PROGRAM_* register file values. */
258 GLint Index
:(INST_INDEX_BITS
+1); /**< Extra bit here for sign bit.
259 * May be negative for relative addressing.
264 /** Take the component-wise absolute value */
269 * This will either be NEGATE_NONE or NEGATE_XYZW, except for the SWZ
270 * instruction which allows per-component negation.
277 * Instruction destination register.
279 struct prog_dst_register
281 GLuint File
:4; /**< One of the PROGRAM_* register file values */
282 GLuint Index
:INST_INDEX_BITS
; /**< Unsigned, never negative */
287 * \name Conditional destination update control.
290 * NV_fragment_program, NV_fragment_program_option, NV_vertex_program2,
291 * NV_vertex_program2_option.
295 * Takes one of the 9 possible condition values (EQ, FL, GT, GE, LE, LT,
296 * NE, TR, or UN). Dest reg is only written to if the matching
297 * (swizzled) condition code value passes. When a conditional update mask
298 * is not specified, this will be \c COND_TR.
303 * Condition code swizzle value.
305 GLuint CondSwizzle
:12;
308 * Selects the condition code register to use for conditional destination
309 * update masking. In NV_fragmnet_program or NV_vertex_program2 mode, only
310 * condition code register 0 is available. In NV_vertex_program3 mode,
311 * condition code registers 0 and 1 are available.
320 * Vertex/fragment program instruction.
322 struct prog_instruction
324 gl_inst_opcode Opcode
;
325 struct prog_src_register SrcReg
[3];
326 struct prog_dst_register DstReg
;
329 * Indicates that the instruction should update the condition code
333 * NV_fragment_program, NV_fragment_program_option, NV_vertex_program2,
334 * NV_vertex_program2_option.
339 * If prog_instruction::CondUpdate is \c GL_TRUE, this value selects the
340 * condition code register that is to be updated.
342 * In GL_NV_fragment_program or GL_NV_vertex_program2 mode, only condition
343 * code register 0 is available. In GL_NV_vertex_program3 mode, condition
344 * code registers 0 and 1 are available.
347 * NV_fragment_program, NV_fragment_program_option, NV_vertex_program2,
348 * NV_vertex_program2_option.
353 * Saturate each value of the vectored result to the range [0,1] or the
354 * range [-1,1]. \c SSAT mode (i.e., saturation to the range [-1,1]) is
355 * only available in NV_fragment_program2 mode.
356 * Value is one of the SATURATE_* tokens.
359 * NV_fragment_program, NV_fragment_program_option, NV_vertex_program3.
361 GLuint SaturateMode
:2;
364 * Per-instruction selectable precision: FLOAT32, FLOAT16, FIXED12.
367 * NV_fragment_program, NV_fragment_program_option.
372 * \name Extra fields for TEX, TXB, TXD, TXL, TXP instructions.
375 /** Source texture unit. */
378 /** Source texture target, one of TEXTURE_{1D,2D,3D,CUBE,RECT}_INDEX */
379 GLuint TexSrcTarget
:3;
381 /** True if tex instruction should do shadow comparison */
386 * For BRA and CAL instructions, the location to jump to.
387 * For BGNLOOP, points to ENDLOOP (and vice-versa).
388 * For BRK, points to BGNLOOP (which points to ENDLOOP).
389 * For IF, points to ELSE or ENDIF.
390 * For ELSE, points to ENDIF.
394 /** for debugging purposes */
397 /** Arbitrary data. Used for OPCODE_PRINT and some drivers */
400 /** for driver use (try to remove someday) */
406 _mesa_init_instructions(struct prog_instruction
*inst
, GLuint count
);
408 extern struct prog_instruction
*
409 _mesa_alloc_instructions(GLuint numInst
);
411 extern struct prog_instruction
*
412 _mesa_realloc_instructions(struct prog_instruction
*oldInst
,
413 GLuint numOldInst
, GLuint numNewInst
);
415 extern struct prog_instruction
*
416 _mesa_copy_instructions(struct prog_instruction
*dest
,
417 const struct prog_instruction
*src
, GLuint n
);
420 _mesa_free_instructions(struct prog_instruction
*inst
, GLuint count
);
423 _mesa_num_inst_src_regs(gl_inst_opcode opcode
);
426 _mesa_num_inst_dst_regs(gl_inst_opcode opcode
);
429 _mesa_is_tex_instruction(gl_inst_opcode opcode
);
432 _mesa_check_soa_dependencies(const struct prog_instruction
*inst
);
435 _mesa_opcode_string(gl_inst_opcode opcode
);
438 #endif /* PROG_INSTRUCTION_H */