2 * Mesa 3-D graphics library
5 * Copyright (C) 1999-2007 Brian Paul All Rights Reserved.
7 * Permission is hereby granted, free of charge, to any person obtaining a
8 * copy of this software and associated documentation files (the "Software"),
9 * to deal in the Software without restriction, including without limitation
10 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
11 * and/or sell copies of the Software, and to permit persons to whom the
12 * Software is furnished to do so, subject to the following conditions:
14 * The above copyright notice and this permission notice shall be included
15 * in all copies or substantial portions of the Software.
17 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
18 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
19 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
20 * BRIAN PAUL BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN
21 * AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
22 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
27 * Vertex/Fragment program optimizations and transformations for program
36 #include "prog_parameter.h"
37 #include "prog_statevars.h"
38 #include "programopt.h"
39 #include "prog_instruction.h"
43 * This function inserts instructions for coordinate modelview * projection
44 * into a vertex program.
45 * May be used to implement the position_invariant option.
48 _mesa_insert_mvp_code(GLcontext
*ctx
, struct gl_vertex_program
*vprog
)
50 struct prog_instruction
*newInst
;
51 const GLuint origLen
= vprog
->Base
.NumInstructions
;
52 const GLuint newLen
= origLen
+ 4;
56 * Setup state references for the modelview/projection matrix.
57 * XXX we should check if these state vars are already declared.
59 static const gl_state_index mvpState
[4][STATE_LENGTH
] = {
60 { STATE_MVP_MATRIX
, 0, 0, 0, 0 }, /* state.matrix.mvp.row[0] */
61 { STATE_MVP_MATRIX
, 0, 1, 1, 0 }, /* state.matrix.mvp.row[1] */
62 { STATE_MVP_MATRIX
, 0, 2, 2, 0 }, /* state.matrix.mvp.row[2] */
63 { STATE_MVP_MATRIX
, 0, 3, 3, 0 }, /* state.matrix.mvp.row[3] */
67 for (i
= 0; i
< 4; i
++) {
68 mvpRef
[i
] = _mesa_add_state_reference(vprog
->Base
.Parameters
,
72 /* Alloc storage for new instructions */
73 newInst
= _mesa_alloc_instructions(newLen
);
75 _mesa_error(ctx
, GL_OUT_OF_MEMORY
,
76 "glProgramString(inserting position_invariant code)");
81 * Generated instructions:
82 * newInst[0] = DP4 result.position.x, mvp.row[0], vertex.position;
83 * newInst[1] = DP4 result.position.y, mvp.row[1], vertex.position;
84 * newInst[2] = DP4 result.position.z, mvp.row[2], vertex.position;
85 * newInst[3] = DP4 result.position.w, mvp.row[3], vertex.position;
87 _mesa_init_instructions(newInst
, 4);
88 for (i
= 0; i
< 4; i
++) {
89 newInst
[i
].Opcode
= OPCODE_DP4
;
90 newInst
[i
].DstReg
.File
= PROGRAM_OUTPUT
;
91 newInst
[i
].DstReg
.Index
= VERT_RESULT_HPOS
;
92 newInst
[i
].DstReg
.WriteMask
= (WRITEMASK_X
<< i
);
93 newInst
[i
].SrcReg
[0].File
= PROGRAM_STATE_VAR
;
94 newInst
[i
].SrcReg
[0].Index
= mvpRef
[i
];
95 newInst
[i
].SrcReg
[0].Swizzle
= SWIZZLE_NOOP
;
96 newInst
[i
].SrcReg
[1].File
= PROGRAM_INPUT
;
97 newInst
[i
].SrcReg
[1].Index
= VERT_ATTRIB_POS
;
98 newInst
[i
].SrcReg
[1].Swizzle
= SWIZZLE_NOOP
;
101 /* Append original instructions after new instructions */
102 _mesa_copy_instructions (newInst
+ 4, vprog
->Base
.Instructions
, origLen
);
104 /* free old instructions */
105 _mesa_free(vprog
->Base
.Instructions
);
107 /* install new instructions */
108 vprog
->Base
.Instructions
= newInst
;
109 vprog
->Base
.NumInstructions
= newLen
;
110 vprog
->Base
.InputsRead
|= VERT_BIT_POS
;
111 vprog
->Base
.OutputsWritten
|= (1 << VERT_RESULT_HPOS
);
117 * Append extra instructions onto the given fragment program to implement
118 * the fog mode specified by fprog->FogOption.
119 * The fragment.fogcoord input is used to compute the fog blend factor.
121 * XXX with a little work, this function could be adapted to add fog code
122 * to vertex programs too.
125 _mesa_append_fog_code(GLcontext
*ctx
, struct gl_fragment_program
*fprog
)
127 static const gl_state_index fogPStateOpt
[STATE_LENGTH
]
128 = { STATE_INTERNAL
, STATE_FOG_PARAMS_OPTIMIZED
, 0, 0, 0 };
129 static const gl_state_index fogColorState
[STATE_LENGTH
]
130 = { STATE_FOG_COLOR
, 0, 0, 0, 0};
131 struct prog_instruction
*newInst
, *inst
;
132 const GLuint origLen
= fprog
->Base
.NumInstructions
;
133 const GLuint newLen
= origLen
+ 5;
135 GLint fogPRefOpt
, fogColorRef
; /* state references */
136 GLuint colorTemp
, fogFactorTemp
; /* temporary registerss */
138 if (fprog
->FogOption
== GL_NONE
) {
139 _mesa_problem(ctx
, "_mesa_append_fog_code() called for fragment program"
140 " with FogOption == GL_NONE");
144 /* Alloc storage for new instructions */
145 newInst
= _mesa_alloc_instructions(newLen
);
147 _mesa_error(ctx
, GL_OUT_OF_MEMORY
,
148 "glProgramString(inserting fog_option code)");
152 /* Copy orig instructions into new instruction buffer */
153 _mesa_copy_instructions(newInst
, fprog
->Base
.Instructions
, origLen
);
155 /* PARAM fogParamsRefOpt = internal optimized fog params; */
157 = _mesa_add_state_reference(fprog
->Base
.Parameters
, fogPStateOpt
);
158 /* PARAM fogColorRef = state.fog.color; */
160 = _mesa_add_state_reference(fprog
->Base
.Parameters
, fogColorState
);
162 /* TEMP colorTemp; */
163 colorTemp
= fprog
->Base
.NumTemporaries
++;
164 /* TEMP fogFactorTemp; */
165 fogFactorTemp
= fprog
->Base
.NumTemporaries
++;
167 /* Scan program to find where result.color is written */
169 for (i
= 0; i
< fprog
->Base
.NumInstructions
; i
++) {
170 if (inst
->Opcode
== OPCODE_END
)
172 if (inst
->DstReg
.File
== PROGRAM_OUTPUT
&&
173 inst
->DstReg
.Index
== FRAG_RESULT_COLR
) {
174 /* change the instruction to write to colorTemp w/ clamping */
175 inst
->DstReg
.File
= PROGRAM_TEMPORARY
;
176 inst
->DstReg
.Index
= colorTemp
;
177 inst
->SaturateMode
= SATURATE_ZERO_ONE
;
178 /* don't break (may be several writes to result.color) */
182 assert(inst
->Opcode
== OPCODE_END
); /* we'll overwrite this inst */
184 _mesa_init_instructions(inst
, 5);
186 /* emit instructions to compute fog blending factor */
187 if (fprog
->FogOption
== GL_LINEAR
) {
188 /* MAD fogFactorTemp.x, fragment.fogcoord.x, fogPRefOpt.x, fogPRefOpt.y; */
189 inst
->Opcode
= OPCODE_MAD
;
190 inst
->DstReg
.File
= PROGRAM_TEMPORARY
;
191 inst
->DstReg
.Index
= fogFactorTemp
;
192 inst
->DstReg
.WriteMask
= WRITEMASK_X
;
193 inst
->SrcReg
[0].File
= PROGRAM_INPUT
;
194 inst
->SrcReg
[0].Index
= FRAG_ATTRIB_FOGC
;
195 inst
->SrcReg
[0].Swizzle
= SWIZZLE_X
;
196 inst
->SrcReg
[1].File
= PROGRAM_STATE_VAR
;
197 inst
->SrcReg
[1].Index
= fogPRefOpt
;
198 inst
->SrcReg
[1].Swizzle
= SWIZZLE_X
;
199 inst
->SrcReg
[2].File
= PROGRAM_STATE_VAR
;
200 inst
->SrcReg
[2].Index
= fogPRefOpt
;
201 inst
->SrcReg
[2].Swizzle
= SWIZZLE_Y
;
202 inst
->SaturateMode
= SATURATE_ZERO_ONE
;
206 ASSERT(fprog
->FogOption
== GL_EXP
|| fprog
->FogOption
== GL_EXP2
);
207 /* fogPRefOpt.z = d/ln(2), fogPRefOpt.w = d/sqrt(ln(2) */
208 /* EXP: MUL fogFactorTemp.x, fogPRefOpt.z, fragment.fogcoord.x; */
209 /* EXP2: MUL fogFactorTemp.x, fogPRefOpt.w, fragment.fogcoord.x; */
210 inst
->Opcode
= OPCODE_MUL
;
211 inst
->DstReg
.File
= PROGRAM_TEMPORARY
;
212 inst
->DstReg
.Index
= fogFactorTemp
;
213 inst
->DstReg
.WriteMask
= WRITEMASK_X
;
214 inst
->SrcReg
[0].File
= PROGRAM_STATE_VAR
;
215 inst
->SrcReg
[0].Index
= fogPRefOpt
;
216 inst
->SrcReg
[0].Swizzle
217 = (fprog
->FogOption
== GL_EXP
) ? SWIZZLE_Z
: SWIZZLE_W
;
218 inst
->SrcReg
[1].File
= PROGRAM_INPUT
;
219 inst
->SrcReg
[1].Index
= FRAG_ATTRIB_FOGC
;
220 inst
->SrcReg
[1].Swizzle
= SWIZZLE_X
;
222 if (fprog
->FogOption
== GL_EXP2
) {
223 /* MUL fogFactorTemp.x, fogFactorTemp.x, fogFactorTemp.x; */
224 inst
->Opcode
= OPCODE_MUL
;
225 inst
->DstReg
.File
= PROGRAM_TEMPORARY
;
226 inst
->DstReg
.Index
= fogFactorTemp
;
227 inst
->DstReg
.WriteMask
= WRITEMASK_X
;
228 inst
->SrcReg
[0].File
= PROGRAM_TEMPORARY
;
229 inst
->SrcReg
[0].Index
= fogFactorTemp
;
230 inst
->SrcReg
[0].Swizzle
= SWIZZLE_X
;
231 inst
->SrcReg
[1].File
= PROGRAM_TEMPORARY
;
232 inst
->SrcReg
[1].Index
= fogFactorTemp
;
233 inst
->SrcReg
[1].Swizzle
= SWIZZLE_X
;
236 /* EX2_SAT fogFactorTemp.x, -fogFactorTemp.x; */
237 inst
->Opcode
= OPCODE_EX2
;
238 inst
->DstReg
.File
= PROGRAM_TEMPORARY
;
239 inst
->DstReg
.Index
= fogFactorTemp
;
240 inst
->DstReg
.WriteMask
= WRITEMASK_X
;
241 inst
->SrcReg
[0].File
= PROGRAM_TEMPORARY
;
242 inst
->SrcReg
[0].Index
= fogFactorTemp
;
243 inst
->SrcReg
[0].NegateBase
= GL_TRUE
;
244 inst
->SrcReg
[0].Swizzle
= SWIZZLE_X
;
245 inst
->SaturateMode
= SATURATE_ZERO_ONE
;
248 /* LRP result.color.xyz, fogFactorTemp.xxxx, colorTemp, fogColorRef; */
249 inst
->Opcode
= OPCODE_LRP
;
250 inst
->DstReg
.File
= PROGRAM_OUTPUT
;
251 inst
->DstReg
.Index
= FRAG_RESULT_COLR
;
252 inst
->DstReg
.WriteMask
= WRITEMASK_XYZ
;
253 inst
->SrcReg
[0].File
= PROGRAM_TEMPORARY
;
254 inst
->SrcReg
[0].Index
= fogFactorTemp
;
255 inst
->SrcReg
[0].Swizzle
256 = MAKE_SWIZZLE4(SWIZZLE_X
, SWIZZLE_X
, SWIZZLE_X
, SWIZZLE_X
);
257 inst
->SrcReg
[1].File
= PROGRAM_TEMPORARY
;
258 inst
->SrcReg
[1].Index
= colorTemp
;
259 inst
->SrcReg
[1].Swizzle
= SWIZZLE_NOOP
;
260 inst
->SrcReg
[2].File
= PROGRAM_STATE_VAR
;
261 inst
->SrcReg
[2].Index
= fogColorRef
;
262 inst
->SrcReg
[2].Swizzle
= SWIZZLE_NOOP
;
264 /* MOV result.color.w, colorTemp.x; # copy alpha */
265 inst
->Opcode
= OPCODE_MOV
;
266 inst
->DstReg
.File
= PROGRAM_OUTPUT
;
267 inst
->DstReg
.Index
= FRAG_RESULT_COLR
;
268 inst
->DstReg
.WriteMask
= WRITEMASK_W
;
269 inst
->SrcReg
[0].File
= PROGRAM_TEMPORARY
;
270 inst
->SrcReg
[0].Index
= colorTemp
;
271 inst
->SrcReg
[0].Swizzle
= SWIZZLE_NOOP
;
274 inst
->Opcode
= OPCODE_END
;
277 /* free old instructions */
278 _mesa_free(fprog
->Base
.Instructions
);
280 /* install new instructions */
281 fprog
->Base
.Instructions
= newInst
;
282 fprog
->Base
.NumInstructions
= inst
- newInst
;
283 fprog
->Base
.InputsRead
|= FRAG_BIT_FOGC
;
284 /* XXX do this? fprog->FogOption = GL_NONE; */
290 is_texture_instruction(const struct prog_instruction
*inst
)
292 switch (inst
->Opcode
) {
307 * Count the number of texure indirections in the given program.
308 * The program's NumTexIndirections field will be updated.
309 * See the GL_ARB_fragment_program spec (issue 24) for details.
310 * XXX we count texture indirections in texenvprogram.c (maybe use this code
311 * instead and elsewhere).
314 _mesa_count_texture_indirections(struct gl_program
*prog
)
316 GLuint indirections
= 1;
317 GLbitfield tempsOutput
= 0x0;
318 GLbitfield aluTemps
= 0x0;
321 for (i
= 0; i
< prog
->NumInstructions
; i
++) {
322 const struct prog_instruction
*inst
= prog
->Instructions
+ i
;
324 if (is_texture_instruction(inst
)) {
325 if (((inst
->SrcReg
[0].File
== PROGRAM_TEMPORARY
) &&
326 (tempsOutput
& (1 << inst
->SrcReg
[0].Index
))) ||
327 ((inst
->Opcode
!= OPCODE_KIL
) &&
328 (inst
->DstReg
.File
== PROGRAM_TEMPORARY
) &&
329 (aluTemps
& (1 << inst
->DstReg
.Index
))))
338 for (j
= 0; j
< 3; j
++) {
339 if (inst
->SrcReg
[j
].File
== PROGRAM_TEMPORARY
)
340 aluTemps
|= (1 << inst
->SrcReg
[j
].Index
);
342 if (inst
->DstReg
.File
== PROGRAM_TEMPORARY
)
343 aluTemps
|= (1 << inst
->DstReg
.Index
);
346 if ((inst
->Opcode
!= OPCODE_KIL
) && (inst
->DstReg
.File
== PROGRAM_TEMPORARY
))
347 tempsOutput
|= (1 << inst
->DstReg
.Index
);
350 prog
->NumTexIndirections
= indirections
;
355 * Count number of texture instructions in given program and update the
356 * program's NumTexInstructions field.
359 _mesa_count_texture_instructions(struct gl_program
*prog
)
362 prog
->NumTexInstructions
= 0;
363 for (i
= 0; i
< prog
->NumInstructions
; i
++) {
364 prog
->NumTexInstructions
+= is_texture_instruction(prog
->Instructions
+ i
);