Merge branch 'xa_branch'
[mesa.git] / src / gallium / drivers / i915 / i915_fpc.h
1 /**************************************************************************
2 *
3 * Copyright 2003 Tungsten Graphics, Inc., Cedar Park, Texas.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28
29 #ifndef I915_FPC_H
30 #define I915_FPC_H
31
32
33 #include "i915_context.h"
34 #include "i915_reg.h"
35
36
37
38 #define I915_PROGRAM_SIZE 192
39
40 /* Use those indices for pos/face routing, must be >= I915_TEX_UNITS */
41 #define I915_SEMANTIC_POS 10
42 #define I915_SEMANTIC_FACE 11
43
44
45 /**
46 * Program translation state
47 */
48 struct i915_fp_compile {
49 struct i915_fragment_shader *shader; /* the shader we're compiling */
50
51 boolean used_constants[I915_MAX_CONSTANT];
52
53 /** maps TGSI immediate index to constant slot */
54 uint num_immediates;
55 uint immediates_map[I915_MAX_CONSTANT];
56 float immediates[I915_MAX_CONSTANT][4];
57
58 boolean first_instruction;
59
60 uint declarations[I915_PROGRAM_SIZE];
61 uint program[I915_PROGRAM_SIZE];
62
63 uint *csr; /**< Cursor, points into program. */
64
65 uint *decl; /**< Cursor, points into declarations. */
66
67 uint decl_s; /**< flags for which s regs need to be decl'd */
68 uint decl_t; /**< flags for which t regs need to be decl'd */
69
70 uint temp_flag; /**< Tracks temporary regs which are in use */
71 uint utemp_flag; /**< Tracks TYPE_U temporary regs which are in use */
72
73 uint register_phases[16];
74 uint nr_tex_indirect;
75 uint nr_tex_insn;
76 uint nr_alu_insn;
77 uint nr_decl_insn;
78
79 boolean error; /**< Set if i915_program_error() is called */
80 uint NumNativeInstructions;
81 uint NumNativeAluInstructions;
82 uint NumNativeTexInstructions;
83 uint NumNativeTexIndirections;
84 };
85
86
87 /* Having zero and one in here makes the definition of swizzle a lot
88 * easier.
89 */
90 #define UREG_TYPE_SHIFT 29
91 #define UREG_NR_SHIFT 24
92 #define UREG_CHANNEL_X_NEGATE_SHIFT 23
93 #define UREG_CHANNEL_X_SHIFT 20
94 #define UREG_CHANNEL_Y_NEGATE_SHIFT 19
95 #define UREG_CHANNEL_Y_SHIFT 16
96 #define UREG_CHANNEL_Z_NEGATE_SHIFT 15
97 #define UREG_CHANNEL_Z_SHIFT 12
98 #define UREG_CHANNEL_W_NEGATE_SHIFT 11
99 #define UREG_CHANNEL_W_SHIFT 8
100 #define UREG_CHANNEL_ZERO_NEGATE_MBZ 5
101 #define UREG_CHANNEL_ZERO_SHIFT 4
102 #define UREG_CHANNEL_ONE_NEGATE_MBZ 1
103 #define UREG_CHANNEL_ONE_SHIFT 0
104
105 #define UREG_BAD 0xffffffff /* not a valid ureg */
106
107 #define X SRC_X
108 #define Y SRC_Y
109 #define Z SRC_Z
110 #define W SRC_W
111 #define ZERO SRC_ZERO
112 #define ONE SRC_ONE
113
114 /* Construct a ureg:
115 */
116 #define UREG( type, nr ) (((type)<< UREG_TYPE_SHIFT) | \
117 ((nr) << UREG_NR_SHIFT) | \
118 (X << UREG_CHANNEL_X_SHIFT) | \
119 (Y << UREG_CHANNEL_Y_SHIFT) | \
120 (Z << UREG_CHANNEL_Z_SHIFT) | \
121 (W << UREG_CHANNEL_W_SHIFT) | \
122 (ZERO << UREG_CHANNEL_ZERO_SHIFT) | \
123 (ONE << UREG_CHANNEL_ONE_SHIFT))
124
125 #define GET_CHANNEL_SRC( reg, channel ) ((reg<<(channel*4)) & (0xf<<20))
126 #define CHANNEL_SRC( src, channel ) (src>>(channel*4))
127
128 #define GET_UREG_TYPE(reg) (((reg)>>UREG_TYPE_SHIFT)&REG_TYPE_MASK)
129 #define GET_UREG_NR(reg) (((reg)>>UREG_NR_SHIFT)&REG_NR_MASK)
130
131
132
133 #define UREG_XYZW_CHANNEL_MASK 0x00ffff00
134
135 /* One neat thing about the UREG representation:
136 */
137 static INLINE int
138 swizzle(int reg, uint x, uint y, uint z, uint w)
139 {
140 assert(x <= SRC_ONE);
141 assert(y <= SRC_ONE);
142 assert(z <= SRC_ONE);
143 assert(w <= SRC_ONE);
144 return ((reg & ~UREG_XYZW_CHANNEL_MASK) |
145 CHANNEL_SRC(GET_CHANNEL_SRC(reg, x), 0) |
146 CHANNEL_SRC(GET_CHANNEL_SRC(reg, y), 1) |
147 CHANNEL_SRC(GET_CHANNEL_SRC(reg, z), 2) |
148 CHANNEL_SRC(GET_CHANNEL_SRC(reg, w), 3));
149 }
150
151
152
153 /***********************************************************************
154 * Public interface for the compiler
155 */
156 extern void
157 i915_translate_fragment_program( struct i915_context *i915,
158 struct i915_fragment_shader *fs);
159
160
161
162 extern uint i915_get_temp(struct i915_fp_compile *p);
163 extern uint i915_get_utemp(struct i915_fp_compile *p);
164 extern void i915_release_utemps(struct i915_fp_compile *p);
165
166
167 extern uint i915_emit_texld(struct i915_fp_compile *p,
168 uint dest,
169 uint destmask,
170 uint sampler, uint coord, uint op);
171
172 extern uint i915_emit_arith(struct i915_fp_compile *p,
173 uint op,
174 uint dest,
175 uint mask,
176 uint saturate,
177 uint src0, uint src1, uint src2);
178
179 extern uint i915_emit_decl(struct i915_fp_compile *p,
180 uint type, uint nr, uint d0_flags);
181
182
183 extern uint i915_emit_const1f(struct i915_fp_compile *p, float c0);
184
185 extern uint i915_emit_const2f(struct i915_fp_compile *p,
186 float c0, float c1);
187
188 extern uint i915_emit_const4fv(struct i915_fp_compile *p,
189 const float * c);
190
191 extern uint i915_emit_const4f(struct i915_fp_compile *p,
192 float c0, float c1,
193 float c2, float c3);
194
195
196 /*======================================================================
197 * i915_fpc_debug.c
198 */
199 extern void i915_disassemble_program(const uint * program, uint sz);
200
201
202 /*======================================================================
203 * i915_fpc_translate.c
204 */
205
206 extern void
207 i915_program_error(struct i915_fp_compile *p, const char *msg, ...);
208
209
210 #endif