0a4710151a038d82dc8e8b386bf06d5970b8947d
[mesa.git] / src / gallium / drivers / r300 / r300_surface.c
1 /*
2 * Copyright 2008 Corbin Simpson <MostAwesomeDude@gmail.com>
3 * Joakim Sindholt <opensource@zhasha.com>
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * on the rights to use, copy, modify, merge, publish, distribute, sub
9 * license, and/or sell copies of the Software, and to permit persons to whom
10 * the Software is furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
14 * Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
20 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
21 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
22 * USE OR OTHER DEALINGS IN THE SOFTWARE. */
23
24 #include "r300_surface.h"
25
26 /* Provides pipe_context's "surface_fill". Commonly used for clearing
27 * buffers. */
28 static void r300_surface_fill(struct pipe_context* pipe,
29 struct pipe_surface* dest,
30 unsigned x, unsigned y,
31 unsigned w, unsigned h,
32 unsigned color)
33 {
34 struct r300_context* r300 = r300_context(pipe);
35 CS_LOCALS(r300);
36 struct r300_capabilities* caps = ((struct r300_screen*)pipe->screen)->caps;
37 struct r300_texture* tex = (struct r300_texture*)dest->texture;
38 int i;
39 float r, g, b, a;
40 r = (float)((color >> 16) & 0xff) / 255.0f;
41 g = (float)((color >> 8) & 0xff) / 255.0f;
42 b = (float)((color >> 0) & 0xff) / 255.0f;
43 debug_printf("r300: Filling surface %p at (%d,%d),"
44 " dimensions %dx%d (stride %d), color 0x%x\n",
45 dest, x, y, w, h, dest->stride, color);
46
47 /* Fallback? */
48 if (0) {
49 debug_printf("r300: Falling back on surface clear...");
50 void* map = pipe->screen->surface_map(pipe->screen, dest,
51 PIPE_BUFFER_USAGE_CPU_WRITE);
52 pipe_fill_rect(map, &dest->block, &dest->stride, x, y, w, h, color);
53 pipe->screen->surface_unmap(pipe->screen, dest);
54 return;
55 }
56
57 BEGIN_CS(161 + (caps->is_r500 ? 22 : 14) + (caps->has_tcl ? 4 : 2));
58 /* Flush PVS. */
59 OUT_CS_REG(R300_VAP_PVS_STATE_FLUSH_REG, 0x0);
60
61 OUT_CS_REG(R300_SE_VTE_CNTL, R300_VPORT_X_SCALE_ENA |
62 R300_VPORT_X_OFFSET_ENA | R300_VPORT_Y_SCALE_ENA |
63 R300_VPORT_Y_OFFSET_ENA | R300_VPORT_Z_SCALE_ENA |
64 R300_VPORT_Z_OFFSET_ENA | R300_VTX_W0_FMT);
65 /* Vertex size. */
66 OUT_CS_REG(R300_VAP_VTX_SIZE, 0x8);
67 /* Max and min vertex index clamp. */
68 OUT_CS_REG(R300_VAP_VF_MAX_VTX_INDX, 0xFFFFFF);
69 OUT_CS_REG(R300_VAP_VF_MIN_VTX_INDX, 0x0);
70 /* XXX endian */
71 OUT_CS_REG(R300_VAP_CNTL_STATUS, R300_VC_NO_SWAP);
72 OUT_CS_REG(R300_VAP_PROG_STREAM_CNTL_0, 0x0);
73 /* XXX magic number not in r300_reg */
74 OUT_CS_REG(R300_VAP_PSC_SGN_NORM_CNTL, 0xAAAAAAAA);
75 OUT_CS_REG(R300_VAP_CLIP_CNTL, 0x0);
76 OUT_CS_REG_SEQ(R300_VAP_GB_VERT_CLIP_ADJ, 4);
77 OUT_CS_32F(1.0);
78 OUT_CS_32F(1.0);
79 OUT_CS_32F(1.0);
80 OUT_CS_32F(1.0);
81 /* XXX is this too long? */
82 OUT_CS_REG(VAP_PVS_VTX_TIMEOUT_REG, 0xFFFF);
83 OUT_CS_REG(R300_GB_ENABLE, R300_GB_POINT_STUFF_ENABLE |
84 R300_GB_LINE_STUFF_ENABLE | R300_GB_TRIANGLE_STUFF_ENABLE);
85 /* XXX more magic numbers */
86 OUT_CS_REG(R300_GB_MSPOS0, 0x66666666);
87 OUT_CS_REG(R300_GB_MSPOS1, 0x66666666);
88 /* XXX why doesn't classic Mesa write the number of pipes, too? */
89 OUT_CS_REG(R300_GB_TILE_CONFIG, R300_GB_TILE_ENABLE |
90 R300_GB_TILE_SIZE_16);
91 OUT_CS_REG(R300_GB_SELECT, R300_GB_FOG_SELECT_1_1_W);
92 OUT_CS_REG(R300_GB_AA_CONFIG, 0x0);
93 /* XXX point tex stuffing */
94 OUT_CS_REG_SEQ(R300_GA_POINT_S0, 1);
95 OUT_CS_32F(0.0);
96 OUT_CS_REG_SEQ(R300_GA_POINT_S1, 1);
97 OUT_CS_32F(1.0);
98 OUT_CS_REG(R300_GA_TRIANGLE_STIPPLE, 0x5 |
99 (0x5 << R300_GA_TRIANGLE_STIPPLE_Y_SHIFT_SHIFT));
100 /* XXX should this be related to the actual point size? */
101 OUT_CS_REG(R300_GA_POINT_MINMAX, 0x6 |
102 (0x1800 << R300_GA_POINT_MINMAX_MAX_SHIFT));
103 /* XXX this big chunk should be refactored into rs_state */
104 OUT_CS_REG(R300_GA_LINE_CNTL, 0x00030006);
105 OUT_CS_REG(R300_GA_LINE_STIPPLE_CONFIG, 0x3BAAAAAB);
106 OUT_CS_REG(R300_GA_LINE_STIPPLE_VALUE, 0x00000000);
107 OUT_CS_REG(R300_GA_LINE_S0, 0x00000000);
108 OUT_CS_REG(R300_GA_LINE_S1, 0x3F800000);
109 OUT_CS_REG(R300_GA_ENHANCE, 0x00000002);
110 OUT_CS_REG(R300_GA_COLOR_CONTROL, 0x0003AAAA);
111 OUT_CS_REG(R300_GA_SOLID_RG, 0x00000000);
112 OUT_CS_REG(R300_GA_SOLID_BA, 0x00000000);
113 OUT_CS_REG(R300_GA_POLY_MODE, 0x00000000);
114 OUT_CS_REG(R300_GA_ROUND_MODE, 0x00000001);
115 OUT_CS_REG(R300_GA_OFFSET, 0x00000000);
116 OUT_CS_REG(R300_GA_FOG_SCALE, 0x3DBF1412);
117 OUT_CS_REG(R300_GA_FOG_OFFSET, 0x00000000);
118 OUT_CS_REG(R300_SU_TEX_WRAP, 0x00000000);
119 OUT_CS_REG(R300_SU_POLY_OFFSET_FRONT_SCALE, 0x00000000);
120 OUT_CS_REG(R300_SU_POLY_OFFSET_FRONT_OFFSET, 0x00000000);
121 OUT_CS_REG(R300_SU_POLY_OFFSET_BACK_SCALE, 0x00000000);
122 OUT_CS_REG(R300_SU_POLY_OFFSET_BACK_OFFSET, 0x00000000);
123 OUT_CS_REG(R300_SU_POLY_OFFSET_ENABLE, 0x00000000);
124 OUT_CS_REG(R300_SU_CULL_MODE, 0x00000000);
125 OUT_CS_REG(R300_SU_DEPTH_SCALE, 0x4B7FFFFF);
126 OUT_CS_REG(R300_SU_DEPTH_OFFSET, 0x00000000);
127 OUT_CS_REG(R300_SC_HYPERZ, 0x0000001C);
128 OUT_CS_REG(R300_SC_EDGERULE, 0x2DA49525);
129 OUT_CS_REG(R300_FG_FOG_BLEND, 0x00000002);
130 OUT_CS_REG(R300_FG_FOG_COLOR_R, 0x00000000);
131 OUT_CS_REG(R300_FG_FOG_COLOR_G, 0x00000000);
132 OUT_CS_REG(R300_FG_FOG_COLOR_B, 0x00000000);
133 OUT_CS_REG(R300_FG_DEPTH_SRC, 0x00000000);
134 OUT_CS_REG(R300_FG_DEPTH_SRC, 0x00000000);
135 OUT_CS_REG(R300_RB3D_CCTL, 0x00000000);
136 OUT_CS_REG(RB3D_COLOR_CHANNEL_MASK, 0x0000000F);
137
138 /* XXX: Oh the wonderful unknown.
139 * Not writing these 8 regs seems to make no difference at all and seeing
140 * as how they're not documented, we should leave them out for now.
141 OUT_CS_REG_SEQ(0x4E54, 8);
142 for (i = 0; i < 8; i++) {
143 OUT_CS(0x00000000);
144 } */
145 OUT_CS_REG(R300_RB3D_AARESOLVE_CTL, 0x00000000);
146 OUT_CS_REG(R500_RB3D_DISCARD_SRC_PIXEL_LTE_THRESHOLD, 0x00000000);
147 OUT_CS_REG(R500_RB3D_DISCARD_SRC_PIXEL_GTE_THRESHOLD, 0xFFFFFFFF);
148 OUT_CS_REG(R300_ZB_FORMAT, 0x00000002);
149 OUT_CS_REG(R300_ZB_ZCACHE_CTLSTAT, 0x00000003);
150 OUT_CS_REG(R300_ZB_BW_CNTL, 0x00000000);
151 OUT_CS_REG(R300_ZB_DEPTHCLEARVALUE, 0x00000000);
152 /* XXX Moar unknown that should probably be left out.
153 OUT_CS_REG(0x4F30, 0x00000000);
154 OUT_CS_REG(0x4F34, 0x00000000); */
155 OUT_CS_REG(R300_ZB_HIZ_OFFSET, 0x00000000);
156 OUT_CS_REG(R300_ZB_HIZ_PITCH, 0x00000000);
157 if (caps->has_tcl) {
158 OUT_CS_REG(R300_VAP_PROG_STREAM_CNTL_0,
159 (R300_DATA_TYPE_FLOAT_4 << R300_DATA_TYPE_0_SHIFT) |
160 ((R300_LAST_VEC | (1 << R300_DST_VEC_LOC_SHIFT) |
161 R300_DATA_TYPE_FLOAT_4) << R300_DATA_TYPE_1_SHIFT));
162 } else {
163 OUT_CS_REG(R300_VAP_PROG_STREAM_CNTL_0,
164 (R300_DATA_TYPE_FLOAT_4 << R300_DATA_TYPE_0_SHIFT) |
165 ((R300_LAST_VEC | (2 << R300_DST_VEC_LOC_SHIFT) |
166 R300_DATA_TYPE_FLOAT_4) << R300_DATA_TYPE_1_SHIFT));
167 }
168 OUT_CS_REG(R300_FG_FOG_BLEND, 0x00000000);
169 OUT_CS_REG(R300_VAP_PROG_STREAM_CNTL_EXT_0, 0xF688F688);
170 OUT_CS_REG(R300_VAP_VTX_STATE_CNTL, 0x1);
171 OUT_CS_REG(R300_VAP_VSM_VTX_ASSM, 0x405);
172 OUT_CS_REG(R300_SE_VTE_CNTL, 0x0000043F);
173 OUT_CS_REG(R300_VAP_VTX_SIZE, 0x00000008);
174 OUT_CS_REG(R300_VAP_PSC_SGN_NORM_CNTL, 0xAAAAAAAA);
175 OUT_CS_REG(R300_VAP_OUTPUT_VTX_FMT_0, 0x00000003);
176 OUT_CS_REG(R300_VAP_OUTPUT_VTX_FMT_1, 0x00000000);
177 OUT_CS_REG(R300_TX_ENABLE, 0x0);
178 /* XXX viewport setup */
179 OUT_CS_REG_SEQ(R300_SE_VPORT_XSCALE, 6);
180 OUT_CS_32F(1.0);
181 OUT_CS_32F((float)x);
182 OUT_CS_32F(1.0);
183 OUT_CS_32F((float)y);
184 OUT_CS_32F(1.0);
185 OUT_CS_32F(0.0);
186
187 if (caps->has_tcl) {
188 OUT_CS_REG(R300_VAP_CLIP_CNTL, R300_CLIP_DISABLE |
189 R300_PS_UCP_MODE_CLIP_AS_TRIFAN);
190 }
191
192 /* The size of the point we're about to draw, in sixths of pixels */
193 OUT_CS_REG(R300_GA_POINT_SIZE,
194 ((h * 6) & R300_POINTSIZE_Y_MASK) |
195 ((w * 6) << R300_POINTSIZE_X_SHIFT));
196
197 /* XXX */
198 OUT_CS_REG(R300_SC_CLIP_RULE, 0xaaaa);
199
200 /* Pixel scissors */
201 OUT_CS_REG_SEQ(R300_SC_SCISSORS_TL, 2);
202 OUT_CS((x << R300_SCISSORS_X_SHIFT) | (y << R300_SCISSORS_Y_SHIFT));
203 OUT_CS((w << R300_SCISSORS_X_SHIFT) | (h << R300_SCISSORS_Y_SHIFT));
204
205 /* RS block setup */
206 if (caps->is_r500) {
207 /* XXX We seem to be in disagreement about how many of these we have
208 * RS:RS_IP_[0-15] [R/W] 32 bits Access: 8/16/32 MMReg:0x4074-0x40b0
209 * Now that's from the docs. I don't care what the mesa driver says */
210 OUT_CS_REG_SEQ(R500_RS_IP_0, 16);
211 for (i = 0; i < 16; i++) {
212 OUT_CS((R500_RS_IP_PTR_K0 << R500_RS_IP_TEX_PTR_S_SHIFT) |
213 (R500_RS_IP_PTR_K0 << R500_RS_IP_TEX_PTR_T_SHIFT) |
214 (R500_RS_IP_PTR_K0 << R500_RS_IP_TEX_PTR_R_SHIFT) |
215 (R500_RS_IP_PTR_K1 << R500_RS_IP_TEX_PTR_Q_SHIFT));
216 }
217 OUT_CS_REG_SEQ(R300_RS_COUNT, 2);
218 OUT_CS((1 << R300_IC_COUNT_SHIFT) | R300_HIRES_EN);
219 OUT_CS(0x00000000);
220 OUT_CS_REG(R500_RS_INST_0, R500_RS_INST_COL_CN_WRITE);
221 } else {
222 OUT_CS_REG_SEQ(R300_RS_IP_0, 8);
223 for (i = 0; i < 8; i++) {
224 OUT_CS(R300_RS_SEL_T(R300_RS_SEL_K0) |
225 R300_RS_SEL_R(R300_RS_SEL_K0) | R300_RS_SEL_Q(R300_RS_SEL_K1));
226 }
227 OUT_CS_REG_SEQ(R300_RS_COUNT, 2);
228 OUT_CS((1 << R300_IC_COUNT_SHIFT) | R300_HIRES_EN);
229 /* XXX Shouldn't this be 0? */
230 OUT_CS(1);
231 OUT_CS_REG(R300_RS_INST_0, R300_RS_INST_COL_CN_WRITE);
232 }
233 END_CS;
234
235 /* Fragment shader setup */
236 if (caps->is_r500) {
237 r500_emit_fragment_shader(r300, &r500_passthrough_fragment_shader);
238 } else {
239 r300_emit_fragment_shader(r300, &r300_passthrough_fragment_shader);
240 }
241
242 BEGIN_CS(8 + (caps->has_tcl ? 20 : 2));
243 OUT_CS_REG_SEQ(R300_US_OUT_FMT_0, 4);
244 OUT_CS(R300_C0_SEL_B | R300_C1_SEL_G | R300_C2_SEL_R | R300_C3_SEL_A);
245 OUT_CS(R300_US_OUT_FMT_UNUSED);
246 OUT_CS(R300_US_OUT_FMT_UNUSED);
247 OUT_CS(R300_US_OUT_FMT_UNUSED);
248 OUT_CS_REG(R300_US_W_FMT, R300_W_FMT_W0);
249 /* XXX these magic numbers should be explained when
250 * this becomes a cached state object */
251 if (caps->has_tcl) {
252 OUT_CS_REG(R300_VAP_CNTL, 0xA |
253 (0x5 << R300_PVS_NUM_CNTLRS_SHIFT) |
254 (0xB << R300_VF_MAX_VTX_NUM_SHIFT) |
255 (caps->num_vert_fpus << R300_PVS_NUM_FPUS_SHIFT));
256 OUT_CS_REG(R300_VAP_PVS_CODE_CNTL_0, 0x00100000);
257 OUT_CS_REG(R300_VAP_PVS_CONST_CNTL, 0x00000000);
258 OUT_CS_REG(R300_VAP_PVS_CODE_CNTL_1, 0x00000001);
259 /* XXX translate these back into normal instructions */
260 OUT_CS_REG(R300_VAP_PVS_STATE_FLUSH_REG, 0x1);
261 OUT_CS_REG(R300_VAP_PVS_VECTOR_INDX_REG, 0x0);
262 OUT_CS_ONE_REG(R300_VAP_PVS_UPLOAD_DATA, 8);
263 OUT_CS(0x00F00203);
264 OUT_CS(0x00D10001);
265 OUT_CS(0x01248001);
266 OUT_CS(0x00000000);
267 OUT_CS(0x00F02203);
268 OUT_CS(0x00D10021);
269 OUT_CS(0x01248021);
270 OUT_CS(0x00000000);
271 } else {
272 OUT_CS_REG(R300_VAP_CNTL, 0xA |
273 (0x5 << R300_PVS_NUM_CNTLRS_SHIFT) |
274 (0x5 << R300_VF_MAX_VTX_NUM_SHIFT) |
275 (caps->num_vert_fpus << R300_PVS_NUM_FPUS_SHIFT));
276 }
277 END_CS;
278
279 r300_emit_blend_state(r300, &blend_clear_state);
280 r300_emit_blend_color_state(r300, &blend_color_clear_state);
281 r300_emit_dsa_state(r300, &dsa_clear_state);
282
283 BEGIN_CS(24);
284 /* Flush colorbuffer and blend caches. */
285 OUT_CS_REG(R300_RB3D_DSTCACHE_CTLSTAT,
286 R300_RB3D_DSTCACHE_CTLSTAT_DC_FLUSH_FLUSH_DIRTY_3D |
287 R300_RB3D_DSTCACHE_CTLSTAT_DC_FINISH_SIGNAL);
288 OUT_CS_REG(R300_ZB_ZCACHE_CTLSTAT,
289 R300_ZB_ZCACHE_CTLSTAT_ZC_FLUSH_FLUSH_AND_FREE |
290 R300_ZB_ZCACHE_CTLSTAT_ZC_FREE_FREE);
291
292 OUT_CS_REG_SEQ(R300_RB3D_COLOROFFSET0, 1);
293 OUT_CS_RELOC(tex->buffer, 0, 0, RADEON_GEM_DOMAIN_VRAM, 0);
294 /* XXX (dest->stride >> 2) should be the buffer width in pixels however,
295 * this little calculation is only good as long as the buffer is 32bpp */
296 OUT_CS_REG(R300_RB3D_COLORPITCH0, (dest->stride >> 2) |
297 R300_COLOR_FORMAT_ARGB8888);
298 OUT_CS_REG(RB3D_COLOR_CHANNEL_MASK, 0x0000000F);
299 /* XXX Packet3 */
300 OUT_CS(CP_PACKET3(R200_3D_DRAW_IMMD_2, 8));
301 OUT_CS(R300_PRIM_TYPE_POINT | R300_PRIM_WALK_RING |
302 (1 << R300_PRIM_NUM_VERTICES_SHIFT));
303 OUT_CS_32F(w / 2.0);
304 OUT_CS_32F(h / 2.0);
305 /* XXX this should be the depth value to clear to */
306 OUT_CS_32F(1.0);
307 OUT_CS_32F(1.0);
308 OUT_CS_32F(r);
309 OUT_CS_32F(g);
310 OUT_CS_32F(b);
311 OUT_CS_32F(1.0);
312
313 /* XXX figure out why this is 0xA and not 0x2 */
314 OUT_CS_REG(R300_RB3D_DSTCACHE_CTLSTAT, 0xA);
315 /* XXX OUT_CS_REG(R300_ZB_ZCACHE_CTLSTAT,
316 R300_ZB_ZCACHE_CTLSTAT_ZC_FLUSH_FLUSH_AND_FREE |
317 R300_ZB_ZCACHE_CTLSTAT_ZC_FREE_FREE); */
318
319 END_CS;
320
321 r300->dirty_hw++;
322 }
323
324 void r300_init_surface_functions(struct r300_context* r300)
325 {
326 r300->context.surface_fill = r300_surface_fill;
327 }