1 /**************************************************************************
3 * Copyright 2003 Tungsten Graphics, Inc., Cedar Park, Texas.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 **************************************************************************/
30 #include "main/glheader.h"
31 #include "main/mtypes.h"
32 #include "main/imports.h"
33 #include "main/macros.h"
34 #include "main/colormac.h"
36 #include "tnl/t_context.h"
37 #include "tnl/t_vertex.h"
39 #include "intel_batchbuffer.h"
40 #include "intel_tex.h"
41 #include "intel_regions.h"
42 #include "intel_tris.h"
45 #include "i915_context.h"
47 #include "glapi/glapi.h"
50 i915_render_prevalidate(struct intel_context
*intel
)
52 struct i915_context
*i915
= i915_context(&intel
->ctx
);
55 i915ValidateFragmentProgram(i915
);
59 i915_render_start(struct intel_context
*intel
)
65 i915_reduced_primitive_state(struct intel_context
*intel
, GLenum rprim
)
67 struct i915_context
*i915
= i915_context(&intel
->ctx
);
68 GLuint st1
= i915
->state
.Stipple
[I915_STPREG_ST1
];
73 case GL_QUADS
: /* from RASTERIZE(GL_QUADS) in t_dd_tritemp.h */
75 if (intel
->ctx
.Polygon
.StippleFlag
&& intel
->hw_stipple
)
84 i915
->intel
.reduced_primitive
= rprim
;
86 if (st1
!= i915
->state
.Stipple
[I915_STPREG_ST1
]) {
87 INTEL_FIREVERTICES(intel
);
89 I915_STATECHANGE(i915
, I915_UPLOAD_STIPPLE
);
90 i915
->state
.Stipple
[I915_STPREG_ST1
] = st1
;
95 /* Pull apart the vertex format registers and figure out how large a
96 * vertex is supposed to be.
99 i915_check_vertex_size(struct intel_context
*intel
, GLuint expected
)
101 struct i915_context
*i915
= i915_context(&intel
->ctx
);
102 int lis2
= i915
->current
->Ctx
[I915_CTXREG_LIS2
];
103 int lis4
= i915
->current
->Ctx
[I915_CTXREG_LIS4
];
106 switch (lis4
& S4_VFMT_XYZW_MASK
) {
120 fprintf(stderr
, "no xyzw specified\n");
124 if (lis4
& S4_VFMT_SPEC_FOG
)
126 if (lis4
& S4_VFMT_COLOR
)
128 if (lis4
& S4_VFMT_DEPTH_OFFSET
)
130 if (lis4
& S4_VFMT_POINT_WIDTH
)
132 if (lis4
& S4_VFMT_FOG_PARAM
)
135 for (i
= 0; i
< 8; i
++) {
136 switch (lis2
& S2_TEXCOORD_FMT0_MASK
) {
149 case TEXCOORDFMT_2D_16
:
152 case TEXCOORDFMT_4D_16
:
155 case TEXCOORDFMT_NOT_PRESENT
:
158 fprintf(stderr
, "bad texcoord fmt %d\n", i
);
161 lis2
>>= S2_TEXCOORD_FMT1_SHIFT
;
165 fprintf(stderr
, "vertex size mismatch %d/%d\n", sz
, expected
);
167 return sz
== expected
;
172 i915_emit_invarient_state(struct intel_context
*intel
)
176 BEGIN_BATCH(20, IGNORE_CLIPRECTS
);
178 OUT_BATCH(_3DSTATE_AA_CMD
|
179 AA_LINE_ECAAR_WIDTH_ENABLE
|
180 AA_LINE_ECAAR_WIDTH_1_0
|
181 AA_LINE_REGION_WIDTH_ENABLE
| AA_LINE_REGION_WIDTH_1_0
);
183 OUT_BATCH(_3DSTATE_DFLT_DIFFUSE_CMD
);
186 OUT_BATCH(_3DSTATE_DFLT_SPEC_CMD
);
189 OUT_BATCH(_3DSTATE_DFLT_Z_CMD
);
192 /* Don't support texture crossbar yet */
193 OUT_BATCH(_3DSTATE_COORD_SET_BINDINGS
|
198 CSB_TCB(4, 4) | CSB_TCB(5, 5) | CSB_TCB(6, 6) | CSB_TCB(7, 7));
200 OUT_BATCH(_3DSTATE_RASTER_RULES_CMD
|
201 ENABLE_POINT_RASTER_RULE
|
202 OGL_POINT_RASTER_RULE
|
203 ENABLE_LINE_STRIP_PROVOKE_VRTX
|
204 ENABLE_TRI_FAN_PROVOKE_VRTX
|
205 LINE_STRIP_PROVOKE_VRTX(1) |
206 TRI_FAN_PROVOKE_VRTX(2) | ENABLE_TEXKILL_3D_4D
| TEXKILL_4D
);
208 /* Need to initialize this to zero.
210 OUT_BATCH(_3DSTATE_LOAD_STATE_IMMEDIATE_1
| I1_LOAD_S(3) | (0));
214 OUT_BATCH(_3DSTATE_SCISSOR_ENABLE_CMD
| DISABLE_SCISSOR_RECT
);
216 OUT_BATCH(_3DSTATE_SCISSOR_RECT_0_CMD
);
220 OUT_BATCH(_3DSTATE_DEPTH_SUBRECT_DISABLE
);
222 OUT_BATCH(_3DSTATE_LOAD_INDIRECT
| 0); /* disable indirect state */
226 /* Don't support twosided stencil yet */
227 OUT_BATCH(_3DSTATE_BACKFACE_STENCIL_OPS
| BFO_ENABLE_STENCIL_TWO_SIDE
| 0);
234 #define emit(intel, state, size ) \
235 intel_batchbuffer_data(intel->batch, state, size, IGNORE_CLIPRECTS )
238 get_dirty(struct i915_hw_state
*state
)
242 /* Workaround the multitex hang - if one texture unit state is
243 * modified, emit all texture units.
245 dirty
= state
->active
& ~state
->emitted
;
246 if (dirty
& I915_UPLOAD_TEX_ALL
)
247 state
->emitted
&= ~I915_UPLOAD_TEX_ALL
;
248 dirty
= state
->active
& ~state
->emitted
;
254 get_state_size(struct i915_hw_state
*state
)
256 GLuint dirty
= get_dirty(state
);
260 if (dirty
& I915_UPLOAD_INVARIENT
)
263 if (dirty
& I915_UPLOAD_CTX
)
264 sz
+= sizeof(state
->Ctx
);
266 if (dirty
& I915_UPLOAD_BUFFERS
)
267 sz
+= sizeof(state
->Buffer
);
269 if (dirty
& I915_UPLOAD_STIPPLE
)
270 sz
+= sizeof(state
->Stipple
);
272 if (dirty
& I915_UPLOAD_FOG
)
273 sz
+= sizeof(state
->Fog
);
275 if (dirty
& I915_UPLOAD_TEX_ALL
) {
277 for (i
= 0; i
< I915_TEX_UNITS
; i
++)
278 if (dirty
& I915_UPLOAD_TEX(i
))
281 sz
+= (2 + nr
* 3) * sizeof(GLuint
) * 2;
284 if (dirty
& I915_UPLOAD_CONSTANTS
)
285 sz
+= state
->ConstantSize
* sizeof(GLuint
);
287 if (dirty
& I915_UPLOAD_PROGRAM
)
288 sz
+= state
->ProgramSize
* sizeof(GLuint
);
293 /* Push the state into the sarea and/or texture memory.
296 i915_emit_state(struct intel_context
*intel
)
298 struct i915_context
*i915
= i915_context(&intel
->ctx
);
299 struct i915_hw_state
*state
= i915
->current
;
300 int i
, count
, aper_count
;
302 dri_bo
*aper_array
[3 + I915_TEX_UNITS
];
303 GET_CURRENT_CONTEXT(ctx
);
306 /* We don't hold the lock at this point, so want to make sure that
307 * there won't be a buffer wrap between the state emits and the primitive
310 * It might be better to talk about explicit places where
311 * scheduling is allowed, rather than assume that it is whenever a
312 * batchbuffer fills up.
314 * Set the space as LOOP_CLIPRECTS now, since that's what our primitives
315 * will be emitted under.
317 intel_batchbuffer_require_space(intel
->batch
,
318 get_state_size(state
) + INTEL_PRIM_EMIT_SIZE
,
323 dirty
= get_dirty(state
);
325 aper_array
[aper_count
++] = intel
->batch
->buf
;
326 if (dirty
& I915_UPLOAD_BUFFERS
) {
327 aper_array
[aper_count
++] = state
->draw_region
->buffer
;
328 if (state
->depth_region
)
329 aper_array
[aper_count
++] = state
->depth_region
->buffer
;
332 if (dirty
& I915_UPLOAD_TEX_ALL
) {
333 for (i
= 0; i
< I915_TEX_UNITS
; i
++) {
334 if (dirty
& I915_UPLOAD_TEX(i
)) {
335 if (state
->tex_buffer
[i
]) {
336 aper_array
[aper_count
++] = state
->tex_buffer
[i
];
342 if (dri_bufmgr_check_aperture_space(aper_array
, aper_count
)) {
345 intel_batchbuffer_flush(intel
->batch
);
348 _mesa_error(ctx
, GL_OUT_OF_MEMORY
, "i915 emit state");
353 /* work out list of buffers to emit */
355 /* Do this here as we may have flushed the batchbuffer above,
356 * causing more state to be dirty!
358 dirty
= get_dirty(state
);
359 state
->emitted
|= dirty
;
360 assert(get_dirty(state
) == 0);
362 if (INTEL_DEBUG
& DEBUG_STATE
)
363 fprintf(stderr
, "%s dirty: %x\n", __FUNCTION__
, dirty
);
365 if (dirty
& I915_UPLOAD_INVARIENT
) {
366 if (INTEL_DEBUG
& DEBUG_STATE
)
367 fprintf(stderr
, "I915_UPLOAD_INVARIENT:\n");
368 i915_emit_invarient_state(intel
);
371 if (dirty
& I915_UPLOAD_CTX
) {
372 if (INTEL_DEBUG
& DEBUG_STATE
)
373 fprintf(stderr
, "I915_UPLOAD_CTX:\n");
375 emit(intel
, state
->Ctx
, sizeof(state
->Ctx
));
378 if (dirty
& I915_UPLOAD_BUFFERS
) {
381 if (INTEL_DEBUG
& DEBUG_STATE
)
382 fprintf(stderr
, "I915_UPLOAD_BUFFERS:\n");
384 if (state
->depth_region
)
387 if (intel
->constant_cliprect
)
390 BEGIN_BATCH(count
, IGNORE_CLIPRECTS
);
391 OUT_BATCH(state
->Buffer
[I915_DESTREG_CBUFADDR0
]);
392 OUT_BATCH(state
->Buffer
[I915_DESTREG_CBUFADDR1
]);
393 OUT_RELOC(state
->draw_region
->buffer
,
394 I915_GEM_DOMAIN_RENDER
, I915_GEM_DOMAIN_RENDER
,
395 state
->draw_region
->draw_offset
);
397 if (state
->depth_region
) {
398 OUT_BATCH(state
->Buffer
[I915_DESTREG_DBUFADDR0
]);
399 OUT_BATCH(state
->Buffer
[I915_DESTREG_DBUFADDR1
]);
400 OUT_RELOC(state
->depth_region
->buffer
,
401 I915_GEM_DOMAIN_RENDER
, I915_GEM_DOMAIN_RENDER
,
402 state
->depth_region
->draw_offset
);
405 OUT_BATCH(state
->Buffer
[I915_DESTREG_DV0
]);
406 OUT_BATCH(state
->Buffer
[I915_DESTREG_DV1
]);
407 OUT_BATCH(state
->Buffer
[I915_DESTREG_SENABLE
]);
408 OUT_BATCH(state
->Buffer
[I915_DESTREG_SR0
]);
409 OUT_BATCH(state
->Buffer
[I915_DESTREG_SR1
]);
410 OUT_BATCH(state
->Buffer
[I915_DESTREG_SR2
]);
412 if (intel
->constant_cliprect
) {
413 assert(state
->Buffer
[I915_DESTREG_DRAWRECT0
] != MI_NOOP
);
414 OUT_BATCH(state
->Buffer
[I915_DESTREG_DRAWRECT0
]);
415 OUT_BATCH(state
->Buffer
[I915_DESTREG_DRAWRECT1
]);
416 OUT_BATCH(state
->Buffer
[I915_DESTREG_DRAWRECT2
]);
417 OUT_BATCH(state
->Buffer
[I915_DESTREG_DRAWRECT3
]);
418 OUT_BATCH(state
->Buffer
[I915_DESTREG_DRAWRECT4
]);
419 OUT_BATCH(state
->Buffer
[I915_DESTREG_DRAWRECT5
]);
425 if (dirty
& I915_UPLOAD_STIPPLE
) {
426 if (INTEL_DEBUG
& DEBUG_STATE
)
427 fprintf(stderr
, "I915_UPLOAD_STIPPLE:\n");
428 emit(intel
, state
->Stipple
, sizeof(state
->Stipple
));
431 if (dirty
& I915_UPLOAD_FOG
) {
432 if (INTEL_DEBUG
& DEBUG_STATE
)
433 fprintf(stderr
, "I915_UPLOAD_FOG:\n");
434 emit(intel
, state
->Fog
, sizeof(state
->Fog
));
437 /* Combine all the dirty texture state into a single command to
438 * avoid lockups on I915 hardware.
440 if (dirty
& I915_UPLOAD_TEX_ALL
) {
443 for (i
= 0; i
< I915_TEX_UNITS
; i
++)
444 if (dirty
& I915_UPLOAD_TEX(i
))
447 BEGIN_BATCH(2 + nr
* 3, IGNORE_CLIPRECTS
);
448 OUT_BATCH(_3DSTATE_MAP_STATE
| (3 * nr
));
449 OUT_BATCH((dirty
& I915_UPLOAD_TEX_ALL
) >> I915_UPLOAD_TEX_0_SHIFT
);
450 for (i
= 0; i
< I915_TEX_UNITS
; i
++)
451 if (dirty
& I915_UPLOAD_TEX(i
)) {
453 if (state
->tex_buffer
[i
]) {
454 OUT_RELOC(state
->tex_buffer
[i
],
455 I915_GEM_DOMAIN_SAMPLER
, 0,
456 state
->tex_offset
[i
]);
458 else if (state
== &i915
->meta
) {
463 OUT_BATCH(state
->tex_offset
[i
]);
466 OUT_BATCH(state
->Tex
[i
][I915_TEXREG_MS3
]);
467 OUT_BATCH(state
->Tex
[i
][I915_TEXREG_MS4
]);
471 BEGIN_BATCH(2 + nr
* 3, IGNORE_CLIPRECTS
);
472 OUT_BATCH(_3DSTATE_SAMPLER_STATE
| (3 * nr
));
473 OUT_BATCH((dirty
& I915_UPLOAD_TEX_ALL
) >> I915_UPLOAD_TEX_0_SHIFT
);
474 for (i
= 0; i
< I915_TEX_UNITS
; i
++)
475 if (dirty
& I915_UPLOAD_TEX(i
)) {
476 OUT_BATCH(state
->Tex
[i
][I915_TEXREG_SS2
]);
477 OUT_BATCH(state
->Tex
[i
][I915_TEXREG_SS3
]);
478 OUT_BATCH(state
->Tex
[i
][I915_TEXREG_SS4
]);
483 if (dirty
& I915_UPLOAD_CONSTANTS
) {
484 if (INTEL_DEBUG
& DEBUG_STATE
)
485 fprintf(stderr
, "I915_UPLOAD_CONSTANTS:\n");
486 emit(intel
, state
->Constant
, state
->ConstantSize
* sizeof(GLuint
));
489 if (dirty
& I915_UPLOAD_PROGRAM
) {
490 if (state
->ProgramSize
) {
491 if (INTEL_DEBUG
& DEBUG_STATE
)
492 fprintf(stderr
, "I915_UPLOAD_PROGRAM:\n");
494 assert((state
->Program
[0] & 0x1ff) + 2 == state
->ProgramSize
);
496 emit(intel
, state
->Program
, state
->ProgramSize
* sizeof(GLuint
));
497 if (INTEL_DEBUG
& DEBUG_STATE
)
498 i915_disassemble_program(state
->Program
, state
->ProgramSize
);
502 intel
->batch
->dirty_state
&= ~dirty
;
503 assert(get_dirty(state
) == 0);
504 assert((intel
->batch
->dirty_state
& (1<<1)) == 0);
508 i915_destroy_context(struct intel_context
*intel
)
511 struct i915_context
*i915
= i915_context(&intel
->ctx
);
513 intel_region_release(&i915
->state
.draw_region
);
514 intel_region_release(&i915
->state
.depth_region
);
515 intel_region_release(&i915
->meta
.draw_region
);
516 intel_region_release(&i915
->meta
.depth_region
);
517 intel_region_release(&i915
->initial
.draw_region
);
518 intel_region_release(&i915
->initial
.depth_region
);
520 for (i
= 0; i
< I915_TEX_UNITS
; i
++) {
521 if (i915
->state
.tex_buffer
[i
] != NULL
) {
522 dri_bo_unreference(i915
->state
.tex_buffer
[i
]);
523 i915
->state
.tex_buffer
[i
] = NULL
;
527 _tnl_free_vertices(&intel
->ctx
);
532 * Set the drawing regions for the color and depth/stencil buffers.
533 * This involves setting the pitch, cpp and buffer ID/location.
534 * Also set pixel format for color and Z rendering
535 * Used for setting both regular and meta state.
538 i915_state_draw_region(struct intel_context
*intel
,
539 struct i915_hw_state
*state
,
540 struct intel_region
*color_region
,
541 struct intel_region
*depth_region
)
543 struct i915_context
*i915
= i915_context(&intel
->ctx
);
544 GLcontext
*ctx
= &intel
->ctx
;
547 ASSERT(state
== &i915
->state
|| state
== &i915
->meta
);
549 if (state
->draw_region
!= color_region
) {
550 intel_region_release(&state
->draw_region
);
551 intel_region_reference(&state
->draw_region
, color_region
);
553 if (state
->depth_region
!= depth_region
) {
554 intel_region_release(&state
->depth_region
);
555 intel_region_reference(&state
->depth_region
, depth_region
);
559 * Set stride/cpp values
562 state
->Buffer
[I915_DESTREG_CBUFADDR0
] = _3DSTATE_BUF_INFO_CMD
;
563 state
->Buffer
[I915_DESTREG_CBUFADDR1
] =
564 (BUF_3D_ID_COLOR_BACK
|
565 BUF_3D_PITCH(color_region
->pitch
* color_region
->cpp
) |
570 state
->Buffer
[I915_DESTREG_DBUFADDR0
] = _3DSTATE_BUF_INFO_CMD
;
571 state
->Buffer
[I915_DESTREG_DBUFADDR1
] =
573 BUF_3D_PITCH(depth_region
->pitch
* depth_region
->cpp
) |
578 * Compute/set I915_DESTREG_DV1 value
580 value
= (DSTORG_HORT_BIAS(0x8) | /* .5 */
581 DSTORG_VERT_BIAS(0x8) | /* .5 */
582 LOD_PRECLAMP_OGL
| TEX_DEFAULT_COLOR_OGL
);
583 if (color_region
&& color_region
->cpp
== 4) {
587 value
|= (DITHER_FULL_ALWAYS
| DV_PF_565
);
589 if (depth_region
&& depth_region
->cpp
== 4) {
590 value
|= DEPTH_FRMT_24_FIXED_8_OTHER
;
593 value
|= DEPTH_FRMT_16_FIXED
;
595 state
->Buffer
[I915_DESTREG_DV1
] = value
;
597 if (intel
->constant_cliprect
) {
598 state
->Buffer
[I915_DESTREG_DRAWRECT0
] = _3DSTATE_DRAWRECT_INFO
;
599 state
->Buffer
[I915_DESTREG_DRAWRECT1
] = 0;
600 state
->Buffer
[I915_DESTREG_DRAWRECT2
] = 0; /* xmin, ymin */
601 state
->Buffer
[I915_DESTREG_DRAWRECT3
] =
602 (ctx
->DrawBuffer
->Width
& 0xffff) |
603 (ctx
->DrawBuffer
->Height
<< 16);
604 state
->Buffer
[I915_DESTREG_DRAWRECT4
] = 0; /* xoff, yoff */
605 state
->Buffer
[I915_DESTREG_DRAWRECT5
] = 0;
607 state
->Buffer
[I915_DESTREG_DRAWRECT0
] = MI_NOOP
;
608 state
->Buffer
[I915_DESTREG_DRAWRECT1
] = MI_NOOP
;
609 state
->Buffer
[I915_DESTREG_DRAWRECT2
] = MI_NOOP
;
610 state
->Buffer
[I915_DESTREG_DRAWRECT3
] = MI_NOOP
;
611 state
->Buffer
[I915_DESTREG_DRAWRECT4
] = MI_NOOP
;
612 state
->Buffer
[I915_DESTREG_DRAWRECT5
] = MI_NOOP
;
615 I915_STATECHANGE(i915
, I915_UPLOAD_BUFFERS
);
620 i915_set_draw_region(struct intel_context
*intel
,
621 struct intel_region
*color_regions
[],
622 struct intel_region
*depth_region
,
625 struct i915_context
*i915
= i915_context(&intel
->ctx
);
626 i915_state_draw_region(intel
, &i915
->state
, color_regions
[0], depth_region
);
632 i915_new_batch(struct intel_context
*intel
)
634 struct i915_context
*i915
= i915_context(&intel
->ctx
);
636 /* Mark all state as needing to be emitted when starting a new batchbuffer.
637 * Using hardware contexts would be an alternative, but they have some
638 * difficulties associated with them (physical address requirements).
640 i915
->state
.emitted
= 0;
642 /* Check that we didn't just wrap our batchbuffer at a bad time. */
643 assert(!intel
->no_batch_wrap
);
649 return MI_FLUSH
| FLUSH_MAP_CACHE
;
653 i915_assert_not_dirty( struct intel_context
*intel
)
655 struct i915_context
*i915
= i915_context(&intel
->ctx
);
656 struct i915_hw_state
*state
= i915
->current
;
657 GLuint dirty
= get_dirty(state
);
662 i915_note_unlock( struct intel_context
*intel
)
669 i915InitVtbl(struct i915_context
*i915
)
671 i915
->intel
.vtbl
.check_vertex_size
= i915_check_vertex_size
;
672 i915
->intel
.vtbl
.destroy
= i915_destroy_context
;
673 i915
->intel
.vtbl
.emit_state
= i915_emit_state
;
674 i915
->intel
.vtbl
.new_batch
= i915_new_batch
;
675 i915
->intel
.vtbl
.reduced_primitive_state
= i915_reduced_primitive_state
;
676 i915
->intel
.vtbl
.render_start
= i915_render_start
;
677 i915
->intel
.vtbl
.render_prevalidate
= i915_render_prevalidate
;
678 i915
->intel
.vtbl
.set_draw_region
= i915_set_draw_region
;
679 i915
->intel
.vtbl
.update_texture_state
= i915UpdateTextureState
;
680 i915
->intel
.vtbl
.flush_cmd
= i915_flush_cmd
;
681 i915
->intel
.vtbl
.assert_not_dirty
= i915_assert_not_dirty
;
682 i915
->intel
.vtbl
.note_unlock
= i915_note_unlock
;
683 i915
->intel
.vtbl
.finish_batch
= intel_finish_vb
;