i965: Update GS state for Broadwell.
[mesa.git] / src / mesa / drivers / dri / i965 / gen8_gs_state.c
1 /*
2 * Copyright © 2013 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21 * DEALINGS IN THE SOFTWARE.
22 */
23
24 #include "brw_context.h"
25 #include "brw_state.h"
26 #include "brw_defines.h"
27 #include "intel_batchbuffer.h"
28
29 static void
30 gen8_upload_gs_state(struct brw_context *brw)
31 {
32 struct gl_context *ctx = &brw->ctx;
33 const struct brw_stage_state *stage_state = &brw->gs.base;
34 /* BRW_NEW_GEOMETRY_PROGRAM */
35 bool active = brw->geometry_program;
36 /* CACHE_NEW_GS_PROG */
37 const struct brw_vec4_prog_data *prog_data = &brw->gs.prog_data->base;
38
39 /* BRW_NEW_GS_BINDING_TABLE */
40 BEGIN_BATCH(2);
41 OUT_BATCH(_3DSTATE_BINDING_TABLE_POINTERS_GS << 16 | (2 - 2));
42 OUT_BATCH(stage_state->bind_bo_offset);
43 ADVANCE_BATCH();
44
45 /* CACHE_NEW_SAMPLER */
46 BEGIN_BATCH(2);
47 OUT_BATCH(_3DSTATE_SAMPLER_STATE_POINTERS_GS << 16 | (2 - 2));
48 OUT_BATCH(stage_state->sampler_offset);
49 ADVANCE_BATCH();
50
51 gen8_upload_constant_state(brw, stage_state, active, _3DSTATE_CONSTANT_GS);
52
53 if (active) {
54 int urb_entry_write_offset = 1;
55 uint32_t urb_entry_output_length =
56 ((prog_data->vue_map.num_slots + 1) / 2 - urb_entry_write_offset);
57
58 if (urb_entry_output_length == 0)
59 urb_entry_output_length = 1;
60
61 BEGIN_BATCH(10);
62 OUT_BATCH(_3DSTATE_GS << 16 | (10 - 2));
63 OUT_BATCH(stage_state->prog_offset);
64 OUT_BATCH(0);
65 OUT_BATCH(GEN6_GS_VECTOR_MASK_ENABLE |
66 brw->geometry_program->VerticesIn |
67 ((ALIGN(stage_state->sampler_count, 4)/4) <<
68 GEN6_GS_SAMPLER_COUNT_SHIFT) |
69 ((prog_data->base.binding_table.size_bytes / 4) <<
70 GEN6_GS_BINDING_TABLE_ENTRY_COUNT_SHIFT));
71
72 if (brw->gs.prog_data->base.total_scratch) {
73 OUT_RELOC64(stage_state->scratch_bo,
74 I915_GEM_DOMAIN_RENDER, I915_GEM_DOMAIN_RENDER,
75 ffs(brw->gs.prog_data->base.total_scratch) - 11);
76 WARN_ONCE(true,
77 "May need to implement a temporary workaround: GS Number of "
78 "URB Entries must be less than or equal to the GS Maximum "
79 "Number of Threads.\n");
80 } else {
81 OUT_BATCH(0);
82 OUT_BATCH(0);
83 }
84
85 /* DW6 */
86 OUT_BATCH(((brw->gs.prog_data->output_vertex_size_hwords * 2 - 1) <<
87 GEN7_GS_OUTPUT_VERTEX_SIZE_SHIFT) |
88 (brw->gs.prog_data->output_topology <<
89 GEN7_GS_OUTPUT_TOPOLOGY_SHIFT) |
90 (prog_data->urb_read_length <<
91 GEN6_GS_URB_READ_LENGTH_SHIFT) |
92 (0 << GEN6_GS_URB_ENTRY_READ_OFFSET_SHIFT) |
93 (prog_data->dispatch_grf_start_reg <<
94 GEN6_GS_DISPATCH_START_GRF_SHIFT));
95
96 /* DW7 */
97 OUT_BATCH(((brw->max_gs_threads / 2 - 1) << HSW_GS_MAX_THREADS_SHIFT) |
98 (brw->gs.prog_data->control_data_header_size_hwords <<
99 GEN7_GS_CONTROL_DATA_HEADER_SIZE_SHIFT) |
100 (brw->gs.prog_data->dual_instanced_dispatch ?
101 GEN7_GS_DISPATCH_MODE_DUAL_INSTANCE :
102 GEN7_GS_DISPATCH_MODE_DUAL_OBJECT) |
103 GEN6_GS_STATISTICS_ENABLE |
104 (brw->gs.prog_data->include_primitive_id ?
105 GEN7_GS_INCLUDE_PRIMITIVE_ID : 0) |
106 GEN7_GS_REORDER_TRAILING |
107 GEN7_GS_ENABLE);
108
109 /* DW8 */
110 OUT_BATCH(brw->gs.prog_data->control_data_format <<
111 HSW_GS_CONTROL_DATA_FORMAT_SHIFT);
112
113 /* DW9 / _NEW_TRANSFORM */
114 OUT_BATCH((ctx->Transform.ClipPlanesEnabled <<
115 GEN8_GS_USER_CLIP_DISTANCE_SHIFT) |
116 (urb_entry_output_length << GEN8_GS_URB_OUTPUT_LENGTH_SHIFT) |
117 (urb_entry_write_offset <<
118 GEN8_GS_URB_ENTRY_OUTPUT_OFFSET_SHIFT));
119 ADVANCE_BATCH();
120 } else {
121 BEGIN_BATCH(10);
122 OUT_BATCH(_3DSTATE_GS << 16 | (10 - 2));
123 OUT_BATCH(0); /* prog_bo */
124 OUT_BATCH(0);
125 OUT_BATCH(0);
126 OUT_BATCH(0); /* scratch space base offset */
127 OUT_BATCH(0);
128 OUT_BATCH(0);
129 OUT_BATCH(GEN6_GS_STATISTICS_ENABLE);
130 OUT_BATCH(0);
131 OUT_BATCH(0);
132 ADVANCE_BATCH();
133 }
134 }
135
136 const struct brw_tracked_state gen8_gs_state = {
137 .dirty = {
138 .mesa = _NEW_TRANSFORM | _NEW_PROGRAM_CONSTANTS,
139 .brw = (BRW_NEW_CONTEXT |
140 BRW_NEW_GEOMETRY_PROGRAM |
141 BRW_NEW_GS_BINDING_TABLE |
142 BRW_NEW_BATCH |
143 BRW_NEW_PUSH_CONSTANT_ALLOCATION),
144 .cache = CACHE_NEW_GS_PROG | CACHE_NEW_SAMPLER
145 },
146 .emit = gen8_upload_gs_state,
147 };