radeonsi: Handle position input parameter for pixel shaders v2
[mesa.git] / src / gallium / drivers / nv30 / nv30_vertprog.c
1 /*
2 * Copyright 2012 Red Hat Inc.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE AUTHORS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
18 * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF
19 * OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
20 * SOFTWARE.
21 *
22 * Authors: Ben Skeggs
23 *
24 */
25
26 #include "util/u_dynarray.h"
27 #include "tgsi/tgsi_parse.h"
28
29 #include "nouveau/nv_object.xml.h"
30 #include "nv30-40_3d.xml.h"
31 #include "nv30_context.h"
32 #include "nv30_state.h"
33
34 static void
35 nv30_vertprog_destroy(struct nv30_vertprog *vp)
36 {
37 util_dynarray_fini(&vp->branch_relocs);
38 nouveau_heap_free(&vp->exec);
39 FREE(vp->insns);
40 vp->insns = NULL;
41 vp->nr_insns = 0;
42
43 util_dynarray_fini(&vp->const_relocs);
44 nouveau_heap_free(&vp->data);
45 FREE(vp->consts);
46 vp->consts = NULL;
47 vp->nr_consts = 0;
48
49 vp->translated = FALSE;
50 }
51
52 void
53 nv30_vertprog_validate(struct nv30_context *nv30)
54 {
55 struct nouveau_pushbuf *push = nv30->base.pushbuf;
56 struct nouveau_object *eng3d = nv30->screen->eng3d;
57 struct nv30_vertprog *vp = nv30->vertprog.program;
58 struct nv30_fragprog *fp = nv30->fragprog.program;
59 boolean upload_code = FALSE;
60 boolean upload_data = FALSE;
61 unsigned i;
62
63 if (nv30->dirty & NV30_NEW_FRAGPROG) {
64 if (memcmp(vp->texcoord, fp->texcoord, sizeof(vp->texcoord))) {
65 if (vp->translated)
66 nv30_vertprog_destroy(vp);
67 memcpy(vp->texcoord, fp->texcoord, sizeof(vp->texcoord));
68 }
69 }
70
71 if (nv30->rast && nv30->rast->pipe.clip_plane_enable != vp->enabled_ucps) {
72 vp->enabled_ucps = nv30->rast->pipe.clip_plane_enable;
73 if (vp->translated)
74 nv30_vertprog_destroy(vp);
75 }
76
77 if (!vp->translated) {
78 vp->translated = _nvfx_vertprog_translate(nv30, vp);
79 if (!vp->translated) {
80 nv30->draw_flags |= NV30_NEW_VERTPROG;
81 return;
82 }
83 nv30->dirty |= NV30_NEW_VERTPROG;
84 }
85
86 if (!vp->exec) {
87 struct nouveau_heap *heap = nv30->screen->vp_exec_heap;
88 struct nv30_shader_reloc *reloc = vp->branch_relocs.data;
89 unsigned nr_reloc = vp->branch_relocs.size / sizeof(*reloc);
90 uint32_t *inst, target;
91
92 if (nouveau_heap_alloc(heap, vp->nr_insns, &vp->exec, &vp->exec)) {
93 while (heap->next && heap->size < vp->nr_insns) {
94 struct nouveau_heap **evict = heap->next->priv;
95 nouveau_heap_free(evict);
96 }
97
98 if (nouveau_heap_alloc(heap, vp->nr_insns, &vp->exec, &vp->exec)) {
99 nv30->draw_flags |= NV30_NEW_VERTPROG;
100 return;
101 }
102 }
103
104 if (eng3d->oclass < NV40_3D_CLASS) {
105 while (nr_reloc--) {
106 inst = vp->insns[reloc->location].data;
107 target = vp->exec->start + reloc->target;
108
109 inst[2] &= ~0x000007fc;
110 inst[2] |= target << 2;
111 reloc++;
112 }
113 } else {
114 while (nr_reloc--) {
115 inst = vp->insns[reloc->location].data;
116 target = vp->exec->start + reloc->target;
117
118 inst[2] &= ~0x0000003f;
119 inst[2] |= target >> 3;
120 inst[3] &= ~0xe0000000;
121 inst[3] |= target << 29;
122 reloc++;
123 }
124 }
125
126 upload_code = TRUE;
127 }
128
129 if (vp->nr_consts && !vp->data) {
130 struct nouveau_heap *heap = nv30->screen->vp_data_heap;
131 struct nv30_shader_reloc *reloc = vp->const_relocs.data;
132 unsigned nr_reloc = vp->const_relocs.size / sizeof(*reloc);
133 uint32_t *inst, target;
134
135 if (nouveau_heap_alloc(heap, vp->nr_consts, vp, &vp->data)) {
136 while (heap->next && heap->size < vp->nr_consts) {
137 struct nv30_vertprog *evp = heap->next->priv;
138 nouveau_heap_free(&evp->data);
139 }
140
141 if (nouveau_heap_alloc(heap, vp->nr_consts, vp, &vp->data)) {
142 nv30->draw_flags |= NV30_NEW_VERTPROG;
143 return;
144 }
145 }
146
147 if (eng3d->oclass < NV40_3D_CLASS) {
148 while (nr_reloc--) {
149 inst = vp->insns[reloc->location].data;
150 target = vp->data->start + reloc->target;
151
152 inst[1] &= ~0x0007fc000;
153 inst[1] |= (target & 0x1ff) << 14;
154 reloc++;
155 }
156 } else {
157 while (nr_reloc--) {
158 inst = vp->insns[reloc->location].data;
159 target = vp->data->start + reloc->target;
160
161 inst[1] &= ~0x0001ff000;
162 inst[1] |= (target & 0x1ff) << 12;
163 reloc++;
164 }
165 }
166
167 upload_code = TRUE;
168 upload_data = TRUE;
169 }
170
171 if (vp->nr_consts) {
172 struct nv04_resource *res = nv04_resource(nv30->vertprog.constbuf);
173
174 for (i = 0; i < vp->nr_consts; i++) {
175 struct nv30_vertprog_data *data = &vp->consts[i];
176
177 if (data->index < 0) {
178 if (!upload_data)
179 continue;
180 } else {
181 float *constbuf = (float *)res->data;
182 if (!upload_data &&
183 !memcmp(data->value, &constbuf[data->index * 4], 16))
184 continue;
185 memcpy(data->value, &constbuf[data->index * 4], 16);
186 }
187
188 BEGIN_NV04(push, NV30_3D(VP_UPLOAD_CONST_ID), 5);
189 PUSH_DATA (push, vp->data->start + i);
190 PUSH_DATAp(push, data->value, 4);
191 }
192 }
193
194 if (upload_code) {
195 BEGIN_NV04(push, NV30_3D(VP_UPLOAD_FROM_ID), 1);
196 PUSH_DATA (push, vp->exec->start);
197 for (i = 0; i < vp->nr_insns; i++) {
198 BEGIN_NV04(push, NV30_3D(VP_UPLOAD_INST(0)), 4);
199 PUSH_DATAp(push, vp->insns[i].data, 4);
200 }
201 }
202
203 if (nv30->dirty & (NV30_NEW_VERTPROG | NV30_NEW_FRAGPROG)) {
204 BEGIN_NV04(push, NV30_3D(VP_START_FROM_ID), 1);
205 PUSH_DATA (push, vp->exec->start);
206 if (eng3d->oclass < NV40_3D_CLASS) {
207 BEGIN_NV04(push, NV30_3D(ENGINE), 1);
208 PUSH_DATA (push, 0x00000013); /* vp instead of ff, somehow */
209 } else {
210 BEGIN_NV04(push, NV40_3D(VP_ATTRIB_EN), 2);
211 PUSH_DATA (push, vp->ir);
212 PUSH_DATA (push, vp->or | fp->vp_or);
213 BEGIN_NV04(push, NV30_3D(ENGINE), 1);
214 PUSH_DATA (push, 0x00000011);
215 }
216 }
217 }
218
219 static void *
220 nv30_vp_state_create(struct pipe_context *pipe,
221 const struct pipe_shader_state *cso)
222 {
223 struct nv30_vertprog *vp = CALLOC_STRUCT(nv30_vertprog);
224 if (!vp)
225 return NULL;
226
227 vp->pipe.tokens = tgsi_dup_tokens(cso->tokens);
228 tgsi_scan_shader(vp->pipe.tokens, &vp->info);
229 return vp;
230 }
231
232 static void
233 nv30_vp_state_delete(struct pipe_context *pipe, void *hwcso)
234 {
235 struct nv30_vertprog *vp = hwcso;
236
237 if (vp->translated)
238 nv30_vertprog_destroy(vp);
239 FREE((void *)vp->pipe.tokens);
240 FREE(vp);
241 }
242
243 static void
244 nv30_vp_state_bind(struct pipe_context *pipe, void *hwcso)
245 {
246 struct nv30_context *nv30 = nv30_context(pipe);
247
248 nv30->vertprog.program = hwcso;
249 nv30->dirty |= NV30_NEW_VERTPROG;
250 }
251
252 void
253 nv30_vertprog_init(struct pipe_context *pipe)
254 {
255 pipe->create_vs_state = nv30_vp_state_create;
256 pipe->bind_vs_state = nv30_vp_state_bind;
257 pipe->delete_vs_state = nv30_vp_state_delete;
258 }