nv50: support vertex program textures
[mesa.git] / src / gallium / drivers / nv50 / nv50_tex.c
1 /*
2 * Copyright 2008 Ben Skeggs
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE AUTHORS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
18 * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF
19 * OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
20 * SOFTWARE.
21 */
22
23 #include "nv50_context.h"
24 #include "nv50_texture.h"
25
26 #include "nouveau/nouveau_stateobj.h"
27
28 #define _MIXED(pf, t0, t1, t2, t3, cr, cg, cb, ca, f) \
29 { \
30 PIPE_FORMAT_##pf, \
31 NV50TIC_0_0_MAPR_##cr | NV50TIC_0_0_TYPER_##t0 | \
32 NV50TIC_0_0_MAPG_##cg | NV50TIC_0_0_TYPEG_##t1 | \
33 NV50TIC_0_0_MAPB_##cb | NV50TIC_0_0_TYPEB_##t2 | \
34 NV50TIC_0_0_MAPA_##ca | NV50TIC_0_0_TYPEA_##t3 | \
35 NV50TIC_0_0_FMT_##f \
36 }
37
38 #define _(pf, t, cr, cg, cb, ca, f) _MIXED(pf, t, t, t, t, cr, cg, cb, ca, f)
39
40 struct nv50_texture_format {
41 enum pipe_format pf;
42 uint32_t hw;
43 };
44
45 #define NV50_TEX_FORMAT_LIST_SIZE \
46 (sizeof(nv50_tex_format_list) / sizeof(struct nv50_texture_format))
47
48 static const struct nv50_texture_format nv50_tex_format_list[] =
49 {
50 _(A8R8G8B8_UNORM, UNORM, C2, C1, C0, C3, 8_8_8_8),
51 _(A8R8G8B8_SRGB, UNORM, C2, C1, C0, C3, 8_8_8_8),
52 _(X8R8G8B8_UNORM, UNORM, C2, C1, C0, ONE, 8_8_8_8),
53 _(X8R8G8B8_SRGB, UNORM, C2, C1, C0, ONE, 8_8_8_8),
54 _(A1R5G5B5_UNORM, UNORM, C2, C1, C0, C3, 1_5_5_5),
55 _(A4R4G4B4_UNORM, UNORM, C2, C1, C0, C3, 4_4_4_4),
56
57 _(R5G6B5_UNORM, UNORM, C2, C1, C0, ONE, 5_6_5),
58
59 _(L8_UNORM, UNORM, C0, C0, C0, ONE, 8),
60 _(A8_UNORM, UNORM, ZERO, ZERO, ZERO, C0, 8),
61 _(I8_UNORM, UNORM, C0, C0, C0, C0, 8),
62
63 _(A8L8_UNORM, UNORM, C0, C0, C0, C1, 8_8),
64
65 _(DXT1_RGB, UNORM, C0, C1, C2, ONE, DXT1),
66 _(DXT1_RGBA, UNORM, C0, C1, C2, C3, DXT1),
67 _(DXT3_RGBA, UNORM, C0, C1, C2, C3, DXT3),
68 _(DXT5_RGBA, UNORM, C0, C1, C2, C3, DXT5),
69
70 _MIXED(Z24S8_UNORM, UINT, UNORM, UINT, UINT, C1, C1, C1, ONE, 24_8),
71
72 _(R16G16B16A16_SNORM, UNORM, C0, C1, C2, C3, 16_16_16_16),
73 _(R16G16B16A16_UNORM, SNORM, C0, C1, C2, C3, 16_16_16_16),
74 _(R32G32B32A32_FLOAT, FLOAT, C0, C1, C2, C3, 32_32_32_32),
75
76 _(R16G16_SNORM, SNORM, C0, C1, ZERO, ONE, 16_16),
77 _(R16G16_UNORM, UNORM, C0, C1, ZERO, ONE, 16_16),
78
79 _MIXED(Z32_FLOAT, FLOAT, UINT, UINT, UINT, C0, C0, C0, ONE, 32_DEPTH)
80
81 };
82
83 #undef _
84 #undef _MIXED
85
86 static int
87 nv50_tex_construct(struct nv50_context *nv50, struct nouveau_stateobj *so,
88 struct nv50_miptree *mt, int unit, unsigned p)
89 {
90 unsigned i;
91 uint32_t mode;
92
93 for (i = 0; i < NV50_TEX_FORMAT_LIST_SIZE; i++)
94 if (nv50_tex_format_list[i].pf == mt->base.base.format)
95 break;
96 if (i == NV50_TEX_FORMAT_LIST_SIZE)
97 return 1;
98
99 if (nv50->sampler[p][unit]->normalized)
100 mode = 0x50001000 | (1 << 31);
101 else {
102 mode = 0x50001000 | (7 << 14);
103 assert(mt->base.base.target == PIPE_TEXTURE_2D);
104 }
105
106 mode |= ((mt->base.bo->tile_mode & 0x0f) << 22) |
107 ((mt->base.bo->tile_mode & 0xf0) << 21);
108
109 if (pf_type(mt->base.base.format) == PIPE_FORMAT_TYPE_SRGB)
110 mode |= 0x0400;
111
112 switch (mt->base.base.target) {
113 case PIPE_TEXTURE_1D:
114 break;
115 case PIPE_TEXTURE_2D:
116 mode |= (1 << 14);
117 break;
118 case PIPE_TEXTURE_3D:
119 mode |= (2 << 14);
120 break;
121 case PIPE_TEXTURE_CUBE:
122 mode |= (3 << 14);
123 break;
124 default:
125 assert(!"unsupported texture target");
126 break;
127 }
128
129 so_data (so, nv50_tex_format_list[i].hw);
130 so_reloc(so, mt->base.bo, 0, NOUVEAU_BO_VRAM | NOUVEAU_BO_LOW |
131 NOUVEAU_BO_RD, 0, 0);
132 so_data (so, mode);
133 so_data (so, 0x00300000);
134 so_data (so, mt->base.base.width0 | (1 << 31));
135 so_data (so, (mt->base.base.last_level << 28) |
136 (mt->base.base.depth0 << 16) | mt->base.base.height0);
137 so_data (so, 0x03000000);
138 so_data (so, mt->base.base.last_level << 4);
139
140 return 0;
141 }
142
143 #ifndef NV50TCL_BIND_TIC
144 #define NV50TCL_BIND_TIC(n) (0x1448 + 8 * n)
145 #endif
146
147 static boolean
148 nv50_validate_textures(struct nv50_context *nv50, struct nouveau_stateobj *so,
149 unsigned p)
150 {
151 static const unsigned p_remap[PIPE_SHADER_TYPES] = { 0, 2 };
152
153 struct nouveau_grobj *eng2d = nv50->screen->eng2d;
154 struct nouveau_grobj *tesla = nv50->screen->tesla;
155 unsigned unit, j, p_hw = p_remap[p];
156
157 nv50_so_init_sifc(nv50, so, nv50->screen->tic, NOUVEAU_BO_VRAM,
158 p * (32 * 8 * 4), nv50->miptree_nr[p] * 8 * 4);
159
160 for (unit = 0; unit < nv50->miptree_nr[p]; ++unit) {
161 struct nv50_miptree *mt = nv50->miptree[p][unit];
162
163 so_method(so, eng2d, NV50_2D_SIFC_DATA | (2 << 29), 8);
164 if (mt) {
165 if (nv50_tex_construct(nv50, so, mt, unit, p))
166 return FALSE;
167 /* Set TEX insn $t src binding $unit in program type p
168 * to TIC, TSC entry (32 * p + unit), mark valid (1).
169 */
170 so_method(so, tesla, NV50TCL_BIND_TIC(p_hw), 1);
171 so_data (so, ((32 * p + unit) << 9) | (unit << 1) | 1);
172 } else {
173 for (j = 0; j < 8; ++j)
174 so_data(so, 0);
175 so_method(so, tesla, NV50TCL_BIND_TIC(p_hw), 1);
176 so_data (so, (unit << 1) | 0);
177 }
178 }
179
180 for (; unit < nv50->state.miptree_nr[p]; unit++) {
181 /* Make other bindings invalid. */
182 so_method(so, tesla, NV50TCL_BIND_TIC(p_hw), 1);
183 so_data (so, (unit << 1) | 0);
184 }
185
186 nv50->state.miptree_nr[p] = nv50->miptree_nr[p];
187 return TRUE;
188 }
189
190 void
191 nv50_tex_validate(struct nv50_context *nv50)
192 {
193 struct nouveau_stateobj *so;
194 struct nouveau_grobj *tesla = nv50->screen->tesla;
195 unsigned p, push, nrlc;
196
197 for (nrlc = 0, push = 0, p = 0; p < PIPE_SHADER_TYPES; ++p) {
198 push += MAX2(nv50->miptree_nr[p], nv50->state.miptree_nr[p]);
199 nrlc += nv50->miptree_nr[p];
200 }
201 push = push * 11 + 23 * PIPE_SHADER_TYPES + 4;
202 nrlc = nrlc * 2 + 2 * PIPE_SHADER_TYPES;
203
204 so = so_new(push, nrlc);
205
206 if (nv50_validate_textures(nv50, so, PIPE_SHADER_VERTEX) == FALSE ||
207 nv50_validate_textures(nv50, so, PIPE_SHADER_FRAGMENT) == FALSE) {
208 so_ref(NULL, &so);
209
210 NOUVEAU_ERR("failed tex validate\n");
211 return;
212 }
213
214 /* not sure if the following really do what I think: */
215 so_method(so, tesla, 0x1330, 1); /* flush TIC */
216 so_data (so, 0);
217 so_method(so, tesla, 0x1338, 1); /* flush texture caches */
218 so_data (so, 0x20);
219
220 so_ref(so, &nv50->state.tic_upload);
221 so_ref(NULL, &so);
222 }