2 * Copyright (C) 2016 Rob Clark <robclark@freedesktop.org>
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
24 * Rob Clark <robclark@freedesktop.org>
27 #include "pipe/p_state.h"
28 #include "util/u_string.h"
29 #include "util/u_memory.h"
30 #include "util/u_inlines.h"
31 #include "util/u_format.h"
33 #include "fd5_texture.h"
34 #include "fd5_format.h"
36 static enum a5xx_tex_clamp
37 tex_clamp(unsigned wrap
, bool clamp_to_edge
, bool *needs_border
)
39 /* Hardware does not support _CLAMP, but we emulate it: */
40 if (wrap
== PIPE_TEX_WRAP_CLAMP
) {
41 wrap
= (clamp_to_edge
) ?
42 PIPE_TEX_WRAP_CLAMP_TO_EDGE
: PIPE_TEX_WRAP_CLAMP_TO_BORDER
;
46 case PIPE_TEX_WRAP_REPEAT
:
47 return A5XX_TEX_REPEAT
;
48 case PIPE_TEX_WRAP_CLAMP_TO_EDGE
:
49 return A5XX_TEX_CLAMP_TO_EDGE
;
50 case PIPE_TEX_WRAP_CLAMP_TO_BORDER
:
52 return A5XX_TEX_CLAMP_TO_BORDER
;
53 case PIPE_TEX_WRAP_MIRROR_CLAMP_TO_EDGE
:
54 /* only works for PoT.. need to emulate otherwise! */
55 return A5XX_TEX_MIRROR_CLAMP
;
56 case PIPE_TEX_WRAP_MIRROR_REPEAT
:
57 return A5XX_TEX_MIRROR_REPEAT
;
58 case PIPE_TEX_WRAP_MIRROR_CLAMP
:
59 case PIPE_TEX_WRAP_MIRROR_CLAMP_TO_BORDER
:
60 /* these two we could perhaps emulate, but we currently
61 * just don't advertise PIPE_CAP_TEXTURE_MIRROR_CLAMP
64 DBG("invalid wrap: %u", wrap
);
69 static enum a5xx_tex_filter
70 tex_filter(unsigned filter
, bool aniso
)
73 case PIPE_TEX_FILTER_NEAREST
:
74 return A5XX_TEX_NEAREST
;
75 case PIPE_TEX_FILTER_LINEAR
:
76 return aniso
? A5XX_TEX_ANISO
: A5XX_TEX_LINEAR
;
78 DBG("invalid filter: %u", filter
);
84 fd5_sampler_state_create(struct pipe_context
*pctx
,
85 const struct pipe_sampler_state
*cso
)
87 struct fd5_sampler_stateobj
*so
= CALLOC_STRUCT(fd5_sampler_stateobj
);
88 unsigned aniso
= util_last_bit(MIN2(cso
->max_anisotropy
>> 1, 8));
89 bool miplinear
= false;
97 if (cso
->min_mip_filter
== PIPE_TEX_MIPFILTER_LINEAR
)
101 * For nearest filtering, _CLAMP means _CLAMP_TO_EDGE; for linear
102 * filtering, _CLAMP means _CLAMP_TO_BORDER while additionally
103 * clamping the texture coordinates to [0.0, 1.0].
105 * The clamping will be taken care of in the shaders. There are two
106 * filters here, but let the minification one has a say.
108 clamp_to_edge
= (cso
->min_img_filter
== PIPE_TEX_FILTER_NEAREST
);
109 if (!clamp_to_edge
) {
110 so
->saturate_s
= (cso
->wrap_s
== PIPE_TEX_WRAP_CLAMP
);
111 so
->saturate_t
= (cso
->wrap_t
== PIPE_TEX_WRAP_CLAMP
);
112 so
->saturate_r
= (cso
->wrap_r
== PIPE_TEX_WRAP_CLAMP
);
115 so
->needs_border
= false;
117 COND(miplinear
, A5XX_TEX_SAMP_0_MIPFILTER_LINEAR_NEAR
) |
118 A5XX_TEX_SAMP_0_XY_MAG(tex_filter(cso
->mag_img_filter
, aniso
)) |
119 A5XX_TEX_SAMP_0_XY_MIN(tex_filter(cso
->min_img_filter
, aniso
)) |
120 A5XX_TEX_SAMP_0_ANISO(aniso
) |
121 A5XX_TEX_SAMP_0_WRAP_S(tex_clamp(cso
->wrap_s
, clamp_to_edge
, &so
->needs_border
)) |
122 A5XX_TEX_SAMP_0_WRAP_T(tex_clamp(cso
->wrap_t
, clamp_to_edge
, &so
->needs_border
)) |
123 A5XX_TEX_SAMP_0_WRAP_R(tex_clamp(cso
->wrap_r
, clamp_to_edge
, &so
->needs_border
));
126 COND(!cso
->seamless_cube_map
, A5XX_TEX_SAMP_1_CUBEMAPSEAMLESSFILTOFF
) |
127 COND(!cso
->normalized_coords
, A5XX_TEX_SAMP_1_UNNORM_COORDS
);
129 if (cso
->min_mip_filter
!= PIPE_TEX_MIPFILTER_NONE
) {
130 so
->texsamp0
|= A5XX_TEX_SAMP_0_LOD_BIAS(cso
->lod_bias
);
132 A5XX_TEX_SAMP_1_MIN_LOD(cso
->min_lod
) |
133 A5XX_TEX_SAMP_1_MAX_LOD(cso
->max_lod
);
136 if (cso
->compare_mode
)
137 so
->texsamp1
|= A5XX_TEX_SAMP_1_COMPARE_FUNC(cso
->compare_func
); /* maps 1:1 */
143 fd5_sampler_states_bind(struct pipe_context
*pctx
,
144 enum pipe_shader_type shader
, unsigned start
,
145 unsigned nr
, void **hwcso
)
147 struct fd_context
*ctx
= fd_context(pctx
);
148 struct fd5_context
*fd5_ctx
= fd5_context(ctx
);
149 uint16_t saturate_s
= 0, saturate_t
= 0, saturate_r
= 0;
155 for (i
= 0; i
< nr
; i
++) {
157 struct fd5_sampler_stateobj
*sampler
=
158 fd5_sampler_stateobj(hwcso
[i
]);
159 if (sampler
->saturate_s
)
160 saturate_s
|= (1 << i
);
161 if (sampler
->saturate_t
)
162 saturate_t
|= (1 << i
);
163 if (sampler
->saturate_r
)
164 saturate_r
|= (1 << i
);
168 fd_sampler_states_bind(pctx
, shader
, start
, nr
, hwcso
);
170 if (shader
== PIPE_SHADER_FRAGMENT
) {
175 fd5_ctx
->fsaturate_s
= saturate_s
;
176 fd5_ctx
->fsaturate_t
= saturate_t
;
177 fd5_ctx
->fsaturate_r
= saturate_r
;
178 } else if (shader
== PIPE_SHADER_VERTEX
) {
183 fd5_ctx
->vsaturate_s
= saturate_s
;
184 fd5_ctx
->vsaturate_t
= saturate_t
;
185 fd5_ctx
->vsaturate_r
= saturate_r
;
190 use_astc_srgb_workaround(struct pipe_context
*pctx
, enum pipe_format format
)
192 return false; // TODO check if this is still needed on a5xx
195 static struct pipe_sampler_view
*
196 fd5_sampler_view_create(struct pipe_context
*pctx
, struct pipe_resource
*prsc
,
197 const struct pipe_sampler_view
*cso
)
199 struct fd5_pipe_sampler_view
*so
= CALLOC_STRUCT(fd5_pipe_sampler_view
);
200 struct fd_resource
*rsc
= fd_resource(prsc
);
201 enum pipe_format format
= cso
->format
;
202 unsigned lvl
, layers
;
207 if (format
== PIPE_FORMAT_X32_S8X24_UINT
) {
209 format
= rsc
->base
.format
;
213 pipe_reference(NULL
, &prsc
->reference
);
214 so
->base
.texture
= prsc
;
215 so
->base
.reference
.count
= 1;
216 so
->base
.context
= pctx
;
219 A5XX_TEX_CONST_0_FMT(fd5_pipe2tex(format
)) |
220 A5XX_TEX_CONST_0_SAMPLES(fd_msaa_samples(prsc
->nr_samples
)) |
221 fd5_tex_swiz(format
, cso
->swizzle_r
, cso
->swizzle_g
,
222 cso
->swizzle_b
, cso
->swizzle_a
);
224 /* NOTE: since we sample z24s8 using 8888_UINT format, the swizzle
225 * we get isn't quite right. Use SWAP(XYZW) as a cheap and cheerful
226 * way to re-arrange things so stencil component is where the swiz
229 * Note that gallium expects stencil sampler to return (s,s,s,s)
230 * which isn't quite true. To make that happen we'd have to massage
231 * the swizzle. But in practice only the .x component is used.
233 if (format
== PIPE_FORMAT_X24S8_UINT
) {
234 so
->texconst0
|= A5XX_TEX_CONST_0_SWAP(XYZW
);
237 if (util_format_is_srgb(format
)) {
238 if (use_astc_srgb_workaround(pctx
, format
))
239 so
->astc_srgb
= true;
240 so
->texconst0
|= A5XX_TEX_CONST_0_SRGB
;
243 if (cso
->target
== PIPE_BUFFER
) {
244 unsigned elements
= cso
->u
.buf
.size
/ util_format_get_blocksize(format
);
248 A5XX_TEX_CONST_1_WIDTH(elements
) |
249 A5XX_TEX_CONST_1_HEIGHT(1);
251 A5XX_TEX_CONST_2_FETCHSIZE(fd5_pipe2fetchsize(format
)) |
252 A5XX_TEX_CONST_2_PITCH(elements
* rsc
->cpp
);
253 so
->offset
= cso
->u
.buf
.offset
;
257 lvl
= fd_sampler_first_level(cso
);
258 miplevels
= fd_sampler_last_level(cso
) - lvl
;
259 layers
= cso
->u
.tex
.last_layer
- cso
->u
.tex
.first_layer
+ 1;
261 so
->texconst0
|= A5XX_TEX_CONST_0_MIPLVLS(miplevels
);
263 A5XX_TEX_CONST_1_WIDTH(u_minify(prsc
->width0
, lvl
)) |
264 A5XX_TEX_CONST_1_HEIGHT(u_minify(prsc
->height0
, lvl
));
266 A5XX_TEX_CONST_2_FETCHSIZE(fd5_pipe2fetchsize(format
)) |
267 A5XX_TEX_CONST_2_PITCH(
268 util_format_get_nblocksx(
269 format
, rsc
->slices
[lvl
].pitch
) * rsc
->cpp
);
270 so
->offset
= fd_resource_offset(rsc
, lvl
, cso
->u
.tex
.first_layer
);
273 so
->texconst2
|= A5XX_TEX_CONST_2_TYPE(fd5_tex_type(cso
->target
));
275 switch (cso
->target
) {
276 case PIPE_TEXTURE_RECT
:
277 case PIPE_TEXTURE_1D
:
278 case PIPE_TEXTURE_2D
:
280 A5XX_TEX_CONST_3_ARRAY_PITCH(rsc
->layer_size
);
282 A5XX_TEX_CONST_5_DEPTH(1);
284 case PIPE_TEXTURE_1D_ARRAY
:
285 case PIPE_TEXTURE_2D_ARRAY
:
287 A5XX_TEX_CONST_3_ARRAY_PITCH(rsc
->layer_size
);
289 A5XX_TEX_CONST_5_DEPTH(layers
);
291 case PIPE_TEXTURE_CUBE
:
292 case PIPE_TEXTURE_CUBE_ARRAY
:
294 A5XX_TEX_CONST_3_ARRAY_PITCH(rsc
->layer_size
);
296 A5XX_TEX_CONST_5_DEPTH(layers
/ 6);
298 case PIPE_TEXTURE_3D
:
300 A5XX_TEX_CONST_3_ARRAY_PITCH(rsc
->slices
[lvl
].size0
);
302 A5XX_TEX_CONST_5_DEPTH(u_minify(prsc
->depth0
, lvl
));
305 so
->texconst3
= 0x00000000;
313 fd5_set_sampler_views(struct pipe_context
*pctx
, enum pipe_shader_type shader
,
314 unsigned start
, unsigned nr
,
315 struct pipe_sampler_view
**views
)
317 struct fd_context
*ctx
= fd_context(pctx
);
318 struct fd5_context
*fd5_ctx
= fd5_context(ctx
);
319 uint16_t astc_srgb
= 0;
322 for (i
= 0; i
< nr
; i
++) {
324 struct fd5_pipe_sampler_view
*view
=
325 fd5_pipe_sampler_view(views
[i
]);
327 astc_srgb
|= (1 << i
);
331 fd_set_sampler_views(pctx
, shader
, start
, nr
, views
);
333 if (shader
== PIPE_SHADER_FRAGMENT
) {
334 fd5_ctx
->fastc_srgb
= astc_srgb
;
335 } else if (shader
== PIPE_SHADER_VERTEX
) {
336 fd5_ctx
->vastc_srgb
= astc_srgb
;
341 fd5_texture_init(struct pipe_context
*pctx
)
343 pctx
->create_sampler_state
= fd5_sampler_state_create
;
344 pctx
->bind_sampler_states
= fd5_sampler_states_bind
;
345 pctx
->create_sampler_view
= fd5_sampler_view_create
;
346 pctx
->set_sampler_views
= fd5_set_sampler_views
;