2 * Copyright (C) 2014 Rob Clark <robclark@freedesktop.org>
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
24 * Rob Clark <robclark@freedesktop.org>
27 #include "pipe/p_state.h"
28 #include "util/u_string.h"
29 #include "util/u_memory.h"
30 #include "util/u_inlines.h"
31 #include "util/format/u_format.h"
33 #include "fd4_texture.h"
34 #include "fd4_format.h"
36 static enum a4xx_tex_clamp
37 tex_clamp(unsigned wrap
, bool clamp_to_edge
, bool *needs_border
)
39 /* Hardware does not support _CLAMP, but we emulate it: */
40 if (wrap
== PIPE_TEX_WRAP_CLAMP
) {
41 wrap
= (clamp_to_edge
) ?
42 PIPE_TEX_WRAP_CLAMP_TO_EDGE
: PIPE_TEX_WRAP_CLAMP_TO_BORDER
;
46 case PIPE_TEX_WRAP_REPEAT
:
47 return A4XX_TEX_REPEAT
;
48 case PIPE_TEX_WRAP_CLAMP_TO_EDGE
:
49 return A4XX_TEX_CLAMP_TO_EDGE
;
50 case PIPE_TEX_WRAP_CLAMP_TO_BORDER
:
52 return A4XX_TEX_CLAMP_TO_BORDER
;
53 case PIPE_TEX_WRAP_MIRROR_CLAMP_TO_EDGE
:
54 /* only works for PoT.. need to emulate otherwise! */
55 return A4XX_TEX_MIRROR_CLAMP
;
56 case PIPE_TEX_WRAP_MIRROR_REPEAT
:
57 return A4XX_TEX_MIRROR_REPEAT
;
58 case PIPE_TEX_WRAP_MIRROR_CLAMP
:
59 case PIPE_TEX_WRAP_MIRROR_CLAMP_TO_BORDER
:
60 /* these two we could perhaps emulate, but we currently
61 * just don't advertise PIPE_CAP_TEXTURE_MIRROR_CLAMP
64 DBG("invalid wrap: %u", wrap
);
69 static enum a4xx_tex_filter
70 tex_filter(unsigned filter
, bool aniso
)
73 case PIPE_TEX_FILTER_NEAREST
:
74 return A4XX_TEX_NEAREST
;
75 case PIPE_TEX_FILTER_LINEAR
:
76 return aniso
? A4XX_TEX_ANISO
: A4XX_TEX_LINEAR
;
78 DBG("invalid filter: %u", filter
);
84 fd4_sampler_state_create(struct pipe_context
*pctx
,
85 const struct pipe_sampler_state
*cso
)
87 struct fd4_sampler_stateobj
*so
= CALLOC_STRUCT(fd4_sampler_stateobj
);
88 unsigned aniso
= util_last_bit(MIN2(cso
->max_anisotropy
>> 1, 8));
89 bool miplinear
= false;
95 if (cso
->min_mip_filter
== PIPE_TEX_MIPFILTER_LINEAR
)
101 * For nearest filtering, _CLAMP means _CLAMP_TO_EDGE; for linear
102 * filtering, _CLAMP means _CLAMP_TO_BORDER while additionally
103 * clamping the texture coordinates to [0.0, 1.0].
105 * The clamping will be taken care of in the shaders. There are two
106 * filters here, but let the minification one has a say.
108 clamp_to_edge
= (cso
->min_img_filter
== PIPE_TEX_FILTER_NEAREST
);
109 if (!clamp_to_edge
) {
110 so
->saturate_s
= (cso
->wrap_s
== PIPE_TEX_WRAP_CLAMP
);
111 so
->saturate_t
= (cso
->wrap_t
== PIPE_TEX_WRAP_CLAMP
);
112 so
->saturate_r
= (cso
->wrap_r
== PIPE_TEX_WRAP_CLAMP
);
115 so
->needs_border
= false;
117 COND(miplinear
, A4XX_TEX_SAMP_0_MIPFILTER_LINEAR_NEAR
) |
118 A4XX_TEX_SAMP_0_XY_MAG(tex_filter(cso
->mag_img_filter
, aniso
)) |
119 A4XX_TEX_SAMP_0_XY_MIN(tex_filter(cso
->min_img_filter
, aniso
)) |
120 A4XX_TEX_SAMP_0_ANISO(aniso
) |
121 A4XX_TEX_SAMP_0_WRAP_S(tex_clamp(cso
->wrap_s
, clamp_to_edge
, &so
->needs_border
)) |
122 A4XX_TEX_SAMP_0_WRAP_T(tex_clamp(cso
->wrap_t
, clamp_to_edge
, &so
->needs_border
)) |
123 A4XX_TEX_SAMP_0_WRAP_R(tex_clamp(cso
->wrap_r
, clamp_to_edge
, &so
->needs_border
));
126 // COND(miplinear, A4XX_TEX_SAMP_1_MIPFILTER_LINEAR_FAR) |
127 COND(!cso
->seamless_cube_map
, A4XX_TEX_SAMP_1_CUBEMAPSEAMLESSFILTOFF
) |
128 COND(!cso
->normalized_coords
, A4XX_TEX_SAMP_1_UNNORM_COORDS
);
130 if (cso
->min_mip_filter
!= PIPE_TEX_MIPFILTER_NONE
) {
131 so
->texsamp0
|= A4XX_TEX_SAMP_0_LOD_BIAS(cso
->lod_bias
);
133 A4XX_TEX_SAMP_1_MIN_LOD(cso
->min_lod
) |
134 A4XX_TEX_SAMP_1_MAX_LOD(cso
->max_lod
);
137 if (cso
->compare_mode
)
138 so
->texsamp1
|= A4XX_TEX_SAMP_1_COMPARE_FUNC(cso
->compare_func
); /* maps 1:1 */
144 fd4_sampler_states_bind(struct pipe_context
*pctx
,
145 enum pipe_shader_type shader
, unsigned start
,
146 unsigned nr
, void **hwcso
)
148 struct fd_context
*ctx
= fd_context(pctx
);
149 struct fd4_context
*fd4_ctx
= fd4_context(ctx
);
150 uint16_t saturate_s
= 0, saturate_t
= 0, saturate_r
= 0;
156 for (i
= 0; i
< nr
; i
++) {
158 struct fd4_sampler_stateobj
*sampler
=
159 fd4_sampler_stateobj(hwcso
[i
]);
160 if (sampler
->saturate_s
)
161 saturate_s
|= (1 << i
);
162 if (sampler
->saturate_t
)
163 saturate_t
|= (1 << i
);
164 if (sampler
->saturate_r
)
165 saturate_r
|= (1 << i
);
169 fd_sampler_states_bind(pctx
, shader
, start
, nr
, hwcso
);
171 if (shader
== PIPE_SHADER_FRAGMENT
) {
176 fd4_ctx
->fsaturate_s
= saturate_s
;
177 fd4_ctx
->fsaturate_t
= saturate_t
;
178 fd4_ctx
->fsaturate_r
= saturate_r
;
179 } else if (shader
== PIPE_SHADER_VERTEX
) {
184 fd4_ctx
->vsaturate_s
= saturate_s
;
185 fd4_ctx
->vsaturate_t
= saturate_t
;
186 fd4_ctx
->vsaturate_r
= saturate_r
;
190 static enum a4xx_tex_type
191 tex_type(unsigned target
)
197 case PIPE_TEXTURE_1D
:
198 case PIPE_TEXTURE_1D_ARRAY
:
200 case PIPE_TEXTURE_RECT
:
201 case PIPE_TEXTURE_2D
:
202 case PIPE_TEXTURE_2D_ARRAY
:
204 case PIPE_TEXTURE_3D
:
206 case PIPE_TEXTURE_CUBE
:
207 case PIPE_TEXTURE_CUBE_ARRAY
:
208 return A4XX_TEX_CUBE
;
213 use_astc_srgb_workaround(struct pipe_context
*pctx
, enum pipe_format format
)
215 return (fd_screen(pctx
->screen
)->gpu_id
== 420) &&
216 (util_format_description(format
)->layout
== UTIL_FORMAT_LAYOUT_ASTC
);
219 static struct pipe_sampler_view
*
220 fd4_sampler_view_create(struct pipe_context
*pctx
, struct pipe_resource
*prsc
,
221 const struct pipe_sampler_view
*cso
)
223 struct fd4_pipe_sampler_view
*so
= CALLOC_STRUCT(fd4_pipe_sampler_view
);
224 struct fd_resource
*rsc
= fd_resource(prsc
);
225 enum pipe_format format
= cso
->format
;
226 unsigned lvl
, layers
= 0;
231 if (format
== PIPE_FORMAT_X32_S8X24_UINT
) {
233 format
= rsc
->base
.format
;
237 pipe_reference(NULL
, &prsc
->reference
);
238 so
->base
.texture
= prsc
;
239 so
->base
.reference
.count
= 1;
240 so
->base
.context
= pctx
;
243 A4XX_TEX_CONST_0_TYPE(tex_type(cso
->target
)) |
244 A4XX_TEX_CONST_0_FMT(fd4_pipe2tex(format
)) |
245 fd4_tex_swiz(format
, cso
->swizzle_r
, cso
->swizzle_g
,
246 cso
->swizzle_b
, cso
->swizzle_a
);
248 if (util_format_is_srgb(format
)) {
249 if (use_astc_srgb_workaround(pctx
, format
))
250 so
->astc_srgb
= true;
251 so
->texconst0
|= A4XX_TEX_CONST_0_SRGB
;
254 if (cso
->target
== PIPE_BUFFER
) {
255 unsigned elements
= cso
->u
.buf
.size
/ util_format_get_blocksize(format
);
259 A4XX_TEX_CONST_1_WIDTH(elements
) |
260 A4XX_TEX_CONST_1_HEIGHT(1);
262 A4XX_TEX_CONST_2_PITCH(elements
* rsc
->layout
.cpp
);
263 so
->offset
= cso
->u
.buf
.offset
;
267 lvl
= fd_sampler_first_level(cso
);
268 miplevels
= fd_sampler_last_level(cso
) - lvl
;
269 layers
= cso
->u
.tex
.last_layer
- cso
->u
.tex
.first_layer
+ 1;
271 so
->texconst0
|= A4XX_TEX_CONST_0_MIPLVLS(miplevels
);
273 A4XX_TEX_CONST_1_WIDTH(u_minify(prsc
->width0
, lvl
)) |
274 A4XX_TEX_CONST_1_HEIGHT(u_minify(prsc
->height0
, lvl
));
276 A4XX_TEX_CONST_2_PITCHALIGN(rsc
->layout
.pitchalign
- 5) |
277 A4XX_TEX_CONST_2_PITCH(fd_resource_pitch(rsc
, lvl
));
278 so
->offset
= fd_resource_offset(rsc
, lvl
, cso
->u
.tex
.first_layer
);
281 /* NOTE: since we sample z24s8 using 8888_UINT format, the swizzle
282 * we get isn't quite right. Use SWAP(XYZW) as a cheap and cheerful
283 * way to re-arrange things so stencil component is where the swiz
286 * Note that gallium expects stencil sampler to return (s,s,s,s)
287 * which isn't quite true. To make that happen we'd have to massage
288 * the swizzle. But in practice only the .x component is used.
290 if (format
== PIPE_FORMAT_X24S8_UINT
)
291 so
->texconst2
|= A4XX_TEX_CONST_2_SWAP(XYZW
);
293 switch (cso
->target
) {
294 case PIPE_TEXTURE_1D_ARRAY
:
295 case PIPE_TEXTURE_2D_ARRAY
:
297 A4XX_TEX_CONST_3_DEPTH(layers
) |
298 A4XX_TEX_CONST_3_LAYERSZ(rsc
->layout
.layer_size
);
300 case PIPE_TEXTURE_CUBE
:
301 case PIPE_TEXTURE_CUBE_ARRAY
:
303 A4XX_TEX_CONST_3_DEPTH(layers
/ 6) |
304 A4XX_TEX_CONST_3_LAYERSZ(rsc
->layout
.layer_size
);
306 case PIPE_TEXTURE_3D
:
308 A4XX_TEX_CONST_3_DEPTH(u_minify(prsc
->depth0
, lvl
)) |
309 A4XX_TEX_CONST_3_LAYERSZ(fd_resource_slice(rsc
, lvl
)->size0
);
310 so
->texconst4
= A4XX_TEX_CONST_4_LAYERSZ(
311 fd_resource_slice(rsc
, prsc
->last_level
)->size0
);
314 so
->texconst3
= 0x00000000;
322 fd4_set_sampler_views(struct pipe_context
*pctx
, enum pipe_shader_type shader
,
323 unsigned start
, unsigned nr
,
324 struct pipe_sampler_view
**views
)
326 struct fd_context
*ctx
= fd_context(pctx
);
327 struct fd4_context
*fd4_ctx
= fd4_context(ctx
);
328 uint16_t astc_srgb
= 0;
331 for (i
= 0; i
< nr
; i
++) {
333 struct fd4_pipe_sampler_view
*view
=
334 fd4_pipe_sampler_view(views
[i
]);
336 astc_srgb
|= (1 << i
);
340 fd_set_sampler_views(pctx
, shader
, start
, nr
, views
);
342 if (shader
== PIPE_SHADER_FRAGMENT
) {
343 fd4_ctx
->fastc_srgb
= astc_srgb
;
344 } else if (shader
== PIPE_SHADER_VERTEX
) {
345 fd4_ctx
->vastc_srgb
= astc_srgb
;
350 fd4_texture_init(struct pipe_context
*pctx
)
352 pctx
->create_sampler_state
= fd4_sampler_state_create
;
353 pctx
->bind_sampler_states
= fd4_sampler_states_bind
;
354 pctx
->create_sampler_view
= fd4_sampler_view_create
;
355 pctx
->set_sampler_views
= fd4_set_sampler_views
;