2 * Copyright (C) 2014 Rob Clark <robclark@freedesktop.org>
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
24 * Rob Clark <robclark@freedesktop.org>
27 #include "pipe/p_state.h"
28 #include "util/u_string.h"
29 #include "util/u_memory.h"
30 #include "util/u_inlines.h"
31 #include "util/format/u_format.h"
33 #include "fd4_texture.h"
34 #include "fd4_format.h"
36 static enum a4xx_tex_clamp
37 tex_clamp(unsigned wrap
, bool clamp_to_edge
, bool *needs_border
)
39 /* Hardware does not support _CLAMP, but we emulate it: */
40 if (wrap
== PIPE_TEX_WRAP_CLAMP
) {
41 wrap
= (clamp_to_edge
) ?
42 PIPE_TEX_WRAP_CLAMP_TO_EDGE
: PIPE_TEX_WRAP_CLAMP_TO_BORDER
;
46 case PIPE_TEX_WRAP_REPEAT
:
47 return A4XX_TEX_REPEAT
;
48 case PIPE_TEX_WRAP_CLAMP_TO_EDGE
:
49 return A4XX_TEX_CLAMP_TO_EDGE
;
50 case PIPE_TEX_WRAP_CLAMP_TO_BORDER
:
52 return A4XX_TEX_CLAMP_TO_BORDER
;
53 case PIPE_TEX_WRAP_MIRROR_CLAMP_TO_EDGE
:
54 /* only works for PoT.. need to emulate otherwise! */
55 return A4XX_TEX_MIRROR_CLAMP
;
56 case PIPE_TEX_WRAP_MIRROR_REPEAT
:
57 return A4XX_TEX_MIRROR_REPEAT
;
58 case PIPE_TEX_WRAP_MIRROR_CLAMP
:
59 case PIPE_TEX_WRAP_MIRROR_CLAMP_TO_BORDER
:
60 /* these two we could perhaps emulate, but we currently
61 * just don't advertise PIPE_CAP_TEXTURE_MIRROR_CLAMP
64 DBG("invalid wrap: %u", wrap
);
69 static enum a4xx_tex_filter
70 tex_filter(unsigned filter
, bool aniso
)
73 case PIPE_TEX_FILTER_NEAREST
:
74 return A4XX_TEX_NEAREST
;
75 case PIPE_TEX_FILTER_LINEAR
:
76 return aniso
? A4XX_TEX_ANISO
: A4XX_TEX_LINEAR
;
78 DBG("invalid filter: %u", filter
);
84 fd4_sampler_state_create(struct pipe_context
*pctx
,
85 const struct pipe_sampler_state
*cso
)
87 struct fd4_sampler_stateobj
*so
= CALLOC_STRUCT(fd4_sampler_stateobj
);
88 unsigned aniso
= util_last_bit(MIN2(cso
->max_anisotropy
>> 1, 8));
89 bool miplinear
= false;
95 if (cso
->min_mip_filter
== PIPE_TEX_MIPFILTER_LINEAR
)
101 * For nearest filtering, _CLAMP means _CLAMP_TO_EDGE; for linear
102 * filtering, _CLAMP means _CLAMP_TO_BORDER while additionally
103 * clamping the texture coordinates to [0.0, 1.0].
105 * The clamping will be taken care of in the shaders. There are two
106 * filters here, but let the minification one has a say.
108 clamp_to_edge
= (cso
->min_img_filter
== PIPE_TEX_FILTER_NEAREST
);
109 if (!clamp_to_edge
) {
110 so
->saturate_s
= (cso
->wrap_s
== PIPE_TEX_WRAP_CLAMP
);
111 so
->saturate_t
= (cso
->wrap_t
== PIPE_TEX_WRAP_CLAMP
);
112 so
->saturate_r
= (cso
->wrap_r
== PIPE_TEX_WRAP_CLAMP
);
115 so
->needs_border
= false;
117 COND(miplinear
, A4XX_TEX_SAMP_0_MIPFILTER_LINEAR_NEAR
) |
118 A4XX_TEX_SAMP_0_XY_MAG(tex_filter(cso
->mag_img_filter
, aniso
)) |
119 A4XX_TEX_SAMP_0_XY_MIN(tex_filter(cso
->min_img_filter
, aniso
)) |
120 A4XX_TEX_SAMP_0_ANISO(aniso
) |
121 A4XX_TEX_SAMP_0_WRAP_S(tex_clamp(cso
->wrap_s
, clamp_to_edge
, &so
->needs_border
)) |
122 A4XX_TEX_SAMP_0_WRAP_T(tex_clamp(cso
->wrap_t
, clamp_to_edge
, &so
->needs_border
)) |
123 A4XX_TEX_SAMP_0_WRAP_R(tex_clamp(cso
->wrap_r
, clamp_to_edge
, &so
->needs_border
));
126 // COND(miplinear, A4XX_TEX_SAMP_1_MIPFILTER_LINEAR_FAR) |
127 COND(!cso
->seamless_cube_map
, A4XX_TEX_SAMP_1_CUBEMAPSEAMLESSFILTOFF
) |
128 COND(!cso
->normalized_coords
, A4XX_TEX_SAMP_1_UNNORM_COORDS
);
130 if (cso
->min_mip_filter
!= PIPE_TEX_MIPFILTER_NONE
) {
131 so
->texsamp0
|= A4XX_TEX_SAMP_0_LOD_BIAS(cso
->lod_bias
);
133 A4XX_TEX_SAMP_1_MIN_LOD(cso
->min_lod
) |
134 A4XX_TEX_SAMP_1_MAX_LOD(cso
->max_lod
);
137 if (cso
->compare_mode
)
138 so
->texsamp1
|= A4XX_TEX_SAMP_1_COMPARE_FUNC(cso
->compare_func
); /* maps 1:1 */
144 fd4_sampler_states_bind(struct pipe_context
*pctx
,
145 enum pipe_shader_type shader
, unsigned start
,
146 unsigned nr
, void **hwcso
)
148 struct fd_context
*ctx
= fd_context(pctx
);
149 struct fd4_context
*fd4_ctx
= fd4_context(ctx
);
150 uint16_t saturate_s
= 0, saturate_t
= 0, saturate_r
= 0;
156 for (i
= 0; i
< nr
; i
++) {
158 struct fd4_sampler_stateobj
*sampler
=
159 fd4_sampler_stateobj(hwcso
[i
]);
160 if (sampler
->saturate_s
)
161 saturate_s
|= (1 << i
);
162 if (sampler
->saturate_t
)
163 saturate_t
|= (1 << i
);
164 if (sampler
->saturate_r
)
165 saturate_r
|= (1 << i
);
169 fd_sampler_states_bind(pctx
, shader
, start
, nr
, hwcso
);
171 if (shader
== PIPE_SHADER_FRAGMENT
) {
176 fd4_ctx
->fsaturate_s
= saturate_s
;
177 fd4_ctx
->fsaturate_t
= saturate_t
;
178 fd4_ctx
->fsaturate_r
= saturate_r
;
179 } else if (shader
== PIPE_SHADER_VERTEX
) {
184 fd4_ctx
->vsaturate_s
= saturate_s
;
185 fd4_ctx
->vsaturate_t
= saturate_t
;
186 fd4_ctx
->vsaturate_r
= saturate_r
;
190 static enum a4xx_tex_type
191 tex_type(unsigned target
)
197 case PIPE_TEXTURE_1D
:
198 case PIPE_TEXTURE_1D_ARRAY
:
200 case PIPE_TEXTURE_RECT
:
201 case PIPE_TEXTURE_2D
:
202 case PIPE_TEXTURE_2D_ARRAY
:
204 case PIPE_TEXTURE_3D
:
206 case PIPE_TEXTURE_CUBE
:
207 case PIPE_TEXTURE_CUBE_ARRAY
:
208 return A4XX_TEX_CUBE
;
213 use_astc_srgb_workaround(struct pipe_context
*pctx
, enum pipe_format format
)
215 return (fd_screen(pctx
->screen
)->gpu_id
== 420) &&
216 (util_format_description(format
)->layout
== UTIL_FORMAT_LAYOUT_ASTC
);
219 static struct pipe_sampler_view
*
220 fd4_sampler_view_create(struct pipe_context
*pctx
, struct pipe_resource
*prsc
,
221 const struct pipe_sampler_view
*cso
)
223 struct fd4_pipe_sampler_view
*so
= CALLOC_STRUCT(fd4_pipe_sampler_view
);
224 struct fd_resource
*rsc
= fd_resource(prsc
);
225 struct fdl_slice
*slice
= NULL
;
226 enum pipe_format format
= cso
->format
;
227 unsigned lvl
, layers
= 0;
232 if (format
== PIPE_FORMAT_X32_S8X24_UINT
) {
234 format
= rsc
->base
.format
;
238 pipe_reference(NULL
, &prsc
->reference
);
239 so
->base
.texture
= prsc
;
240 so
->base
.reference
.count
= 1;
241 so
->base
.context
= pctx
;
244 A4XX_TEX_CONST_0_TYPE(tex_type(cso
->target
)) |
245 A4XX_TEX_CONST_0_FMT(fd4_pipe2tex(format
)) |
246 fd4_tex_swiz(format
, cso
->swizzle_r
, cso
->swizzle_g
,
247 cso
->swizzle_b
, cso
->swizzle_a
);
249 if (util_format_is_srgb(format
)) {
250 if (use_astc_srgb_workaround(pctx
, format
))
251 so
->astc_srgb
= true;
252 so
->texconst0
|= A4XX_TEX_CONST_0_SRGB
;
255 if (cso
->target
== PIPE_BUFFER
) {
256 unsigned elements
= cso
->u
.buf
.size
/ util_format_get_blocksize(format
);
260 A4XX_TEX_CONST_1_WIDTH(elements
) |
261 A4XX_TEX_CONST_1_HEIGHT(1);
263 A4XX_TEX_CONST_2_FETCHSIZE(fd4_pipe2fetchsize(format
)) |
264 A4XX_TEX_CONST_2_PITCH(elements
* rsc
->layout
.cpp
);
265 so
->offset
= cso
->u
.buf
.offset
;
269 lvl
= fd_sampler_first_level(cso
);
270 slice
= fd_resource_slice(rsc
, lvl
);
271 miplevels
= fd_sampler_last_level(cso
) - lvl
;
272 layers
= cso
->u
.tex
.last_layer
- cso
->u
.tex
.first_layer
+ 1;
274 so
->texconst0
|= A4XX_TEX_CONST_0_MIPLVLS(miplevels
);
276 A4XX_TEX_CONST_1_WIDTH(u_minify(prsc
->width0
, lvl
)) |
277 A4XX_TEX_CONST_1_HEIGHT(u_minify(prsc
->height0
, lvl
));
279 A4XX_TEX_CONST_2_FETCHSIZE(fd4_pipe2fetchsize(format
)) |
280 A4XX_TEX_CONST_2_PITCH(slice
->pitch
);
281 so
->offset
= fd_resource_offset(rsc
, lvl
, cso
->u
.tex
.first_layer
);
284 /* NOTE: since we sample z24s8 using 8888_UINT format, the swizzle
285 * we get isn't quite right. Use SWAP(XYZW) as a cheap and cheerful
286 * way to re-arrange things so stencil component is where the swiz
289 * Note that gallium expects stencil sampler to return (s,s,s,s)
290 * which isn't quite true. To make that happen we'd have to massage
291 * the swizzle. But in practice only the .x component is used.
293 if (format
== PIPE_FORMAT_X24S8_UINT
)
294 so
->texconst2
|= A4XX_TEX_CONST_2_SWAP(XYZW
);
296 switch (cso
->target
) {
297 case PIPE_TEXTURE_1D_ARRAY
:
298 case PIPE_TEXTURE_2D_ARRAY
:
300 A4XX_TEX_CONST_3_DEPTH(layers
) |
301 A4XX_TEX_CONST_3_LAYERSZ(rsc
->layout
.layer_size
);
303 case PIPE_TEXTURE_CUBE
:
304 case PIPE_TEXTURE_CUBE_ARRAY
:
306 A4XX_TEX_CONST_3_DEPTH(layers
/ 6) |
307 A4XX_TEX_CONST_3_LAYERSZ(rsc
->layout
.layer_size
);
309 case PIPE_TEXTURE_3D
:
311 A4XX_TEX_CONST_3_DEPTH(u_minify(prsc
->depth0
, lvl
)) |
312 A4XX_TEX_CONST_3_LAYERSZ(slice
->size0
);
313 so
->texconst4
= A4XX_TEX_CONST_4_LAYERSZ(
314 fd_resource_slice(rsc
, prsc
->last_level
)->size0
);
317 so
->texconst3
= 0x00000000;
325 fd4_set_sampler_views(struct pipe_context
*pctx
, enum pipe_shader_type shader
,
326 unsigned start
, unsigned nr
,
327 struct pipe_sampler_view
**views
)
329 struct fd_context
*ctx
= fd_context(pctx
);
330 struct fd4_context
*fd4_ctx
= fd4_context(ctx
);
331 uint16_t astc_srgb
= 0;
334 for (i
= 0; i
< nr
; i
++) {
336 struct fd4_pipe_sampler_view
*view
=
337 fd4_pipe_sampler_view(views
[i
]);
339 astc_srgb
|= (1 << i
);
343 fd_set_sampler_views(pctx
, shader
, start
, nr
, views
);
345 if (shader
== PIPE_SHADER_FRAGMENT
) {
346 fd4_ctx
->fastc_srgb
= astc_srgb
;
347 } else if (shader
== PIPE_SHADER_VERTEX
) {
348 fd4_ctx
->vastc_srgb
= astc_srgb
;
353 fd4_texture_init(struct pipe_context
*pctx
)
355 pctx
->create_sampler_state
= fd4_sampler_state_create
;
356 pctx
->bind_sampler_states
= fd4_sampler_states_bind
;
357 pctx
->create_sampler_view
= fd4_sampler_view_create
;
358 pctx
->set_sampler_views
= fd4_set_sampler_views
;