2 /**************************************************************************
4 * Copyright 2003 Tungsten Graphics, Inc., Cedar Park, Texas.
7 * Permission is hereby granted, free of charge, to any person obtaining a
8 * copy of this software and associated documentation files (the
9 * "Software"), to deal in the Software without restriction, including
10 * without limitation the rights to use, copy, modify, merge, publish,
11 * distribute, sub license, and/or sell copies of the Software, and to
12 * permit persons to whom the Software is furnished to do so, subject to
13 * the following conditions:
15 * The above copyright notice and this permission notice (including the
16 * next paragraph) shall be included in all copies or substantial portions
19 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
20 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
21 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
22 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
23 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
24 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
25 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
27 **************************************************************************/
29 #include "pipe/p_context.h"
30 #include "pipe/p_format.h"
31 #include "util/u_format.h"
32 #include "util/u_math.h"
33 #include "util/u_memory.h"
34 #include "util/u_pack_color.h"
35 #include "util/u_blitter.h"
36 #include "util/u_surface.h"
38 #include "nouveau/nouveau_winsys.h"
39 #include "nouveau/nouveau_screen.h"
40 #include "nvfx_context.h"
41 #include "nvfx_screen.h"
42 #include "nvfx_resource.h"
45 #include <nouveau/nouveau_bo.h>
48 nvfx_region_set_format(struct nv04_region
* rgn
, enum pipe_format format
)
50 unsigned bits
= util_format_get_blocksizebits(format
);
61 if(format
== PIPE_FORMAT_B5G5R5X1_UNORM
)
66 if(format
== PIPE_FORMAT_R8G8B8X8_UNORM
|| format
== PIPE_FORMAT_B8G8R8X8_UNORM
)
80 rgn
->x
= util_format_get_nblocksx(format
, rgn
->x
) << shift
;
81 rgn
->y
= util_format_get_nblocksy(format
, rgn
->y
);
87 nvfx_region_init_for_surface(struct nv04_region
* rgn
, struct nvfx_surface
* surf
, unsigned x
, unsigned y
, boolean for_write
)
95 rgn
->bo
= surf
->temp
->base
.bo
;
97 rgn
->pitch
= surf
->temp
->linear_pitch
;
100 util_dirty_surface_set_dirty(nvfx_surface_get_dirty_surfaces(&surf
->base
.base
), &surf
->base
);
102 rgn
->bo
= ((struct nvfx_resource
*)surf
->base
.base
.texture
)->bo
;
103 rgn
->offset
= surf
->offset
;
105 if(surf
->base
.base
.texture
->flags
& NOUVEAU_RESOURCE_FLAG_LINEAR
)
106 rgn
->pitch
= surf
->pitch
;
110 rgn
->z
= surf
->base
.base
.u
.tex
.first_layer
;
111 rgn
->w
= surf
->base
.base
.width
;
112 rgn
->h
= surf
->base
.base
.height
;
113 rgn
->d
= u_minify(surf
->base
.base
.texture
->depth0
, surf
->base
.base
.u
.tex
.level
);
117 nvfx_region_set_format(rgn
, surf
->base
.base
.format
);
119 nv04_region_try_to_linearize(rgn
);
123 nvfx_region_init_for_subresource(struct nv04_region
* rgn
, struct pipe_resource
* pt
, unsigned level
, unsigned x
, unsigned y
, unsigned z
, boolean for_write
)
125 if(pt
->target
!= PIPE_BUFFER
)
127 struct nvfx_surface
* ns
= (struct nvfx_surface
*)util_surfaces_peek(&((struct nvfx_miptree
*)pt
)->surfaces
, pt
, level
, z
);
128 if(ns
&& util_dirty_surface_is_dirty(&ns
->base
))
130 nvfx_region_init_for_surface(rgn
, ns
, x
, y
, for_write
);
135 rgn
->bo
= ((struct nvfx_resource
*)pt
)->bo
;
136 rgn
->offset
= nvfx_subresource_offset(pt
, z
, level
, z
);
140 if(pt
->flags
& NOUVEAU_RESOURCE_FLAG_LINEAR
)
142 rgn
->pitch
= nvfx_subresource_pitch(pt
, level
);
149 rgn
->w
= u_minify(pt
->width0
, level
);
150 rgn
->h
= u_minify(pt
->height0
, level
);
151 rgn
->d
= u_minify(pt
->depth0
, level
);
154 nvfx_region_set_format(rgn
, pt
->format
);
156 nv04_region_try_to_linearize(rgn
);
159 // don't save index buffer because blitter doesn't setit
160 static struct blitter_context
*
161 nvfx_get_blitter(struct pipe_context
* pipe
, int copy
)
163 struct nvfx_context
* nvfx
= nvfx_context(pipe
);
164 struct blitter_context
** pblitter
;
165 struct blitter_context
* blitter
;
167 assert(nvfx
->blitters_in_use
< Elements(nvfx
->blitter
));
169 if(nvfx
->query
&& !nvfx
->blitters_in_use
)
171 struct nouveau_channel
* chan
= nvfx
->screen
->base
.channel
;
172 struct nouveau_grobj
*eng3d
= nvfx
->screen
->eng3d
;
173 BEGIN_RING(chan
, eng3d
, NV30_3D_QUERY_ENABLE
, 1);
177 pblitter
= &nvfx
->blitter
[nvfx
->blitters_in_use
++];
179 *pblitter
= util_blitter_create(pipe
);
182 util_blitter_save_blend(blitter
, nvfx
->blend
);
183 util_blitter_save_depth_stencil_alpha(blitter
, nvfx
->zsa
);
184 util_blitter_save_stencil_ref(blitter
, &nvfx
->stencil_ref
);
185 util_blitter_save_rasterizer(blitter
, nvfx
->rasterizer
);
186 util_blitter_save_fragment_shader(blitter
, nvfx
->fragprog
);
187 util_blitter_save_vertex_shader(blitter
, nvfx
->vertprog
);
188 util_blitter_save_viewport(blitter
, &nvfx
->viewport
);
189 util_blitter_save_framebuffer(blitter
, &nvfx
->framebuffer
);
190 util_blitter_save_vertex_elements(blitter
, nvfx
->vtxelt
);
191 util_blitter_save_vertex_buffers(blitter
, nvfx
->vtxbuf_nr
, nvfx
->vtxbuf
);
195 util_blitter_save_fragment_sampler_states(blitter
, nvfx
->nr_samplers
, (void**)nvfx
->tex_sampler
);
196 util_blitter_save_fragment_sampler_views(blitter
, nvfx
->nr_textures
, nvfx
->fragment_sampler_views
);
203 nvfx_put_blitter(struct pipe_context
* pipe
, struct blitter_context
* blitter
)
205 struct nvfx_context
* nvfx
= nvfx_context(pipe
);
206 --nvfx
->blitters_in_use
;
207 assert(nvfx
->blitters_in_use
>= 0);
209 if(nvfx
->query
&& !nvfx
->blitters_in_use
)
211 struct nouveau_channel
* chan
= nvfx
->screen
->base
.channel
;
212 struct nouveau_grobj
*eng3d
= nvfx
->screen
->eng3d
;
213 BEGIN_RING(chan
, eng3d
, NV30_3D_QUERY_ENABLE
, 1);
219 nvfx_region_clone(struct nv04_2d_context
* ctx
, struct nv04_region
* rgn
, unsigned w
, unsigned h
, boolean for_read
)
221 unsigned begin
= nv04_region_begin(rgn
, w
, h
);
222 unsigned end
= nv04_region_end(rgn
, w
, h
);
223 unsigned size
= end
- begin
;
224 struct nouveau_bo
* bo
= 0;
225 nouveau_bo_new(rgn
->bo
->device
, NOUVEAU_BO_MAP
| NOUVEAU_BO_GART
, 256, size
, &bo
);
227 if(for_read
|| (size
> ((w
* h
) << rgn
->bpps
)))
228 nv04_memcpy(ctx
, bo
, 0, rgn
->bo
, rgn
->offset
+ begin
, size
);
231 rgn
->offset
= -begin
;
236 nvfx_resource_copy_region(struct pipe_context
*pipe
,
237 struct pipe_resource
*dstr
, unsigned dst_level
,
238 unsigned dstx
, unsigned dsty
, unsigned dstz
,
239 struct pipe_resource
*srcr
, unsigned src_level
,
240 const struct pipe_box
*src_box
)
242 static int copy_threshold
= -1;
243 struct nv04_2d_context
*ctx
= nvfx_screen(pipe
->screen
)->eng2d
;
244 struct nv04_region dst
, src
;
249 unsigned w
= src_box
->width
;
250 unsigned h
= src_box
->height
;
255 /* Fallback for buffers. */
256 if (dstr
->target
== PIPE_BUFFER
&& srcr
->target
== PIPE_BUFFER
) {
257 util_resource_copy_region(pipe
, dstr
, dst_level
, dstx
, dsty
, dstz
,
258 srcr
, src_level
, src_box
);
262 if(copy_threshold
< 0)
263 copy_threshold
= debug_get_num_option("NOUVEAU_COPY_THRESHOLD", 4);
265 dst_to_gpu
= dstr
->usage
!= PIPE_USAGE_DYNAMIC
&& dstr
->usage
!= PIPE_USAGE_STAGING
;
266 src_on_gpu
= nvfx_resource_on_gpu(srcr
);
268 nvfx_region_init_for_subresource(&dst
, dstr
, dst_level
, dstx
, dsty
, dstz
, TRUE
);
269 nvfx_region_init_for_subresource(&src
, srcr
, src_level
, src_box
->x
, src_box
->y
, src_box
->z
, FALSE
);
270 w
= util_format_get_stride(dstr
->format
, w
) >> dst
.bpps
;
271 h
= util_format_get_nblocksy(dstr
->format
, h
);
273 small
= (w
* h
<= copy_threshold
);
274 if((!dst_to_gpu
|| !src_on_gpu
) && small
)
275 ret
= -1; /* use the CPU */
277 ret
= nv04_region_copy_2d(ctx
, &dst
, &src
, w
, h
, dst_to_gpu
, src_on_gpu
);
281 && dstr
->bind
& (PIPE_BIND_RENDER_TARGET
| PIPE_BIND_DEPTH_STENCIL
)
282 && srcr
->bind
& PIPE_BIND_SAMPLER_VIEW
)
284 /* this currently works because we hack the bind flags on resource creation to be
285 * the maximum set that the resource type actually supports
287 * TODO: perhaps support reinterpreting the formats
289 struct blitter_context
* blitter
= nvfx_get_blitter(pipe
, 1);
290 util_blitter_copy_texture(blitter
, dstr
, dst_level
, dstx
, dsty
, dstz
, srcr
, src_level
, src_box
, TRUE
);
291 nvfx_put_blitter(pipe
, blitter
);
295 struct nv04_region dstt
= dst
;
296 struct nv04_region srct
= src
;
297 unsigned dstbegin
= 0;
302 nvfx_region_clone(ctx
, &srct
, w
, h
, TRUE
);
305 dstbegin
= nvfx_region_clone(ctx
, &dstt
, w
, h
, FALSE
);
308 nv04_region_copy_cpu(&dstt
, &srct
, w
, h
);
310 if(srct
.bo
!= src
.bo
)
311 nouveau_screen_bo_release(pipe
->screen
, srct
.bo
);
313 if(dstt
.bo
!= dst
.bo
)
315 nv04_memcpy(ctx
, dst
.bo
, dst
.offset
+ dstbegin
, dstt
.bo
, 0, dstt
.bo
->size
);
316 nouveau_screen_bo_release(pipe
->screen
, dstt
.bo
);
322 nvfx_surface_fill(struct pipe_context
* pipe
, struct pipe_surface
*dsts
,
323 unsigned dx
, unsigned dy
, unsigned w
, unsigned h
, unsigned value
)
325 struct nv04_2d_context
*ctx
= nvfx_screen(pipe
->screen
)->eng2d
;
326 struct nv04_region dst
;
328 /* Always try to use the GPU right now, if possible
329 * If the user wanted the surface data on the CPU, he would have cleared with memset (hopefully) */
331 // we don't care about interior pixel order since we set all them to the same value
332 nvfx_region_init_for_surface(&dst
, (struct nvfx_surface
*)dsts
, dx
, dy
, TRUE
);
334 w
= util_format_get_stride(dsts
->format
, w
) >> dst
.bpps
;
335 h
= util_format_get_nblocksy(dsts
->format
, h
);
337 ret
= nv04_region_fill_2d(ctx
, &dst
, w
, h
, value
);
338 if(ret
> 0 && dsts
->texture
->bind
& PIPE_BIND_RENDER_TARGET
)
342 struct nv04_region dstt
= dst
;
343 unsigned dstbegin
= 0;
345 if(nvfx_resource_on_gpu(dsts
->texture
))
346 dstbegin
= nvfx_region_clone(ctx
, &dstt
, w
, h
, FALSE
);
348 nv04_region_fill_cpu(&dstt
, w
, h
, value
);
350 if(dstt
.bo
!= dst
.bo
)
352 nv04_memcpy(ctx
, dst
.bo
, dst
.offset
+ dstbegin
, dstt
.bo
, 0, dstt
.bo
->size
);
353 nouveau_screen_bo_release(pipe
->screen
, dstt
.bo
);
362 nvfx_screen_surface_takedown(struct pipe_screen
*pscreen
)
364 nv04_2d_context_takedown(nvfx_screen(pscreen
)->eng2d
);
365 nvfx_screen(pscreen
)->eng2d
= 0;
369 nvfx_screen_surface_init(struct pipe_screen
*pscreen
)
371 struct nv04_2d_context
* ctx
= nv04_2d_context_init(nouveau_screen(pscreen
)->channel
);
374 nvfx_screen(pscreen
)->eng2d
= ctx
;
379 nvfx_surface_copy_temp(struct pipe_context
* pipe
, struct pipe_surface
* surf
, int to_temp
)
381 struct nvfx_surface
* ns
= (struct nvfx_surface
*)surf
;
383 struct nvfx_context
* nvfx
= nvfx_context(pipe
);
384 struct nvfx_miptree
* temp
;
385 unsigned use_vertex_buffers
;
386 boolean use_index_buffer
;
387 unsigned base_vertex
;
389 /* temporarily detach the temp, so it isn't used in place of the actual resource */
393 // TODO: we really should do this validation before setting these variable in draw calls
394 use_vertex_buffers
= nvfx
->use_vertex_buffers
;
395 use_index_buffer
= nvfx
->use_index_buffer
;
396 base_vertex
= nvfx
->base_vertex
;
399 assert(surf
->u
.tex
.first_layer
== surf
->u
.tex
.last_layer
);
400 box
.width
= surf
->width
;
401 box
.height
= surf
->height
;
405 box
.z
= surf
->u
.tex
.first_layer
;
406 nvfx_resource_copy_region(pipe
, &temp
->base
.base
, 0, 0, 0, 0, surf
->texture
, surf
->u
.tex
.level
, &box
);
410 nvfx_resource_copy_region(pipe
, surf
->texture
, surf
->u
.tex
.level
, 0, 0, surf
->u
.tex
.first_layer
, &temp
->base
.base
, 0, &box
);
413 /* If this triggers, it probably means we attempted to use the blitter
414 * but failed due to non-renderability of the target.
415 * Obviously, this would lead to infinite recursion if supported. */
420 nvfx
->use_vertex_buffers
= use_vertex_buffers
;
421 nvfx
->use_index_buffer
= use_index_buffer
;
422 nvfx
->base_vertex
= base_vertex
;
424 nvfx
->dirty
|= NVFX_NEW_ARRAYS
;
425 nvfx
->draw_dirty
|= NVFX_NEW_ARRAYS
;
429 nvfx_surface_create_temp(struct pipe_context
* pipe
, struct pipe_surface
* surf
)
431 struct nvfx_surface
* ns
= (struct nvfx_surface
*)surf
;
432 struct pipe_resource
template;
433 memset(&template, 0, sizeof(struct pipe_resource
));
434 template.target
= PIPE_TEXTURE_2D
;
435 template.format
= surf
->format
;
436 template.width0
= surf
->width
;
437 template.height0
= surf
->height
;
439 template.nr_samples
= surf
->texture
->nr_samples
;
440 template.flags
= NOUVEAU_RESOURCE_FLAG_LINEAR
;
442 assert(!ns
->temp
&& !util_dirty_surface_is_dirty(&ns
->base
));
444 ns
->temp
= (struct nvfx_miptree
*)nvfx_miptree_create(pipe
->screen
, &template);
445 nvfx_surface_copy_temp(pipe
, surf
, 1);
449 nvfx_surface_flush(struct pipe_context
* pipe
, struct pipe_surface
* surf
)
451 struct nvfx_context
* nvfx
= (struct nvfx_context
*)pipe
;
452 struct nvfx_surface
* ns
= (struct nvfx_surface
*)surf
;
453 boolean bound
= FALSE
;
455 nvfx_surface_copy_temp(pipe
, surf
, 0);
457 util_dirty_surface_set_clean(nvfx_surface_get_dirty_surfaces(surf
), &ns
->base
);
459 if(nvfx
->framebuffer
.zsbuf
== surf
)
463 for(unsigned i
= 0; i
< nvfx
->framebuffer
.nr_cbufs
; ++i
)
465 if(nvfx
->framebuffer
.cbufs
[i
] == surf
)
474 pipe_resource_reference((struct pipe_resource
**)&ns
->temp
, 0);
478 nvfx_clear_render_target(struct pipe_context
*pipe
,
479 struct pipe_surface
*dst
,
480 const union pipe_color_union
*color
,
481 unsigned dstx
, unsigned dsty
,
482 unsigned width
, unsigned height
)
485 util_pack_color(color
->f
, dst
->format
, &uc
);
487 if(util_format_get_blocksizebits(dst
->format
) > 32
488 || nvfx_surface_fill(pipe
, dst
, dstx
, dsty
, width
, height
, uc
.ui
))
490 // TODO: probably should use hardware clear here instead if possible
491 struct blitter_context
* blitter
= nvfx_get_blitter(pipe
, 0);
492 util_blitter_clear_render_target(blitter
, dst
, color
, dstx
, dsty
, width
, height
);
493 nvfx_put_blitter(pipe
, blitter
);
498 nvfx_clear_depth_stencil(struct pipe_context
*pipe
,
499 struct pipe_surface
*dst
,
500 unsigned clear_flags
,
503 unsigned dstx
, unsigned dsty
,
504 unsigned width
, unsigned height
)
506 if(util_format_get_blocksizebits(dst
->format
) > 32
507 || nvfx_surface_fill(pipe
, dst
, dstx
, dsty
, width
, height
, util_pack_z_stencil(dst
->format
, depth
, stencil
)))
509 // TODO: probably should use hardware clear here instead if possible
510 struct blitter_context
* blitter
= nvfx_get_blitter(pipe
, 0);
511 util_blitter_clear_depth_stencil(blitter
, dst
, clear_flags
, depth
, stencil
, dstx
, dsty
, width
, height
);
512 nvfx_put_blitter(pipe
, blitter
);
518 nvfx_init_surface_functions(struct nvfx_context
*nvfx
)
520 nvfx
->pipe
.resource_copy_region
= nvfx_resource_copy_region
;
521 nvfx
->pipe
.clear_render_target
= nvfx_clear_render_target
;
522 nvfx
->pipe
.clear_depth_stencil
= nvfx_clear_depth_stencil
;