2 * Copyright 2010 Jerome Glisse <glisse@freedesktop.org>
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * on the rights to use, copy, modify, merge, publish, distribute, sub
8 * license, and/or sell copies of the Software, and to permit persons to whom
9 * the Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
19 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
20 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21 * USE OR OTHER DEALINGS IN THE SOFTWARE.
25 #include "pipe/p_defines.h"
26 #include "pipe/p_state.h"
27 #include "pipe/p_context.h"
28 #include "tgsi/tgsi_scan.h"
29 #include "tgsi/tgsi_parse.h"
30 #include "tgsi/tgsi_util.h"
31 #include "util/u_blitter.h"
32 #include "util/u_double_list.h"
33 #include "util/u_format.h"
34 #include "util/u_format_s3tc.h"
35 #include "util/u_transfer.h"
36 #include "util/u_surface.h"
37 #include "util/u_pack_color.h"
38 #include "util/u_memory.h"
39 #include "util/u_inlines.h"
40 #include "util/u_simple_shaders.h"
41 #include "util/u_upload_mgr.h"
42 #include "vl/vl_decoder.h"
43 #include "vl/vl_video_buffer.h"
44 #include "os/os_time.h"
45 #include "pipebuffer/pb_buffer.h"
46 #include "radeonsi_pipe.h"
47 #include "radeon/radeon_uvd.h"
50 #include "r600_resource.h"
51 #include "radeonsi_pipe.h"
52 #include "r600_hw_context_priv.h"
58 static struct r600_fence
*r600_create_fence(struct r600_context
*rctx
)
60 struct r600_screen
*rscreen
= rctx
->screen
;
61 struct r600_fence
*fence
= NULL
;
63 pipe_mutex_lock(rscreen
->fences
.mutex
);
65 if (!rscreen
->fences
.bo
) {
66 /* Create the shared buffer object */
67 rscreen
->fences
.bo
= si_resource_create_custom(&rscreen
->screen
,
70 if (!rscreen
->fences
.bo
) {
71 R600_ERR("r600: failed to create bo for fence objects\n");
74 rscreen
->fences
.data
= rctx
->ws
->buffer_map(rscreen
->fences
.bo
->cs_buf
,
76 PIPE_TRANSFER_READ_WRITE
);
79 if (!LIST_IS_EMPTY(&rscreen
->fences
.pool
)) {
80 struct r600_fence
*entry
;
82 /* Try to find a freed fence that has been signalled */
83 LIST_FOR_EACH_ENTRY(entry
, &rscreen
->fences
.pool
, head
) {
84 if (rscreen
->fences
.data
[entry
->index
] != 0) {
85 LIST_DELINIT(&entry
->head
);
93 /* Allocate a new fence */
94 struct r600_fence_block
*block
;
97 if ((rscreen
->fences
.next_index
+ 1) >= 1024) {
98 R600_ERR("r600: too many concurrent fences\n");
102 index
= rscreen
->fences
.next_index
++;
104 if (!(index
% FENCE_BLOCK_SIZE
)) {
105 /* Allocate a new block */
106 block
= CALLOC_STRUCT(r600_fence_block
);
110 LIST_ADD(&block
->head
, &rscreen
->fences
.blocks
);
112 block
= LIST_ENTRY(struct r600_fence_block
, rscreen
->fences
.blocks
.next
, head
);
115 fence
= &block
->fences
[index
% FENCE_BLOCK_SIZE
];
116 fence
->index
= index
;
119 pipe_reference_init(&fence
->reference
, 1);
121 rscreen
->fences
.data
[fence
->index
] = 0;
122 si_context_emit_fence(rctx
, rscreen
->fences
.bo
, fence
->index
, 1);
124 /* Create a dummy BO so that fence_finish without a timeout can sleep waiting for completion */
125 fence
->sleep_bo
= si_resource_create_custom(&rctx
->screen
->screen
, PIPE_USAGE_STAGING
, 1);
127 /* Add the fence as a dummy relocation. */
128 r600_context_bo_reloc(rctx
, fence
->sleep_bo
, RADEON_USAGE_READWRITE
);
131 pipe_mutex_unlock(rscreen
->fences
.mutex
);
136 void radeonsi_flush(struct pipe_context
*ctx
, struct pipe_fence_handle
**fence
,
139 struct r600_context
*rctx
= (struct r600_context
*)ctx
;
140 struct r600_fence
**rfence
= (struct r600_fence
**)fence
;
141 struct pipe_query
*render_cond
= NULL
;
142 boolean render_cond_cond
= FALSE
;
143 unsigned render_cond_mode
= 0;
146 *rfence
= r600_create_fence(rctx
);
148 /* Disable render condition. */
149 if (rctx
->current_render_cond
) {
150 render_cond
= rctx
->current_render_cond
;
151 render_cond_cond
= rctx
->current_render_cond_cond
;
152 render_cond_mode
= rctx
->current_render_cond_mode
;
153 ctx
->render_condition(ctx
, NULL
, FALSE
, 0);
156 si_context_flush(rctx
, flags
);
158 /* Re-enable render condition. */
160 ctx
->render_condition(ctx
, render_cond
, render_cond_cond
, render_cond_mode
);
164 static void r600_flush_from_st(struct pipe_context
*ctx
,
165 struct pipe_fence_handle
**fence
,
168 radeonsi_flush(ctx
, fence
,
169 flags
& PIPE_FLUSH_END_OF_FRAME
? RADEON_FLUSH_END_OF_FRAME
: 0);
172 static void r600_flush_from_winsys(void *ctx
, unsigned flags
)
174 radeonsi_flush((struct pipe_context
*)ctx
, NULL
, flags
);
177 static void r600_destroy_context(struct pipe_context
*context
)
179 struct r600_context
*rctx
= (struct r600_context
*)context
;
181 si_release_all_descriptors(rctx
);
183 si_resource_reference(&rctx
->border_color_table
, NULL
);
185 if (rctx
->dummy_pixel_shader
) {
186 rctx
->context
.delete_fs_state(&rctx
->context
, rctx
->dummy_pixel_shader
);
188 for (int i
= 0; i
< 8; i
++) {
189 rctx
->context
.delete_depth_stencil_alpha_state(&rctx
->context
, rctx
->custom_dsa_flush_depth_stencil
[i
]);
190 rctx
->context
.delete_depth_stencil_alpha_state(&rctx
->context
, rctx
->custom_dsa_flush_depth
[i
]);
191 rctx
->context
.delete_depth_stencil_alpha_state(&rctx
->context
, rctx
->custom_dsa_flush_stencil
[i
]);
193 rctx
->context
.delete_depth_stencil_alpha_state(&rctx
->context
, rctx
->custom_dsa_flush_inplace
);
194 rctx
->context
.delete_blend_state(&rctx
->context
, rctx
->custom_blend_resolve
);
195 rctx
->context
.delete_blend_state(&rctx
->context
, rctx
->custom_blend_decompress
);
196 util_unreference_framebuffer_state(&rctx
->framebuffer
);
198 util_blitter_destroy(rctx
->blitter
);
200 if (rctx
->uploader
) {
201 u_upload_destroy(rctx
->uploader
);
203 util_slab_destroy(&rctx
->pool_transfers
);
207 static struct pipe_context
*r600_create_context(struct pipe_screen
*screen
, void *priv
)
209 struct r600_context
*rctx
= CALLOC_STRUCT(r600_context
);
210 struct r600_screen
* rscreen
= (struct r600_screen
*)screen
;
215 rctx
->context
.screen
= screen
;
216 rctx
->context
.priv
= priv
;
217 rctx
->context
.destroy
= r600_destroy_context
;
218 rctx
->context
.flush
= r600_flush_from_st
;
220 /* Easy accessing of screen/winsys. */
221 rctx
->screen
= rscreen
;
222 rctx
->ws
= rscreen
->ws
;
223 rctx
->family
= rscreen
->family
;
224 rctx
->chip_class
= rscreen
->chip_class
;
226 si_init_blit_functions(rctx
);
227 r600_init_query_functions(rctx
);
228 r600_init_context_resource_functions(rctx
);
229 si_init_surface_functions(rctx
);
230 si_init_compute_functions(rctx
);
232 if (rscreen
->info
.has_uvd
) {
233 rctx
->context
.create_video_codec
= radeonsi_uvd_create_decoder
;
234 rctx
->context
.create_video_buffer
= radeonsi_video_buffer_create
;
236 rctx
->context
.create_video_codec
= vl_create_decoder
;
237 rctx
->context
.create_video_buffer
= vl_video_buffer_create
;
240 rctx
->cs
= rctx
->ws
->cs_create(rctx
->ws
, RING_GFX
, NULL
);
242 si_init_all_descriptors(rctx
);
244 switch (rctx
->chip_class
) {
247 si_init_state_functions(rctx
);
248 LIST_INITHEAD(&rctx
->active_nontimer_query_list
);
250 si_init_config(rctx
);
253 R600_ERR("Unsupported chip class %d.\n", rctx
->chip_class
);
254 r600_destroy_context(&rctx
->context
);
258 rctx
->ws
->cs_set_flush_callback(rctx
->cs
, r600_flush_from_winsys
, rctx
);
260 util_slab_create(&rctx
->pool_transfers
,
261 sizeof(struct pipe_transfer
), 64,
262 UTIL_SLAB_SINGLETHREADED
);
264 rctx
->uploader
= u_upload_create(&rctx
->context
, 1024 * 1024, 256,
265 PIPE_BIND_INDEX_BUFFER
|
266 PIPE_BIND_CONSTANT_BUFFER
);
267 if (!rctx
->uploader
) {
268 r600_destroy_context(&rctx
->context
);
272 rctx
->blitter
= util_blitter_create(&rctx
->context
);
273 if (rctx
->blitter
== NULL
) {
274 r600_destroy_context(&rctx
->context
);
278 si_get_backend_mask(rctx
); /* this emits commands and must be last */
280 rctx
->dummy_pixel_shader
=
281 util_make_fragment_cloneinput_shader(&rctx
->context
, 0,
282 TGSI_SEMANTIC_GENERIC
,
283 TGSI_INTERPOLATE_CONSTANT
);
284 rctx
->context
.bind_fs_state(&rctx
->context
, rctx
->dummy_pixel_shader
);
286 return &rctx
->context
;
292 static const char* r600_get_vendor(struct pipe_screen
* pscreen
)
297 const char *r600_get_llvm_processor_name(enum radeon_family family
)
300 case CHIP_TAHITI
: return "tahiti";
301 case CHIP_PITCAIRN
: return "pitcairn";
302 case CHIP_VERDE
: return "verde";
303 case CHIP_OLAND
: return "oland";
304 case CHIP_HAINAN
: return "hainan";
305 case CHIP_BONAIRE
: return "bonaire";
306 case CHIP_KABINI
: return "kabini";
307 case CHIP_KAVERI
: return "kaveri";
312 static const char *r600_get_family_name(enum radeon_family family
)
315 case CHIP_TAHITI
: return "AMD TAHITI";
316 case CHIP_PITCAIRN
: return "AMD PITCAIRN";
317 case CHIP_VERDE
: return "AMD CAPE VERDE";
318 case CHIP_OLAND
: return "AMD OLAND";
319 case CHIP_HAINAN
: return "AMD HAINAN";
320 case CHIP_BONAIRE
: return "AMD BONAIRE";
321 case CHIP_KAVERI
: return "AMD KAVERI";
322 case CHIP_KABINI
: return "AMD KABINI";
323 default: return "AMD unknown";
327 static const char* r600_get_name(struct pipe_screen
* pscreen
)
329 struct r600_screen
*rscreen
= (struct r600_screen
*)pscreen
;
331 return r600_get_family_name(rscreen
->family
);
334 static int r600_get_param(struct pipe_screen
* pscreen
, enum pipe_cap param
)
336 struct r600_screen
*rscreen
= (struct r600_screen
*)pscreen
;
339 /* Supported features (boolean caps). */
340 case PIPE_CAP_TWO_SIDED_STENCIL
:
341 case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS
:
342 case PIPE_CAP_ANISOTROPIC_FILTER
:
343 case PIPE_CAP_POINT_SPRITE
:
344 case PIPE_CAP_OCCLUSION_QUERY
:
345 case PIPE_CAP_TEXTURE_SHADOW_MAP
:
346 case PIPE_CAP_TEXTURE_MIRROR_CLAMP
:
347 case PIPE_CAP_BLEND_EQUATION_SEPARATE
:
348 case PIPE_CAP_TEXTURE_SWIZZLE
:
349 case PIPE_CAP_DEPTH_CLIP_DISABLE
:
350 case PIPE_CAP_SHADER_STENCIL_EXPORT
:
351 case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR
:
352 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS
:
353 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT
:
354 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER
:
356 case PIPE_CAP_SEAMLESS_CUBE_MAP
:
357 case PIPE_CAP_PRIMITIVE_RESTART
:
358 case PIPE_CAP_CONDITIONAL_RENDER
:
359 case PIPE_CAP_TEXTURE_BARRIER
:
360 case PIPE_CAP_INDEP_BLEND_ENABLE
:
361 case PIPE_CAP_INDEP_BLEND_FUNC
:
362 case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE
:
363 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED
:
364 case PIPE_CAP_VERTEX_BUFFER_OFFSET_4BYTE_ALIGNED_ONLY
:
365 case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY
:
366 case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY
:
367 case PIPE_CAP_USER_INDEX_BUFFERS
:
368 case PIPE_CAP_USER_CONSTANT_BUFFERS
:
369 case PIPE_CAP_START_INSTANCE
:
370 case PIPE_CAP_NPOT_TEXTURES
:
371 case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER
:
372 case PIPE_CAP_TGSI_INSTANCEID
:
373 case PIPE_CAP_COMPUTE
:
376 case PIPE_CAP_TEXTURE_MULTISAMPLE
:
377 return HAVE_LLVM
>= 0x0304 && rscreen
->chip_class
== SI
;
379 case PIPE_CAP_TGSI_TEXCOORD
:
382 case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT
:
385 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT
:
388 case PIPE_CAP_GLSL_FEATURE_LEVEL
:
391 /* Unsupported features. */
392 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT
:
393 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER
:
394 case PIPE_CAP_SCALED_RESOLVE
:
395 case PIPE_CAP_TGSI_CAN_COMPACT_CONSTANTS
:
396 case PIPE_CAP_FRAGMENT_COLOR_CLAMPED
:
397 case PIPE_CAP_VERTEX_COLOR_CLAMPED
:
398 case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION
:
399 case PIPE_CAP_USER_VERTEX_BUFFERS
:
400 case PIPE_CAP_QUERY_PIPELINE_STATISTICS
:
401 case PIPE_CAP_CUBE_MAP_ARRAY
:
402 case PIPE_CAP_TEXTURE_BUFFER_OBJECTS
:
403 case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT
:
404 case PIPE_CAP_TEXTURE_BORDER_COLOR_QUIRK
:
405 case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE
:
410 case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS
:
411 return debug_get_bool_option("R600_STREAMOUT", FALSE
) ? 4 : 0;
412 case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME
:
413 return debug_get_bool_option("R600_STREAMOUT", FALSE
) ? 1 : 0;
414 case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS
:
415 case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS
:
418 case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS
:
419 case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME
:
420 case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS
:
421 case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS
:
425 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS
:
426 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS
:
427 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS
:
429 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS
:
431 case PIPE_CAP_MAX_COMBINED_SAMPLERS
:
434 /* Render targets. */
435 case PIPE_CAP_MAX_RENDER_TARGETS
:
436 /* FIXME some r6xx are buggy and can only do 4 */
439 /* Timer queries, present when the clock frequency is non zero. */
440 case PIPE_CAP_QUERY_TIMESTAMP
:
441 case PIPE_CAP_QUERY_TIME_ELAPSED
:
442 return rscreen
->info
.r600_clock_crystal_freq
!= 0;
444 case PIPE_CAP_MIN_TEXEL_OFFSET
:
447 case PIPE_CAP_MAX_TEXEL_OFFSET
:
449 case PIPE_CAP_ENDIANNESS
:
450 return PIPE_ENDIAN_LITTLE
;
455 static float r600_get_paramf(struct pipe_screen
* pscreen
,
456 enum pipe_capf param
)
459 case PIPE_CAPF_MAX_LINE_WIDTH
:
460 case PIPE_CAPF_MAX_LINE_WIDTH_AA
:
461 case PIPE_CAPF_MAX_POINT_WIDTH
:
462 case PIPE_CAPF_MAX_POINT_WIDTH_AA
:
464 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY
:
466 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS
:
468 case PIPE_CAPF_GUARD_BAND_LEFT
:
469 case PIPE_CAPF_GUARD_BAND_TOP
:
470 case PIPE_CAPF_GUARD_BAND_RIGHT
:
471 case PIPE_CAPF_GUARD_BAND_BOTTOM
:
477 static int r600_get_shader_param(struct pipe_screen
* pscreen
, unsigned shader
, enum pipe_shader_cap param
)
481 case PIPE_SHADER_FRAGMENT
:
482 case PIPE_SHADER_VERTEX
:
484 case PIPE_SHADER_GEOMETRY
:
485 /* TODO: support and enable geometry programs */
487 case PIPE_SHADER_COMPUTE
:
489 case PIPE_SHADER_CAP_PREFERRED_IR
:
490 return PIPE_SHADER_IR_LLVM
;
495 /* TODO: support tessellation */
500 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS
:
501 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS
:
502 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS
:
503 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS
:
505 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH
:
507 case PIPE_SHADER_CAP_MAX_INPUTS
:
509 case PIPE_SHADER_CAP_MAX_TEMPS
:
510 return 256; /* Max native temporaries. */
511 case PIPE_SHADER_CAP_MAX_ADDRS
:
512 /* FIXME Isn't this equal to TEMPS? */
513 return 1; /* Max native address registers */
514 case PIPE_SHADER_CAP_MAX_CONSTS
:
515 return 4096; /* actually only memory limits this */
516 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS
:
518 case PIPE_SHADER_CAP_MAX_PREDS
:
519 return 0; /* FIXME */
520 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED
:
522 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED
:
524 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR
:
525 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR
:
526 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR
:
527 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR
:
529 case PIPE_SHADER_CAP_INTEGERS
:
531 case PIPE_SHADER_CAP_SUBROUTINES
:
533 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS
:
535 case PIPE_SHADER_CAP_PREFERRED_IR
:
536 return PIPE_SHADER_IR_TGSI
;
541 static int r600_get_video_param(struct pipe_screen
*screen
,
542 enum pipe_video_profile profile
,
543 enum pipe_video_entrypoint entrypoint
,
544 enum pipe_video_cap param
)
547 case PIPE_VIDEO_CAP_SUPPORTED
:
548 return vl_profile_supported(screen
, profile
, entrypoint
);
549 case PIPE_VIDEO_CAP_NPOT_TEXTURES
:
551 case PIPE_VIDEO_CAP_MAX_WIDTH
:
552 case PIPE_VIDEO_CAP_MAX_HEIGHT
:
553 return vl_video_buffer_max_size(screen
);
554 case PIPE_VIDEO_CAP_PREFERED_FORMAT
:
555 return PIPE_FORMAT_NV12
;
556 case PIPE_VIDEO_CAP_MAX_LEVEL
:
557 return vl_level_supported(screen
, profile
);
563 static int r600_get_compute_param(struct pipe_screen
*screen
,
564 enum pipe_compute_cap param
,
567 struct r600_screen
*rscreen
= (struct r600_screen
*)screen
;
568 //TODO: select these params by asic
570 case PIPE_COMPUTE_CAP_IR_TARGET
: {
571 const char *gpu
= r600_get_llvm_processor_name(rscreen
->family
);
573 sprintf(ret
, "%s-r600--", gpu
);
575 return (8 + strlen(gpu
)) * sizeof(char);
577 case PIPE_COMPUTE_CAP_GRID_DIMENSION
:
579 uint64_t * grid_dimension
= ret
;
580 grid_dimension
[0] = 3;
582 return 1 * sizeof(uint64_t);
583 case PIPE_COMPUTE_CAP_MAX_GRID_SIZE
:
585 uint64_t * grid_size
= ret
;
586 grid_size
[0] = 65535;
587 grid_size
[1] = 65535;
590 return 3 * sizeof(uint64_t) ;
592 case PIPE_COMPUTE_CAP_MAX_BLOCK_SIZE
:
594 uint64_t * block_size
= ret
;
599 return 3 * sizeof(uint64_t);
600 case PIPE_COMPUTE_CAP_MAX_THREADS_PER_BLOCK
:
602 uint64_t * max_threads_per_block
= ret
;
603 *max_threads_per_block
= 256;
605 return sizeof(uint64_t);
607 case PIPE_COMPUTE_CAP_MAX_GLOBAL_SIZE
:
609 uint64_t *max_global_size
= ret
;
610 /* XXX: Not sure what to put here. */
611 *max_global_size
= 2000000000;
613 return sizeof(uint64_t);
614 case PIPE_COMPUTE_CAP_MAX_LOCAL_SIZE
:
616 uint64_t *max_local_size
= ret
;
617 /* Value reported by the closed source driver. */
618 *max_local_size
= 32768;
620 return sizeof(uint64_t);
621 case PIPE_COMPUTE_CAP_MAX_INPUT_SIZE
:
623 uint64_t *max_input_size
= ret
;
624 /* Value reported by the closed source driver. */
625 *max_input_size
= 1024;
627 return sizeof(uint64_t);
628 case PIPE_COMPUTE_CAP_MAX_MEM_ALLOC_SIZE
:
630 uint64_t max_global_size
;
631 uint64_t *max_mem_alloc_size
= ret
;
632 r600_get_compute_param(screen
, PIPE_COMPUTE_CAP_MAX_GLOBAL_SIZE
, &max_global_size
);
633 *max_mem_alloc_size
= max_global_size
/ 4;
635 return sizeof(uint64_t);
637 fprintf(stderr
, "unknown PIPE_COMPUTE_CAP %d\n", param
);
642 static void r600_destroy_screen(struct pipe_screen
* pscreen
)
644 struct r600_screen
*rscreen
= (struct r600_screen
*)pscreen
;
649 if (rscreen
->fences
.bo
) {
650 struct r600_fence_block
*entry
, *tmp
;
652 LIST_FOR_EACH_ENTRY_SAFE(entry
, tmp
, &rscreen
->fences
.blocks
, head
) {
653 LIST_DEL(&entry
->head
);
657 rscreen
->ws
->buffer_unmap(rscreen
->fences
.bo
->cs_buf
);
658 si_resource_reference(&rscreen
->fences
.bo
, NULL
);
662 if (rscreen
->trace_bo
) {
663 rscreen
->ws
->buffer_unmap(rscreen
->trace_bo
->cs_buf
);
664 pipe_resource_reference((struct pipe_resource
**)&rscreen
->trace_bo
, NULL
);
668 pipe_mutex_destroy(rscreen
->fences
.mutex
);
670 rscreen
->ws
->destroy(rscreen
->ws
);
674 static void r600_fence_reference(struct pipe_screen
*pscreen
,
675 struct pipe_fence_handle
**ptr
,
676 struct pipe_fence_handle
*fence
)
678 struct r600_fence
**oldf
= (struct r600_fence
**)ptr
;
679 struct r600_fence
*newf
= (struct r600_fence
*)fence
;
681 if (pipe_reference(&(*oldf
)->reference
, &newf
->reference
)) {
682 struct r600_screen
*rscreen
= (struct r600_screen
*)pscreen
;
683 pipe_mutex_lock(rscreen
->fences
.mutex
);
684 si_resource_reference(&(*oldf
)->sleep_bo
, NULL
);
685 LIST_ADDTAIL(&(*oldf
)->head
, &rscreen
->fences
.pool
);
686 pipe_mutex_unlock(rscreen
->fences
.mutex
);
692 static boolean
r600_fence_signalled(struct pipe_screen
*pscreen
,
693 struct pipe_fence_handle
*fence
)
695 struct r600_screen
*rscreen
= (struct r600_screen
*)pscreen
;
696 struct r600_fence
*rfence
= (struct r600_fence
*)fence
;
698 return rscreen
->fences
.data
[rfence
->index
] != 0;
701 static boolean
r600_fence_finish(struct pipe_screen
*pscreen
,
702 struct pipe_fence_handle
*fence
,
705 struct r600_screen
*rscreen
= (struct r600_screen
*)pscreen
;
706 struct r600_fence
*rfence
= (struct r600_fence
*)fence
;
707 int64_t start_time
= 0;
710 if (timeout
!= PIPE_TIMEOUT_INFINITE
) {
711 start_time
= os_time_get();
713 /* Convert to microseconds. */
717 while (rscreen
->fences
.data
[rfence
->index
] == 0) {
718 /* Special-case infinite timeout - wait for the dummy BO to become idle */
719 if (timeout
== PIPE_TIMEOUT_INFINITE
) {
720 rscreen
->ws
->buffer_wait(rfence
->sleep_bo
->buf
, RADEON_USAGE_READWRITE
);
724 /* The dummy BO will be busy until the CS including the fence has completed, or
725 * the GPU is reset. Don't bother continuing to spin when the BO is idle. */
726 if (!rscreen
->ws
->buffer_is_busy(rfence
->sleep_bo
->buf
, RADEON_USAGE_READWRITE
))
736 if (timeout
!= PIPE_TIMEOUT_INFINITE
&&
737 os_time_get() - start_time
>= timeout
) {
742 return rscreen
->fences
.data
[rfence
->index
] != 0;
745 static int evergreen_interpret_tiling(struct r600_screen
*rscreen
, uint32_t tiling_config
)
747 switch (tiling_config
& 0xf) {
749 rscreen
->tiling_info
.num_channels
= 1;
752 rscreen
->tiling_info
.num_channels
= 2;
755 rscreen
->tiling_info
.num_channels
= 4;
758 rscreen
->tiling_info
.num_channels
= 8;
764 switch ((tiling_config
& 0xf0) >> 4) {
766 rscreen
->tiling_info
.num_banks
= 4;
769 rscreen
->tiling_info
.num_banks
= 8;
772 rscreen
->tiling_info
.num_banks
= 16;
778 switch ((tiling_config
& 0xf00) >> 8) {
780 rscreen
->tiling_info
.group_bytes
= 256;
783 rscreen
->tiling_info
.group_bytes
= 512;
791 static int r600_init_tiling(struct r600_screen
*rscreen
)
793 uint32_t tiling_config
= rscreen
->info
.r600_tiling_config
;
795 /* set default group bytes, overridden by tiling info ioctl */
796 rscreen
->tiling_info
.group_bytes
= 512;
801 return evergreen_interpret_tiling(rscreen
, tiling_config
);
804 static uint64_t r600_get_timestamp(struct pipe_screen
*screen
)
806 struct r600_screen
*rscreen
= (struct r600_screen
*)screen
;
808 return 1000000 * rscreen
->ws
->query_value(rscreen
->ws
, RADEON_TIMESTAMP
) /
809 rscreen
->info
.r600_clock_crystal_freq
;
812 static unsigned radeon_family_from_device(unsigned device
)
815 #define CHIPSET(pciid, name, family) case pciid: return CHIP_##family;
816 #include "pci_ids/radeonsi_pci_ids.h"
823 struct pipe_screen
*radeonsi_screen_create(struct radeon_winsys
*ws
)
825 struct r600_screen
*rscreen
= CALLOC_STRUCT(r600_screen
);
826 if (rscreen
== NULL
) {
831 ws
->query_info(ws
, &rscreen
->info
);
833 rscreen
->family
= radeon_family_from_device(rscreen
->info
.pci_id
);
834 if (rscreen
->family
== CHIP_UNKNOWN
) {
835 fprintf(stderr
, "r600: Unknown chipset 0x%04X\n", rscreen
->info
.pci_id
);
841 if (rscreen
->family
>= CHIP_BONAIRE
) {
842 rscreen
->chip_class
= CIK
;
843 } else if (rscreen
->family
>= CHIP_TAHITI
) {
844 rscreen
->chip_class
= SI
;
846 fprintf(stderr
, "r600: Unsupported family %d\n", rscreen
->family
);
851 if (r600_init_tiling(rscreen
)) {
856 rscreen
->screen
.destroy
= r600_destroy_screen
;
857 rscreen
->screen
.get_name
= r600_get_name
;
858 rscreen
->screen
.get_vendor
= r600_get_vendor
;
859 rscreen
->screen
.get_param
= r600_get_param
;
860 rscreen
->screen
.get_shader_param
= r600_get_shader_param
;
861 rscreen
->screen
.get_paramf
= r600_get_paramf
;
862 rscreen
->screen
.get_compute_param
= r600_get_compute_param
;
863 rscreen
->screen
.get_timestamp
= r600_get_timestamp
;
864 rscreen
->screen
.is_format_supported
= si_is_format_supported
;
865 rscreen
->screen
.context_create
= r600_create_context
;
866 rscreen
->screen
.fence_reference
= r600_fence_reference
;
867 rscreen
->screen
.fence_signalled
= r600_fence_signalled
;
868 rscreen
->screen
.fence_finish
= r600_fence_finish
;
869 r600_init_screen_resource_functions(&rscreen
->screen
);
871 if (rscreen
->info
.has_uvd
) {
872 rscreen
->screen
.get_video_param
= ruvd_get_video_param
;
873 rscreen
->screen
.is_video_format_supported
= ruvd_is_format_supported
;
875 rscreen
->screen
.get_video_param
= r600_get_video_param
;
876 rscreen
->screen
.is_video_format_supported
= vl_video_buffer_is_format_supported
;
879 util_format_s3tc_init();
881 rscreen
->fences
.bo
= NULL
;
882 rscreen
->fences
.data
= NULL
;
883 rscreen
->fences
.next_index
= 0;
884 LIST_INITHEAD(&rscreen
->fences
.pool
);
885 LIST_INITHEAD(&rscreen
->fences
.blocks
);
886 pipe_mutex_init(rscreen
->fences
.mutex
);
889 rscreen
->cs_count
= 0;
890 if (rscreen
->info
.drm_minor
>= 28) {
891 rscreen
->trace_bo
= (struct si_resource
*)pipe_buffer_create(&rscreen
->screen
,
895 if (rscreen
->trace_bo
) {
896 rscreen
->trace_ptr
= rscreen
->ws
->buffer_map(rscreen
->trace_bo
->cs_buf
, NULL
,
897 PIPE_TRANSFER_UNSYNCHRONIZED
);
902 return &rscreen
->screen
;