X-Git-Url: https://git.libre-soc.org/?a=blobdiff_plain;f=src%2Fgallium%2Fdrivers%2Fradeonsi%2Fsi_pm4.c;h=22c4a5b6e6efca1f90d14f65574cb0b5f260b363;hb=ae2cb7280436ab3fe24afef510d30201e54b795c;hp=bf923ec1eb686e3f6ff89afa4b71680eee2393a0;hpb=3e3d4f5e1def09f05deb9b94f3ec5862271312d2;p=mesa.git diff --git a/src/gallium/drivers/radeonsi/si_pm4.c b/src/gallium/drivers/radeonsi/si_pm4.c index bf923ec1eb6..22c4a5b6e6e 100644 --- a/src/gallium/drivers/radeonsi/si_pm4.c +++ b/src/gallium/drivers/radeonsi/si_pm4.c @@ -1,5 +1,6 @@ /* * Copyright 2012 Advanced Micro Devices, Inc. + * All Rights Reserved. * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the "Software"), @@ -19,12 +20,8 @@ * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE * USE OR OTHER DEALINGS IN THE SOFTWARE. - * - * Authors: - * Christian König */ -#include "radeon/r600_cs.h" #include "util/u_memory.h" #include "si_pipe.h" #include "sid.h" @@ -45,8 +42,7 @@ void si_pm4_cmd_end(struct si_pm4_state *state, bool predicate) unsigned count; count = state->ndw - state->last_pm4 - 2; state->pm4[state->last_pm4] = - PKT3(state->last_opcode, count, predicate) - | PKT3_SHADER_TYPE_S(state->compute_pkt); + PKT3(state->last_opcode, count, predicate); assert(state->ndw <= SI_PM4_MAX_DW); } @@ -72,7 +68,7 @@ void si_pm4_set_reg(struct si_pm4_state *state, unsigned reg, uint32_t val) reg -= CIK_UCONFIG_REG_OFFSET; } else { - R600_ERR("Invalid register offset %08x!\n", reg); + PRINT_ERR("Invalid register offset %08x!\n", reg); return; } @@ -89,14 +85,14 @@ void si_pm4_set_reg(struct si_pm4_state *state, unsigned reg, uint32_t val) } void si_pm4_add_bo(struct si_pm4_state *state, - struct r600_resource *bo, + struct si_resource *bo, enum radeon_bo_usage usage, enum radeon_bo_priority priority) { unsigned idx = state->nbo++; assert(idx < SI_PM4_MAX_BO); - r600_resource_reference(&state->bo[idx], bo); + si_resource_reference(&state->bo[idx], bo); state->bo_usage[idx] = usage; state->bo_priority[idx] = priority; } @@ -104,18 +100,12 @@ void si_pm4_add_bo(struct si_pm4_state *state, void si_pm4_clear_state(struct si_pm4_state *state) { for (int i = 0; i < state->nbo; ++i) - r600_resource_reference(&state->bo[i], NULL); - r600_resource_reference(&state->indirect_buffer, NULL); + si_resource_reference(&state->bo[i], NULL); + si_resource_reference(&state->indirect_buffer, NULL); state->nbo = 0; state->ndw = 0; } -void si_pm4_free_state_simple(struct si_pm4_state *state) -{ - si_pm4_clear_state(state); - FREE(state); -} - void si_pm4_free_state(struct si_context *sctx, struct si_pm4_state *state, unsigned idx) @@ -127,24 +117,25 @@ void si_pm4_free_state(struct si_context *sctx, sctx->emitted.array[idx] = NULL; } - si_pm4_free_state_simple(state); + si_pm4_clear_state(state); + FREE(state); } void si_pm4_emit(struct si_context *sctx, struct si_pm4_state *state) { - struct radeon_winsys_cs *cs = sctx->b.gfx.cs; + struct radeon_cmdbuf *cs = sctx->gfx_cs; for (int i = 0; i < state->nbo; ++i) { - radeon_add_to_buffer_list(&sctx->b, &sctx->b.gfx, state->bo[i], + radeon_add_to_buffer_list(sctx, sctx->gfx_cs, state->bo[i], state->bo_usage[i], state->bo_priority[i]); } if (!state->indirect_buffer) { radeon_emit_array(cs, state->pm4, state->ndw); } else { - struct r600_resource *ib = state->indirect_buffer; + struct si_resource *ib = state->indirect_buffer; - radeon_add_to_buffer_list(&sctx->b, &sctx->b.gfx, ib, + radeon_add_to_buffer_list(sctx, sctx->gfx_cs, ib, RADEON_USAGE_READ, RADEON_PRIO_IB2); @@ -153,6 +144,9 @@ void si_pm4_emit(struct si_context *sctx, struct si_pm4_state *state) radeon_emit(cs, ib->gpu_address >> 32); radeon_emit(cs, (ib->b.b.width0 >> 2) & 0xfffff); } + + if (state->atom.emit) + state->atom.emit(sctx); } void si_pm4_reset_emitted(struct si_context *sctx) @@ -164,25 +158,27 @@ void si_pm4_reset_emitted(struct si_context *sctx) void si_pm4_upload_indirect_buffer(struct si_context *sctx, struct si_pm4_state *state) { - struct pipe_screen *screen = sctx->b.b.screen; + struct pipe_screen *screen = sctx->b.screen; unsigned aligned_ndw = align(state->ndw, 8); /* only supported on CIK and later */ - if (sctx->b.chip_class < CIK) + if (sctx->chip_class < CIK) return; assert(state->ndw); assert(aligned_ndw <= SI_PM4_MAX_DW); - r600_resource_reference(&state->indirect_buffer, NULL); - state->indirect_buffer = (struct r600_resource*) - pipe_buffer_create(screen, 0, - PIPE_USAGE_DEFAULT, aligned_ndw * 4); + si_resource_reference(&state->indirect_buffer, NULL); + /* TODO: this hangs with 1024 or higher alignment on GFX9. */ + state->indirect_buffer = + si_aligned_buffer_create(screen, 0, + PIPE_USAGE_DEFAULT, aligned_ndw * 4, + 256); if (!state->indirect_buffer) return; /* Pad the IB to 8 DWs to meet CP fetch alignment requirements. */ - if (sctx->screen->b.info.gfx_ib_pad_with_type2) { + if (sctx->screen->info.gfx_ib_pad_with_type2) { for (int i = state->ndw; i < aligned_ndw; i++) state->pm4[i] = 0x80000000; /* type2 nop packet */ } else { @@ -190,6 +186,6 @@ void si_pm4_upload_indirect_buffer(struct si_context *sctx, state->pm4[i] = 0xffff1000; /* type3 nop packet */ } - pipe_buffer_write(&sctx->b.b, &state->indirect_buffer->b.b, + pipe_buffer_write(&sctx->b, &state->indirect_buffer->b.b, 0, aligned_ndw *4, state->pm4); }