X-Git-Url: https://git.libre-soc.org/?a=blobdiff_plain;f=src%2Fmesa%2Fdrivers%2Fdri%2Fi965%2Fgen8_vec4_generator.cpp;h=0c54e6ddd749d5aa9a865b74853bb91bb7be564e;hb=4a2f0e305ce30ac4dfc2ad3c380711a7aff3f63b;hp=b854db542d03f19f0e5cde50d46f3e199f082e82;hpb=a76e5dce4fc8d50f8699c108833f24e80167d706;p=mesa.git diff --git a/src/mesa/drivers/dri/i965/gen8_vec4_generator.cpp b/src/mesa/drivers/dri/i965/gen8_vec4_generator.cpp index b854db542d0..0c54e6ddd74 100644 --- a/src/mesa/drivers/dri/i965/gen8_vec4_generator.cpp +++ b/src/mesa/drivers/dri/i965/gen8_vec4_generator.cpp @@ -48,15 +48,6 @@ gen8_vec4_generator::~gen8_vec4_generator() { } -void -gen8_vec4_generator::mark_surface_used(unsigned surf_index) -{ - assert(surf_index < BRW_MAX_SURFACES); - - prog_data->base.binding_table.size_bytes = - MAX2(prog_data->base.binding_table.size_bytes, (surf_index + 1) * 4); -} - void gen8_vec4_generator::generate_tex(vec4_instruction *ir, struct brw_reg dst) { @@ -157,7 +148,7 @@ gen8_vec4_generator::generate_tex(vec4_instruction *ir, struct brw_reg dst) ir->header_present, BRW_SAMPLER_SIMD_MODE_SIMD4X2); - mark_surface_used(surf_index); + brw_mark_surface_used(&prog_data->base, surf_index); } void @@ -461,9 +452,66 @@ gen8_vec4_generator::generate_pull_constant_load(vec4_instruction *inst, false, /* no header */ false); /* EOT */ - mark_surface_used(surf_index); + brw_mark_surface_used(&prog_data->base, surf_index); } +void +gen8_vec4_generator::generate_untyped_atomic(vec4_instruction *ir, + struct brw_reg dst, + struct brw_reg atomic_op, + struct brw_reg surf_index) +{ + assert(atomic_op.file == BRW_IMMEDIATE_VALUE && + atomic_op.type == BRW_REGISTER_TYPE_UD && + surf_index.file == BRW_IMMEDIATE_VALUE && + surf_index.type == BRW_REGISTER_TYPE_UD); + assert((atomic_op.dw1.ud & ~0xf) == 0); + + unsigned msg_control = + atomic_op.dw1.ud | /* Atomic Operation Type: BRW_AOP_* */ + (1 << 5); /* Return data expected */ + + gen8_instruction *inst = next_inst(BRW_OPCODE_SEND); + gen8_set_dst(brw, inst, retype(dst, BRW_REGISTER_TYPE_UD)); + gen8_set_src0(brw, inst, brw_message_reg(ir->base_mrf)); + gen8_set_dp_message(brw, inst, HSW_SFID_DATAPORT_DATA_CACHE_1, + surf_index.dw1.ud, + HSW_DATAPORT_DC_PORT1_UNTYPED_ATOMIC_OP_SIMD4X2, + msg_control, + ir->mlen, + 1, + ir->header_present, + false); + + brw_mark_surface_used(&prog_data->base, surf_index.dw1.ud); +} + + + +void +gen8_vec4_generator::generate_untyped_surface_read(vec4_instruction *ir, + struct brw_reg dst, + struct brw_reg surf_index) +{ + assert(surf_index.file == BRW_IMMEDIATE_VALUE && + surf_index.type == BRW_REGISTER_TYPE_UD); + + gen8_instruction *inst = next_inst(BRW_OPCODE_SEND); + gen8_set_dst(brw, inst, retype(dst, BRW_REGISTER_TYPE_UD)); + gen8_set_src0(brw, inst, brw_message_reg(ir->base_mrf)); + gen8_set_dp_message(brw, inst, HSW_SFID_DATAPORT_DATA_CACHE_1, + surf_index.dw1.ud, + HSW_DATAPORT_DC_PORT1_UNTYPED_SURFACE_READ, + 0xe, /* enable only the R channel */ + ir->mlen, + 1, + ir->header_present, + false); + + brw_mark_surface_used(&prog_data->base, surf_index.dw1.ud); +} + + void gen8_vec4_generator::generate_vec4_instruction(vec4_instruction *instruction, struct brw_reg dst, @@ -770,11 +818,11 @@ gen8_vec4_generator::generate_vec4_instruction(vec4_instruction *instruction, break; case SHADER_OPCODE_UNTYPED_ATOMIC: - assert(!"XXX: Missing Gen8 vec4 support for UNTYPED_ATOMIC"); + generate_untyped_atomic(ir, dst, src[0], src[1]); break; case SHADER_OPCODE_UNTYPED_SURFACE_READ: - assert(!"XXX: Missing Gen8 vec4 support for UNTYPED_SURFACE_READ"); + generate_untyped_surface_read(ir, dst, src[0]); break; case VS_OPCODE_UNPACK_FLAGS_SIMD4X2: @@ -862,7 +910,7 @@ gen8_vec4_generator::generate_code(exec_list *instructions) } if (unlikely(debug_flag)) { - disassemble(stderr, last_native_inst_offset, next_inst_offset); + gen8_dump_compile(brw, store, last_native_inst_offset, next_inst_offset, stderr); } last_native_inst_offset = next_inst_offset; @@ -880,7 +928,7 @@ gen8_vec4_generator::generate_code(exec_list *instructions) * case you're doing that. */ if (0 && unlikely(debug_flag)) { - disassemble(stderr, 0, next_inst_offset); + gen8_dump_compile(brw, store, 0, next_inst_offset, stderr); } }