intel/fs: Implement nir_intrinsic_{load,store}_ssbo_block_intel
Reviewed-by: Jason Ekstrand <jason@jlekstrand.net> Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/7448>
This commit is contained in:
parent
d372abe397
commit
9fe158e1d1
|
@ -4003,7 +4003,10 @@ fs_visitor::get_nir_ssbo_intrinsic_index(const brw::fs_builder &bld,
|
|||
nir_intrinsic_instr *instr)
|
||||
{
|
||||
/* SSBO stores are weird in that their index is in src[1] */
|
||||
const unsigned src = instr->intrinsic == nir_intrinsic_store_ssbo ? 1 : 0;
|
||||
const bool is_store =
|
||||
instr->intrinsic == nir_intrinsic_store_ssbo ||
|
||||
instr->intrinsic == nir_intrinsic_store_ssbo_block_intel;
|
||||
const unsigned src = is_store ? 1 : 0;
|
||||
|
||||
if (nir_src_is_const(instr->src[src])) {
|
||||
unsigned index = stage_prog_data->binding_table.ssbo_start +
|
||||
|
@ -5421,6 +5424,80 @@ fs_visitor::nir_emit_intrinsic(const fs_builder &bld, nir_intrinsic_instr *instr
|
|||
break;
|
||||
}
|
||||
|
||||
case nir_intrinsic_load_ssbo_block_intel: {
|
||||
assert(nir_dest_bit_size(instr->dest) == 32);
|
||||
|
||||
fs_reg address = bld.emit_uniformize(get_nir_src(instr->src[1]));
|
||||
|
||||
fs_reg srcs[SURFACE_LOGICAL_NUM_SRCS];
|
||||
srcs[SURFACE_LOGICAL_SRC_SURFACE] = get_nir_ssbo_intrinsic_index(bld, instr);
|
||||
srcs[SURFACE_LOGICAL_SRC_ADDRESS] = address;
|
||||
|
||||
const fs_builder ubld1 = bld.exec_all().group(1, 0);
|
||||
const fs_builder ubld8 = bld.exec_all().group(8, 0);
|
||||
const fs_builder ubld16 = bld.exec_all().group(16, 0);
|
||||
|
||||
const unsigned total = instr->num_components * dispatch_width;
|
||||
unsigned loaded = 0;
|
||||
|
||||
while (loaded < total) {
|
||||
const unsigned block =
|
||||
choose_oword_block_size_dwords(total - loaded);
|
||||
const unsigned block_bytes = block * 4;
|
||||
|
||||
srcs[SURFACE_LOGICAL_SRC_IMM_ARG] = brw_imm_ud(block);
|
||||
|
||||
const fs_builder &ubld = block == 8 ? ubld8 : ubld16;
|
||||
ubld.emit(SHADER_OPCODE_UNALIGNED_OWORD_BLOCK_READ_LOGICAL,
|
||||
retype(byte_offset(dest, loaded * 4), BRW_REGISTER_TYPE_UD),
|
||||
srcs, SURFACE_LOGICAL_NUM_SRCS)->size_written = block_bytes;
|
||||
|
||||
ubld1.ADD(address, address, brw_imm_ud(block_bytes));
|
||||
loaded += block;
|
||||
}
|
||||
|
||||
assert(loaded == total);
|
||||
break;
|
||||
}
|
||||
|
||||
case nir_intrinsic_store_ssbo_block_intel: {
|
||||
assert(nir_src_bit_size(instr->src[0]) == 32);
|
||||
|
||||
fs_reg address = bld.emit_uniformize(get_nir_src(instr->src[2]));
|
||||
fs_reg src = get_nir_src(instr->src[0]);
|
||||
|
||||
fs_reg srcs[SURFACE_LOGICAL_NUM_SRCS];
|
||||
srcs[SURFACE_LOGICAL_SRC_SURFACE] = get_nir_ssbo_intrinsic_index(bld, instr);
|
||||
srcs[SURFACE_LOGICAL_SRC_ADDRESS] = address;
|
||||
|
||||
const fs_builder ubld1 = bld.exec_all().group(1, 0);
|
||||
const fs_builder ubld8 = bld.exec_all().group(8, 0);
|
||||
const fs_builder ubld16 = bld.exec_all().group(16, 0);
|
||||
|
||||
const unsigned total = instr->num_components * dispatch_width;
|
||||
unsigned written = 0;
|
||||
|
||||
while (written < total) {
|
||||
const unsigned block =
|
||||
choose_oword_block_size_dwords(total - written);
|
||||
|
||||
srcs[SURFACE_LOGICAL_SRC_IMM_ARG] = brw_imm_ud(block);
|
||||
srcs[SURFACE_LOGICAL_SRC_DATA] =
|
||||
retype(byte_offset(src, written * 4), BRW_REGISTER_TYPE_UD);
|
||||
|
||||
const fs_builder &ubld = block == 8 ? ubld8 : ubld16;
|
||||
ubld.emit(SHADER_OPCODE_OWORD_BLOCK_WRITE_LOGICAL,
|
||||
fs_reg(), srcs, SURFACE_LOGICAL_NUM_SRCS);
|
||||
|
||||
const unsigned block_bytes = block * 4;
|
||||
ubld1.ADD(address, address, brw_imm_ud(block_bytes));
|
||||
written += block;
|
||||
}
|
||||
|
||||
assert(written == total);
|
||||
break;
|
||||
}
|
||||
|
||||
default:
|
||||
unreachable("unknown intrinsic");
|
||||
}
|
||||
|
|
Loading…
Reference in New Issue