i965/vec4: emit correctly load_inputs for 64bit data
For dvec3 and dvec4 types, a single GRF do not have enough space to allocate two inputs from two different vertices (SIMD4x2). So the GRF only contains first two components for the two vertices, and the next GRF has the remaining components. We want to put all the components for the same vertex in the same register. Thus, we do a shuffle to reorder the data. Reviewed-by: Jordan Justen <jordan.l.justen@intel.com>
This commit is contained in:
parent
58fdb85f0f
commit
f51a5b51ab
|
@ -417,15 +417,24 @@ vec4_visitor::nir_emit_intrinsic(nir_intrinsic_instr *instr)
|
|||
/* We set EmitNoIndirectInput for VS */
|
||||
assert(const_offset);
|
||||
|
||||
src = src_reg(ATTR, instr->const_index[0] + const_offset->u32[0],
|
||||
glsl_type::uvec4_type);
|
||||
/* Swizzle source based on component layout qualifier */
|
||||
src.swizzle = BRW_SWZ_COMP_INPUT(nir_intrinsic_component(instr));
|
||||
|
||||
dest = get_nir_dest(instr->dest, src.type);
|
||||
dest = get_nir_dest(instr->dest);
|
||||
dest.writemask = brw_writemask_for_size(instr->num_components);
|
||||
|
||||
emit(MOV(dest, src));
|
||||
src = src_reg(ATTR, instr->const_index[0] + const_offset->u32[0],
|
||||
glsl_type::uvec4_type);
|
||||
src = retype(src, dest.type);
|
||||
|
||||
bool is_64bit = nir_dest_bit_size(instr->dest) == 64;
|
||||
if (is_64bit) {
|
||||
dst_reg tmp = dst_reg(this, glsl_type::dvec4_type);
|
||||
src.swizzle = BRW_SWIZZLE_XYZW;
|
||||
shuffle_64bit_data(tmp, src, false);
|
||||
emit(MOV(dest, src_reg(tmp)));
|
||||
} else {
|
||||
/* Swizzle source based on component layout qualifier */
|
||||
src.swizzle = BRW_SWZ_COMP_INPUT(nir_intrinsic_component(instr));
|
||||
emit(MOV(dest, src));
|
||||
}
|
||||
break;
|
||||
}
|
||||
|
||||
|
|
Loading…
Reference in New Issue