intel/nir: Lower things with > 4 components in lower_mem_access_bit_sizes
Reviewed-by: Lionel Landwerlin <lionel.g.landwerlin@intel.com>
Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/6502>
diff --git a/src/intel/compiler/brw_nir_lower_mem_access_bit_sizes.c b/src/intel/compiler/brw_nir_lower_mem_access_bit_sizes.c
index c26ea0b..4ea20fe 100644
--- a/src/intel/compiler/brw_nir_lower_mem_access_bit_sizes.c
+++ b/src/intel/compiler/brw_nir_lower_mem_access_bit_sizes.c
@@ -86,7 +86,7 @@
const unsigned bytes_read = num_components * (bit_size / 8);
const unsigned align = nir_intrinsic_align(intrin);
- if (bit_size == 32 && align >= 32 &&
+ if (bit_size == 32 && align >= 32 && intrin->num_components <= 4 &&
(!needs_scalar || intrin->num_components == 1))
return false;
@@ -169,7 +169,7 @@
assert(writemask < (1 << num_components));
if ((value->bit_size <= 32 && num_components == 1) ||
- (value->bit_size == 32 && align >= 32 &&
+ (value->bit_size == 32 && num_components <= 4 && align >= 32 &&
writemask == (1 << num_components) - 1 &&
!needs_scalar))
return false;