aco: workaround disassembler bug of v_writelane_b32 with literal

Signed-off-by: Rhys Perry <pendingchaos02@gmail.com>
Reviewed-by: Daniel Schürmann <daniel@schuermann.dev>
Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/6662>
diff --git a/src/amd/compiler/aco_print_asm.cpp b/src/amd/compiler/aco_print_asm.cpp
index ce12aac..b9a6226 100644
--- a/src/amd/compiler/aco_print_asm.cpp
+++ b/src/amd/compiler/aco_print_asm.cpp
@@ -153,6 +153,13 @@
                                        (exec_size - pos) * sizeof(uint32_t), pos * 4,
                                        outline, sizeof(outline));
 
+      if (program->chip_class >= GFX10 && l == 8 &&
+          ((binary[pos] & 0xffff0000) == 0xd7610000) &&
+          ((binary[pos + 1] & 0x1ff) == 0xff)) {
+         /* v_writelane with literal uses 3 dwords but llvm consumes only 2 */
+         l += 4;
+      }
+
       size_t new_pos;
       if (!l &&
           ((program->chip_class >= GFX9 && (binary[pos] & 0xffff8000) == 0xd1348000) || /* v_add_u32_e64 + clamp */