239 lines
13 KiB
Plaintext
239 lines
13 KiB
Plaintext
# RUN: llvm-mc -arch=amdgcn -mcpu=tonga -disassemble -show-encoding < %s | FileCheck %s -check-prefix=VI -check-prefix=GFX80
|
|
# RUN: llvm-mc -arch=amdgcn -mcpu=gfx810 -disassemble -show-encoding < %s | FileCheck %s -check-prefix=VI -check-prefix=GFX81
|
|
|
|
#===------------------------------------------------------------------------===#
|
|
# Image load/store
|
|
#===------------------------------------------------------------------------===#
|
|
|
|
# VI: image_load v[0:3], v4, s[8:15] dmask:0xf unorm ; encoding: [0x00,0x1f,0x00,0xf0,0x04,0x00,0x02,0x00]
|
|
0x00 0x1f 0x00 0xf0 0x04 0x00 0x02 0x00
|
|
|
|
# VI: image_load v[0:2], v4, s[8:15] dmask:0xe unorm ; encoding: [0x00,0x1e,0x00,0xf0,0x04,0x00,0x02,0x00]
|
|
0x00 0x1e 0x00 0xf0 0x04 0x00 0x02 0x00
|
|
|
|
# VI: image_load v[0:1], v0, s[0:7] dmask:0x3 unorm ; encoding: [0x00,0x13,0x00,0xf0,0x00,0x00,0x00,0x00]
|
|
0x00 0x13 0x00 0xf0 0x00 0x00 0x00 0x00
|
|
|
|
# VI: image_load v0, v0, s[0:7] dmask:0x1 unorm ; encoding: [0x00,0x11,0x00,0xf0,0x00,0x00,0x00,0x00]
|
|
0x00 0x11 0x00 0xf0 0x00 0x00 0x00 0x00
|
|
|
|
# VI: image_store v[0:3], v4, s[0:7] dmask:0xf unorm ; encoding: [0x00,0x1f,0x20,0xf0,0x04,0x00,0x00,0x00]
|
|
0x00 0x1f 0x20 0xf0 0x04 0x00 0x00 0x00
|
|
|
|
# VI: image_store v[0:2], v4, s[0:7] dmask:0xe unorm ; encoding: [0x00,0x1e,0x20,0xf0,0x04,0x00,0x00,0x00]
|
|
0x00 0x1e 0x20 0xf0 0x04 0x00 0x00 0x00
|
|
|
|
# VI: image_store v[0:1], v2, s[0:7] dmask:0x3 unorm ; encoding: [0x00,0x13,0x20,0xf0,0x02,0x00,0x00,0x00]
|
|
0x00 0x13 0x20 0xf0 0x02 0x00 0x00 0x00
|
|
|
|
# VI: image_store v0, v1, s[0:7] dmask:0x1 unorm ; encoding: [0x00,0x11,0x20,0xf0,0x01,0x00,0x00,0x00]
|
|
0x00 0x11 0x20 0xf0 0x01 0x00 0x00 0x00
|
|
|
|
# Test all modifiers
|
|
# FIXME: This test is incorrect because r128 assumes a 128-bit SRSRC.
|
|
# VI: image_load v[5:6], v1, s[8:15] dmask:0x1 unorm glc slc r128 tfe lwe da d16 ; encoding: [0x00,0xf1,0x03,0xf2,0x01,0x05,0x02,0x80]
|
|
0x00,0xf1,0x03,0xf2,0x01,0x05,0x02,0x80
|
|
|
|
# Test dmask == 0
|
|
# VI: image_load v0, v4, s[8:15] unorm ; encoding: [0x00,0x10,0x00,0xf0,0x04,0x00,0x02,0x00]
|
|
0x00 0x10 0x00 0xf0 0x04 0x00 0x02 0x00
|
|
|
|
# Test out of bounds register width
|
|
# VI: image_load v254, v0, s[0:7] dmask:0x7 unorm ; encoding: [0x00,0x17,0x00,0xf0,0x00,0xfe,0x00,0x00]
|
|
0x00 0x17 0x00 0xf0 0x00 0xfe 0x00 0x00
|
|
|
|
# VI: image_load v255, v0, s[0:7] dmask:0x1 unorm ; encoding: [0x00,0x11,0x00,0xf0,0x00,0xff,0x00,0x00]
|
|
0x00 0x11 0x00 0xf0 0x00 0xff 0x00 0x00
|
|
|
|
# VI: image_load v255, v0, s[0:7] dmask:0x3 unorm ; encoding: [0x00,0x13,0x00,0xf0,0x00,0xff,0x00,0x00]
|
|
0x00 0x13 0x00 0xf0 0x00 0xff 0x00 0x00
|
|
|
|
#===------------------------------------------------------------------------===#
|
|
# Image load/store: packed/unpacked d16
|
|
#===------------------------------------------------------------------------===#
|
|
|
|
# GFX80: image_load v[0:1], v4, s[8:15] dmask:0x3 d16 ; encoding: [0x00,0x03,0x00,0xf0,0x04,0x00,0x02,0x80]
|
|
# GFX81: image_load v0, v4, s[8:15] dmask:0x3 d16 ; encoding: [0x00,0x03,0x00,0xf0,0x04,0x00,0x02,0x80]
|
|
0x00,0x03,0x00,0xf0,0x04,0x00,0x02,0x80
|
|
|
|
# GFX80: image_load v[0:2], v4, s[8:15] dmask:0x7 d16 ; encoding: [0x00,0x07,0x00,0xf0,0x04,0x00,0x02,0x80]
|
|
# GFX81: image_load v[0:1], v4, s[8:15] dmask:0x7 d16 ; encoding: [0x00,0x07,0x00,0xf0,0x04,0x00,0x02,0x80]
|
|
0x00,0x07,0x00,0xf0,0x04,0x00,0x02,0x80
|
|
|
|
# GFX80: image_load v[0:3], v4, s[8:15] dmask:0xf d16 ; encoding: [0x00,0x0f,0x00,0xf0,0x04,0x00,0x02,0x80]
|
|
# GFX81: image_load v[0:1], v4, s[8:15] dmask:0xf d16 ; encoding: [0x00,0x0f,0x00,0xf0,0x04,0x00,0x02,0x80]
|
|
0x00,0x0f,0x00,0xf0,0x04,0x00,0x02,0x80
|
|
|
|
# GFX80: image_store v[0:1], v4, s[8:15] dmask:0x3 d16 ; encoding: [0x00,0x03,0x20,0xf0,0x04,0x00,0x02,0x80]
|
|
# GFX81: image_store v0, v4, s[8:15] dmask:0x3 d16 ; encoding: [0x00,0x03,0x20,0xf0,0x04,0x00,0x02,0x80]
|
|
0x00,0x03,0x20,0xf0,0x04,0x00,0x02,0x80
|
|
|
|
# GFX80: image_store v[0:2], v4, s[8:15] dmask:0x7 d16 ; encoding: [0x00,0x07,0x20,0xf0,0x04,0x00,0x02,0x80]
|
|
# GFX81: image_store v[0:1], v4, s[8:15] dmask:0x7 d16 ; encoding: [0x00,0x07,0x20,0xf0,0x04,0x00,0x02,0x80]
|
|
0x00,0x07,0x20,0xf0,0x04,0x00,0x02,0x80
|
|
|
|
# GFX80: image_store v[0:3], v4, s[8:15] dmask:0xf d16 ; encoding: [0x00,0x0f,0x20,0xf0,0x04,0x00,0x02,0x80]
|
|
# GFX81: image_store v[0:1], v4, s[8:15] dmask:0xf d16 ; encoding: [0x00,0x0f,0x20,0xf0,0x04,0x00,0x02,0x80]
|
|
0x00,0x0f,0x20,0xf0,0x04,0x00,0x02,0x80
|
|
|
|
# GFX80: image_load v[0:2], v4, s[8:15] dmask:0x3 tfe d16 ; encoding: [0x00,0x03,0x01,0xf0,0x04,0x00,0x02,0x80]
|
|
# GFX81: image_load v[0:1], v4, s[8:15] dmask:0x3 tfe d16 ; encoding: [0x00,0x03,0x01,0xf0,0x04,0x00,0x02,0x80]
|
|
0x00,0x03,0x01,0xf0,0x04,0x00,0x02,0x80
|
|
|
|
# GFX80: image_load v[0:3], v4, s[8:15] dmask:0x7 tfe d16 ; encoding: [0x00,0x07,0x01,0xf0,0x04,0x00,0x02,0x80]
|
|
# GFX81: image_load v[0:2], v4, s[8:15] dmask:0x7 tfe d16 ; encoding: [0x00,0x07,0x01,0xf0,0x04,0x00,0x02,0x80]
|
|
0x00,0x07,0x01,0xf0,0x04,0x00,0x02,0x80
|
|
|
|
# GFX80: image_load v[0:4], v4, s[8:15] dmask:0xf tfe d16 ; encoding: [0x00,0x0f,0x01,0xf0,0x04,0x00,0x02,0x80]
|
|
# GFX81: image_load v[0:2], v4, s[8:15] dmask:0xf tfe d16 ; encoding: [0x00,0x0f,0x01,0xf0,0x04,0x00,0x02,0x80]
|
|
0x00,0x0f,0x01,0xf0,0x04,0x00,0x02,0x80
|
|
|
|
# GFX80: image_store v[0:2], v4, s[8:15] dmask:0x3 tfe d16 ; encoding: [0x00,0x03,0x21,0xf0,0x04,0x00,0x02,0x80]
|
|
# GFX81: image_store v[0:1], v4, s[8:15] dmask:0x3 tfe d16 ; encoding: [0x00,0x03,0x21,0xf0,0x04,0x00,0x02,0x80]
|
|
0x00,0x03,0x21,0xf0,0x04,0x00,0x02,0x80
|
|
|
|
# GFX80: image_store v[0:3], v4, s[8:15] dmask:0x7 tfe d16 ; encoding: [0x00,0x07,0x21,0xf0,0x04,0x00,0x02,0x80]
|
|
# GFX81: image_store v[0:2], v4, s[8:15] dmask:0x7 tfe d16 ; encoding: [0x00,0x07,0x21,0xf0,0x04,0x00,0x02,0x80]
|
|
0x00,0x07,0x21,0xf0,0x04,0x00,0x02,0x80
|
|
|
|
# GFX80: image_store v[0:4], v4, s[8:15] dmask:0xf tfe d16 ; encoding: [0x00,0x0f,0x21,0xf0,0x04,0x00,0x02,0x80]
|
|
# GFX81: image_store v[0:2], v4, s[8:15] dmask:0xf tfe d16 ; encoding: [0x00,0x0f,0x21,0xf0,0x04,0x00,0x02,0x80]
|
|
0x00,0x0f,0x21,0xf0,0x04,0x00,0x02,0x80
|
|
#===------------------------------------------------------------------------===#
|
|
# Image load/store: PCK variants
|
|
#===------------------------------------------------------------------------===#
|
|
|
|
# VI: image_load_mip_pck v5, v1, s[8:15] dmask:0x1 ; encoding: [0x00,0x01,0x10,0xf0,0x01,0x05,0x02,0x00]
|
|
0x00,0x01,0x10,0xf0,0x01,0x05,0x02,0x00
|
|
|
|
# VI: image_load_mip_pck v[5:6], v1, s[8:15] dmask:0x3 ; encoding: [0x00,0x03,0x10,0xf0,0x01,0x05,0x02,0x00]
|
|
0x00,0x03,0x10,0xf0,0x01,0x05,0x02,0x00
|
|
|
|
# VI: image_load_mip_pck_sgn v[5:6], v1, s[8:15] dmask:0x5 ; encoding: [0x00,0x05,0x14,0xf0,0x01,0x05,0x02,0x00]
|
|
0x00,0x05,0x14,0xf0,0x01,0x05,0x02,0x00
|
|
|
|
# VI: image_load_pck v5, v1, s[8:15] dmask:0x1 glc ; encoding: [0x00,0x21,0x08,0xf0,0x01,0x05,0x02,0x00]
|
|
0x00,0x21,0x08,0xf0,0x01,0x05,0x02,0x00
|
|
|
|
# VI: image_load_pck_sgn v5, v1, s[8:15] dmask:0x1 lwe ; encoding: [0x00,0x01,0x0e,0xf0,0x01,0x05,0x02,0x00]
|
|
0x00,0x01,0x0e,0xf0,0x01,0x05,0x02,0x00
|
|
|
|
# VI: image_store_mip_pck v252, v2, s[12:19] dmask:0x1 unorm ; encoding: [0x00,0x11,0x2c,0xf0,0x02,0xfc,0x03,0x00]
|
|
0x00,0x11,0x2c,0xf0,0x02,0xfc,0x03,0x00
|
|
|
|
# VI: image_store_mip_pck v1, v2, s[12:19] dmask:0x1 unorm glc slc lwe da ; encoding: [0x00,0x71,0x2e,0xf2,0x02,0x01,0x03,0x00]
|
|
0x00,0x71,0x2e,0xf2,0x02,0x01,0x03,0x00
|
|
|
|
# VI: image_store_pck v1, v2, s[12:19] dmask:0x1 unorm da ; encoding: [0x00,0x51,0x28,0xf0,0x02,0x01,0x03,0x00]
|
|
0x00,0x51,0x28,0xf0,0x02,0x01,0x03,0x00
|
|
|
|
#===------------------------------------------------------------------------===#
|
|
# Image sample
|
|
#===------------------------------------------------------------------------===#
|
|
|
|
# VI: image_sample v[193:195], v237, s[28:35], s[4:7] dmask:0x7 unorm ; encoding: [0x00,0x17,0x80,0xf0,0xed,0xc1,0x27,0x00]
|
|
0x00,0x17,0x80,0xf0,0xed,0xc1,0x27,0x00
|
|
|
|
# GFX80: image_sample v[193:194], v237, s[28:35], s[4:7] dmask:0x3 d16 ; encoding: [0x00,0x03,0x80,0xf0,0xed,0xc1,0x27,0x80]
|
|
# GFX81: image_sample v193, v237, s[28:35], s[4:7] dmask:0x3 d16 ; encoding: [0x00,0x03,0x80,0xf0,0xed,0xc1,0x27,0x80]
|
|
0x00,0x03,0x80,0xf0,0xed,0xc1,0x27,0x80
|
|
|
|
# GFX80: image_sample v[193:195], v237, s[28:35], s[4:7] dmask:0x7 d16 ; encoding: [0x00,0x07,0x80,0xf0,0xed,0xc1,0x27,0x80]
|
|
# GFX81: image_sample v[193:194], v237, s[28:35], s[4:7] dmask:0x7 d16 ; encoding: [0x00,0x07,0x80,0xf0,0xed,0xc1,0x27,0x80]
|
|
0x00,0x07,0x80,0xf0,0xed,0xc1,0x27,0x80
|
|
|
|
# GFX80: image_sample v[193:196], v237, s[28:35], s[4:7] dmask:0xf d16 ; encoding: [0x00,0x0f,0x80,0xf0,0xed,0xc1,0x27,0x80]
|
|
# GFX81: image_sample v[193:194], v237, s[28:35], s[4:7] dmask:0xf d16 ; encoding: [0x00,0x0f,0x80,0xf0,0xed,0xc1,0x27,0x80]
|
|
0x00,0x0f,0x80,0xf0,0xed,0xc1,0x27,0x80
|
|
|
|
#===------------------------------------------------------------------------===#
|
|
# Image atomics
|
|
#===------------------------------------------------------------------------===#
|
|
|
|
# VI: image_atomic_add v5, v1, s[8:15] dmask:0x1 unorm ; encoding: [0x00,0x11,0x48,0xf0,0x01,0x05,0x02,0x00]
|
|
0x00,0x11,0x48,0xf0,0x01,0x05,0x02,0x00
|
|
|
|
# VI: image_atomic_add v252, v1, s[8:15] dmask:0x1 unorm ; encoding: [0x00,0x11,0x48,0xf0,0x01,0xfc,0x02,0x00]
|
|
0x00,0x11,0x48,0xf0,0x01,0xfc,0x02,0x00
|
|
|
|
# VI: image_atomic_add v5, v255, s[8:15] dmask:0x1 unorm ; encoding: [0x00,0x11,0x48,0xf0,0xff,0x05,0x02,0x00]
|
|
0x00,0x11,0x48,0xf0,0xff,0x05,0x02,0x00
|
|
|
|
# VI: image_atomic_add v5, v1, s[92:99] dmask:0x1 unorm ; encoding: [0x00,0x11,0x48,0xf0,0x01,0x05,0x17,0x00]
|
|
0x00,0x11,0x48,0xf0,0x01,0x05,0x17,0x00
|
|
|
|
# VI: image_atomic_add v5, v1, s[8:15] dmask:0x1 unorm glc ; encoding: [0x00,0x31,0x48,0xf0,0x01,0x05,0x02,0x00]
|
|
0x00,0x31,0x48,0xf0,0x01,0x05,0x02,0x00
|
|
|
|
# VI: image_atomic_add v5, v1, s[8:15] dmask:0x1 unorm slc ; encoding: [0x00,0x11,0x48,0xf2,0x01,0x05,0x02,0x00]
|
|
0x00,0x11,0x48,0xf2,0x01,0x05,0x02,0x00
|
|
|
|
# VI: image_atomic_add v5, v1, s[8:15] dmask:0x1 unorm lwe ; encoding: [0x00,0x11,0x4a,0xf0,0x01,0x05,0x02,0x00]
|
|
0x00,0x11,0x4a,0xf0,0x01,0x05,0x02,0x00
|
|
|
|
# VI: image_atomic_add v5, v1, s[8:15] dmask:0x1 unorm da ; encoding: [0x00,0x51,0x48,0xf0,0x01,0x05,0x02,0x00]
|
|
0x00,0x51,0x48,0xf0,0x01,0x05,0x02,0x00
|
|
|
|
# VI: image_atomic_add v[5:6], v1, s[8:15] dmask:0x3 unorm ; encoding: [0x00,0x13,0x48,0xf0,0x01,0x05,0x02,0x00]
|
|
0x00,0x13,0x48,0xf0,0x01,0x05,0x02,0x00
|
|
|
|
# VI: image_atomic_cmpswap v[5:6], v1, s[8:15] dmask:0x3 unorm ; encoding: [0x00,0x13,0x44,0xf0,0x01,0x05,0x02,0x00]
|
|
0x00,0x13,0x44,0xf0,0x01,0x05,0x02,0x00
|
|
|
|
# VI: image_atomic_cmpswap v[5:8], v1, s[8:15] dmask:0xf unorm ; encoding: [0x00,0x1f,0x44,0xf0,0x01,0x05,0x02,0x00]
|
|
0x00,0x1f,0x44,0xf0,0x01,0x05,0x02,0x00
|
|
|
|
#===------------------------------------------------------------------------===#
|
|
# Invalid image atomics (incorrect dmask value).
|
|
# Disassembler may produce a partially incorrect instruction but should not fail.
|
|
#===------------------------------------------------------------------------===#
|
|
|
|
# VI: image_atomic_add v5, v1, s[8:15] dmask:0x2 unorm ; encoding: [0x00,0x12,0x48,0xf0,0x01,0x05,0x02,0x00]
|
|
0x00,0x12,0x48,0xf0,0x01,0x05,0x02,0x00
|
|
|
|
# VI: image_atomic_add v5, v1, s[8:15] dmask:0x7 unorm ; encoding: [0x00,0x17,0x48,0xf0,0x01,0x05,0x02,0x00]
|
|
0x00,0x17,0x48,0xf0,0x01,0x05,0x02,0x00
|
|
|
|
# VI: image_atomic_add v5, v1, s[8:15] dmask:0xf unorm ; encoding: [0x00,0x1f,0x48,0xf0,0x01,0x05,0x02,0x00]
|
|
0x00,0x1f,0x48,0xf0,0x01,0x05,0x02,0x00
|
|
|
|
# VI: image_atomic_cmpswap v[5:6], v1, s[8:15] unorm ; encoding: [0x00,0x10,0x44,0xf0,0x01,0x05,0x02,0x00]
|
|
0x00,0x10,0x44,0xf0,0x01,0x05,0x02,0x00
|
|
|
|
# VI: image_atomic_cmpswap v[5:6], v1, s[8:15] dmask:0x1 unorm ; encoding: [0x00,0x11,0x44,0xf0,0x01,0x05,0x02,0x00]
|
|
0x00,0x11,0x44,0xf0,0x01,0x05,0x02,0x00
|
|
|
|
# VI: image_atomic_cmpswap v[5:6], v1, s[8:15] dmask:0xe unorm ; encoding: [0x00,0x1e,0x44,0xf0,0x01,0x05,0x02,0x00]
|
|
0x00,0x1e,0x44,0xf0,0x01,0x05,0x02,0x00
|
|
|
|
#===------------------------------------------------------------------------===#
|
|
# Image gather
|
|
#===------------------------------------------------------------------------===#
|
|
|
|
# VI: image_gather4 v[252:255], v1, s[8:15], s[12:15] dmask:0x1 ; encoding: [0x00,0x01,0x00,0xf1,0x01,0xfc,0x62,0x00]
|
|
0x00,0x01,0x00,0xf1,0x01,0xfc,0x62,0x00
|
|
|
|
# VI: image_gather4 v[5:8], v1, s[8:15], s[12:15] dmask:0x2 ; encoding: [0x00,0x02,0x00,0xf1,0x01,0x05,0x62,0x00]
|
|
0x00,0x02,0x00,0xf1,0x01,0x05,0x62,0x00
|
|
|
|
# VI: image_gather4 v[5:8], v1, s[8:15], s[12:15] dmask:0x4 ; encoding: [0x00,0x04,0x00,0xf1,0x01,0x05,0x62,0x00]
|
|
0x00,0x04,0x00,0xf1,0x01,0x05,0x62,0x00
|
|
|
|
# VI: image_gather4 v[5:8], v1, s[8:15], s[12:15] dmask:0x8 ; encoding: [0x00,0x08,0x00,0xf1,0x01,0x05,0x62,0x00]
|
|
0x00,0x08,0x00,0xf1,0x01,0x05,0x62,0x00
|
|
|
|
# GFX80: image_gather4 v[252:255], v1, s[8:15], s[12:15] dmask:0x1 unorm glc slc lwe da d16 ; encoding: [0x00,0x71,0x02,0xf3,0x01,0xfc,0x62,0x80]
|
|
# GFX81: image_gather4 v[252:253], v1, s[8:15], s[12:15] dmask:0x1 unorm glc slc lwe da d16 ; encoding: [0x00,0x71,0x02,0xf3,0x01,0xfc,0x62,0x80]
|
|
0x00,0x71,0x02,0xf3,0x01,0xfc,0x62,0x80
|
|
|
|
#===------------------------------------------------------------------------===#
|
|
# Invalid image gather (incorrect dmask value or tfe).
|
|
# Disassembler may produce a partially incorrect instruction but should not fail.
|
|
#===------------------------------------------------------------------------===#
|
|
|
|
# VI: image_gather4 v[252:255], v1, s[8:15], s[12:15] dmask:0x3 ; encoding: [0x00,0x03,0x00,0xf1,0x01,0xfc,0x62,0x00]
|
|
0x00,0x03,0x00,0xf1,0x01,0xfc,0x62,0x00
|
|
|
|
# VI: image_gather4 v[252:255], v1, s[8:15], s[12:15] dmask:0x1 unorm glc slc tfe lwe da ; encoding: [0x00,0x71,0x03,0xf3,0x01,0xfc,0x62,0x00]
|
|
0x00,0x71,0x03,0xf3,0x01,0xfc,0x62,0x00
|