1166 lines
48 KiB
LLVM
1166 lines
48 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
|
|
; RUN: llc -global-isel -march=amdgcn -mcpu=verde -verify-machineinstrs -show-mc-encoding < %s | FileCheck -check-prefixes=GFX6 %s
|
|
; RUN: llc -global-isel -march=amdgcn -mcpu=tonga -verify-machineinstrs -show-mc-encoding < %s | FileCheck -check-prefixes=GFX789 %s
|
|
; RUN: llc -global-isel -march=amdgcn -mcpu=gfx900 -verify-machineinstrs -show-mc-encoding < %s | FileCheck -check-prefixes=GFX789 %s
|
|
; RUN: llc -global-isel -march=amdgcn -mcpu=gfx1010 -verify-machineinstrs -show-mc-encoding < %s | FileCheck -check-prefixes=GFX10 %s
|
|
|
|
; FIXME: This test has a DAG duplicate
|
|
|
|
; Immediate values:
|
|
; (mode register ID = 1) | (Offset << 6) | ((Width - 1) << 11)
|
|
; Offset: fp_round = 0, fp_denorm = 4, dx10_clamp = 8, ieee_mode = 9
|
|
|
|
|
|
; Set FP32 fp_round to round to zero
|
|
define amdgpu_kernel void @test_setreg_f32_round_mode_rtz() {
|
|
; GFX6-LABEL: test_setreg_f32_round_mode_rtz:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 2), 3 ; encoding: [0x01,0x08,0x80,0xba,0x03,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_f32_round_mode_rtz:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 2), 3 ; encoding: [0x01,0x08,0x00,0xba,0x03,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_f32_round_mode_rtz:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 2), 3 ; encoding: [0x01,0x08,0x80,0xba,0x03,0x00,0x00,0x00]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 2049, i32 3)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
; Set FP64/FP16 fp_round to round to zero
|
|
define amdgpu_kernel void @test_setreg_f64_round_mode_rtz() {
|
|
; GFX6-LABEL: test_setreg_f64_round_mode_rtz:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 2, 2), 3 ; encoding: [0x81,0x08,0x80,0xba,0x03,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_f64_round_mode_rtz:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 2, 2), 3 ; encoding: [0x81,0x08,0x00,0xba,0x03,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_f64_round_mode_rtz:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 2, 2), 3 ; encoding: [0x81,0x08,0x80,0xba,0x03,0x00,0x00,0x00]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 2177, i32 3)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
; Set all fp_round to round to zero
|
|
define amdgpu_kernel void @test_setreg_all_round_mode_rtz() {
|
|
; GFX6-LABEL: test_setreg_all_round_mode_rtz:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 2, 4), 7 ; encoding: [0x81,0x18,0x80,0xba,0x07,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_all_round_mode_rtz:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 2, 4), 7 ; encoding: [0x81,0x18,0x00,0xba,0x07,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_all_round_mode_rtz:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 2, 4), 7 ; encoding: [0x81,0x18,0x80,0xba,0x07,0x00,0x00,0x00]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 6273, i32 7)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
; Set FP32 fp_round to dynamic mode
|
|
define amdgpu_cs void @test_setreg_roundingmode_var(i32 inreg %var.mode) {
|
|
; GFX6-LABEL: test_setreg_roundingmode_var:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_b32 hwreg(HW_REG_MODE, 0, 2), s0 ; encoding: [0x01,0x08,0x80,0xb9]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_roundingmode_var:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_b32 hwreg(HW_REG_MODE, 0, 2), s0 ; encoding: [0x01,0x08,0x00,0xb9]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_roundingmode_var:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_setreg_b32 hwreg(HW_REG_MODE, 0, 2), s0 ; encoding: [0x01,0x08,0x80,0xb9]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 2049, i32 %var.mode)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_ieee_mode_off() {
|
|
; GFX6-LABEL: test_setreg_ieee_mode_off:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 9, 1), 0 ; encoding: [0x41,0x02,0x80,0xba,0x00,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_ieee_mode_off:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 9, 1), 0 ; encoding: [0x41,0x02,0x00,0xba,0x00,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_ieee_mode_off:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 9, 1), 0 ; encoding: [0x41,0x02,0x80,0xba,0x00,0x00,0x00,0x00]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 577, i32 0)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_ieee_mode_on() {
|
|
; GFX6-LABEL: test_setreg_ieee_mode_on:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 9, 1), 1 ; encoding: [0x41,0x02,0x80,0xba,0x01,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_ieee_mode_on:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 9, 1), 1 ; encoding: [0x41,0x02,0x00,0xba,0x01,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_ieee_mode_on:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 9, 1), 1 ; encoding: [0x41,0x02,0x80,0xba,0x01,0x00,0x00,0x00]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 577, i32 1)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_dx10_clamp_off() {
|
|
; GFX6-LABEL: test_setreg_dx10_clamp_off:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 8, 1), 0 ; encoding: [0x01,0x02,0x80,0xba,0x00,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_dx10_clamp_off:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 8, 1), 0 ; encoding: [0x01,0x02,0x00,0xba,0x00,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_dx10_clamp_off:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 8, 1), 0 ; encoding: [0x01,0x02,0x80,0xba,0x00,0x00,0x00,0x00]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 513, i32 0)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_dx10_clamp_on() {
|
|
; GFX6-LABEL: test_setreg_dx10_clamp_on:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 8, 1), 1 ; encoding: [0x01,0x02,0x80,0xba,0x01,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_dx10_clamp_on:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 8, 1), 1 ; encoding: [0x01,0x02,0x00,0xba,0x01,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_dx10_clamp_on:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 8, 1), 1 ; encoding: [0x01,0x02,0x80,0xba,0x01,0x00,0x00,0x00]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 513, i32 1)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
; Sets full width of fp round and fp denorm fields, to a variable
|
|
define amdgpu_cs void @test_setreg_full_both_round_mode_and_denorm_mode(i32 inreg %mode) {
|
|
; GFX6-LABEL: test_setreg_full_both_round_mode_and_denorm_mode:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_b32 hwreg(HW_REG_MODE, 0, 8), s0 ; encoding: [0x01,0x38,0x80,0xb9]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_both_round_mode_and_denorm_mode:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_b32 hwreg(HW_REG_MODE, 0, 8), s0 ; encoding: [0x01,0x38,0x00,0xb9]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_both_round_mode_and_denorm_mode:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_setreg_b32 hwreg(HW_REG_MODE, 0, 8), s0 ; encoding: [0x01,0x38,0x80,0xb9]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 14337, i32 inreg %mode)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
; Does not cover last bit of denorm field
|
|
define amdgpu_cs void @test_setreg_most_both_round_mode_and_denorm_mode() {
|
|
; GFX6-LABEL: test_setreg_most_both_round_mode_and_denorm_mode:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 7), 6 ; encoding: [0x01,0x30,0x80,0xba,0x06,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_most_both_round_mode_and_denorm_mode:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 7), 6 ; encoding: [0x01,0x30,0x00,0xba,0x06,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_most_both_round_mode_and_denorm_mode:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 7), 6 ; encoding: [0x01,0x30,0x80,0xba,0x06,0x00,0x00,0x00]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 12289, i32 6)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
; Does not cover first bit of denorm field
|
|
define amdgpu_cs void @test_setreg_most_both_round_mode_and_denorm_mode_6() {
|
|
; GFX6-LABEL: test_setreg_most_both_round_mode_and_denorm_mode_6:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 1, 3), 6 ; encoding: [0x41,0x10,0x80,0xba,0x06,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_most_both_round_mode_and_denorm_mode_6:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 1, 3), 6 ; encoding: [0x41,0x10,0x00,0xba,0x06,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_most_both_round_mode_and_denorm_mode_6:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 1, 3), 6 ; encoding: [0x41,0x10,0x80,0xba,0x06,0x00,0x00,0x00]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 4161, i32 6)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_cs void @test_setreg_f32_denorm_mode(i32 inreg %val) {
|
|
; GFX6-LABEL: test_setreg_f32_denorm_mode:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_b32 hwreg(HW_REG_MODE, 4, 2), s0 ; encoding: [0x01,0x09,0x80,0xb9]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_f32_denorm_mode:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_b32 hwreg(HW_REG_MODE, 4, 2), s0 ; encoding: [0x01,0x09,0x00,0xb9]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_f32_denorm_mode:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_setreg_b32 hwreg(HW_REG_MODE, 4, 2), s0 ; encoding: [0x01,0x09,0x80,0xb9]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 2305, i32 %val)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_cs void @test_setreg_f64_denorm_mode(i32 inreg %val) {
|
|
; GFX6-LABEL: test_setreg_f64_denorm_mode:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_b32 hwreg(HW_REG_MODE, 6, 2), s0 ; encoding: [0x81,0x09,0x80,0xb9]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_f64_denorm_mode:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_b32 hwreg(HW_REG_MODE, 6, 2), s0 ; encoding: [0x81,0x09,0x00,0xb9]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_f64_denorm_mode:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_setreg_b32 hwreg(HW_REG_MODE, 6, 2), s0 ; encoding: [0x81,0x09,0x80,0xb9]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 2433, i32 %val)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_cs void @test_setreg_full_denorm_mode(i32 inreg %val) {
|
|
; GFX6-LABEL: test_setreg_full_denorm_mode:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_b32 hwreg(HW_REG_MODE, 0, 4), s0 ; encoding: [0x01,0x18,0x80,0xb9]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_denorm_mode:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_b32 hwreg(HW_REG_MODE, 0, 4), s0 ; encoding: [0x01,0x18,0x00,0xb9]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_denorm_mode:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_setreg_b32 hwreg(HW_REG_MODE, 0, 4), s0 ; encoding: [0x01,0x18,0x80,0xb9]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 6145, i32 %val)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_full_round_mode_0() {
|
|
; GFX6-LABEL: test_setreg_full_round_mode_0:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 4), 0 ; encoding: [0x01,0x18,0x80,0xba,0x00,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_round_mode_0:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 4), 0 ; encoding: [0x01,0x18,0x00,0xba,0x00,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_round_mode_0:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_round_mode 0x0 ; encoding: [0x00,0x00,0xa4,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 6145, i32 0)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_full_round_mode_1() {
|
|
; GFX6-LABEL: test_setreg_full_round_mode_1:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 4), 1 ; encoding: [0x01,0x18,0x80,0xba,0x01,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_round_mode_1:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 4), 1 ; encoding: [0x01,0x18,0x00,0xba,0x01,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_round_mode_1:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_round_mode 0x1 ; encoding: [0x01,0x00,0xa4,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 6145, i32 1)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_full_round_mode_2() {
|
|
; GFX6-LABEL: test_setreg_full_round_mode_2:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 4), 2 ; encoding: [0x01,0x18,0x80,0xba,0x02,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_round_mode_2:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 4), 2 ; encoding: [0x01,0x18,0x00,0xba,0x02,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_round_mode_2:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_round_mode 0x2 ; encoding: [0x02,0x00,0xa4,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 6145, i32 2)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_full_round_mode_4() {
|
|
; GFX6-LABEL: test_setreg_full_round_mode_4:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 4), 4 ; encoding: [0x01,0x18,0x80,0xba,0x04,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_round_mode_4:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 4), 4 ; encoding: [0x01,0x18,0x00,0xba,0x04,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_round_mode_4:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_round_mode 0x4 ; encoding: [0x04,0x00,0xa4,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 6145, i32 4)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_full_round_mode_8() {
|
|
; GFX6-LABEL: test_setreg_full_round_mode_8:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 4), 8 ; encoding: [0x01,0x18,0x80,0xba,0x08,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_round_mode_8:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 4), 8 ; encoding: [0x01,0x18,0x00,0xba,0x08,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_round_mode_8:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_round_mode 0x8 ; encoding: [0x08,0x00,0xa4,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 6145, i32 8)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_full_round_mode_15() {
|
|
; GFX6-LABEL: test_setreg_full_round_mode_15:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 4), 15 ; encoding: [0x01,0x18,0x80,0xba,0x0f,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_round_mode_15:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 4), 15 ; encoding: [0x01,0x18,0x00,0xba,0x0f,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_round_mode_15:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_round_mode 0xf ; encoding: [0x0f,0x00,0xa4,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 6145, i32 15)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
; Should truncate set immediate value
|
|
define amdgpu_kernel void @test_setreg_full_round_mode_42() {
|
|
; GFX6-LABEL: test_setreg_full_round_mode_42:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 4), 42 ; encoding: [0x01,0x18,0x80,0xba,0x2a,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_round_mode_42:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 4), 42 ; encoding: [0x01,0x18,0x00,0xba,0x2a,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_round_mode_42:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_round_mode 0xa ; encoding: [0x0a,0x00,0xa4,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 6145, i32 42)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_full_denorm_mode_0() {
|
|
; GFX6-LABEL: test_setreg_full_denorm_mode_0:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 4, 4), 0 ; encoding: [0x01,0x19,0x80,0xba,0x00,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_denorm_mode_0:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 4, 4), 0 ; encoding: [0x01,0x19,0x00,0xba,0x00,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_denorm_mode_0:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_denorm_mode 0 ; encoding: [0x00,0x00,0xa5,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 6401, i32 0)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_full_denorm_mode_1() {
|
|
; GFX6-LABEL: test_setreg_full_denorm_mode_1:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 4, 4), 1 ; encoding: [0x01,0x19,0x80,0xba,0x01,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_denorm_mode_1:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 4, 4), 1 ; encoding: [0x01,0x19,0x00,0xba,0x01,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_denorm_mode_1:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_denorm_mode 1 ; encoding: [0x01,0x00,0xa5,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 6401, i32 1)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
|
|
define amdgpu_kernel void @test_setreg_full_denorm_mode_2() {
|
|
; GFX6-LABEL: test_setreg_full_denorm_mode_2:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 4, 4), 2 ; encoding: [0x01,0x19,0x80,0xba,0x02,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_denorm_mode_2:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 4, 4), 2 ; encoding: [0x01,0x19,0x00,0xba,0x02,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_denorm_mode_2:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_denorm_mode 2 ; encoding: [0x02,0x00,0xa5,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 6401, i32 2)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_full_denorm_mode_4() {
|
|
; GFX6-LABEL: test_setreg_full_denorm_mode_4:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 4, 4), 4 ; encoding: [0x01,0x19,0x80,0xba,0x04,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_denorm_mode_4:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 4, 4), 4 ; encoding: [0x01,0x19,0x00,0xba,0x04,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_denorm_mode_4:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_denorm_mode 4 ; encoding: [0x04,0x00,0xa5,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 6401, i32 4)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_full_denorm_mode_8() {
|
|
; GFX6-LABEL: test_setreg_full_denorm_mode_8:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 4, 4), 8 ; encoding: [0x01,0x19,0x80,0xba,0x08,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_denorm_mode_8:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 4, 4), 8 ; encoding: [0x01,0x19,0x00,0xba,0x08,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_denorm_mode_8:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_denorm_mode 8 ; encoding: [0x08,0x00,0xa5,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 6401, i32 8)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_full_denorm_mode_15() {
|
|
; GFX6-LABEL: test_setreg_full_denorm_mode_15:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 4, 4), 15 ; encoding: [0x01,0x19,0x80,0xba,0x0f,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_denorm_mode_15:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 4, 4), 15 ; encoding: [0x01,0x19,0x00,0xba,0x0f,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_denorm_mode_15:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_denorm_mode 15 ; encoding: [0x0f,0x00,0xa5,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 6401, i32 15)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_full_denorm_mode_42() {
|
|
; GFX6-LABEL: test_setreg_full_denorm_mode_42:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 4, 4), 42 ; encoding: [0x01,0x19,0x80,0xba,0x2a,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_denorm_mode_42:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 4, 4), 42 ; encoding: [0x01,0x19,0x00,0xba,0x2a,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_denorm_mode_42:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_denorm_mode 10 ; encoding: [0x0a,0x00,0xa5,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 6401, i32 42)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
; Sets all fp round and fp denorm bits.
|
|
define amdgpu_kernel void @test_setreg_full_both_round_mode_and_denorm_mode_0() {
|
|
; GFX6-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_0:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 8), 0 ; encoding: [0x01,0x38,0x80,0xba,0x00,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_0:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 8), 0 ; encoding: [0x01,0x38,0x00,0xba,0x00,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_0:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_round_mode 0x0 ; encoding: [0x00,0x00,0xa4,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_denorm_mode 0 ; encoding: [0x00,0x00,0xa5,0xbf]
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 14337, i32 0)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_full_both_round_mode_and_denorm_mode_1() {
|
|
; GFX6-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_1:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 8), 1 ; encoding: [0x01,0x38,0x80,0xba,0x01,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_1:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 8), 1 ; encoding: [0x01,0x38,0x00,0xba,0x01,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_1:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_round_mode 0x1 ; encoding: [0x01,0x00,0xa4,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_denorm_mode 0 ; encoding: [0x00,0x00,0xa5,0xbf]
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 14337, i32 1)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_full_both_round_mode_and_denorm_mode_2() {
|
|
; GFX6-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_2:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 8), 2 ; encoding: [0x01,0x38,0x80,0xba,0x02,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_2:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 8), 2 ; encoding: [0x01,0x38,0x00,0xba,0x02,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_2:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_round_mode 0x2 ; encoding: [0x02,0x00,0xa4,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_denorm_mode 0 ; encoding: [0x00,0x00,0xa5,0xbf]
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 14337, i32 2)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_full_both_round_mode_and_denorm_mode_4() {
|
|
; GFX6-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_4:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 8), 4 ; encoding: [0x01,0x38,0x80,0xba,0x04,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_4:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 8), 4 ; encoding: [0x01,0x38,0x00,0xba,0x04,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_4:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_round_mode 0x4 ; encoding: [0x04,0x00,0xa4,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_denorm_mode 0 ; encoding: [0x00,0x00,0xa5,0xbf]
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 14337, i32 4)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_full_both_round_mode_and_denorm_mode_8() {
|
|
; GFX6-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_8:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 8), 8 ; encoding: [0x01,0x38,0x80,0xba,0x08,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_8:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 8), 8 ; encoding: [0x01,0x38,0x00,0xba,0x08,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_8:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_round_mode 0x8 ; encoding: [0x08,0x00,0xa4,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_denorm_mode 0 ; encoding: [0x00,0x00,0xa5,0xbf]
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 14337, i32 8)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_full_both_round_mode_and_denorm_mode_16() {
|
|
; GFX6-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_16:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 8), 16 ; encoding: [0x01,0x38,0x80,0xba,0x10,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_16:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 8), 16 ; encoding: [0x01,0x38,0x00,0xba,0x10,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_16:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_round_mode 0x0 ; encoding: [0x00,0x00,0xa4,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_denorm_mode 1 ; encoding: [0x01,0x00,0xa5,0xbf]
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 14337, i32 16)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_full_both_round_mode_and_denorm_mode_32() {
|
|
; GFX6-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_32:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 8), 32 ; encoding: [0x01,0x38,0x80,0xba,0x20,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_32:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 8), 32 ; encoding: [0x01,0x38,0x00,0xba,0x20,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_32:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_round_mode 0x0 ; encoding: [0x00,0x00,0xa4,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_denorm_mode 2 ; encoding: [0x02,0x00,0xa5,0xbf]
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 14337, i32 32)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_full_both_round_mode_and_denorm_mode_64() {
|
|
; GFX6-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_64:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 8), 64 ; encoding: [0x01,0x38,0x80,0xba,0x40,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_64:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 8), 64 ; encoding: [0x01,0x38,0x00,0xba,0x40,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_64:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_round_mode 0x0 ; encoding: [0x00,0x00,0xa4,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_denorm_mode 4 ; encoding: [0x04,0x00,0xa5,0xbf]
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 14337, i32 64)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_full_both_round_mode_and_denorm_mode_128() {
|
|
; GFX6-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_128:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 8), 0x80 ; encoding: [0x01,0x38,0x80,0xba,0x80,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_128:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 8), 0x80 ; encoding: [0x01,0x38,0x00,0xba,0x80,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_128:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_round_mode 0x0 ; encoding: [0x00,0x00,0xa4,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_denorm_mode 8 ; encoding: [0x08,0x00,0xa5,0xbf]
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 14337, i32 128)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_full_both_round_mode_and_denorm_mode_15() {
|
|
; GFX6-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_15:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 8), 15 ; encoding: [0x01,0x38,0x80,0xba,0x0f,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_15:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 8), 15 ; encoding: [0x01,0x38,0x00,0xba,0x0f,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_15:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_round_mode 0xf ; encoding: [0x0f,0x00,0xa4,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_denorm_mode 0 ; encoding: [0x00,0x00,0xa5,0xbf]
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 14337, i32 15)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_full_both_round_mode_and_denorm_mode_255() {
|
|
; GFX6-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_255:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 8), 0xff ; encoding: [0x01,0x38,0x80,0xba,0xff,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_255:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 8), 0xff ; encoding: [0x01,0x38,0x00,0xba,0xff,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_255:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_round_mode 0xf ; encoding: [0x0f,0x00,0xa4,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_denorm_mode 15 ; encoding: [0x0f,0x00,0xa5,0xbf]
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 14337, i32 255)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
; Truncate extra high bit
|
|
define amdgpu_kernel void @test_setreg_full_both_round_mode_and_denorm_mode_597() {
|
|
; GFX6-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_597:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 8), 0x255 ; encoding: [0x01,0x38,0x80,0xba,0x55,0x02,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_597:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 0, 8), 0x255 ; encoding: [0x01,0x38,0x00,0xba,0x55,0x02,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_full_both_round_mode_and_denorm_mode_597:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_round_mode 0x5 ; encoding: [0x05,0x00,0xa4,0xbf]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_denorm_mode 5 ; encoding: [0x05,0x00,0xa5,0xbf]
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 14337, i32 597)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_set_8_bits_straddles_round_and_denorm() {
|
|
; GFX6-LABEL: test_setreg_set_8_bits_straddles_round_and_denorm:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 2, 8), 0xff ; encoding: [0x81,0x38,0x80,0xba,0xff,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_set_8_bits_straddles_round_and_denorm:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 2, 8), 0xff ; encoding: [0x81,0x38,0x00,0xba,0xff,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_set_8_bits_straddles_round_and_denorm:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 2, 8), 0xff ; encoding: [0x81,0x38,0x80,0xba,0xff,0x00,0x00,0x00]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 14465, i32 255)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
define amdgpu_kernel void @test_setreg_set_4_bits_straddles_round_and_denorm() {
|
|
; GFX6-LABEL: test_setreg_set_4_bits_straddles_round_and_denorm:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 2, 4), 15 ; encoding: [0x81,0x18,0x80,0xba,0x0f,0x00,0x00,0x00]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX789-LABEL: test_setreg_set_4_bits_straddles_round_and_denorm:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 2, 4), 15 ; encoding: [0x81,0x18,0x00,0xba,0x0f,0x00,0x00,0x00]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
;
|
|
; GFX10-LABEL: test_setreg_set_4_bits_straddles_round_and_denorm:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_setreg_imm32_b32 hwreg(HW_REG_MODE, 2, 4), 15 ; encoding: [0x81,0x18,0x80,0xba,0x0f,0x00,0x00,0x00]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_endpgm ; encoding: [0x00,0x00,0x81,0xbf]
|
|
call void @llvm.amdgcn.s.setreg(i32 6273, i32 15)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
; FIXME: Broken for DAG
|
|
define void @test_setreg_roundingmode_var_vgpr(i32 %var.mode) {
|
|
; GFX6-LABEL: test_setreg_roundingmode_var_vgpr:
|
|
; GFX6: ; %bb.0:
|
|
; GFX6-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) ; encoding: [0x00,0x00,0x8c,0xbf]
|
|
; GFX6-NEXT: v_readfirstlane_b32 s4, v0 ; encoding: [0x00,0x05,0x08,0x7e]
|
|
; GFX6-NEXT: s_setreg_b32 hwreg(HW_REG_MODE, 0, 3), s4 ; encoding: [0x01,0x10,0x84,0xb9]
|
|
; GFX6-NEXT: ;;#ASMSTART
|
|
; GFX6-NEXT: ;;#ASMEND
|
|
; GFX6-NEXT: s_setpc_b64 s[30:31] ; encoding: [0x1e,0x20,0x80,0xbe]
|
|
;
|
|
; GFX789-LABEL: test_setreg_roundingmode_var_vgpr:
|
|
; GFX789: ; %bb.0:
|
|
; GFX789-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) ; encoding: [0x00,0x00,0x8c,0xbf]
|
|
; GFX789-NEXT: v_readfirstlane_b32 s4, v0 ; encoding: [0x00,0x05,0x08,0x7e]
|
|
; GFX789-NEXT: s_setreg_b32 hwreg(HW_REG_MODE, 0, 3), s4 ; encoding: [0x01,0x10,0x04,0xb9]
|
|
; GFX789-NEXT: ;;#ASMSTART
|
|
; GFX789-NEXT: ;;#ASMEND
|
|
; GFX789-NEXT: s_setpc_b64 s[30:31] ; encoding: [0x1e,0x1d,0x80,0xbe]
|
|
;
|
|
; GFX10-LABEL: test_setreg_roundingmode_var_vgpr:
|
|
; GFX10: ; %bb.0:
|
|
; GFX10-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0) ; encoding: [0x00,0x00,0x8c,0xbf]
|
|
; GFX10-NEXT: s_waitcnt_vscnt null, 0x0 ; encoding: [0x00,0x00,0xfd,0xbb]
|
|
; GFX10-NEXT: v_readfirstlane_b32 s4, v0 ; encoding: [0x00,0x05,0x08,0x7e]
|
|
; GFX10-NEXT: ;;#ASMSTART
|
|
; GFX10-NEXT: ;;#ASMEND
|
|
; GFX10-NEXT: s_setreg_b32 hwreg(HW_REG_MODE, 0, 3), s4 ; encoding: [0x01,0x10,0x84,0xb9]
|
|
; GFX10-NEXT: s_setpc_b64 s[30:31] ; encoding: [0x1e,0x20,0x80,0xbe]
|
|
call void @llvm.amdgcn.s.setreg(i32 4097, i32 %var.mode)
|
|
call void asm sideeffect "", ""()
|
|
ret void
|
|
}
|
|
|
|
declare void @llvm.amdgcn.s.setreg(i32 immarg, i32) #0
|
|
|
|
attributes #0 = { nounwind }
|