diff options
Diffstat (limited to 'test/CodeGen/R600/v_cndmask.ll')
-rw-r--r-- | test/CodeGen/R600/v_cndmask.ll | 42 |
1 files changed, 33 insertions, 9 deletions
diff --git a/test/CodeGen/R600/v_cndmask.ll b/test/CodeGen/R600/v_cndmask.ll index 84087ee..a24dcc7 100644 --- a/test/CodeGen/R600/v_cndmask.ll +++ b/test/CodeGen/R600/v_cndmask.ll @@ -1,14 +1,38 @@ -; RUN: llc < %s -march=r600 -mcpu=SI -verify-machineinstrs | FileCheck --check-prefix=SI %s +; RUN: llc -march=r600 -mcpu=SI -verify-machineinstrs < %s | FileCheck -check-prefix=SI %s -; SI: @v_cnd_nan -; SI: V_CNDMASK_B32_e64 v{{[0-9]}}, +declare i32 @llvm.r600.read.tidig.x() #1 + +; SI-LABEL: {{^}}v_cnd_nan_nosgpr: +; SI: v_cndmask_b32_e64 v{{[0-9]}}, v{{[0-9]}}, -1, s{{\[[0-9]+:[0-9]+\]}} ; SI-DAG: v{{[0-9]}} ; All nan values are converted to 0xffffffff -; SI-DAG: -1 -define void @v_cnd_nan(float addrspace(1)* %out, i32 %c, float %f) { -entry: - %0 = icmp ne i32 %c, 0 - %1 = select i1 %0, float 0xFFFFFFFFE0000000, float %f - store float %1, float addrspace(1)* %out +; SI: s_endpgm +define void @v_cnd_nan_nosgpr(float addrspace(1)* %out, i32 %c, float addrspace(1)* %fptr) #0 { + %idx = call i32 @llvm.r600.read.tidig.x() #1 + %f.gep = getelementptr float addrspace(1)* %fptr, i32 %idx + %f = load float addrspace(1)* %fptr + %setcc = icmp ne i32 %c, 0 + %select = select i1 %setcc, float 0xFFFFFFFFE0000000, float %f + store float %select, float addrspace(1)* %out ret void } + + +; This requires slightly trickier SGPR operand legalization since the +; single constant bus SGPR usage is the last operand, and it should +; never be moved. + +; SI-LABEL: {{^}}v_cnd_nan: +; SI: v_cndmask_b32_e64 v{{[0-9]}}, v{{[0-9]}}, -1, s{{\[[0-9]+:[0-9]+\]}} +; SI-DAG: v{{[0-9]}} +; All nan values are converted to 0xffffffff +; SI: s_endpgm +define void @v_cnd_nan(float addrspace(1)* %out, i32 %c, float %f) #0 { + %setcc = icmp ne i32 %c, 0 + %select = select i1 %setcc, float 0xFFFFFFFFE0000000, float %f + store float %select, float addrspace(1)* %out + ret void +} + +attributes #0 = { nounwind } +attributes #1 = { nounwind readnone } |