59 lines
1.7 KiB
LLVM
59 lines
1.7 KiB
LLVM
|
; RUN: llc -march=amdgcn -verify-machineinstrs < %s | FileCheck -check-prefix=SI %s
|
||
|
; RUN: llc -march=amdgcn -mcpu=tonga -verify-machineinstrs < %s | FileCheck -check-prefix=SI %s
|
||
|
|
||
|
; SI-LABEL: {{^}}br_i1_phi:
|
||
|
|
||
|
; SI: ; %bb
|
||
|
; SI: s_mov_b64 [[TMP:s\[[0-9]+:[0-9]+\]]], 0
|
||
|
|
||
|
; SI: ; %bb2
|
||
|
; SI: s_mov_b64 [[TMP]], exec
|
||
|
|
||
|
; SI: ; %bb3
|
||
|
; SI: s_and_saveexec_b64 {{s\[[0-9]+:[0-9]+\]}}, [[TMP]]
|
||
|
|
||
|
define amdgpu_kernel void @br_i1_phi(i32 %arg) {
|
||
|
bb:
|
||
|
%tidig = call i32 @llvm.amdgcn.workitem.id.x()
|
||
|
%cmp = trunc i32 %tidig to i1
|
||
|
br i1 %cmp, label %bb2, label %bb3
|
||
|
|
||
|
bb2: ; preds = %bb
|
||
|
br label %bb3
|
||
|
|
||
|
bb3: ; preds = %bb2, %bb
|
||
|
%tmp = phi i1 [ true, %bb2 ], [ false, %bb ]
|
||
|
br i1 %tmp, label %bb4, label %bb6
|
||
|
|
||
|
bb4: ; preds = %bb3
|
||
|
%val = load volatile i32, i32 addrspace(1)* undef
|
||
|
%tmp5 = mul i32 %val, %arg
|
||
|
br label %bb6
|
||
|
|
||
|
bb6: ; preds = %bb4, %bb3
|
||
|
ret void
|
||
|
}
|
||
|
|
||
|
declare i32 @llvm.amdgcn.workitem.id.x() #0
|
||
|
|
||
|
attributes #0 = { nounwind readnone }
|
||
|
|
||
|
; Make sure this won't crash.
|
||
|
; SI-LABEL: {{^}}vcopy_i1_undef
|
||
|
; SI: v_cndmask_b32_e64
|
||
|
; SI: v_cndmask_b32_e64
|
||
|
define <2 x float> @vcopy_i1_undef(<2 x float> addrspace(1)* %p) {
|
||
|
entry:
|
||
|
br i1 undef, label %exit, label %false
|
||
|
|
||
|
false:
|
||
|
%x = load <2 x float>, <2 x float> addrspace(1)* %p
|
||
|
%cmp = fcmp one <2 x float> %x, zeroinitializer
|
||
|
br label %exit
|
||
|
|
||
|
exit:
|
||
|
%c = phi <2 x i1> [ undef, %entry ], [ %cmp, %false ]
|
||
|
%ret = select <2 x i1> %c, <2 x float> <float 2.0, float 2.0>, <2 x float> <float 4.0, float 4.0>
|
||
|
ret <2 x float> %ret
|
||
|
}
|