Mercurial > hg > CbC > CbC_llvm
diff llvm/test/CodeGen/AMDGPU/llvm.amdgcn.rcp.legacy.ll @ 150:1d019706d866
LLVM10
author | anatofuz |
---|---|
date | Thu, 13 Feb 2020 15:10:13 +0900 |
parents | |
children | 1f2b6ac9f198 |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/llvm/test/CodeGen/AMDGPU/llvm.amdgcn.rcp.legacy.ll Thu Feb 13 15:10:13 2020 +0900 @@ -0,0 +1,42 @@ +; RUN: llc -march=amdgcn -verify-machineinstrs < %s | FileCheck -check-prefix=GCN %s +; RUN: not llc -march=amdgcn -mcpu=fiji -verify-machineinstrs < %s 2>&1 | FileCheck -check-prefix=ERROR %s + +; ERROR: error: <unknown>:0:0: in function rcp_legacy_f32 void (float addrspace(1)*, float): intrinsic not supported on subtarget + +declare float @llvm.amdgcn.rcp.legacy(float) #0 + +; GCN-LABEL: {{^}}rcp_legacy_f32: +; GCN: v_rcp_legacy_f32_e32 {{v[0-9]+}}, {{s[0-9]+}} +define amdgpu_kernel void @rcp_legacy_f32(float addrspace(1)* %out, float %src) #1 { + %rcp = call float @llvm.amdgcn.rcp.legacy(float %src) #0 + store float %rcp, float addrspace(1)* %out, align 4 + ret void +} + +; TODO: Really these should be constant folded +; GCN-LABEL: {{^}}rcp_legacy_f32_constant_4.0 +; GCN: v_rcp_legacy_f32_e32 {{v[0-9]+}}, 4.0 +define amdgpu_kernel void @rcp_legacy_f32_constant_4.0(float addrspace(1)* %out) #1 { + %rcp = call float @llvm.amdgcn.rcp.legacy(float 4.0) #0 + store float %rcp, float addrspace(1)* %out, align 4 + ret void +} + +; GCN-LABEL: {{^}}rcp_legacy_f32_constant_100.0 +; GCN: v_rcp_legacy_f32_e32 {{v[0-9]+}}, 0x42c80000 +define amdgpu_kernel void @rcp_legacy_f32_constant_100.0(float addrspace(1)* %out) #1 { + %rcp = call float @llvm.amdgcn.rcp.legacy(float 100.0) #0 + store float %rcp, float addrspace(1)* %out, align 4 + ret void +} + +; GCN-LABEL: {{^}}rcp_legacy_undef_f32: +; GCN-NOT: v_rcp_legacy_f32 +define amdgpu_kernel void @rcp_legacy_undef_f32(float addrspace(1)* %out) #1 { + %rcp = call float @llvm.amdgcn.rcp.legacy(float undef) + store float %rcp, float addrspace(1)* %out, align 4 + ret void +} + +attributes #0 = { nounwind readnone } +attributes #1 = { nounwind }