Mercurial > hg > CbC > CbC_llvm
view llvm/test/CodeGen/AMDGPU/rcp_iflag.ll @ 223:5f17cb93ff66 llvm-original
LLVM13 (2021/7/18)
author | Shinji KONO <kono@ie.u-ryukyu.ac.jp> |
---|---|
date | Sun, 18 Jul 2021 22:43:00 +0900 |
parents | 0572611fdcc8 |
children | 1f2b6ac9f198 |
line wrap: on
line source
; RUN: llc -march=amdgcn -verify-machineinstrs < %s | FileCheck --check-prefix=GCN %s ; GCN-LABEL: {{^}}rcp_uint: ; GCN: v_rcp_iflag_f32_e32 define amdgpu_kernel void @rcp_uint(i32 addrspace(1)* %in, float addrspace(1)* %out) #0 { %load = load i32, i32 addrspace(1)* %in, align 4 %cvt = uitofp i32 %load to float %div = fdiv float 1.000000e+00, %cvt, !fpmath !0 store float %div, float addrspace(1)* %out, align 4 ret void } ; GCN-LABEL: {{^}}rcp_sint: ; GCN: v_rcp_iflag_f32_e32 define amdgpu_kernel void @rcp_sint(i32 addrspace(1)* %in, float addrspace(1)* %out) #0 { %load = load i32, i32 addrspace(1)* %in, align 4 %cvt = sitofp i32 %load to float %div = fdiv float 1.000000e+00, %cvt, !fpmath !0 store float %div, float addrspace(1)* %out, align 4 ret void } ; GCN-LABEL: {{^}}rcp_uint_denorm: ; GCN-NOT: v_rcp_iflag_f32 define amdgpu_kernel void @rcp_uint_denorm(i32 addrspace(1)* %in, float addrspace(1)* %out) #1 { %load = load i32, i32 addrspace(1)* %in, align 4 %cvt = uitofp i32 %load to float %div = fdiv float 1.000000e+00, %cvt store float %div, float addrspace(1)* %out, align 4 ret void } ; GCN-LABEL: {{^}}rcp_sint_denorm: ; GCN-NOT: v_rcp_iflag_f32 define amdgpu_kernel void @rcp_sint_denorm(i32 addrspace(1)* %in, float addrspace(1)* %out) #1 { %load = load i32, i32 addrspace(1)* %in, align 4 %cvt = sitofp i32 %load to float %div = fdiv float 1.000000e+00, %cvt store float %div, float addrspace(1)* %out, align 4 ret void } !0 = !{float 2.500000e+00} attributes #0 = { "denormal-fp-math-f32"="preserve-sign,preserve-sign" } attributes #1 = { "denormal-fp-math-f32"="ieee,ieee" }