comparison test/CodeGen/AMDGPU/fpext.f16.ll @ 134:3a76565eade5 LLVM5.0.1

update 5.0.1
author mir3636
date Sat, 17 Feb 2018 09:57:20 +0900
parents 803732b1fca8
children c2174574ed3a
comparison
equal deleted inserted replaced
133:c60214abe0e8 134:3a76565eade5
1 ; RUN: llc -amdgpu-scalarize-global-loads=false -march=amdgcn -mcpu=tahiti -verify-machineinstrs -enable-unsafe-fp-math < %s | FileCheck -check-prefix=GCN -check-prefix=SI -check-prefix=SIVI %s 1 ; RUN: llc -amdgpu-scalarize-global-loads=false -march=amdgcn -mcpu=tahiti -verify-machineinstrs -enable-unsafe-fp-math < %s | FileCheck -enable-var-scope -check-prefix=GCN -check-prefix=SI -check-prefix=SIVI %s
2 ; RUN: llc -amdgpu-scalarize-global-loads=false -march=amdgcn -mcpu=fiji -mattr=-flat-for-global -verify-machineinstrs -enable-unsafe-fp-math < %s | FileCheck -check-prefix=GCN -check-prefix=VI -check-prefix=GFX89 %s 2 ; RUN: llc -amdgpu-scalarize-global-loads=false -march=amdgcn -mcpu=fiji -mattr=-flat-for-global -verify-machineinstrs -enable-unsafe-fp-math < %s | FileCheck -enable-var-scope -check-prefix=GCN -check-prefix=VI -check-prefix=GFX89 %s
3 ; RUN: llc -amdgpu-scalarize-global-loads=false -march=amdgcn -mcpu=gfx901 -mattr=-flat-for-global -verify-machineinstrs -enable-unsafe-fp-math < %s | FileCheck -check-prefix=GCN -check-prefix=GFX9 -check-prefix=GFX89 %s 3 ; RUN: llc -amdgpu-scalarize-global-loads=false -march=amdgcn -mcpu=gfx900 -mattr=-flat-for-global -verify-machineinstrs -enable-unsafe-fp-math < %s | FileCheck -enable-var-scope -check-prefix=GCN -check-prefix=GFX9 -check-prefix=GFX89 %s
4 4
5 ; GCN-LABEL: {{^}}fpext_f16_to_f32 5 ; GCN-LABEL: {{^}}fpext_f16_to_f32
6 ; GCN: buffer_load_ushort v[[A_F16:[0-9]+]] 6 ; GCN: buffer_load_ushort v[[A_F16:[0-9]+]]
7 ; GCN: v_cvt_f32_f16_e32 v[[R_F32:[0-9]+]], v[[A_F16]] 7 ; GCN: v_cvt_f32_f16_e32 v[[R_F32:[0-9]+]], v[[A_F16]]
8 ; GCN: buffer_store_dword v[[R_F32]] 8 ; GCN: buffer_store_dword v[[R_F32]]
178 ; GCN-LABEL: {{^}}fabs_multi_use_fpext_f16_to_f32: 178 ; GCN-LABEL: {{^}}fabs_multi_use_fpext_f16_to_f32:
179 ; GCN: {{buffer|flat}}_load_ushort [[A:v[0-9]+]] 179 ; GCN: {{buffer|flat}}_load_ushort [[A:v[0-9]+]]
180 ; GCN-DAG: v_and_b32_e32 [[XOR:v[0-9]+]], 0x7fff, [[A]] 180 ; GCN-DAG: v_and_b32_e32 [[XOR:v[0-9]+]], 0x7fff, [[A]]
181 181
182 ; SI-DAG: v_cvt_f32_f16_e32 [[CVT:v[0-9]+]], [[A]] 182 ; SI-DAG: v_cvt_f32_f16_e32 [[CVT:v[0-9]+]], [[A]]
183 ; VI-DAG: v_cvt_f32_f16_e64 [[CVT:v[0-9]+]], |[[A]]| 183 ; GFX89-DAG: v_cvt_f32_f16_e64 [[CVT:v[0-9]+]], |[[A]]|
184 184
185 ; GCN: store_dword [[CVT]] 185 ; GCN: store_dword [[CVT]]
186 ; GCN: store_short [[XOR]] 186 ; GCN: store_short [[XOR]]
187 define amdgpu_kernel void @fabs_multi_use_fpext_f16_to_f32( 187 define amdgpu_kernel void @fabs_multi_use_fpext_f16_to_f32(
188 float addrspace(1)* %r, 188 float addrspace(1)* %r,
224 ; GCN-LABEL: {{^}}fabs_fneg_multi_use_fpext_f16_to_f32: 224 ; GCN-LABEL: {{^}}fabs_fneg_multi_use_fpext_f16_to_f32:
225 ; GCN: {{buffer|flat}}_load_ushort [[A:v[0-9]+]] 225 ; GCN: {{buffer|flat}}_load_ushort [[A:v[0-9]+]]
226 ; GCN-DAG: v_or_b32_e32 [[OR:v[0-9]+]], 0x8000, [[A]] 226 ; GCN-DAG: v_or_b32_e32 [[OR:v[0-9]+]], 0x8000, [[A]]
227 227
228 ; SI: v_cvt_f32_f16_e32 [[CVT:v[0-9]+]], [[OR]] 228 ; SI: v_cvt_f32_f16_e32 [[CVT:v[0-9]+]], [[OR]]
229 ; VI-DAG: v_cvt_f32_f16_e64 [[CVT:v[0-9]+]], -|[[OR]]| 229 ; GFX89-DAG: v_cvt_f32_f16_e64 [[CVT:v[0-9]+]], -|[[OR]]|
230 230
231 ; GCN: buffer_store_dword [[CVT]] 231 ; GCN: buffer_store_dword [[CVT]]
232 ; GCN: buffer_store_short [[OR]] 232 ; GCN: buffer_store_short [[OR]]
233 define amdgpu_kernel void @fabs_fneg_multi_use_fpext_f16_to_f32( 233 define amdgpu_kernel void @fabs_fneg_multi_use_fpext_f16_to_f32(
234 float addrspace(1)* %r, 234 float addrspace(1)* %r,