Mercurial > hg > CbC > CbC_llvm
comparison test/CodeGen/AMDGPU/fpext.f16.ll @ 134:3a76565eade5 LLVM5.0.1
update 5.0.1
author | mir3636 |
---|---|
date | Sat, 17 Feb 2018 09:57:20 +0900 |
parents | 803732b1fca8 |
children | c2174574ed3a |
comparison
equal
deleted
inserted
replaced
133:c60214abe0e8 | 134:3a76565eade5 |
---|---|
1 ; RUN: llc -amdgpu-scalarize-global-loads=false -march=amdgcn -mcpu=tahiti -verify-machineinstrs -enable-unsafe-fp-math < %s | FileCheck -check-prefix=GCN -check-prefix=SI -check-prefix=SIVI %s | 1 ; RUN: llc -amdgpu-scalarize-global-loads=false -march=amdgcn -mcpu=tahiti -verify-machineinstrs -enable-unsafe-fp-math < %s | FileCheck -enable-var-scope -check-prefix=GCN -check-prefix=SI -check-prefix=SIVI %s |
2 ; RUN: llc -amdgpu-scalarize-global-loads=false -march=amdgcn -mcpu=fiji -mattr=-flat-for-global -verify-machineinstrs -enable-unsafe-fp-math < %s | FileCheck -check-prefix=GCN -check-prefix=VI -check-prefix=GFX89 %s | 2 ; RUN: llc -amdgpu-scalarize-global-loads=false -march=amdgcn -mcpu=fiji -mattr=-flat-for-global -verify-machineinstrs -enable-unsafe-fp-math < %s | FileCheck -enable-var-scope -check-prefix=GCN -check-prefix=VI -check-prefix=GFX89 %s |
3 ; RUN: llc -amdgpu-scalarize-global-loads=false -march=amdgcn -mcpu=gfx901 -mattr=-flat-for-global -verify-machineinstrs -enable-unsafe-fp-math < %s | FileCheck -check-prefix=GCN -check-prefix=GFX9 -check-prefix=GFX89 %s | 3 ; RUN: llc -amdgpu-scalarize-global-loads=false -march=amdgcn -mcpu=gfx900 -mattr=-flat-for-global -verify-machineinstrs -enable-unsafe-fp-math < %s | FileCheck -enable-var-scope -check-prefix=GCN -check-prefix=GFX9 -check-prefix=GFX89 %s |
4 | 4 |
5 ; GCN-LABEL: {{^}}fpext_f16_to_f32 | 5 ; GCN-LABEL: {{^}}fpext_f16_to_f32 |
6 ; GCN: buffer_load_ushort v[[A_F16:[0-9]+]] | 6 ; GCN: buffer_load_ushort v[[A_F16:[0-9]+]] |
7 ; GCN: v_cvt_f32_f16_e32 v[[R_F32:[0-9]+]], v[[A_F16]] | 7 ; GCN: v_cvt_f32_f16_e32 v[[R_F32:[0-9]+]], v[[A_F16]] |
8 ; GCN: buffer_store_dword v[[R_F32]] | 8 ; GCN: buffer_store_dword v[[R_F32]] |
178 ; GCN-LABEL: {{^}}fabs_multi_use_fpext_f16_to_f32: | 178 ; GCN-LABEL: {{^}}fabs_multi_use_fpext_f16_to_f32: |
179 ; GCN: {{buffer|flat}}_load_ushort [[A:v[0-9]+]] | 179 ; GCN: {{buffer|flat}}_load_ushort [[A:v[0-9]+]] |
180 ; GCN-DAG: v_and_b32_e32 [[XOR:v[0-9]+]], 0x7fff, [[A]] | 180 ; GCN-DAG: v_and_b32_e32 [[XOR:v[0-9]+]], 0x7fff, [[A]] |
181 | 181 |
182 ; SI-DAG: v_cvt_f32_f16_e32 [[CVT:v[0-9]+]], [[A]] | 182 ; SI-DAG: v_cvt_f32_f16_e32 [[CVT:v[0-9]+]], [[A]] |
183 ; VI-DAG: v_cvt_f32_f16_e64 [[CVT:v[0-9]+]], |[[A]]| | 183 ; GFX89-DAG: v_cvt_f32_f16_e64 [[CVT:v[0-9]+]], |[[A]]| |
184 | 184 |
185 ; GCN: store_dword [[CVT]] | 185 ; GCN: store_dword [[CVT]] |
186 ; GCN: store_short [[XOR]] | 186 ; GCN: store_short [[XOR]] |
187 define amdgpu_kernel void @fabs_multi_use_fpext_f16_to_f32( | 187 define amdgpu_kernel void @fabs_multi_use_fpext_f16_to_f32( |
188 float addrspace(1)* %r, | 188 float addrspace(1)* %r, |
224 ; GCN-LABEL: {{^}}fabs_fneg_multi_use_fpext_f16_to_f32: | 224 ; GCN-LABEL: {{^}}fabs_fneg_multi_use_fpext_f16_to_f32: |
225 ; GCN: {{buffer|flat}}_load_ushort [[A:v[0-9]+]] | 225 ; GCN: {{buffer|flat}}_load_ushort [[A:v[0-9]+]] |
226 ; GCN-DAG: v_or_b32_e32 [[OR:v[0-9]+]], 0x8000, [[A]] | 226 ; GCN-DAG: v_or_b32_e32 [[OR:v[0-9]+]], 0x8000, [[A]] |
227 | 227 |
228 ; SI: v_cvt_f32_f16_e32 [[CVT:v[0-9]+]], [[OR]] | 228 ; SI: v_cvt_f32_f16_e32 [[CVT:v[0-9]+]], [[OR]] |
229 ; VI-DAG: v_cvt_f32_f16_e64 [[CVT:v[0-9]+]], -|[[OR]]| | 229 ; GFX89-DAG: v_cvt_f32_f16_e64 [[CVT:v[0-9]+]], -|[[OR]]| |
230 | 230 |
231 ; GCN: buffer_store_dword [[CVT]] | 231 ; GCN: buffer_store_dword [[CVT]] |
232 ; GCN: buffer_store_short [[OR]] | 232 ; GCN: buffer_store_short [[OR]] |
233 define amdgpu_kernel void @fabs_fneg_multi_use_fpext_f16_to_f32( | 233 define amdgpu_kernel void @fabs_fneg_multi_use_fpext_f16_to_f32( |
234 float addrspace(1)* %r, | 234 float addrspace(1)* %r, |