annotate clang/test/CodeGenOpenCL/amdgpu-alignment.cl @ 236:c4bab56944e8 llvm-original

LLVM 16
author kono
date Wed, 09 Nov 2022 17:45:10 +0900
parents 1d019706d866
children 1f2b6ac9f198
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
150
anatofuz
parents:
diff changeset
1 // REQUIRES: amdgpu-registered-target
236
c4bab56944e8 LLVM 16
kono
parents: 150
diff changeset
2 // RUN: %clang_cc1 -no-opaque-pointers -triple amdgcn-unknown-unknown -S -disable-llvm-passes -emit-llvm -o - %s | FileCheck %s
c4bab56944e8 LLVM 16
kono
parents: 150
diff changeset
3 // RUN: %clang_cc1 -no-opaque-pointers -triple amdgcn-unknown-unknown-opencl -S -disable-llvm-passes -emit-llvm -o - %s | FileCheck %s
150
anatofuz
parents:
diff changeset
4
anatofuz
parents:
diff changeset
5 #pragma OPENCL EXTENSION cl_khr_fp64 : enable
anatofuz
parents:
diff changeset
6 #pragma OPENCL EXTENSION cl_khr_fp16 : enable
anatofuz
parents:
diff changeset
7
anatofuz
parents:
diff changeset
8 typedef char __attribute__((ext_vector_type(2))) char2;
anatofuz
parents:
diff changeset
9 typedef char __attribute__((ext_vector_type(3))) char3;
anatofuz
parents:
diff changeset
10 typedef char __attribute__((ext_vector_type(4))) char4;
anatofuz
parents:
diff changeset
11 typedef char __attribute__((ext_vector_type(8))) char8;
anatofuz
parents:
diff changeset
12 typedef char __attribute__((ext_vector_type(16))) char16;
anatofuz
parents:
diff changeset
13
anatofuz
parents:
diff changeset
14 typedef short __attribute__((ext_vector_type(2))) short2;
anatofuz
parents:
diff changeset
15 typedef short __attribute__((ext_vector_type(3))) short3;
anatofuz
parents:
diff changeset
16 typedef short __attribute__((ext_vector_type(4))) short4;
anatofuz
parents:
diff changeset
17 typedef short __attribute__((ext_vector_type(8))) short8;
anatofuz
parents:
diff changeset
18 typedef short __attribute__((ext_vector_type(16))) short16;
anatofuz
parents:
diff changeset
19
anatofuz
parents:
diff changeset
20 typedef int __attribute__((ext_vector_type(2))) int2;
anatofuz
parents:
diff changeset
21 typedef int __attribute__((ext_vector_type(3))) int3;
anatofuz
parents:
diff changeset
22 typedef int __attribute__((ext_vector_type(4))) int4;
anatofuz
parents:
diff changeset
23 typedef int __attribute__((ext_vector_type(8))) int8;
anatofuz
parents:
diff changeset
24 typedef int __attribute__((ext_vector_type(16))) int16;
anatofuz
parents:
diff changeset
25
anatofuz
parents:
diff changeset
26 typedef long __attribute__((ext_vector_type(2))) long2;
anatofuz
parents:
diff changeset
27 typedef long __attribute__((ext_vector_type(3))) long3;
anatofuz
parents:
diff changeset
28 typedef long __attribute__((ext_vector_type(4))) long4;
anatofuz
parents:
diff changeset
29 typedef long __attribute__((ext_vector_type(8))) long8;
anatofuz
parents:
diff changeset
30 typedef long __attribute__((ext_vector_type(16))) long16;
anatofuz
parents:
diff changeset
31
anatofuz
parents:
diff changeset
32 typedef half __attribute__((ext_vector_type(2))) half2;
anatofuz
parents:
diff changeset
33 typedef half __attribute__((ext_vector_type(3))) half3;
anatofuz
parents:
diff changeset
34 typedef half __attribute__((ext_vector_type(4))) half4;
anatofuz
parents:
diff changeset
35 typedef half __attribute__((ext_vector_type(8))) half8;
anatofuz
parents:
diff changeset
36 typedef half __attribute__((ext_vector_type(16))) half16;
anatofuz
parents:
diff changeset
37
anatofuz
parents:
diff changeset
38 typedef float __attribute__((ext_vector_type(2))) float2;
anatofuz
parents:
diff changeset
39 typedef float __attribute__((ext_vector_type(3))) float3;
anatofuz
parents:
diff changeset
40 typedef float __attribute__((ext_vector_type(4))) float4;
anatofuz
parents:
diff changeset
41 typedef float __attribute__((ext_vector_type(8))) float8;
anatofuz
parents:
diff changeset
42 typedef float __attribute__((ext_vector_type(16))) float16;
anatofuz
parents:
diff changeset
43
anatofuz
parents:
diff changeset
44 typedef double __attribute__((ext_vector_type(2))) double2;
anatofuz
parents:
diff changeset
45 typedef double __attribute__((ext_vector_type(3))) double3;
anatofuz
parents:
diff changeset
46 typedef double __attribute__((ext_vector_type(4))) double4;
anatofuz
parents:
diff changeset
47 typedef double __attribute__((ext_vector_type(8))) double8;
anatofuz
parents:
diff changeset
48 typedef double __attribute__((ext_vector_type(16))) double16;
anatofuz
parents:
diff changeset
49
anatofuz
parents:
diff changeset
50 // CHECK: @local_memory_alignment_global.lds_i8 = internal addrspace(3) global [4 x i8] undef, align 1
anatofuz
parents:
diff changeset
51 // CHECK: @local_memory_alignment_global.lds_v2i8 = internal addrspace(3) global [4 x <2 x i8>] undef, align 2
anatofuz
parents:
diff changeset
52 // CHECK: @local_memory_alignment_global.lds_v3i8 = internal addrspace(3) global [4 x <3 x i8>] undef, align 4
anatofuz
parents:
diff changeset
53 // CHECK: @local_memory_alignment_global.lds_v4i8 = internal addrspace(3) global [4 x <4 x i8>] undef, align 4
anatofuz
parents:
diff changeset
54 // CHECK: @local_memory_alignment_global.lds_v8i8 = internal addrspace(3) global [4 x <8 x i8>] undef, align 8
anatofuz
parents:
diff changeset
55 // CHECK: @local_memory_alignment_global.lds_v16i8 = internal addrspace(3) global [4 x <16 x i8>] undef, align 16
anatofuz
parents:
diff changeset
56 // CHECK: @local_memory_alignment_global.lds_i16 = internal addrspace(3) global [4 x i16] undef, align 2
anatofuz
parents:
diff changeset
57 // CHECK: @local_memory_alignment_global.lds_v2i16 = internal addrspace(3) global [4 x <2 x i16>] undef, align 4
anatofuz
parents:
diff changeset
58 // CHECK: @local_memory_alignment_global.lds_v3i16 = internal addrspace(3) global [4 x <3 x i16>] undef, align 8
anatofuz
parents:
diff changeset
59 // CHECK: @local_memory_alignment_global.lds_v4i16 = internal addrspace(3) global [4 x <4 x i16>] undef, align 8
anatofuz
parents:
diff changeset
60 // CHECK: @local_memory_alignment_global.lds_v8i16 = internal addrspace(3) global [4 x <8 x i16>] undef, align 16
anatofuz
parents:
diff changeset
61 // CHECK: @local_memory_alignment_global.lds_v16i16 = internal addrspace(3) global [4 x <16 x i16>] undef, align 32
anatofuz
parents:
diff changeset
62 // CHECK: @local_memory_alignment_global.lds_i32 = internal addrspace(3) global [4 x i32] undef, align 4
anatofuz
parents:
diff changeset
63 // CHECK: @local_memory_alignment_global.lds_v2i32 = internal addrspace(3) global [4 x <2 x i32>] undef, align 8
anatofuz
parents:
diff changeset
64 // CHECK: @local_memory_alignment_global.lds_v3i32 = internal addrspace(3) global [4 x <3 x i32>] undef, align 16
anatofuz
parents:
diff changeset
65 // CHECK: @local_memory_alignment_global.lds_v4i32 = internal addrspace(3) global [4 x <4 x i32>] undef, align 16
anatofuz
parents:
diff changeset
66 // CHECK: @local_memory_alignment_global.lds_v8i32 = internal addrspace(3) global [4 x <8 x i32>] undef, align 32
anatofuz
parents:
diff changeset
67 // CHECK: @local_memory_alignment_global.lds_v16i32 = internal addrspace(3) global [4 x <16 x i32>] undef, align 64
anatofuz
parents:
diff changeset
68 // CHECK: @local_memory_alignment_global.lds_i64 = internal addrspace(3) global [4 x i64] undef, align 8
anatofuz
parents:
diff changeset
69 // CHECK: @local_memory_alignment_global.lds_v2i64 = internal addrspace(3) global [4 x <2 x i64>] undef, align 16
anatofuz
parents:
diff changeset
70 // CHECK: @local_memory_alignment_global.lds_v3i64 = internal addrspace(3) global [4 x <3 x i64>] undef, align 32
anatofuz
parents:
diff changeset
71 // CHECK: @local_memory_alignment_global.lds_v4i64 = internal addrspace(3) global [4 x <4 x i64>] undef, align 32
anatofuz
parents:
diff changeset
72 // CHECK: @local_memory_alignment_global.lds_v8i64 = internal addrspace(3) global [4 x <8 x i64>] undef, align 64
anatofuz
parents:
diff changeset
73 // CHECK: @local_memory_alignment_global.lds_v16i64 = internal addrspace(3) global [4 x <16 x i64>] undef, align 128
anatofuz
parents:
diff changeset
74 // CHECK: @local_memory_alignment_global.lds_f16 = internal addrspace(3) global [4 x half] undef, align 2
anatofuz
parents:
diff changeset
75 // CHECK: @local_memory_alignment_global.lds_v2f16 = internal addrspace(3) global [4 x <2 x half>] undef, align 4
anatofuz
parents:
diff changeset
76 // CHECK: @local_memory_alignment_global.lds_v3f16 = internal addrspace(3) global [4 x <3 x half>] undef, align 8
anatofuz
parents:
diff changeset
77 // CHECK: @local_memory_alignment_global.lds_v4f16 = internal addrspace(3) global [4 x <4 x half>] undef, align 8
anatofuz
parents:
diff changeset
78 // CHECK: @local_memory_alignment_global.lds_v8f16 = internal addrspace(3) global [4 x <8 x half>] undef, align 16
anatofuz
parents:
diff changeset
79 // CHECK: @local_memory_alignment_global.lds_v16f16 = internal addrspace(3) global [4 x <16 x half>] undef, align 32
anatofuz
parents:
diff changeset
80 // CHECK: @local_memory_alignment_global.lds_f32 = internal addrspace(3) global [4 x float] undef, align 4
anatofuz
parents:
diff changeset
81 // CHECK: @local_memory_alignment_global.lds_v2f32 = internal addrspace(3) global [4 x <2 x float>] undef, align 8
anatofuz
parents:
diff changeset
82 // CHECK: @local_memory_alignment_global.lds_v3f32 = internal addrspace(3) global [4 x <3 x float>] undef, align 16
anatofuz
parents:
diff changeset
83 // CHECK: @local_memory_alignment_global.lds_v4f32 = internal addrspace(3) global [4 x <4 x float>] undef, align 16
anatofuz
parents:
diff changeset
84 // CHECK: @local_memory_alignment_global.lds_v8f32 = internal addrspace(3) global [4 x <8 x float>] undef, align 32
anatofuz
parents:
diff changeset
85 // CHECK: @local_memory_alignment_global.lds_v16f32 = internal addrspace(3) global [4 x <16 x float>] undef, align 64
anatofuz
parents:
diff changeset
86 // CHECK: @local_memory_alignment_global.lds_f64 = internal addrspace(3) global [4 x double] undef, align 8
anatofuz
parents:
diff changeset
87 // CHECK: @local_memory_alignment_global.lds_v2f64 = internal addrspace(3) global [4 x <2 x double>] undef, align 16
anatofuz
parents:
diff changeset
88 // CHECK: @local_memory_alignment_global.lds_v3f64 = internal addrspace(3) global [4 x <3 x double>] undef, align 32
anatofuz
parents:
diff changeset
89 // CHECK: @local_memory_alignment_global.lds_v4f64 = internal addrspace(3) global [4 x <4 x double>] undef, align 32
anatofuz
parents:
diff changeset
90 // CHECK: @local_memory_alignment_global.lds_v8f64 = internal addrspace(3) global [4 x <8 x double>] undef, align 64
anatofuz
parents:
diff changeset
91 // CHECK: @local_memory_alignment_global.lds_v16f64 = internal addrspace(3) global [4 x <16 x double>] undef, align 128
anatofuz
parents:
diff changeset
92
anatofuz
parents:
diff changeset
93
anatofuz
parents:
diff changeset
94 // CHECK-LABEL: @local_memory_alignment_global(
anatofuz
parents:
diff changeset
95 // CHECK: store volatile i8 0, i8 addrspace(3)* getelementptr inbounds ([4 x i8], [4 x i8] addrspace(3)* @local_memory_alignment_global.lds_i8, i64 0, i64 0), align 1
anatofuz
parents:
diff changeset
96 // CHECK: store volatile <2 x i8> zeroinitializer, <2 x i8> addrspace(3)* getelementptr inbounds ([4 x <2 x i8>], [4 x <2 x i8>] addrspace(3)* @local_memory_alignment_global.lds_v2i8, i64 0, i64 0), align 2
anatofuz
parents:
diff changeset
97 // CHECK: store volatile <4 x i8> <i8 0, i8 0, i8 0, i8 undef>, <4 x i8> addrspace(3)* bitcast ([4 x <3 x i8>] addrspace(3)* @local_memory_alignment_global.lds_v3i8 to <4 x i8> addrspace(3)*), align 4
anatofuz
parents:
diff changeset
98 // CHECK: store volatile <4 x i8> zeroinitializer, <4 x i8> addrspace(3)* getelementptr inbounds ([4 x <4 x i8>], [4 x <4 x i8>] addrspace(3)* @local_memory_alignment_global.lds_v4i8, i64 0, i64 0), align 4
anatofuz
parents:
diff changeset
99 // CHECK: store volatile <8 x i8> zeroinitializer, <8 x i8> addrspace(3)* getelementptr inbounds ([4 x <8 x i8>], [4 x <8 x i8>] addrspace(3)* @local_memory_alignment_global.lds_v8i8, i64 0, i64 0), align 8
anatofuz
parents:
diff changeset
100 // CHECK: store volatile <16 x i8> zeroinitializer, <16 x i8> addrspace(3)* getelementptr inbounds ([4 x <16 x i8>], [4 x <16 x i8>] addrspace(3)* @local_memory_alignment_global.lds_v16i8, i64 0, i64 0), align 16
anatofuz
parents:
diff changeset
101 // CHECK: store volatile i16 0, i16 addrspace(3)* getelementptr inbounds ([4 x i16], [4 x i16] addrspace(3)* @local_memory_alignment_global.lds_i16, i64 0, i64 0), align 2
anatofuz
parents:
diff changeset
102 // CHECK: store volatile <2 x i16> zeroinitializer, <2 x i16> addrspace(3)* getelementptr inbounds ([4 x <2 x i16>], [4 x <2 x i16>] addrspace(3)* @local_memory_alignment_global.lds_v2i16, i64 0, i64 0), align 4
anatofuz
parents:
diff changeset
103 // CHECK: store volatile <4 x i16> <i16 0, i16 0, i16 0, i16 undef>, <4 x i16> addrspace(3)* bitcast ([4 x <3 x i16>] addrspace(3)* @local_memory_alignment_global.lds_v3i16 to <4 x i16> addrspace(3)*), align 8
anatofuz
parents:
diff changeset
104 // CHECK: store volatile <4 x i16> zeroinitializer, <4 x i16> addrspace(3)* getelementptr inbounds ([4 x <4 x i16>], [4 x <4 x i16>] addrspace(3)* @local_memory_alignment_global.lds_v4i16, i64 0, i64 0), align 8
anatofuz
parents:
diff changeset
105 // CHECK: store volatile <8 x i16> zeroinitializer, <8 x i16> addrspace(3)* getelementptr inbounds ([4 x <8 x i16>], [4 x <8 x i16>] addrspace(3)* @local_memory_alignment_global.lds_v8i16, i64 0, i64 0), align 16
anatofuz
parents:
diff changeset
106 // CHECK: store volatile <16 x i16> zeroinitializer, <16 x i16> addrspace(3)* getelementptr inbounds ([4 x <16 x i16>], [4 x <16 x i16>] addrspace(3)* @local_memory_alignment_global.lds_v16i16, i64 0, i64 0), align 32
anatofuz
parents:
diff changeset
107 // CHECK: store volatile i32 0, i32 addrspace(3)* getelementptr inbounds ([4 x i32], [4 x i32] addrspace(3)* @local_memory_alignment_global.lds_i32, i64 0, i64 0), align 4
anatofuz
parents:
diff changeset
108 // CHECK: store volatile <2 x i32> zeroinitializer, <2 x i32> addrspace(3)* getelementptr inbounds ([4 x <2 x i32>], [4 x <2 x i32>] addrspace(3)* @local_memory_alignment_global.lds_v2i32, i64 0, i64 0), align 8
anatofuz
parents:
diff changeset
109 // CHECK: store volatile <4 x i32> <i32 0, i32 0, i32 0, i32 undef>, <4 x i32> addrspace(3)* bitcast ([4 x <3 x i32>] addrspace(3)* @local_memory_alignment_global.lds_v3i32 to <4 x i32> addrspace(3)*), align 16
anatofuz
parents:
diff changeset
110 // CHECK: store volatile <4 x i32> zeroinitializer, <4 x i32> addrspace(3)* getelementptr inbounds ([4 x <4 x i32>], [4 x <4 x i32>] addrspace(3)* @local_memory_alignment_global.lds_v4i32, i64 0, i64 0), align 16
anatofuz
parents:
diff changeset
111 // CHECK: store volatile <8 x i32> zeroinitializer, <8 x i32> addrspace(3)* getelementptr inbounds ([4 x <8 x i32>], [4 x <8 x i32>] addrspace(3)* @local_memory_alignment_global.lds_v8i32, i64 0, i64 0), align 32
anatofuz
parents:
diff changeset
112 // CHECK: store volatile <16 x i32> zeroinitializer, <16 x i32> addrspace(3)* getelementptr inbounds ([4 x <16 x i32>], [4 x <16 x i32>] addrspace(3)* @local_memory_alignment_global.lds_v16i32, i64 0, i64 0), align 64
anatofuz
parents:
diff changeset
113 // CHECK: store volatile i64 0, i64 addrspace(3)* getelementptr inbounds ([4 x i64], [4 x i64] addrspace(3)* @local_memory_alignment_global.lds_i64, i64 0, i64 0), align 8
anatofuz
parents:
diff changeset
114 // CHECK: store volatile <2 x i64> zeroinitializer, <2 x i64> addrspace(3)* getelementptr inbounds ([4 x <2 x i64>], [4 x <2 x i64>] addrspace(3)* @local_memory_alignment_global.lds_v2i64, i64 0, i64 0), align 16
anatofuz
parents:
diff changeset
115 // CHECK: store volatile <4 x i64> <i64 0, i64 0, i64 0, i64 undef>, <4 x i64> addrspace(3)* bitcast ([4 x <3 x i64>] addrspace(3)* @local_memory_alignment_global.lds_v3i64 to <4 x i64> addrspace(3)*), align 32
anatofuz
parents:
diff changeset
116 // CHECK: store volatile <4 x i64> zeroinitializer, <4 x i64> addrspace(3)* getelementptr inbounds ([4 x <4 x i64>], [4 x <4 x i64>] addrspace(3)* @local_memory_alignment_global.lds_v4i64, i64 0, i64 0), align 32
anatofuz
parents:
diff changeset
117 // CHECK: store volatile <8 x i64> zeroinitializer, <8 x i64> addrspace(3)* getelementptr inbounds ([4 x <8 x i64>], [4 x <8 x i64>] addrspace(3)* @local_memory_alignment_global.lds_v8i64, i64 0, i64 0), align 64
anatofuz
parents:
diff changeset
118 // CHECK: store volatile <16 x i64> zeroinitializer, <16 x i64> addrspace(3)* getelementptr inbounds ([4 x <16 x i64>], [4 x <16 x i64>] addrspace(3)* @local_memory_alignment_global.lds_v16i64, i64 0, i64 0), align 128
anatofuz
parents:
diff changeset
119 // CHECK: store volatile half 0xH0000, half addrspace(3)* getelementptr inbounds ([4 x half], [4 x half] addrspace(3)* @local_memory_alignment_global.lds_f16, i64 0, i64 0), align 2
anatofuz
parents:
diff changeset
120 // CHECK: store volatile <2 x half> zeroinitializer, <2 x half> addrspace(3)* getelementptr inbounds ([4 x <2 x half>], [4 x <2 x half>] addrspace(3)* @local_memory_alignment_global.lds_v2f16, i64 0, i64 0), align 4
anatofuz
parents:
diff changeset
121 // CHECK: store volatile <4 x half> <half 0xH0000, half 0xH0000, half 0xH0000, half undef>, <4 x half> addrspace(3)* bitcast ([4 x <3 x half>] addrspace(3)* @local_memory_alignment_global.lds_v3f16 to <4 x half> addrspace(3)*), align 8
anatofuz
parents:
diff changeset
122 // CHECK: store volatile <4 x half> zeroinitializer, <4 x half> addrspace(3)* getelementptr inbounds ([4 x <4 x half>], [4 x <4 x half>] addrspace(3)* @local_memory_alignment_global.lds_v4f16, i64 0, i64 0), align 8
anatofuz
parents:
diff changeset
123 // CHECK: store volatile <8 x half> zeroinitializer, <8 x half> addrspace(3)* getelementptr inbounds ([4 x <8 x half>], [4 x <8 x half>] addrspace(3)* @local_memory_alignment_global.lds_v8f16, i64 0, i64 0), align 16
anatofuz
parents:
diff changeset
124 // CHECK: store volatile <16 x half> zeroinitializer, <16 x half> addrspace(3)* getelementptr inbounds ([4 x <16 x half>], [4 x <16 x half>] addrspace(3)* @local_memory_alignment_global.lds_v16f16, i64 0, i64 0), align 32
anatofuz
parents:
diff changeset
125 // CHECK: store volatile float 0.000000e+00, float addrspace(3)* getelementptr inbounds ([4 x float], [4 x float] addrspace(3)* @local_memory_alignment_global.lds_f32, i64 0, i64 0), align 4
anatofuz
parents:
diff changeset
126 // CHECK: store volatile <2 x float> zeroinitializer, <2 x float> addrspace(3)* getelementptr inbounds ([4 x <2 x float>], [4 x <2 x float>] addrspace(3)* @local_memory_alignment_global.lds_v2f32, i64 0, i64 0), align 8
anatofuz
parents:
diff changeset
127 // CHECK: store volatile <4 x float> <float 0.000000e+00, float 0.000000e+00, float 0.000000e+00, float undef>, <4 x float> addrspace(3)* bitcast ([4 x <3 x float>] addrspace(3)* @local_memory_alignment_global.lds_v3f32 to <4 x float> addrspace(3)*), align 16
anatofuz
parents:
diff changeset
128 // CHECK: store volatile <4 x float> zeroinitializer, <4 x float> addrspace(3)* getelementptr inbounds ([4 x <4 x float>], [4 x <4 x float>] addrspace(3)* @local_memory_alignment_global.lds_v4f32, i64 0, i64 0), align 16
anatofuz
parents:
diff changeset
129 // CHECK: store volatile <8 x float> zeroinitializer, <8 x float> addrspace(3)* getelementptr inbounds ([4 x <8 x float>], [4 x <8 x float>] addrspace(3)* @local_memory_alignment_global.lds_v8f32, i64 0, i64 0), align 32
anatofuz
parents:
diff changeset
130 // CHECK: store volatile <16 x float> zeroinitializer, <16 x float> addrspace(3)* getelementptr inbounds ([4 x <16 x float>], [4 x <16 x float>] addrspace(3)* @local_memory_alignment_global.lds_v16f32, i64 0, i64 0), align 64
anatofuz
parents:
diff changeset
131 // CHECK: store volatile double 0.000000e+00, double addrspace(3)* getelementptr inbounds ([4 x double], [4 x double] addrspace(3)* @local_memory_alignment_global.lds_f64, i64 0, i64 0), align 8
anatofuz
parents:
diff changeset
132 // CHECK: store volatile <2 x double> zeroinitializer, <2 x double> addrspace(3)* getelementptr inbounds ([4 x <2 x double>], [4 x <2 x double>] addrspace(3)* @local_memory_alignment_global.lds_v2f64, i64 0, i64 0), align 16
anatofuz
parents:
diff changeset
133 // CHECK: store volatile <4 x double> <double 0.000000e+00, double 0.000000e+00, double 0.000000e+00, double undef>, <4 x double> addrspace(3)* bitcast ([4 x <3 x double>] addrspace(3)* @local_memory_alignment_global.lds_v3f64 to <4 x double> addrspace(3)*), align 32
anatofuz
parents:
diff changeset
134 // CHECK: store volatile <4 x double> zeroinitializer, <4 x double> addrspace(3)* getelementptr inbounds ([4 x <4 x double>], [4 x <4 x double>] addrspace(3)* @local_memory_alignment_global.lds_v4f64, i64 0, i64 0), align 32
anatofuz
parents:
diff changeset
135 // CHECK: store volatile <8 x double> zeroinitializer, <8 x double> addrspace(3)* getelementptr inbounds ([4 x <8 x double>], [4 x <8 x double>] addrspace(3)* @local_memory_alignment_global.lds_v8f64, i64 0, i64 0), align 64
anatofuz
parents:
diff changeset
136 // CHECK: store volatile <16 x double> zeroinitializer, <16 x double> addrspace(3)* getelementptr inbounds ([4 x <16 x double>], [4 x <16 x double>] addrspace(3)* @local_memory_alignment_global.lds_v16f64, i64 0, i64 0), align 128
anatofuz
parents:
diff changeset
137 kernel void local_memory_alignment_global()
anatofuz
parents:
diff changeset
138 {
anatofuz
parents:
diff changeset
139 volatile local char lds_i8[4];
anatofuz
parents:
diff changeset
140 volatile local char2 lds_v2i8[4];
anatofuz
parents:
diff changeset
141 volatile local char3 lds_v3i8[4];
anatofuz
parents:
diff changeset
142 volatile local char4 lds_v4i8[4];
anatofuz
parents:
diff changeset
143 volatile local char8 lds_v8i8[4];
anatofuz
parents:
diff changeset
144 volatile local char16 lds_v16i8[4];
anatofuz
parents:
diff changeset
145
anatofuz
parents:
diff changeset
146 volatile local short lds_i16[4];
anatofuz
parents:
diff changeset
147 volatile local short2 lds_v2i16[4];
anatofuz
parents:
diff changeset
148 volatile local short3 lds_v3i16[4];
anatofuz
parents:
diff changeset
149 volatile local short4 lds_v4i16[4];
anatofuz
parents:
diff changeset
150 volatile local short8 lds_v8i16[4];
anatofuz
parents:
diff changeset
151 volatile local short16 lds_v16i16[4];
anatofuz
parents:
diff changeset
152
anatofuz
parents:
diff changeset
153 volatile local int lds_i32[4];
anatofuz
parents:
diff changeset
154 volatile local int2 lds_v2i32[4];
anatofuz
parents:
diff changeset
155 volatile local int3 lds_v3i32[4];
anatofuz
parents:
diff changeset
156 volatile local int4 lds_v4i32[4];
anatofuz
parents:
diff changeset
157 volatile local int8 lds_v8i32[4];
anatofuz
parents:
diff changeset
158 volatile local int16 lds_v16i32[4];
anatofuz
parents:
diff changeset
159
anatofuz
parents:
diff changeset
160 volatile local long lds_i64[4];
anatofuz
parents:
diff changeset
161 volatile local long2 lds_v2i64[4];
anatofuz
parents:
diff changeset
162 volatile local long3 lds_v3i64[4];
anatofuz
parents:
diff changeset
163 volatile local long4 lds_v4i64[4];
anatofuz
parents:
diff changeset
164 volatile local long8 lds_v8i64[4];
anatofuz
parents:
diff changeset
165 volatile local long16 lds_v16i64[4];
anatofuz
parents:
diff changeset
166
anatofuz
parents:
diff changeset
167 volatile local half lds_f16[4];
anatofuz
parents:
diff changeset
168 volatile local half2 lds_v2f16[4];
anatofuz
parents:
diff changeset
169 volatile local half3 lds_v3f16[4];
anatofuz
parents:
diff changeset
170 volatile local half4 lds_v4f16[4];
anatofuz
parents:
diff changeset
171 volatile local half8 lds_v8f16[4];
anatofuz
parents:
diff changeset
172 volatile local half16 lds_v16f16[4];
anatofuz
parents:
diff changeset
173
anatofuz
parents:
diff changeset
174 volatile local float lds_f32[4];
anatofuz
parents:
diff changeset
175 volatile local float2 lds_v2f32[4];
anatofuz
parents:
diff changeset
176 volatile local float3 lds_v3f32[4];
anatofuz
parents:
diff changeset
177 volatile local float4 lds_v4f32[4];
anatofuz
parents:
diff changeset
178 volatile local float8 lds_v8f32[4];
anatofuz
parents:
diff changeset
179 volatile local float16 lds_v16f32[4];
anatofuz
parents:
diff changeset
180
anatofuz
parents:
diff changeset
181 volatile local double lds_f64[4];
anatofuz
parents:
diff changeset
182 volatile local double2 lds_v2f64[4];
anatofuz
parents:
diff changeset
183 volatile local double3 lds_v3f64[4];
anatofuz
parents:
diff changeset
184 volatile local double4 lds_v4f64[4];
anatofuz
parents:
diff changeset
185 volatile local double8 lds_v8f64[4];
anatofuz
parents:
diff changeset
186 volatile local double16 lds_v16f64[4];
anatofuz
parents:
diff changeset
187
anatofuz
parents:
diff changeset
188 *lds_i8 = 0;
anatofuz
parents:
diff changeset
189 *lds_v2i8 = 0;
anatofuz
parents:
diff changeset
190 *lds_v3i8 = 0;
anatofuz
parents:
diff changeset
191 *lds_v4i8 = 0;
anatofuz
parents:
diff changeset
192 *lds_v8i8 = 0;
anatofuz
parents:
diff changeset
193 *lds_v16i8 = 0;
anatofuz
parents:
diff changeset
194
anatofuz
parents:
diff changeset
195 *lds_i16 = 0;
anatofuz
parents:
diff changeset
196 *lds_v2i16 = 0;
anatofuz
parents:
diff changeset
197 *lds_v3i16 = 0;
anatofuz
parents:
diff changeset
198 *lds_v4i16 = 0;
anatofuz
parents:
diff changeset
199 *lds_v8i16 = 0;
anatofuz
parents:
diff changeset
200 *lds_v16i16 = 0;
anatofuz
parents:
diff changeset
201
anatofuz
parents:
diff changeset
202 *lds_i32 = 0;
anatofuz
parents:
diff changeset
203 *lds_v2i32 = 0;
anatofuz
parents:
diff changeset
204 *lds_v3i32 = 0;
anatofuz
parents:
diff changeset
205 *lds_v4i32 = 0;
anatofuz
parents:
diff changeset
206 *lds_v8i32 = 0;
anatofuz
parents:
diff changeset
207 *lds_v16i32 = 0;
anatofuz
parents:
diff changeset
208
anatofuz
parents:
diff changeset
209 *lds_i64 = 0;
anatofuz
parents:
diff changeset
210 *lds_v2i64 = 0;
anatofuz
parents:
diff changeset
211 *lds_v3i64 = 0;
anatofuz
parents:
diff changeset
212 *lds_v4i64 = 0;
anatofuz
parents:
diff changeset
213 *lds_v8i64 = 0;
anatofuz
parents:
diff changeset
214 *lds_v16i64 = 0;
anatofuz
parents:
diff changeset
215
anatofuz
parents:
diff changeset
216 *lds_f16 = 0;
anatofuz
parents:
diff changeset
217 *lds_v2f16 = 0;
anatofuz
parents:
diff changeset
218 *lds_v3f16 = 0;
anatofuz
parents:
diff changeset
219 *lds_v4f16 = 0;
anatofuz
parents:
diff changeset
220 *lds_v8f16 = 0;
anatofuz
parents:
diff changeset
221 *lds_v16f16 = 0;
anatofuz
parents:
diff changeset
222
anatofuz
parents:
diff changeset
223 *lds_f32 = 0;
anatofuz
parents:
diff changeset
224 *lds_v2f32 = 0;
anatofuz
parents:
diff changeset
225 *lds_v3f32 = 0;
anatofuz
parents:
diff changeset
226 *lds_v4f32 = 0;
anatofuz
parents:
diff changeset
227 *lds_v8f32 = 0;
anatofuz
parents:
diff changeset
228 *lds_v16f32 = 0;
anatofuz
parents:
diff changeset
229
anatofuz
parents:
diff changeset
230 *lds_f64 = 0;
anatofuz
parents:
diff changeset
231 *lds_v2f64 = 0;
anatofuz
parents:
diff changeset
232 *lds_v3f64 = 0;
anatofuz
parents:
diff changeset
233 *lds_v4f64 = 0;
anatofuz
parents:
diff changeset
234 *lds_v8f64 = 0;
anatofuz
parents:
diff changeset
235 *lds_v16f64 = 0;
anatofuz
parents:
diff changeset
236 }
anatofuz
parents:
diff changeset
237
anatofuz
parents:
diff changeset
238 kernel void local_memory_alignment_arg(
anatofuz
parents:
diff changeset
239 volatile local char* lds_i8,
anatofuz
parents:
diff changeset
240 volatile local char2* lds_v2i8,
anatofuz
parents:
diff changeset
241 volatile local char3* lds_v3i8,
anatofuz
parents:
diff changeset
242 volatile local char4* lds_v4i8,
anatofuz
parents:
diff changeset
243 volatile local char8* lds_v8i8,
anatofuz
parents:
diff changeset
244 volatile local char16* lds_v16i8,
anatofuz
parents:
diff changeset
245
anatofuz
parents:
diff changeset
246 volatile local short* lds_i16,
anatofuz
parents:
diff changeset
247 volatile local short2* lds_v2i16,
anatofuz
parents:
diff changeset
248 volatile local short3* lds_v3i16,
anatofuz
parents:
diff changeset
249 volatile local short4* lds_v4i16,
anatofuz
parents:
diff changeset
250 volatile local short8* lds_v8i16,
anatofuz
parents:
diff changeset
251 volatile local short16* lds_v16i16,
anatofuz
parents:
diff changeset
252
anatofuz
parents:
diff changeset
253 volatile local int* lds_i32,
anatofuz
parents:
diff changeset
254 volatile local int2* lds_v2i32,
anatofuz
parents:
diff changeset
255 volatile local int3* lds_v3i32,
anatofuz
parents:
diff changeset
256 volatile local int4* lds_v4i32,
anatofuz
parents:
diff changeset
257 volatile local int8* lds_v8i32,
anatofuz
parents:
diff changeset
258 volatile local int16* lds_v16i32,
anatofuz
parents:
diff changeset
259
anatofuz
parents:
diff changeset
260 volatile local long* lds_i64,
anatofuz
parents:
diff changeset
261 volatile local long2* lds_v2i64,
anatofuz
parents:
diff changeset
262 volatile local long3* lds_v3i64,
anatofuz
parents:
diff changeset
263 volatile local long4* lds_v4i64,
anatofuz
parents:
diff changeset
264 volatile local long8* lds_v8i64,
anatofuz
parents:
diff changeset
265 volatile local long16* lds_v16i64,
anatofuz
parents:
diff changeset
266
anatofuz
parents:
diff changeset
267 volatile local half* lds_f16,
anatofuz
parents:
diff changeset
268 volatile local half2* lds_v2f16,
anatofuz
parents:
diff changeset
269 volatile local half3* lds_v3f16,
anatofuz
parents:
diff changeset
270 volatile local half4* lds_v4f16,
anatofuz
parents:
diff changeset
271 volatile local half8* lds_v8f16,
anatofuz
parents:
diff changeset
272 volatile local half16* lds_v16f16,
anatofuz
parents:
diff changeset
273
anatofuz
parents:
diff changeset
274 volatile local float* lds_f32,
anatofuz
parents:
diff changeset
275 volatile local float2* lds_v2f32,
anatofuz
parents:
diff changeset
276 volatile local float3* lds_v3f32,
anatofuz
parents:
diff changeset
277 volatile local float4* lds_v4f32,
anatofuz
parents:
diff changeset
278 volatile local float8* lds_v8f32,
anatofuz
parents:
diff changeset
279 volatile local float16* lds_v16f32,
anatofuz
parents:
diff changeset
280
anatofuz
parents:
diff changeset
281 volatile local double* lds_f64,
anatofuz
parents:
diff changeset
282 volatile local double2* lds_v2f64,
anatofuz
parents:
diff changeset
283 volatile local double3* lds_v3f64,
anatofuz
parents:
diff changeset
284 volatile local double4* lds_v4f64,
anatofuz
parents:
diff changeset
285 volatile local double8* lds_v8f64,
anatofuz
parents:
diff changeset
286 volatile local double16* lds_v16f64)
anatofuz
parents:
diff changeset
287 {
anatofuz
parents:
diff changeset
288 *lds_i8 = 0;
anatofuz
parents:
diff changeset
289 *lds_v2i8 = 0;
anatofuz
parents:
diff changeset
290 *lds_v3i8 = 0;
anatofuz
parents:
diff changeset
291 *lds_v4i8 = 0;
anatofuz
parents:
diff changeset
292 *lds_v8i8 = 0;
anatofuz
parents:
diff changeset
293 *lds_v16i8 = 0;
anatofuz
parents:
diff changeset
294
anatofuz
parents:
diff changeset
295 *lds_i16 = 0;
anatofuz
parents:
diff changeset
296 *lds_v2i16 = 0;
anatofuz
parents:
diff changeset
297 *lds_v3i16 = 0;
anatofuz
parents:
diff changeset
298 *lds_v4i16 = 0;
anatofuz
parents:
diff changeset
299 *lds_v8i16 = 0;
anatofuz
parents:
diff changeset
300 *lds_v16i16 = 0;
anatofuz
parents:
diff changeset
301
anatofuz
parents:
diff changeset
302 *lds_i32 = 0;
anatofuz
parents:
diff changeset
303 *lds_v2i32 = 0;
anatofuz
parents:
diff changeset
304 *lds_v3i32 = 0;
anatofuz
parents:
diff changeset
305 *lds_v4i32 = 0;
anatofuz
parents:
diff changeset
306 *lds_v8i32 = 0;
anatofuz
parents:
diff changeset
307 *lds_v16i32 = 0;
anatofuz
parents:
diff changeset
308
anatofuz
parents:
diff changeset
309 *lds_i64 = 0;
anatofuz
parents:
diff changeset
310 *lds_v2i64 = 0;
anatofuz
parents:
diff changeset
311 *lds_v3i64 = 0;
anatofuz
parents:
diff changeset
312 *lds_v4i64 = 0;
anatofuz
parents:
diff changeset
313 *lds_v8i64 = 0;
anatofuz
parents:
diff changeset
314 *lds_v16i64 = 0;
anatofuz
parents:
diff changeset
315
anatofuz
parents:
diff changeset
316 *lds_f16 = 0;
anatofuz
parents:
diff changeset
317 *lds_v2f16 = 0;
anatofuz
parents:
diff changeset
318 *lds_v3f16 = 0;
anatofuz
parents:
diff changeset
319 *lds_v4f16 = 0;
anatofuz
parents:
diff changeset
320 *lds_v8f16 = 0;
anatofuz
parents:
diff changeset
321 *lds_v16f16 = 0;
anatofuz
parents:
diff changeset
322
anatofuz
parents:
diff changeset
323 *lds_f32 = 0;
anatofuz
parents:
diff changeset
324 *lds_v2f32 = 0;
anatofuz
parents:
diff changeset
325 *lds_v3f32 = 0;
anatofuz
parents:
diff changeset
326 *lds_v4f32 = 0;
anatofuz
parents:
diff changeset
327 *lds_v8f32 = 0;
anatofuz
parents:
diff changeset
328 *lds_v16f32 = 0;
anatofuz
parents:
diff changeset
329
anatofuz
parents:
diff changeset
330 *lds_f64 = 0;
anatofuz
parents:
diff changeset
331 *lds_v2f64 = 0;
anatofuz
parents:
diff changeset
332 *lds_v3f64 = 0;
anatofuz
parents:
diff changeset
333 *lds_v4f64 = 0;
anatofuz
parents:
diff changeset
334 *lds_v8f64 = 0;
anatofuz
parents:
diff changeset
335 *lds_v16f64 = 0;
anatofuz
parents:
diff changeset
336 }
anatofuz
parents:
diff changeset
337
anatofuz
parents:
diff changeset
338 // CHECK-LABEL: @private_memory_alignment_alloca(
anatofuz
parents:
diff changeset
339 // CHECK: %private_i8 = alloca [4 x i8], align 1, addrspace(5)
anatofuz
parents:
diff changeset
340 // CHECK: %private_v2i8 = alloca [4 x <2 x i8>], align 2, addrspace(5)
anatofuz
parents:
diff changeset
341 // CHECK: %private_v3i8 = alloca [4 x <3 x i8>], align 4, addrspace(5)
anatofuz
parents:
diff changeset
342 // CHECK: %private_v4i8 = alloca [4 x <4 x i8>], align 4, addrspace(5)
anatofuz
parents:
diff changeset
343 // CHECK: %private_v8i8 = alloca [4 x <8 x i8>], align 8, addrspace(5)
anatofuz
parents:
diff changeset
344 // CHECK: %private_v16i8 = alloca [4 x <16 x i8>], align 16, addrspace(5)
anatofuz
parents:
diff changeset
345 // CHECK: %private_i16 = alloca [4 x i16], align 2, addrspace(5)
anatofuz
parents:
diff changeset
346 // CHECK: %private_v2i16 = alloca [4 x <2 x i16>], align 4, addrspace(5)
anatofuz
parents:
diff changeset
347 // CHECK: %private_v3i16 = alloca [4 x <3 x i16>], align 8, addrspace(5)
anatofuz
parents:
diff changeset
348 // CHECK: %private_v4i16 = alloca [4 x <4 x i16>], align 8, addrspace(5)
anatofuz
parents:
diff changeset
349 // CHECK: %private_v8i16 = alloca [4 x <8 x i16>], align 16, addrspace(5)
anatofuz
parents:
diff changeset
350 // CHECK: %private_v16i16 = alloca [4 x <16 x i16>], align 32, addrspace(5)
anatofuz
parents:
diff changeset
351 // CHECK: %private_i32 = alloca [4 x i32], align 4, addrspace(5)
anatofuz
parents:
diff changeset
352 // CHECK: %private_v2i32 = alloca [4 x <2 x i32>], align 8, addrspace(5)
anatofuz
parents:
diff changeset
353 // CHECK: %private_v3i32 = alloca [4 x <3 x i32>], align 16, addrspace(5)
anatofuz
parents:
diff changeset
354 // CHECK: %private_v4i32 = alloca [4 x <4 x i32>], align 16, addrspace(5)
anatofuz
parents:
diff changeset
355 // CHECK: %private_v8i32 = alloca [4 x <8 x i32>], align 32, addrspace(5)
anatofuz
parents:
diff changeset
356 // CHECK: %private_v16i32 = alloca [4 x <16 x i32>], align 64, addrspace(5)
anatofuz
parents:
diff changeset
357 // CHECK: %private_i64 = alloca [4 x i64], align 8, addrspace(5)
anatofuz
parents:
diff changeset
358 // CHECK: %private_v2i64 = alloca [4 x <2 x i64>], align 16, addrspace(5)
anatofuz
parents:
diff changeset
359 // CHECK: %private_v3i64 = alloca [4 x <3 x i64>], align 32, addrspace(5)
anatofuz
parents:
diff changeset
360 // CHECK: %private_v4i64 = alloca [4 x <4 x i64>], align 32, addrspace(5)
anatofuz
parents:
diff changeset
361 // CHECK: %private_v8i64 = alloca [4 x <8 x i64>], align 64, addrspace(5)
anatofuz
parents:
diff changeset
362 // CHECK: %private_v16i64 = alloca [4 x <16 x i64>], align 128, addrspace(5)
anatofuz
parents:
diff changeset
363 // CHECK: %private_f16 = alloca [4 x half], align 2, addrspace(5)
anatofuz
parents:
diff changeset
364 // CHECK: %private_v2f16 = alloca [4 x <2 x half>], align 4, addrspace(5)
anatofuz
parents:
diff changeset
365 // CHECK: %private_v3f16 = alloca [4 x <3 x half>], align 8, addrspace(5)
anatofuz
parents:
diff changeset
366 // CHECK: %private_v4f16 = alloca [4 x <4 x half>], align 8, addrspace(5)
anatofuz
parents:
diff changeset
367 // CHECK: %private_v8f16 = alloca [4 x <8 x half>], align 16, addrspace(5)
anatofuz
parents:
diff changeset
368 // CHECK: %private_v16f16 = alloca [4 x <16 x half>], align 32, addrspace(5)
anatofuz
parents:
diff changeset
369 // CHECK: %private_f32 = alloca [4 x float], align 4, addrspace(5)
anatofuz
parents:
diff changeset
370 // CHECK: %private_v2f32 = alloca [4 x <2 x float>], align 8, addrspace(5)
anatofuz
parents:
diff changeset
371 // CHECK: %private_v3f32 = alloca [4 x <3 x float>], align 16, addrspace(5)
anatofuz
parents:
diff changeset
372 // CHECK: %private_v4f32 = alloca [4 x <4 x float>], align 16, addrspace(5)
anatofuz
parents:
diff changeset
373 // CHECK: %private_v8f32 = alloca [4 x <8 x float>], align 32, addrspace(5)
anatofuz
parents:
diff changeset
374 // CHECK: %private_v16f32 = alloca [4 x <16 x float>], align 64, addrspace(5)
anatofuz
parents:
diff changeset
375 // CHECK: %private_f64 = alloca [4 x double], align 8, addrspace(5)
anatofuz
parents:
diff changeset
376 // CHECK: %private_v2f64 = alloca [4 x <2 x double>], align 16, addrspace(5)
anatofuz
parents:
diff changeset
377 // CHECK: %private_v3f64 = alloca [4 x <3 x double>], align 32, addrspace(5)
anatofuz
parents:
diff changeset
378 // CHECK: %private_v4f64 = alloca [4 x <4 x double>], align 32, addrspace(5)
anatofuz
parents:
diff changeset
379 // CHECK: %private_v8f64 = alloca [4 x <8 x double>], align 64, addrspace(5)
anatofuz
parents:
diff changeset
380 // CHECK: %private_v16f64 = alloca [4 x <16 x double>], align 128, addrspace(5)
anatofuz
parents:
diff changeset
381
anatofuz
parents:
diff changeset
382 // CHECK: store volatile i8 0, i8 addrspace(5)* %arraydecay, align 1
anatofuz
parents:
diff changeset
383 // CHECK: store volatile <2 x i8> zeroinitializer, <2 x i8> addrspace(5)* %arraydecay{{[0-9]+}}, align 2
anatofuz
parents:
diff changeset
384 // CHECK: store volatile <4 x i8> <i8 0, i8 0, i8 0, i8 undef>, <4 x i8> addrspace(5)* %storetmp, align 4
anatofuz
parents:
diff changeset
385 // CHECK: store volatile <4 x i8> zeroinitializer, <4 x i8> addrspace(5)* %arraydecay{{[0-9]+}}, align 4
anatofuz
parents:
diff changeset
386 // CHECK: store volatile <8 x i8> zeroinitializer, <8 x i8> addrspace(5)* %arraydecay{{[0-9]+}}, align 8
anatofuz
parents:
diff changeset
387 // CHECK: store volatile <16 x i8> zeroinitializer, <16 x i8> addrspace(5)* %arraydecay{{[0-9]+}}, align 16
anatofuz
parents:
diff changeset
388 // CHECK: store volatile i16 0, i16 addrspace(5)* %arraydecay{{[0-9]+}}, align 2
anatofuz
parents:
diff changeset
389 // CHECK: store volatile <2 x i16> zeroinitializer, <2 x i16> addrspace(5)* %arraydecay{{[0-9]+}}, align 4
anatofuz
parents:
diff changeset
390 // CHECK: store volatile <4 x i16> <i16 0, i16 0, i16 0, i16 undef>, <4 x i16> addrspace(5)* %storetmp{{[0-9]+}}, align 8
anatofuz
parents:
diff changeset
391 // CHECK: store volatile <4 x i16> zeroinitializer, <4 x i16> addrspace(5)* %arraydecay{{[0-9]+}}, align 8
anatofuz
parents:
diff changeset
392 // CHECK: store volatile <8 x i16> zeroinitializer, <8 x i16> addrspace(5)* %arraydecay{{[0-9]+}}, align 16
anatofuz
parents:
diff changeset
393 // CHECK: store volatile <16 x i16> zeroinitializer, <16 x i16> addrspace(5)* %arraydecay{{[0-9]+}}, align 32
anatofuz
parents:
diff changeset
394 // CHECK: store volatile i32 0, i32 addrspace(5)* %arraydecay{{[0-9]+}}, align 4
anatofuz
parents:
diff changeset
395 // CHECK: store volatile <2 x i32> zeroinitializer, <2 x i32> addrspace(5)* %arraydecay{{[0-9]+}}, align 8
anatofuz
parents:
diff changeset
396 // CHECK: store volatile <4 x i32> <i32 0, i32 0, i32 0, i32 undef>, <4 x i32> addrspace(5)* %storetmp16, align 16
anatofuz
parents:
diff changeset
397 // CHECK: store volatile <4 x i32> zeroinitializer, <4 x i32> addrspace(5)* %arraydecay{{[0-9]+}}, align 16
anatofuz
parents:
diff changeset
398 // CHECK: store volatile <8 x i32> zeroinitializer, <8 x i32> addrspace(5)* %arraydecay{{[0-9]+}}, align 32
anatofuz
parents:
diff changeset
399 // CHECK: store volatile <16 x i32> zeroinitializer, <16 x i32> addrspace(5)* %arraydecay{{[0-9]+}}, align 64
anatofuz
parents:
diff changeset
400 // CHECK: store volatile i64 0, i64 addrspace(5)* %arraydecay{{[0-9]+}}, align 8
anatofuz
parents:
diff changeset
401 // CHECK: store volatile <2 x i64> zeroinitializer, <2 x i64> addrspace(5)* %arraydecay{{[0-9]+}}, align 16
anatofuz
parents:
diff changeset
402 // CHECK: store volatile <4 x i64> <i64 0, i64 0, i64 0, i64 undef>, <4 x i64> addrspace(5)* %storetmp23, align 32
anatofuz
parents:
diff changeset
403 // CHECK: store volatile <4 x i64> zeroinitializer, <4 x i64> addrspace(5)* %arraydecay{{[0-9]+}}, align 32
anatofuz
parents:
diff changeset
404 // CHECK: store volatile <8 x i64> zeroinitializer, <8 x i64> addrspace(5)* %arraydecay{{[0-9]+}}, align 64
anatofuz
parents:
diff changeset
405 // CHECK: store volatile <16 x i64> zeroinitializer, <16 x i64> addrspace(5)* %arraydecay{{[0-9]+}}, align 128
anatofuz
parents:
diff changeset
406 // CHECK: store volatile half 0xH0000, half addrspace(5)* %arraydecay{{[0-9]+}}, align 2
anatofuz
parents:
diff changeset
407 // CHECK: store volatile <2 x half> zeroinitializer, <2 x half> addrspace(5)* %arraydecay{{[0-9]+}}, align 4
anatofuz
parents:
diff changeset
408 // CHECK: store volatile <4 x half> <half 0xH0000, half 0xH0000, half 0xH0000, half undef>, <4 x half> addrspace(5)* %storetmp{{[0-9]+}}, align 8
anatofuz
parents:
diff changeset
409 // CHECK: store volatile <4 x half> zeroinitializer, <4 x half> addrspace(5)* %arraydecay{{[0-9]+}}, align 8
anatofuz
parents:
diff changeset
410 // CHECK: store volatile <8 x half> zeroinitializer, <8 x half> addrspace(5)* %arraydecay{{[0-9]+}}, align 16
anatofuz
parents:
diff changeset
411 // CHECK: store volatile <16 x half> zeroinitializer, <16 x half> addrspace(5)* %arraydecay{{[0-9]+}}, align 32
anatofuz
parents:
diff changeset
412 // CHECK: store volatile float 0.000000e+00, float addrspace(5)* %arraydecay34, align 4
anatofuz
parents:
diff changeset
413 // CHECK: store volatile <2 x float> zeroinitializer, <2 x float> addrspace(5)* %arraydecay{{[0-9]+}}, align 8
anatofuz
parents:
diff changeset
414 // CHECK: store volatile <4 x float> <float 0.000000e+00, float 0.000000e+00, float 0.000000e+00, float undef>, <4 x float> addrspace(5)* %storetmp{{[0-9]+}}, align 16
anatofuz
parents:
diff changeset
415 // CHECK: store volatile <4 x float> zeroinitializer, <4 x float> addrspace(5)* %arraydecay{{[0-9]+}}, align 16
anatofuz
parents:
diff changeset
416 // CHECK: store volatile <8 x float> zeroinitializer, <8 x float> addrspace(5)* %arraydecay{{[0-9]+}}, align 32
anatofuz
parents:
diff changeset
417 // CHECK: store volatile <16 x float> zeroinitializer, <16 x float> addrspace(5)* %arraydecay{{[0-9]+}}, align 64
anatofuz
parents:
diff changeset
418 // CHECK: store volatile double 0.000000e+00, double addrspace(5)* %arraydecay{{[0-9]+}}, align 8
anatofuz
parents:
diff changeset
419 // CHECK: store volatile <2 x double> zeroinitializer, <2 x double> addrspace(5)* %arraydecay{{[0-9]+}}, align 16
anatofuz
parents:
diff changeset
420 // CHECK: store volatile <4 x double> <double 0.000000e+00, double 0.000000e+00, double 0.000000e+00, double undef>, <4 x double> addrspace(5)* %storetmp{{[0-9]+}}, align 32
anatofuz
parents:
diff changeset
421 // CHECK: store volatile <4 x double> zeroinitializer, <4 x double> addrspace(5)* %arraydecay{{[0-9]+}}, align 32
anatofuz
parents:
diff changeset
422 // CHECK: store volatile <8 x double> zeroinitializer, <8 x double> addrspace(5)* %arraydecay{{[0-9]+}}, align 64
anatofuz
parents:
diff changeset
423 // CHECK: store volatile <16 x double> zeroinitializer, <16 x double> addrspace(5)* %arraydecay{{[0-9]+}}, align 128
anatofuz
parents:
diff changeset
424 kernel void private_memory_alignment_alloca()
anatofuz
parents:
diff changeset
425 {
anatofuz
parents:
diff changeset
426 volatile private char private_i8[4];
anatofuz
parents:
diff changeset
427 volatile private char2 private_v2i8[4];
anatofuz
parents:
diff changeset
428 volatile private char3 private_v3i8[4];
anatofuz
parents:
diff changeset
429 volatile private char4 private_v4i8[4];
anatofuz
parents:
diff changeset
430 volatile private char8 private_v8i8[4];
anatofuz
parents:
diff changeset
431 volatile private char16 private_v16i8[4];
anatofuz
parents:
diff changeset
432
anatofuz
parents:
diff changeset
433 volatile private short private_i16[4];
anatofuz
parents:
diff changeset
434 volatile private short2 private_v2i16[4];
anatofuz
parents:
diff changeset
435 volatile private short3 private_v3i16[4];
anatofuz
parents:
diff changeset
436 volatile private short4 private_v4i16[4];
anatofuz
parents:
diff changeset
437 volatile private short8 private_v8i16[4];
anatofuz
parents:
diff changeset
438 volatile private short16 private_v16i16[4];
anatofuz
parents:
diff changeset
439
anatofuz
parents:
diff changeset
440 volatile private int private_i32[4];
anatofuz
parents:
diff changeset
441 volatile private int2 private_v2i32[4];
anatofuz
parents:
diff changeset
442 volatile private int3 private_v3i32[4];
anatofuz
parents:
diff changeset
443 volatile private int4 private_v4i32[4];
anatofuz
parents:
diff changeset
444 volatile private int8 private_v8i32[4];
anatofuz
parents:
diff changeset
445 volatile private int16 private_v16i32[4];
anatofuz
parents:
diff changeset
446
anatofuz
parents:
diff changeset
447 volatile private long private_i64[4];
anatofuz
parents:
diff changeset
448 volatile private long2 private_v2i64[4];
anatofuz
parents:
diff changeset
449 volatile private long3 private_v3i64[4];
anatofuz
parents:
diff changeset
450 volatile private long4 private_v4i64[4];
anatofuz
parents:
diff changeset
451 volatile private long8 private_v8i64[4];
anatofuz
parents:
diff changeset
452 volatile private long16 private_v16i64[4];
anatofuz
parents:
diff changeset
453
anatofuz
parents:
diff changeset
454 volatile private half private_f16[4];
anatofuz
parents:
diff changeset
455 volatile private half2 private_v2f16[4];
anatofuz
parents:
diff changeset
456 volatile private half3 private_v3f16[4];
anatofuz
parents:
diff changeset
457 volatile private half4 private_v4f16[4];
anatofuz
parents:
diff changeset
458 volatile private half8 private_v8f16[4];
anatofuz
parents:
diff changeset
459 volatile private half16 private_v16f16[4];
anatofuz
parents:
diff changeset
460
anatofuz
parents:
diff changeset
461 volatile private float private_f32[4];
anatofuz
parents:
diff changeset
462 volatile private float2 private_v2f32[4];
anatofuz
parents:
diff changeset
463 volatile private float3 private_v3f32[4];
anatofuz
parents:
diff changeset
464 volatile private float4 private_v4f32[4];
anatofuz
parents:
diff changeset
465 volatile private float8 private_v8f32[4];
anatofuz
parents:
diff changeset
466 volatile private float16 private_v16f32[4];
anatofuz
parents:
diff changeset
467
anatofuz
parents:
diff changeset
468 volatile private double private_f64[4];
anatofuz
parents:
diff changeset
469 volatile private double2 private_v2f64[4];
anatofuz
parents:
diff changeset
470 volatile private double3 private_v3f64[4];
anatofuz
parents:
diff changeset
471 volatile private double4 private_v4f64[4];
anatofuz
parents:
diff changeset
472 volatile private double8 private_v8f64[4];
anatofuz
parents:
diff changeset
473 volatile private double16 private_v16f64[4];
anatofuz
parents:
diff changeset
474
anatofuz
parents:
diff changeset
475 *private_i8 = 0;
anatofuz
parents:
diff changeset
476 *private_v2i8 = 0;
anatofuz
parents:
diff changeset
477 *private_v3i8 = 0;
anatofuz
parents:
diff changeset
478 *private_v4i8 = 0;
anatofuz
parents:
diff changeset
479 *private_v8i8 = 0;
anatofuz
parents:
diff changeset
480 *private_v16i8 = 0;
anatofuz
parents:
diff changeset
481
anatofuz
parents:
diff changeset
482 *private_i16 = 0;
anatofuz
parents:
diff changeset
483 *private_v2i16 = 0;
anatofuz
parents:
diff changeset
484 *private_v3i16 = 0;
anatofuz
parents:
diff changeset
485 *private_v4i16 = 0;
anatofuz
parents:
diff changeset
486 *private_v8i16 = 0;
anatofuz
parents:
diff changeset
487 *private_v16i16 = 0;
anatofuz
parents:
diff changeset
488
anatofuz
parents:
diff changeset
489 *private_i32 = 0;
anatofuz
parents:
diff changeset
490 *private_v2i32 = 0;
anatofuz
parents:
diff changeset
491 *private_v3i32 = 0;
anatofuz
parents:
diff changeset
492 *private_v4i32 = 0;
anatofuz
parents:
diff changeset
493 *private_v8i32 = 0;
anatofuz
parents:
diff changeset
494 *private_v16i32 = 0;
anatofuz
parents:
diff changeset
495
anatofuz
parents:
diff changeset
496 *private_i64 = 0;
anatofuz
parents:
diff changeset
497 *private_v2i64 = 0;
anatofuz
parents:
diff changeset
498 *private_v3i64 = 0;
anatofuz
parents:
diff changeset
499 *private_v4i64 = 0;
anatofuz
parents:
diff changeset
500 *private_v8i64 = 0;
anatofuz
parents:
diff changeset
501 *private_v16i64 = 0;
anatofuz
parents:
diff changeset
502
anatofuz
parents:
diff changeset
503 *private_f16 = 0;
anatofuz
parents:
diff changeset
504 *private_v2f16 = 0;
anatofuz
parents:
diff changeset
505 *private_v3f16 = 0;
anatofuz
parents:
diff changeset
506 *private_v4f16 = 0;
anatofuz
parents:
diff changeset
507 *private_v8f16 = 0;
anatofuz
parents:
diff changeset
508 *private_v16f16 = 0;
anatofuz
parents:
diff changeset
509
anatofuz
parents:
diff changeset
510 *private_f32 = 0;
anatofuz
parents:
diff changeset
511 *private_v2f32 = 0;
anatofuz
parents:
diff changeset
512 *private_v3f32 = 0;
anatofuz
parents:
diff changeset
513 *private_v4f32 = 0;
anatofuz
parents:
diff changeset
514 *private_v8f32 = 0;
anatofuz
parents:
diff changeset
515 *private_v16f32 = 0;
anatofuz
parents:
diff changeset
516
anatofuz
parents:
diff changeset
517 *private_f64 = 0;
anatofuz
parents:
diff changeset
518 *private_v2f64 = 0;
anatofuz
parents:
diff changeset
519 *private_v3f64 = 0;
anatofuz
parents:
diff changeset
520 *private_v4f64 = 0;
anatofuz
parents:
diff changeset
521 *private_v8f64 = 0;
anatofuz
parents:
diff changeset
522 *private_v16f64 = 0;
anatofuz
parents:
diff changeset
523 }