|
1 | 1 | // RUN: %clang_cc1 -finclude-default-header -x hlsl -triple \
|
2 | 2 | // RUN: dxil-pc-shadermodel6.3-library %s -fnative-half-type \
|
3 | 3 | // RUN: -emit-llvm -disable-llvm-passes -o - | FileCheck %s \
|
4 |
| -// RUN: --check-prefixes=CHECK,NATIVE_HALF |
| 4 | +// RUN: --check-prefixes=CHECK,DXCHECK,NATIVE_HALF |
5 | 5 | // RUN: %clang_cc1 -finclude-default-header -x hlsl -triple \
|
6 | 6 | // RUN: dxil-pc-shadermodel6.3-library %s -emit-llvm -disable-llvm-passes \
|
7 |
| -// RUN: -o - | FileCheck %s --check-prefixes=CHECK,NO_HALF |
| 7 | +// RUN: -o - | FileCheck %s --check-prefixes=CHECK,DXCHECK,NO_HALF |
8 | 8 |
|
9 |
| -#ifdef __HLSL_ENABLE_16_BIT |
10 |
| -// NATIVE_HALF: %dx.dot = mul i16 %0, %1 |
11 |
| -// NATIVE_HALF: ret i16 %dx.dot |
12 |
| -int16_t test_dot_short(int16_t p0, int16_t p1) { return dot(p0, p1); } |
13 |
| - |
14 |
| -// NATIVE_HALF: %dx.dot = call i16 @llvm.dx.sdot.v2i16(<2 x i16> %0, <2 x i16> %1) |
15 |
| -// NATIVE_HALF: ret i16 %dx.dot |
16 |
| -int16_t test_dot_short2(int16_t2 p0, int16_t2 p1) { return dot(p0, p1); } |
17 |
| - |
18 |
| -// NATIVE_HALF: %dx.dot = call i16 @llvm.dx.sdot.v3i16(<3 x i16> %0, <3 x i16> %1) |
19 |
| -// NATIVE_HALF: ret i16 %dx.dot |
20 |
| -int16_t test_dot_short3(int16_t3 p0, int16_t3 p1) { return dot(p0, p1); } |
21 |
| - |
22 |
| -// NATIVE_HALF: %dx.dot = call i16 @llvm.dx.sdot.v4i16(<4 x i16> %0, <4 x i16> %1) |
23 |
| -// NATIVE_HALF: ret i16 %dx.dot |
24 |
| -int16_t test_dot_short4(int16_t4 p0, int16_t4 p1) { return dot(p0, p1); } |
25 |
| - |
26 |
| -// NATIVE_HALF: %dx.dot = mul i16 %0, %1 |
27 |
| -// NATIVE_HALF: ret i16 %dx.dot |
28 |
| -uint16_t test_dot_ushort(uint16_t p0, uint16_t p1) { return dot(p0, p1); } |
29 |
| - |
30 |
| -// NATIVE_HALF: %dx.dot = call i16 @llvm.dx.udot.v2i16(<2 x i16> %0, <2 x i16> %1) |
31 |
| -// NATIVE_HALF: ret i16 %dx.dot |
32 |
| -uint16_t test_dot_ushort2(uint16_t2 p0, uint16_t2 p1) { return dot(p0, p1); } |
33 |
| - |
34 |
| -// NATIVE_HALF: %dx.dot = call i16 @llvm.dx.udot.v3i16(<3 x i16> %0, <3 x i16> %1) |
35 |
| -// NATIVE_HALF: ret i16 %dx.dot |
36 |
| -uint16_t test_dot_ushort3(uint16_t3 p0, uint16_t3 p1) { return dot(p0, p1); } |
| 9 | +// RUN: %clang_cc1 -finclude-default-header -x hlsl -triple \ |
| 10 | +// RUN: spirv-unknown-vulkan-compute %s -fnative-half-type \ |
| 11 | +// RUN: -emit-llvm -disable-llvm-passes -o - | FileCheck %s \ |
| 12 | +// RUN: --check-prefixes=CHECK,SPVCHECK,NATIVE_HALF |
| 13 | +// RUN: %clang_cc1 -finclude-default-header -x hlsl -triple \ |
| 14 | +// RUN: spirv-unknown-vulkan-compute %s -emit-llvm -disable-llvm-passes \ |
| 15 | +// RUN: -o - | FileCheck %s --check-prefixes=CHECK,SPVCHECK,NO_HALF |
37 | 16 |
|
38 |
| -// NATIVE_HALF: %dx.dot = call i16 @llvm.dx.udot.v4i16(<4 x i16> %0, <4 x i16> %1) |
39 |
| -// NATIVE_HALF: ret i16 %dx.dot |
40 |
| -uint16_t test_dot_ushort4(uint16_t4 p0, uint16_t4 p1) { return dot(p0, p1); } |
41 |
| -#endif |
42 | 17 |
|
43 |
| -// CHECK: %dx.dot = mul i32 %0, %1 |
44 |
| -// CHECK: ret i32 %dx.dot |
| 18 | +// CHECK: %hlsl.dot = mul i32 |
| 19 | +// CHECK: ret i32 %hlsl.dot |
45 | 20 | int test_dot_int(int p0, int p1) { return dot(p0, p1); }
|
46 | 21 |
|
47 |
| -// CHECK: %dx.dot = call i32 @llvm.dx.sdot.v2i32(<2 x i32> %0, <2 x i32> %1) |
48 |
| -// CHECK: ret i32 %dx.dot |
| 22 | +// Capture the expected interchange format so not every check needs to be duplicated |
| 23 | +// DXCHECK: %hlsl.dot = call i32 @llvm.[[ICF:dx]].sdot.v2i32(<2 x i32> |
| 24 | +// SPVCHECK: %hlsl.dot = call i32 @llvm.[[ICF:spv]].sdot.v2i32(<2 x i32> |
| 25 | +// CHECK: ret i32 %hlsl.dot |
49 | 26 | int test_dot_int2(int2 p0, int2 p1) { return dot(p0, p1); }
|
50 | 27 |
|
51 |
| -// CHECK: %dx.dot = call i32 @llvm.dx.sdot.v3i32(<3 x i32> %0, <3 x i32> %1) |
52 |
| -// CHECK: ret i32 %dx.dot |
| 28 | +// CHECK: %hlsl.dot = call i32 @llvm.[[ICF]].sdot.v3i32(<3 x i32> |
| 29 | +// CHECK: ret i32 %hlsl.dot |
53 | 30 | int test_dot_int3(int3 p0, int3 p1) { return dot(p0, p1); }
|
54 | 31 |
|
55 |
| -// CHECK: %dx.dot = call i32 @llvm.dx.sdot.v4i32(<4 x i32> %0, <4 x i32> %1) |
56 |
| -// CHECK: ret i32 %dx.dot |
| 32 | +// CHECK: %hlsl.dot = call i32 @llvm.[[ICF]].sdot.v4i32(<4 x i32> |
| 33 | +// CHECK: ret i32 %hlsl.dot |
57 | 34 | int test_dot_int4(int4 p0, int4 p1) { return dot(p0, p1); }
|
58 | 35 |
|
59 |
| -// CHECK: %dx.dot = mul i32 %0, %1 |
60 |
| -// CHECK: ret i32 %dx.dot |
| 36 | +// CHECK: %hlsl.dot = mul i32 |
| 37 | +// CHECK: ret i32 %hlsl.dot |
61 | 38 | uint test_dot_uint(uint p0, uint p1) { return dot(p0, p1); }
|
62 | 39 |
|
63 |
| -// CHECK: %dx.dot = call i32 @llvm.dx.udot.v2i32(<2 x i32> %0, <2 x i32> %1) |
64 |
| -// CHECK: ret i32 %dx.dot |
| 40 | +// CHECK: %hlsl.dot = call i32 @llvm.[[ICF]].udot.v2i32(<2 x i32> |
| 41 | +// CHECK: ret i32 %hlsl.dot |
65 | 42 | uint test_dot_uint2(uint2 p0, uint2 p1) { return dot(p0, p1); }
|
66 | 43 |
|
67 |
| -// CHECK: %dx.dot = call i32 @llvm.dx.udot.v3i32(<3 x i32> %0, <3 x i32> %1) |
68 |
| -// CHECK: ret i32 %dx.dot |
| 44 | +// CHECK: %hlsl.dot = call i32 @llvm.[[ICF]].udot.v3i32(<3 x i32> |
| 45 | +// CHECK: ret i32 %hlsl.dot |
69 | 46 | uint test_dot_uint3(uint3 p0, uint3 p1) { return dot(p0, p1); }
|
70 | 47 |
|
71 |
| -// CHECK: %dx.dot = call i32 @llvm.dx.udot.v4i32(<4 x i32> %0, <4 x i32> %1) |
72 |
| -// CHECK: ret i32 %dx.dot |
| 48 | +// CHECK: %hlsl.dot = call i32 @llvm.[[ICF]].udot.v4i32(<4 x i32> |
| 49 | +// CHECK: ret i32 %hlsl.dot |
73 | 50 | uint test_dot_uint4(uint4 p0, uint4 p1) { return dot(p0, p1); }
|
74 | 51 |
|
75 |
| -// CHECK: %dx.dot = mul i64 %0, %1 |
76 |
| -// CHECK: ret i64 %dx.dot |
| 52 | +// CHECK: %hlsl.dot = mul i64 |
| 53 | +// CHECK: ret i64 %hlsl.dot |
77 | 54 | int64_t test_dot_long(int64_t p0, int64_t p1) { return dot(p0, p1); }
|
78 | 55 |
|
79 |
| -// CHECK: %dx.dot = call i64 @llvm.dx.sdot.v2i64(<2 x i64> %0, <2 x i64> %1) |
80 |
| -// CHECK: ret i64 %dx.dot |
| 56 | +// CHECK: %hlsl.dot = call i64 @llvm.[[ICF]].sdot.v2i64(<2 x i64> |
| 57 | +// CHECK: ret i64 %hlsl.dot |
81 | 58 | int64_t test_dot_long2(int64_t2 p0, int64_t2 p1) { return dot(p0, p1); }
|
82 | 59 |
|
83 |
| -// CHECK: %dx.dot = call i64 @llvm.dx.sdot.v3i64(<3 x i64> %0, <3 x i64> %1) |
84 |
| -// CHECK: ret i64 %dx.dot |
| 60 | +// CHECK: %hlsl.dot = call i64 @llvm.[[ICF]].sdot.v3i64(<3 x i64> |
| 61 | +// CHECK: ret i64 %hlsl.dot |
85 | 62 | int64_t test_dot_long3(int64_t3 p0, int64_t3 p1) { return dot(p0, p1); }
|
86 | 63 |
|
87 |
| -// CHECK: %dx.dot = call i64 @llvm.dx.sdot.v4i64(<4 x i64> %0, <4 x i64> %1) |
88 |
| -// CHECK: ret i64 %dx.dot |
| 64 | +// CHECK: %hlsl.dot = call i64 @llvm.[[ICF]].sdot.v4i64(<4 x i64> |
| 65 | +// CHECK: ret i64 %hlsl.dot |
89 | 66 | int64_t test_dot_long4(int64_t4 p0, int64_t4 p1) { return dot(p0, p1); }
|
90 | 67 |
|
91 |
| -// CHECK: %dx.dot = mul i64 %0, %1 |
92 |
| -// CHECK: ret i64 %dx.dot |
| 68 | +// CHECK: %hlsl.dot = mul i64 |
| 69 | +// CHECK: ret i64 %hlsl.dot |
93 | 70 | uint64_t test_dot_ulong(uint64_t p0, uint64_t p1) { return dot(p0, p1); }
|
94 | 71 |
|
95 |
| -// CHECK: %dx.dot = call i64 @llvm.dx.udot.v2i64(<2 x i64> %0, <2 x i64> %1) |
96 |
| -// CHECK: ret i64 %dx.dot |
| 72 | +// CHECK: %hlsl.dot = call i64 @llvm.[[ICF]].udot.v2i64(<2 x i64> |
| 73 | +// CHECK: ret i64 %hlsl.dot |
97 | 74 | uint64_t test_dot_ulong2(uint64_t2 p0, uint64_t2 p1) { return dot(p0, p1); }
|
98 | 75 |
|
99 |
| -// CHECK: %dx.dot = call i64 @llvm.dx.udot.v3i64(<3 x i64> %0, <3 x i64> %1) |
100 |
| -// CHECK: ret i64 %dx.dot |
| 76 | +// CHECK: %hlsl.dot = call i64 @llvm.[[ICF]].udot.v3i64(<3 x i64> |
| 77 | +// CHECK: ret i64 %hlsl.dot |
101 | 78 | uint64_t test_dot_ulong3(uint64_t3 p0, uint64_t3 p1) { return dot(p0, p1); }
|
102 | 79 |
|
103 |
| -// CHECK: %dx.dot = call i64 @llvm.dx.udot.v4i64(<4 x i64> %0, <4 x i64> %1) |
104 |
| -// CHECK: ret i64 %dx.dot |
| 80 | +// CHECK: %hlsl.dot = call i64 @llvm.[[ICF]].udot.v4i64(<4 x i64> |
| 81 | +// CHECK: ret i64 %hlsl.dot |
105 | 82 | uint64_t test_dot_ulong4(uint64_t4 p0, uint64_t4 p1) { return dot(p0, p1); }
|
106 | 83 |
|
107 |
| -// NATIVE_HALF: %dx.dot = fmul half %0, %1 |
108 |
| -// NATIVE_HALF: ret half %dx.dot |
109 |
| -// NO_HALF: %dx.dot = fmul float %0, %1 |
110 |
| -// NO_HALF: ret float %dx.dot |
| 84 | +#ifdef __HLSL_ENABLE_16_BIT |
| 85 | +// NATIVE_HALF: %hlsl.dot = mul i16 |
| 86 | +// NATIVE_HALF: ret i16 %hlsl.dot |
| 87 | +int16_t test_dot_short(int16_t p0, int16_t p1) { return dot(p0, p1); } |
| 88 | + |
| 89 | +// NATIVE_HALF: %hlsl.dot = call i16 @llvm.[[ICF]].sdot.v2i16(<2 x i16> |
| 90 | +// NATIVE_HALF: ret i16 %hlsl.dot |
| 91 | +int16_t test_dot_short2(int16_t2 p0, int16_t2 p1) { return dot(p0, p1); } |
| 92 | + |
| 93 | +// NATIVE_HALF: %hlsl.dot = call i16 @llvm.[[ICF]].sdot.v3i16(<3 x i16> |
| 94 | +// NATIVE_HALF: ret i16 %hlsl.dot |
| 95 | +int16_t test_dot_short3(int16_t3 p0, int16_t3 p1) { return dot(p0, p1); } |
| 96 | + |
| 97 | +// NATIVE_HALF: %hlsl.dot = call i16 @llvm.[[ICF]].sdot.v4i16(<4 x i16> |
| 98 | +// NATIVE_HALF: ret i16 %hlsl.dot |
| 99 | +int16_t test_dot_short4(int16_t4 p0, int16_t4 p1) { return dot(p0, p1); } |
| 100 | + |
| 101 | +// NATIVE_HALF: %hlsl.dot = mul i16 |
| 102 | +// NATIVE_HALF: ret i16 %hlsl.dot |
| 103 | +uint16_t test_dot_ushort(uint16_t p0, uint16_t p1) { return dot(p0, p1); } |
| 104 | + |
| 105 | +// NATIVE_HALF: %hlsl.dot = call i16 @llvm.[[ICF]].udot.v2i16(<2 x i16> |
| 106 | +// NATIVE_HALF: ret i16 %hlsl.dot |
| 107 | +uint16_t test_dot_ushort2(uint16_t2 p0, uint16_t2 p1) { return dot(p0, p1); } |
| 108 | + |
| 109 | +// NATIVE_HALF: %hlsl.dot = call i16 @llvm.[[ICF]].udot.v3i16(<3 x i16> |
| 110 | +// NATIVE_HALF: ret i16 %hlsl.dot |
| 111 | +uint16_t test_dot_ushort3(uint16_t3 p0, uint16_t3 p1) { return dot(p0, p1); } |
| 112 | + |
| 113 | +// NATIVE_HALF: %hlsl.dot = call i16 @llvm.[[ICF]].udot.v4i16(<4 x i16> |
| 114 | +// NATIVE_HALF: ret i16 %hlsl.dot |
| 115 | +uint16_t test_dot_ushort4(uint16_t4 p0, uint16_t4 p1) { return dot(p0, p1); } |
| 116 | +#endif |
| 117 | + |
| 118 | +// NATIVE_HALF: %hlsl.dot = fmul half |
| 119 | +// NATIVE_HALF: ret half %hlsl.dot |
| 120 | +// NO_HALF: %hlsl.dot = fmul float |
| 121 | +// NO_HALF: ret float %hlsl.dot |
111 | 122 | half test_dot_half(half p0, half p1) { return dot(p0, p1); }
|
112 | 123 |
|
113 |
| -// NATIVE_HALF: %dx.dot = call half @llvm.dx.dot2.v2f16(<2 x half> %0, <2 x half> %1) |
114 |
| -// NATIVE_HALF: ret half %dx.dot |
115 |
| -// NO_HALF: %dx.dot = call float @llvm.dx.dot2.v2f32(<2 x float> %0, <2 x float> %1) |
116 |
| -// NO_HALF: ret float %dx.dot |
| 124 | +// NATIVE_HALF: %hlsl.dot = call half @llvm.[[ICF]].fdot.v2f16(<2 x half> |
| 125 | +// NATIVE_HALF: ret half %hlsl.dot |
| 126 | +// NO_HALF: %hlsl.dot = call float @llvm.[[ICF]].fdot.v2f32(<2 x float> |
| 127 | +// NO_HALF: ret float %hlsl.dot |
117 | 128 | half test_dot_half2(half2 p0, half2 p1) { return dot(p0, p1); }
|
118 | 129 |
|
119 |
| -// NATIVE_HALF: %dx.dot = call half @llvm.dx.dot3.v3f16(<3 x half> %0, <3 x half> %1) |
120 |
| -// NATIVE_HALF: ret half %dx.dot |
121 |
| -// NO_HALF: %dx.dot = call float @llvm.dx.dot3.v3f32(<3 x float> %0, <3 x float> %1) |
122 |
| -// NO_HALF: ret float %dx.dot |
| 130 | +// NATIVE_HALF: %hlsl.dot = call half @llvm.[[ICF]].fdot.v3f16(<3 x half> |
| 131 | +// NATIVE_HALF: ret half %hlsl.dot |
| 132 | +// NO_HALF: %hlsl.dot = call float @llvm.[[ICF]].fdot.v3f32(<3 x float> |
| 133 | +// NO_HALF: ret float %hlsl.dot |
123 | 134 | half test_dot_half3(half3 p0, half3 p1) { return dot(p0, p1); }
|
124 | 135 |
|
125 |
| -// NATIVE_HALF: %dx.dot = call half @llvm.dx.dot4.v4f16(<4 x half> %0, <4 x half> %1) |
126 |
| -// NATIVE_HALF: ret half %dx.dot |
127 |
| -// NO_HALF: %dx.dot = call float @llvm.dx.dot4.v4f32(<4 x float> %0, <4 x float> %1) |
128 |
| -// NO_HALF: ret float %dx.dot |
| 136 | +// NATIVE_HALF: %hlsl.dot = call half @llvm.[[ICF]].fdot.v4f16(<4 x half> |
| 137 | +// NATIVE_HALF: ret half %hlsl.dot |
| 138 | +// NO_HALF: %hlsl.dot = call float @llvm.[[ICF]].fdot.v4f32(<4 x float> |
| 139 | +// NO_HALF: ret float %hlsl.dot |
129 | 140 | half test_dot_half4(half4 p0, half4 p1) { return dot(p0, p1); }
|
130 | 141 |
|
131 |
| -// CHECK: %dx.dot = fmul float %0, %1 |
132 |
| -// CHECK: ret float %dx.dot |
| 142 | +// CHECK: %hlsl.dot = fmul float |
| 143 | +// CHECK: ret float %hlsl.dot |
133 | 144 | float test_dot_float(float p0, float p1) { return dot(p0, p1); }
|
134 | 145 |
|
135 |
| -// CHECK: %dx.dot = call float @llvm.dx.dot2.v2f32(<2 x float> %0, <2 x float> %1) |
136 |
| -// CHECK: ret float %dx.dot |
| 146 | +// CHECK: %hlsl.dot = call float @llvm.[[ICF]].fdot.v2f32(<2 x float> |
| 147 | +// CHECK: ret float %hlsl.dot |
137 | 148 | float test_dot_float2(float2 p0, float2 p1) { return dot(p0, p1); }
|
138 | 149 |
|
139 |
| -// CHECK: %dx.dot = call float @llvm.dx.dot3.v3f32(<3 x float> %0, <3 x float> %1) |
140 |
| -// CHECK: ret float %dx.dot |
| 150 | +// CHECK: %hlsl.dot = call float @llvm.[[ICF]].fdot.v3f32(<3 x float> |
| 151 | +// CHECK: ret float %hlsl.dot |
141 | 152 | float test_dot_float3(float3 p0, float3 p1) { return dot(p0, p1); }
|
142 | 153 |
|
143 |
| -// CHECK: %dx.dot = call float @llvm.dx.dot4.v4f32(<4 x float> %0, <4 x float> %1) |
144 |
| -// CHECK: ret float %dx.dot |
| 154 | +// CHECK: %hlsl.dot = call float @llvm.[[ICF]].fdot.v4f32(<4 x float> |
| 155 | +// CHECK: ret float %hlsl.dot |
145 | 156 | float test_dot_float4(float4 p0, float4 p1) { return dot(p0, p1); }
|
146 | 157 |
|
147 |
| -// CHECK: %dx.dot = call float @llvm.dx.dot2.v2f32(<2 x float> %splat.splat, <2 x float> %1) |
148 |
| -// CHECK: ret float %dx.dot |
| 158 | +// CHECK: %hlsl.dot = call float @llvm.[[ICF]].fdot.v2f32(<2 x float> %splat.splat, <2 x float> |
| 159 | +// CHECK: ret float %hlsl.dot |
149 | 160 | float test_dot_float2_splat(float p0, float2 p1) { return dot(p0, p1); }
|
150 | 161 |
|
151 |
| -// CHECK: %dx.dot = call float @llvm.dx.dot3.v3f32(<3 x float> %splat.splat, <3 x float> %1) |
152 |
| -// CHECK: ret float %dx.dot |
| 162 | +// CHECK: %hlsl.dot = call float @llvm.[[ICF]].fdot.v3f32(<3 x float> %splat.splat, <3 x float> |
| 163 | +// CHECK: ret float %hlsl.dot |
153 | 164 | float test_dot_float3_splat(float p0, float3 p1) { return dot(p0, p1); }
|
154 | 165 |
|
155 |
| -// CHECK: %dx.dot = call float @llvm.dx.dot4.v4f32(<4 x float> %splat.splat, <4 x float> %1) |
156 |
| -// CHECK: ret float %dx.dot |
| 166 | +// CHECK: %hlsl.dot = call float @llvm.[[ICF]].fdot.v4f32(<4 x float> %splat.splat, <4 x float> |
| 167 | +// CHECK: ret float %hlsl.dot |
157 | 168 | float test_dot_float4_splat(float p0, float4 p1) { return dot(p0, p1); }
|
158 | 169 |
|
159 |
| -// CHECK: %dx.dot = fmul double %0, %1 |
160 |
| -// CHECK: ret double %dx.dot |
| 170 | +// CHECK: %hlsl.dot = fmul double |
| 171 | +// CHECK: ret double %hlsl.dot |
161 | 172 | double test_dot_double(double p0, double p1) { return dot(p0, p1); }
|
0 commit comments