|
7 | 7 | // RUN: -o - | FileCheck %s --check-prefixes=CHECK,NO_HALF |
8 | 8 |
|
9 | 9 | #ifdef __HLSL_ENABLE_16_BIT |
10 | | -// NATIVE_HALF: %dx.dot = mul i16 %0, %1 |
11 | | -// NATIVE_HALF: ret i16 %dx.dot |
| 10 | +// NATIVE_HALF: %dot = mul i16 %0, %1 |
| 11 | +// NATIVE_HALF: ret i16 %dot |
12 | 12 | int16_t test_dot_short(int16_t p0, int16_t p1) { return dot(p0, p1); } |
13 | 13 |
|
14 | | -// NATIVE_HALF: %dx.dot = call i16 @llvm.dx.sdot.v2i16(<2 x i16> %0, <2 x i16> %1) |
15 | | -// NATIVE_HALF: ret i16 %dx.dot |
| 14 | +// NATIVE_HALF: %dot = call i16 @llvm.sdot.v2i16(<2 x i16> %0, <2 x i16> %1) |
| 15 | +// NATIVE_HALF: ret i16 %dot |
16 | 16 | int16_t test_dot_short2(int16_t2 p0, int16_t2 p1) { return dot(p0, p1); } |
17 | 17 |
|
18 | | -// NATIVE_HALF: %dx.dot = call i16 @llvm.dx.sdot.v3i16(<3 x i16> %0, <3 x i16> %1) |
19 | | -// NATIVE_HALF: ret i16 %dx.dot |
| 18 | +// NATIVE_HALF: %dot = call i16 @llvm.sdot.v3i16(<3 x i16> %0, <3 x i16> %1) |
| 19 | +// NATIVE_HALF: ret i16 %dot |
20 | 20 | int16_t test_dot_short3(int16_t3 p0, int16_t3 p1) { return dot(p0, p1); } |
21 | 21 |
|
22 | | -// NATIVE_HALF: %dx.dot = call i16 @llvm.dx.sdot.v4i16(<4 x i16> %0, <4 x i16> %1) |
23 | | -// NATIVE_HALF: ret i16 %dx.dot |
| 22 | +// NATIVE_HALF: %dot = call i16 @llvm.sdot.v4i16(<4 x i16> %0, <4 x i16> %1) |
| 23 | +// NATIVE_HALF: ret i16 %dot |
24 | 24 | int16_t test_dot_short4(int16_t4 p0, int16_t4 p1) { return dot(p0, p1); } |
25 | 25 |
|
26 | | -// NATIVE_HALF: %dx.dot = mul i16 %0, %1 |
27 | | -// NATIVE_HALF: ret i16 %dx.dot |
| 26 | +// NATIVE_HALF: %dot = mul i16 %0, %1 |
| 27 | +// NATIVE_HALF: ret i16 %dot |
28 | 28 | uint16_t test_dot_ushort(uint16_t p0, uint16_t p1) { return dot(p0, p1); } |
29 | 29 |
|
30 | | -// NATIVE_HALF: %dx.dot = call i16 @llvm.dx.udot.v2i16(<2 x i16> %0, <2 x i16> %1) |
31 | | -// NATIVE_HALF: ret i16 %dx.dot |
| 30 | +// NATIVE_HALF: %dot = call i16 @llvm.udot.v2i16(<2 x i16> %0, <2 x i16> %1) |
| 31 | +// NATIVE_HALF: ret i16 %dot |
32 | 32 | uint16_t test_dot_ushort2(uint16_t2 p0, uint16_t2 p1) { return dot(p0, p1); } |
33 | 33 |
|
34 | | -// NATIVE_HALF: %dx.dot = call i16 @llvm.dx.udot.v3i16(<3 x i16> %0, <3 x i16> %1) |
35 | | -// NATIVE_HALF: ret i16 %dx.dot |
| 34 | +// NATIVE_HALF: %dot = call i16 @llvm.udot.v3i16(<3 x i16> %0, <3 x i16> %1) |
| 35 | +// NATIVE_HALF: ret i16 %dot |
36 | 36 | uint16_t test_dot_ushort3(uint16_t3 p0, uint16_t3 p1) { return dot(p0, p1); } |
37 | 37 |
|
38 | | -// NATIVE_HALF: %dx.dot = call i16 @llvm.dx.udot.v4i16(<4 x i16> %0, <4 x i16> %1) |
39 | | -// NATIVE_HALF: ret i16 %dx.dot |
| 38 | +// NATIVE_HALF: %dot = call i16 @llvm.udot.v4i16(<4 x i16> %0, <4 x i16> %1) |
| 39 | +// NATIVE_HALF: ret i16 %dot |
40 | 40 | uint16_t test_dot_ushort4(uint16_t4 p0, uint16_t4 p1) { return dot(p0, p1); } |
41 | 41 | #endif |
42 | 42 |
|
43 | | -// CHECK: %dx.dot = mul i32 %0, %1 |
44 | | -// CHECK: ret i32 %dx.dot |
| 43 | +// CHECK: %dot = mul i32 %0, %1 |
| 44 | +// CHECK: ret i32 %dot |
45 | 45 | int test_dot_int(int p0, int p1) { return dot(p0, p1); } |
46 | 46 |
|
47 | | -// CHECK: %dx.dot = call i32 @llvm.dx.sdot.v2i32(<2 x i32> %0, <2 x i32> %1) |
48 | | -// CHECK: ret i32 %dx.dot |
| 47 | +// CHECK: %dot = call i32 @llvm.sdot.v2i32(<2 x i32> %0, <2 x i32> %1) |
| 48 | +// CHECK: ret i32 %dot |
49 | 49 | int test_dot_int2(int2 p0, int2 p1) { return dot(p0, p1); } |
50 | 50 |
|
51 | | -// CHECK: %dx.dot = call i32 @llvm.dx.sdot.v3i32(<3 x i32> %0, <3 x i32> %1) |
52 | | -// CHECK: ret i32 %dx.dot |
| 51 | +// CHECK: %dot = call i32 @llvm.sdot.v3i32(<3 x i32> %0, <3 x i32> %1) |
| 52 | +// CHECK: ret i32 %dot |
53 | 53 | int test_dot_int3(int3 p0, int3 p1) { return dot(p0, p1); } |
54 | 54 |
|
55 | | -// CHECK: %dx.dot = call i32 @llvm.dx.sdot.v4i32(<4 x i32> %0, <4 x i32> %1) |
56 | | -// CHECK: ret i32 %dx.dot |
| 55 | +// CHECK: %dot = call i32 @llvm.sdot.v4i32(<4 x i32> %0, <4 x i32> %1) |
| 56 | +// CHECK: ret i32 %dot |
57 | 57 | int test_dot_int4(int4 p0, int4 p1) { return dot(p0, p1); } |
58 | 58 |
|
59 | | -// CHECK: %dx.dot = mul i32 %0, %1 |
60 | | -// CHECK: ret i32 %dx.dot |
| 59 | +// CHECK: %dot = mul i32 %0, %1 |
| 60 | +// CHECK: ret i32 %dot |
61 | 61 | uint test_dot_uint(uint p0, uint p1) { return dot(p0, p1); } |
62 | 62 |
|
63 | | -// CHECK: %dx.dot = call i32 @llvm.dx.udot.v2i32(<2 x i32> %0, <2 x i32> %1) |
64 | | -// CHECK: ret i32 %dx.dot |
| 63 | +// CHECK: %dot = call i32 @llvm.udot.v2i32(<2 x i32> %0, <2 x i32> %1) |
| 64 | +// CHECK: ret i32 %dot |
65 | 65 | uint test_dot_uint2(uint2 p0, uint2 p1) { return dot(p0, p1); } |
66 | 66 |
|
67 | | -// CHECK: %dx.dot = call i32 @llvm.dx.udot.v3i32(<3 x i32> %0, <3 x i32> %1) |
68 | | -// CHECK: ret i32 %dx.dot |
| 67 | +// CHECK: %dot = call i32 @llvm.udot.v3i32(<3 x i32> %0, <3 x i32> %1) |
| 68 | +// CHECK: ret i32 %dot |
69 | 69 | uint test_dot_uint3(uint3 p0, uint3 p1) { return dot(p0, p1); } |
70 | 70 |
|
71 | | -// CHECK: %dx.dot = call i32 @llvm.dx.udot.v4i32(<4 x i32> %0, <4 x i32> %1) |
72 | | -// CHECK: ret i32 %dx.dot |
| 71 | +// CHECK: %dot = call i32 @llvm.udot.v4i32(<4 x i32> %0, <4 x i32> %1) |
| 72 | +// CHECK: ret i32 %dot |
73 | 73 | uint test_dot_uint4(uint4 p0, uint4 p1) { return dot(p0, p1); } |
74 | 74 |
|
75 | | -// CHECK: %dx.dot = mul i64 %0, %1 |
76 | | -// CHECK: ret i64 %dx.dot |
| 75 | +// CHECK: %dot = mul i64 %0, %1 |
| 76 | +// CHECK: ret i64 %dot |
77 | 77 | int64_t test_dot_long(int64_t p0, int64_t p1) { return dot(p0, p1); } |
78 | 78 |
|
79 | | -// CHECK: %dx.dot = call i64 @llvm.dx.sdot.v2i64(<2 x i64> %0, <2 x i64> %1) |
80 | | -// CHECK: ret i64 %dx.dot |
| 79 | +// CHECK: %dot = call i64 @llvm.sdot.v2i64(<2 x i64> %0, <2 x i64> %1) |
| 80 | +// CHECK: ret i64 %dot |
81 | 81 | int64_t test_dot_long2(int64_t2 p0, int64_t2 p1) { return dot(p0, p1); } |
82 | 82 |
|
83 | | -// CHECK: %dx.dot = call i64 @llvm.dx.sdot.v3i64(<3 x i64> %0, <3 x i64> %1) |
84 | | -// CHECK: ret i64 %dx.dot |
| 83 | +// CHECK: %dot = call i64 @llvm.sdot.v3i64(<3 x i64> %0, <3 x i64> %1) |
| 84 | +// CHECK: ret i64 %dot |
85 | 85 | int64_t test_dot_long3(int64_t3 p0, int64_t3 p1) { return dot(p0, p1); } |
86 | 86 |
|
87 | | -// CHECK: %dx.dot = call i64 @llvm.dx.sdot.v4i64(<4 x i64> %0, <4 x i64> %1) |
88 | | -// CHECK: ret i64 %dx.dot |
| 87 | +// CHECK: %dot = call i64 @llvm.sdot.v4i64(<4 x i64> %0, <4 x i64> %1) |
| 88 | +// CHECK: ret i64 %dot |
89 | 89 | int64_t test_dot_long4(int64_t4 p0, int64_t4 p1) { return dot(p0, p1); } |
90 | 90 |
|
91 | | -// CHECK: %dx.dot = mul i64 %0, %1 |
92 | | -// CHECK: ret i64 %dx.dot |
| 91 | +// CHECK: %dot = mul i64 %0, %1 |
| 92 | +// CHECK: ret i64 %dot |
93 | 93 | uint64_t test_dot_ulong(uint64_t p0, uint64_t p1) { return dot(p0, p1); } |
94 | 94 |
|
95 | | -// CHECK: %dx.dot = call i64 @llvm.dx.udot.v2i64(<2 x i64> %0, <2 x i64> %1) |
96 | | -// CHECK: ret i64 %dx.dot |
| 95 | +// CHECK: %dot = call i64 @llvm.udot.v2i64(<2 x i64> %0, <2 x i64> %1) |
| 96 | +// CHECK: ret i64 %dot |
97 | 97 | uint64_t test_dot_ulong2(uint64_t2 p0, uint64_t2 p1) { return dot(p0, p1); } |
98 | 98 |
|
99 | | -// CHECK: %dx.dot = call i64 @llvm.dx.udot.v3i64(<3 x i64> %0, <3 x i64> %1) |
100 | | -// CHECK: ret i64 %dx.dot |
| 99 | +// CHECK: %dot = call i64 @llvm.udot.v3i64(<3 x i64> %0, <3 x i64> %1) |
| 100 | +// CHECK: ret i64 %dot |
101 | 101 | uint64_t test_dot_ulong3(uint64_t3 p0, uint64_t3 p1) { return dot(p0, p1); } |
102 | 102 |
|
103 | | -// CHECK: %dx.dot = call i64 @llvm.dx.udot.v4i64(<4 x i64> %0, <4 x i64> %1) |
104 | | -// CHECK: ret i64 %dx.dot |
| 103 | +// CHECK: %dot = call i64 @llvm.udot.v4i64(<4 x i64> %0, <4 x i64> %1) |
| 104 | +// CHECK: ret i64 %dot |
105 | 105 | uint64_t test_dot_ulong4(uint64_t4 p0, uint64_t4 p1) { return dot(p0, p1); } |
106 | 106 |
|
107 | | -// NATIVE_HALF: %dx.dot = fmul half %0, %1 |
108 | | -// NATIVE_HALF: ret half %dx.dot |
109 | | -// NO_HALF: %dx.dot = fmul float %0, %1 |
110 | | -// NO_HALF: ret float %dx.dot |
| 107 | +// NATIVE_HALF: %dot = fmul half %0, %1 |
| 108 | +// NATIVE_HALF: ret half %dot |
| 109 | +// NO_HALF: %dot = fmul float %0, %1 |
| 110 | +// NO_HALF: ret float %dot |
111 | 111 | half test_dot_half(half p0, half p1) { return dot(p0, p1); } |
112 | 112 |
|
113 | | -// NATIVE_HALF: %dx.dot = call half @llvm.dx.dot2.v2f16(<2 x half> %0, <2 x half> %1) |
114 | | -// NATIVE_HALF: ret half %dx.dot |
115 | | -// NO_HALF: %dx.dot = call float @llvm.dx.dot2.v2f32(<2 x float> %0, <2 x float> %1) |
116 | | -// NO_HALF: ret float %dx.dot |
| 113 | +// NATIVE_HALF: %dot = call half @llvm.fdot.v2f16(<2 x half> %0, <2 x half> %1) |
| 114 | +// NATIVE_HALF: ret half %dot |
| 115 | +// NO_HALF: %dot = call float @llvm.fdot.v2f32(<2 x float> %0, <2 x float> %1) |
| 116 | +// NO_HALF: ret float %dot |
117 | 117 | half test_dot_half2(half2 p0, half2 p1) { return dot(p0, p1); } |
118 | 118 |
|
119 | | -// NATIVE_HALF: %dx.dot = call half @llvm.dx.dot3.v3f16(<3 x half> %0, <3 x half> %1) |
120 | | -// NATIVE_HALF: ret half %dx.dot |
121 | | -// NO_HALF: %dx.dot = call float @llvm.dx.dot3.v3f32(<3 x float> %0, <3 x float> %1) |
122 | | -// NO_HALF: ret float %dx.dot |
| 119 | +// NATIVE_HALF: %dot = call half @llvm.fdot.v3f16(<3 x half> %0, <3 x half> %1) |
| 120 | +// NATIVE_HALF: ret half %dot |
| 121 | +// NO_HALF: %dot = call float @llvm.fdot.v3f32(<3 x float> %0, <3 x float> %1) |
| 122 | +// NO_HALF: ret float %dot |
123 | 123 | half test_dot_half3(half3 p0, half3 p1) { return dot(p0, p1); } |
124 | 124 |
|
125 | | -// NATIVE_HALF: %dx.dot = call half @llvm.dx.dot4.v4f16(<4 x half> %0, <4 x half> %1) |
126 | | -// NATIVE_HALF: ret half %dx.dot |
127 | | -// NO_HALF: %dx.dot = call float @llvm.dx.dot4.v4f32(<4 x float> %0, <4 x float> %1) |
128 | | -// NO_HALF: ret float %dx.dot |
| 125 | +// NATIVE_HALF: %dot = call half @llvm.fdot.v4f16(<4 x half> %0, <4 x half> %1) |
| 126 | +// NATIVE_HALF: ret half %dot |
| 127 | +// NO_HALF: %dot = call float @llvm.fdot.v4f32(<4 x float> %0, <4 x float> %1) |
| 128 | +// NO_HALF: ret float %dot |
129 | 129 | half test_dot_half4(half4 p0, half4 p1) { return dot(p0, p1); } |
130 | 130 |
|
131 | | -// CHECK: %dx.dot = fmul float %0, %1 |
132 | | -// CHECK: ret float %dx.dot |
| 131 | +// CHECK: %dot = fmul float %0, %1 |
| 132 | +// CHECK: ret float %dot |
133 | 133 | float test_dot_float(float p0, float p1) { return dot(p0, p1); } |
134 | 134 |
|
135 | | -// CHECK: %dx.dot = call float @llvm.dx.dot2.v2f32(<2 x float> %0, <2 x float> %1) |
136 | | -// CHECK: ret float %dx.dot |
| 135 | +// CHECK: %dot = call float @llvm.fdot.v2f32(<2 x float> %0, <2 x float> %1) |
| 136 | +// CHECK: ret float %dot |
137 | 137 | float test_dot_float2(float2 p0, float2 p1) { return dot(p0, p1); } |
138 | 138 |
|
139 | | -// CHECK: %dx.dot = call float @llvm.dx.dot3.v3f32(<3 x float> %0, <3 x float> %1) |
140 | | -// CHECK: ret float %dx.dot |
| 139 | +// CHECK: %dot = call float @llvm.fdot.v3f32(<3 x float> %0, <3 x float> %1) |
| 140 | +// CHECK: ret float %dot |
141 | 141 | float test_dot_float3(float3 p0, float3 p1) { return dot(p0, p1); } |
142 | 142 |
|
143 | | -// CHECK: %dx.dot = call float @llvm.dx.dot4.v4f32(<4 x float> %0, <4 x float> %1) |
144 | | -// CHECK: ret float %dx.dot |
| 143 | +// CHECK: %dot = call float @llvm.fdot.v4f32(<4 x float> %0, <4 x float> %1) |
| 144 | +// CHECK: ret float %dot |
145 | 145 | float test_dot_float4(float4 p0, float4 p1) { return dot(p0, p1); } |
146 | 146 |
|
147 | | -// CHECK: %dx.dot = call float @llvm.dx.dot2.v2f32(<2 x float> %splat.splat, <2 x float> %1) |
148 | | -// CHECK: ret float %dx.dot |
| 147 | +// CHECK: %dot = call float @llvm.fdot.v2f32(<2 x float> %splat.splat, <2 x float> %1) |
| 148 | +// CHECK: ret float %dot |
149 | 149 | float test_dot_float2_splat(float p0, float2 p1) { return dot(p0, p1); } |
150 | 150 |
|
151 | | -// CHECK: %dx.dot = call float @llvm.dx.dot3.v3f32(<3 x float> %splat.splat, <3 x float> %1) |
152 | | -// CHECK: ret float %dx.dot |
| 151 | +// CHECK: %dot = call float @llvm.fdot.v3f32(<3 x float> %splat.splat, <3 x float> %1) |
| 152 | +// CHECK: ret float %dot |
153 | 153 | float test_dot_float3_splat(float p0, float3 p1) { return dot(p0, p1); } |
154 | 154 |
|
155 | | -// CHECK: %dx.dot = call float @llvm.dx.dot4.v4f32(<4 x float> %splat.splat, <4 x float> %1) |
156 | | -// CHECK: ret float %dx.dot |
| 155 | +// CHECK: %dot = call float @llvm.fdot.v4f32(<4 x float> %splat.splat, <4 x float> %1) |
| 156 | +// CHECK: ret float %dot |
157 | 157 | float test_dot_float4_splat(float p0, float4 p1) { return dot(p0, p1); } |
158 | 158 |
|
159 | | -// CHECK: %dx.dot = fmul double %0, %1 |
160 | | -// CHECK: ret double %dx.dot |
| 159 | +// CHECK: %dot = fmul double %0, %1 |
| 160 | +// CHECK: ret double %dot |
161 | 161 | double test_dot_double(double p0, double p1) { return dot(p0, p1); } |
0 commit comments