@@ -213,17 +213,17 @@ __CLC_SUBGROUP_COLLECTIVE(FAdd, __CLC_ADD, half, 0)
213
213
__CLC_SUBGROUP_COLLECTIVE (FAdd , __CLC_ADD , float , 0 )
214
214
__CLC_SUBGROUP_COLLECTIVE (FAdd , __CLC_ADD , double , 0 )
215
215
216
- __CLC_SUBGROUP_COLLECTIVE (IMul , __CLC_MUL , char , 1 )
217
- __CLC_SUBGROUP_COLLECTIVE (IMul , __CLC_MUL , uchar , 1 )
218
- __CLC_SUBGROUP_COLLECTIVE (IMul , __CLC_MUL , short , 1 )
219
- __CLC_SUBGROUP_COLLECTIVE (IMul , __CLC_MUL , ushort , 1 )
220
- __CLC_SUBGROUP_COLLECTIVE (IMul , __CLC_MUL , int , 1 )
221
- __CLC_SUBGROUP_COLLECTIVE (IMul , __CLC_MUL , uint , 1 )
222
- __CLC_SUBGROUP_COLLECTIVE (IMul , __CLC_MUL , long , 1 )
223
- __CLC_SUBGROUP_COLLECTIVE (IMul , __CLC_MUL , ulong , 1 )
224
- __CLC_SUBGROUP_COLLECTIVE (FMul , __CLC_MUL , half , 1 )
225
- __CLC_SUBGROUP_COLLECTIVE (FMul , __CLC_MUL , float , 1 )
226
- __CLC_SUBGROUP_COLLECTIVE (FMul , __CLC_MUL , double , 1 )
216
+ __CLC_SUBGROUP_COLLECTIVE (IMulKHR , __CLC_MUL , char , 1 )
217
+ __CLC_SUBGROUP_COLLECTIVE (IMulKHR , __CLC_MUL , uchar , 1 )
218
+ __CLC_SUBGROUP_COLLECTIVE (IMulKHR , __CLC_MUL , short , 1 )
219
+ __CLC_SUBGROUP_COLLECTIVE (IMulKHR , __CLC_MUL , ushort , 1 )
220
+ __CLC_SUBGROUP_COLLECTIVE (IMulKHR , __CLC_MUL , int , 1 )
221
+ __CLC_SUBGROUP_COLLECTIVE (IMulKHR , __CLC_MUL , uint , 1 )
222
+ __CLC_SUBGROUP_COLLECTIVE (IMulKHR , __CLC_MUL , long , 1 )
223
+ __CLC_SUBGROUP_COLLECTIVE (IMulKHR , __CLC_MUL , ulong , 1 )
224
+ __CLC_SUBGROUP_COLLECTIVE (FMulKHR , __CLC_MUL , half , 1 )
225
+ __CLC_SUBGROUP_COLLECTIVE (FMulKHR , __CLC_MUL , float , 1 )
226
+ __CLC_SUBGROUP_COLLECTIVE (FMulKHR , __CLC_MUL , double , 1 )
227
227
228
228
__CLC_SUBGROUP_COLLECTIVE (SMin , __CLC_MIN , char , CHAR_MAX )
229
229
__CLC_SUBGROUP_COLLECTIVE (UMin , __CLC_MIN , uchar , UCHAR_MAX )
@@ -249,12 +249,12 @@ __CLC_SUBGROUP_COLLECTIVE(FMax, __CLC_MAX, half, -HALF_MAX)
249
249
__CLC_SUBGROUP_COLLECTIVE (FMax , __CLC_MAX , float , - FLT_MAX )
250
250
__CLC_SUBGROUP_COLLECTIVE (FMax , __CLC_MAX , double , - DBL_MAX )
251
251
252
- __CLC_SUBGROUP_COLLECTIVE_REDUX (NonUniformBitwiseAnd , __CLC_AND , and , uint , ~0 )
253
- __CLC_SUBGROUP_COLLECTIVE_REDUX (NonUniformBitwiseOr , __CLC_OR , or , uint , 0 )
254
- __CLC_SUBGROUP_COLLECTIVE_REDUX (NonUniformBitwiseXor , __CLC_XOR , xor , uint , 0 )
255
- __CLC_SUBGROUP_COLLECTIVE_REDUX (NonUniformBitwiseAnd , __CLC_AND , and , int , ~0 )
256
- __CLC_SUBGROUP_COLLECTIVE_REDUX (NonUniformBitwiseOr , __CLC_OR , or , int , 0 )
257
- __CLC_SUBGROUP_COLLECTIVE_REDUX (NonUniformBitwiseXor , __CLC_XOR , xor , int , 0 )
252
+ __CLC_SUBGROUP_COLLECTIVE_REDUX (BitwiseAndKHR , __CLC_AND , and , uint , ~0 )
253
+ __CLC_SUBGROUP_COLLECTIVE_REDUX (BitwiseOrKHR , __CLC_OR , or , uint , 0 )
254
+ __CLC_SUBGROUP_COLLECTIVE_REDUX (BitwiseXorKHR , __CLC_XOR , xor , uint , 0 )
255
+ __CLC_SUBGROUP_COLLECTIVE_REDUX (BitwiseAndKHR , __CLC_AND , and , int , ~0 )
256
+ __CLC_SUBGROUP_COLLECTIVE_REDUX (BitwiseOrKHR , __CLC_OR , or , int , 0 )
257
+ __CLC_SUBGROUP_COLLECTIVE_REDUX (BitwiseXorKHR , __CLC_XOR , xor , int , 0 )
258
258
259
259
#undef __CLC_SUBGROUP_COLLECTIVE_BODY
260
260
#undef __CLC_SUBGROUP_COLLECTIVE
@@ -340,18 +340,17 @@ __CLC_GROUP_COLLECTIVE(FAdd, __CLC_ADD, half, 0)
340
340
__CLC_GROUP_COLLECTIVE (FAdd , __CLC_ADD , float , 0 )
341
341
__CLC_GROUP_COLLECTIVE (FAdd , __CLC_ADD , double , 0 )
342
342
343
- // There is no Mul group op in SPIR-V, use non-uniform variant instead.
344
- __CLC_GROUP_COLLECTIVE (NonUniformIMul , IMul , __CLC_MUL , char , 1 )
345
- __CLC_GROUP_COLLECTIVE (NonUniformIMul , IMul , __CLC_MUL , uchar , 1 )
346
- __CLC_GROUP_COLLECTIVE (NonUniformIMul , IMul , __CLC_MUL , short , 1 )
347
- __CLC_GROUP_COLLECTIVE (NonUniformIMul , IMul , __CLC_MUL , ushort , 1 )
348
- __CLC_GROUP_COLLECTIVE (NonUniformIMul , IMul , __CLC_MUL , int , 1 )
349
- __CLC_GROUP_COLLECTIVE (NonUniformIMul , IMul , __CLC_MUL , uint , 1 )
350
- __CLC_GROUP_COLLECTIVE (NonUniformIMul , IMul , __CLC_MUL , long , 1 )
351
- __CLC_GROUP_COLLECTIVE (NonUniformIMul , IMul , __CLC_MUL , ulong , 1 )
352
- __CLC_GROUP_COLLECTIVE (NonUniformFMul , FMul , __CLC_MUL , half , 1 )
353
- __CLC_GROUP_COLLECTIVE (NonUniformFMul , FMul , __CLC_MUL , float , 1 )
354
- __CLC_GROUP_COLLECTIVE (NonUniformFMul , FMul , __CLC_MUL , double , 1 )
343
+ __CLC_GROUP_COLLECTIVE (IMulKHR , __CLC_MUL , char , 1 )
344
+ __CLC_GROUP_COLLECTIVE (IMulKHR , __CLC_MUL , uchar , 1 )
345
+ __CLC_GROUP_COLLECTIVE (IMulKHR , __CLC_MUL , short , 1 )
346
+ __CLC_GROUP_COLLECTIVE (IMulKHR , __CLC_MUL , ushort , 1 )
347
+ __CLC_GROUP_COLLECTIVE (IMulKHR , __CLC_MUL , int , 1 )
348
+ __CLC_GROUP_COLLECTIVE (IMulKHR , __CLC_MUL , uint , 1 )
349
+ __CLC_GROUP_COLLECTIVE (IMulKHR , __CLC_MUL , long , 1 )
350
+ __CLC_GROUP_COLLECTIVE (IMulKHR , __CLC_MUL , ulong , 1 )
351
+ __CLC_GROUP_COLLECTIVE (FMulKHR , __CLC_MUL , half , 1 )
352
+ __CLC_GROUP_COLLECTIVE (FMulKHR , __CLC_MUL , float , 1 )
353
+ __CLC_GROUP_COLLECTIVE (FMulKHR , __CLC_MUL , double , 1 )
355
354
356
355
__CLC_GROUP_COLLECTIVE (SMin , __CLC_MIN , char , CHAR_MAX )
357
356
__CLC_GROUP_COLLECTIVE (UMin , __CLC_MIN , uchar , UCHAR_MAX )
@@ -377,12 +376,12 @@ __CLC_GROUP_COLLECTIVE(FMax, __CLC_MAX, half, -HALF_MAX)
377
376
__CLC_GROUP_COLLECTIVE (FMax , __CLC_MAX , float , - FLT_MAX )
378
377
__CLC_GROUP_COLLECTIVE (FMax , __CLC_MAX , double , - DBL_MAX )
379
378
380
- __CLC_GROUP_COLLECTIVE (NonUniformBitwiseAnd , __CLC_AND , uint , ~0 )
381
- __CLC_GROUP_COLLECTIVE (NonUniformBitwiseOr , __CLC_OR , uint , 0 )
382
- __CLC_GROUP_COLLECTIVE (NonUniformBitwiseXor , __CLC_XOR , uint , 0 )
383
- __CLC_GROUP_COLLECTIVE (NonUniformBitwiseAnd , __CLC_AND , int , ~0 )
384
- __CLC_GROUP_COLLECTIVE (NonUniformBitwiseOr , __CLC_OR , int , 0 )
385
- __CLC_GROUP_COLLECTIVE (NonUniformBitwiseXor , __CLC_XOR , int , 0 )
379
+ __CLC_GROUP_COLLECTIVE (BitwiseAndKHR , __CLC_AND , uint , ~0 )
380
+ __CLC_GROUP_COLLECTIVE (BitwiseOrKHR , __CLC_OR , uint , 0 )
381
+ __CLC_GROUP_COLLECTIVE (BitwiseXorKHR , __CLC_XOR , uint , 0 )
382
+ __CLC_GROUP_COLLECTIVE (BitwiseAndKHR , __CLC_AND , int , ~0 )
383
+ __CLC_GROUP_COLLECTIVE (BitwiseOrKHR , __CLC_OR , int , 0 )
384
+ __CLC_GROUP_COLLECTIVE (BitwiseXorKHR , __CLC_XOR , int , 0 )
386
385
387
386
// half requires additional mangled entry points
388
387
_CLC_DEF _CLC_CONVERGENT half _Z17__spirv_GroupFAddjjDF16_ (uint scope , uint op ,
0 commit comments