Skip to content

Commit 261fde4

Browse files
committed
[SYCL][CUDA][HIP][libclc] Rename libclc NonUniform binops to KHR extensions
#5705 changed the use of NonUniform group binary operators to the KHR extension operators. These changes rename the implementation of these in libclc for both amdgcn and PTX to the new naming. Signed-off-by: Larsen, Steffen <[email protected]>
1 parent c0e36bd commit 261fde4

File tree

2 files changed

+33
-34
lines changed

2 files changed

+33
-34
lines changed

libclc/amdgcn-amdhsa/libspirv/group/collectives.cl

Lines changed: 10 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -235,16 +235,16 @@ __CLC_GROUP_COLLECTIVE(FAdd, __CLC_ADD, float, 0)
235235
__CLC_GROUP_COLLECTIVE(FAdd, __CLC_ADD, double, 0)
236236

237237
// There is no Mul group op in SPIR-V, use non-uniform variant instead.
238-
__CLC_GROUP_COLLECTIVE(NonUniformIMul, IMul, __CLC_MUL, char, 1)
239-
__CLC_GROUP_COLLECTIVE(NonUniformIMul, IMul, __CLC_MUL, uchar, 1)
240-
__CLC_GROUP_COLLECTIVE(NonUniformIMul, IMul, __CLC_MUL, short, 1)
241-
__CLC_GROUP_COLLECTIVE(NonUniformIMul, IMul, __CLC_MUL, ushort, 1)
242-
__CLC_GROUP_COLLECTIVE(NonUniformIMul, IMul, __CLC_MUL, int, 1)
243-
__CLC_GROUP_COLLECTIVE(NonUniformIMul, IMul, __CLC_MUL, uint, 1)
244-
__CLC_GROUP_COLLECTIVE(NonUniformIMul, IMul, __CLC_MUL, long, 1)
245-
__CLC_GROUP_COLLECTIVE(NonUniformIMul, IMul, __CLC_MUL, ulong, 1)
246-
__CLC_GROUP_COLLECTIVE(NonUniformFMul, FMul, __CLC_MUL, float, 1)
247-
__CLC_GROUP_COLLECTIVE(NonUniformFMul, FMul, __CLC_MUL, double, 1)
238+
__CLC_GROUP_COLLECTIVE(IMulKHR, IMul, __CLC_MUL, char, 1)
239+
__CLC_GROUP_COLLECTIVE(IMulKHR, IMul, __CLC_MUL, uchar, 1)
240+
__CLC_GROUP_COLLECTIVE(IMulKHR, IMul, __CLC_MUL, short, 1)
241+
__CLC_GROUP_COLLECTIVE(IMulKHR, IMul, __CLC_MUL, ushort, 1)
242+
__CLC_GROUP_COLLECTIVE(IMulKHR, IMul, __CLC_MUL, int, 1)
243+
__CLC_GROUP_COLLECTIVE(IMulKHR, IMul, __CLC_MUL, uint, 1)
244+
__CLC_GROUP_COLLECTIVE(IMulKHR, IMul, __CLC_MUL, long, 1)
245+
__CLC_GROUP_COLLECTIVE(IMulKHR, IMul, __CLC_MUL, ulong, 1)
246+
__CLC_GROUP_COLLECTIVE(FMulKHR, FMul, __CLC_MUL, float, 1)
247+
__CLC_GROUP_COLLECTIVE(FMulKHR, FMul, __CLC_MUL, double, 1)
248248

249249
__CLC_GROUP_COLLECTIVE(SMin, __CLC_MIN, char, CHAR_MAX)
250250
__CLC_GROUP_COLLECTIVE(UMin, __CLC_MIN, uchar, UCHAR_MAX)

libclc/ptx-nvidiacl/libspirv/group/collectives.cl

Lines changed: 23 additions & 24 deletions
Original file line numberDiff line numberDiff line change
@@ -249,12 +249,12 @@ __CLC_SUBGROUP_COLLECTIVE(FMax, __CLC_MAX, half, -HALF_MAX)
249249
__CLC_SUBGROUP_COLLECTIVE(FMax, __CLC_MAX, float, -FLT_MAX)
250250
__CLC_SUBGROUP_COLLECTIVE(FMax, __CLC_MAX, double, -DBL_MAX)
251251

252-
__CLC_SUBGROUP_COLLECTIVE_REDUX(NonUniformBitwiseAnd, __CLC_AND, and, uint, ~0)
253-
__CLC_SUBGROUP_COLLECTIVE_REDUX(NonUniformBitwiseOr, __CLC_OR, or, uint, 0)
254-
__CLC_SUBGROUP_COLLECTIVE_REDUX(NonUniformBitwiseXor, __CLC_XOR, xor, uint, 0)
255-
__CLC_SUBGROUP_COLLECTIVE_REDUX(NonUniformBitwiseAnd, __CLC_AND, and, int, ~0)
256-
__CLC_SUBGROUP_COLLECTIVE_REDUX(NonUniformBitwiseOr, __CLC_OR, or, int, 0)
257-
__CLC_SUBGROUP_COLLECTIVE_REDUX(NonUniformBitwiseXor, __CLC_XOR, xor, int, 0)
252+
__CLC_SUBGROUP_COLLECTIVE_REDUX(BitwiseAndKHR, __CLC_AND, and, uint, ~0)
253+
__CLC_SUBGROUP_COLLECTIVE_REDUX(BitwiseOrKHR, __CLC_OR, or, uint, 0)
254+
__CLC_SUBGROUP_COLLECTIVE_REDUX(BitwiseXorKHR, __CLC_XOR, xor, uint, 0)
255+
__CLC_SUBGROUP_COLLECTIVE_REDUX(BitwiseAndKHR, __CLC_AND, and, int, ~0)
256+
__CLC_SUBGROUP_COLLECTIVE_REDUX(BitwiseOrKHR, __CLC_OR, or, int, 0)
257+
__CLC_SUBGROUP_COLLECTIVE_REDUX(BitwiseXorKHR, __CLC_XOR, xor, int, 0)
258258

259259
#undef __CLC_SUBGROUP_COLLECTIVE_BODY
260260
#undef __CLC_SUBGROUP_COLLECTIVE
@@ -340,18 +340,17 @@ __CLC_GROUP_COLLECTIVE(FAdd, __CLC_ADD, half, 0)
340340
__CLC_GROUP_COLLECTIVE(FAdd, __CLC_ADD, float, 0)
341341
__CLC_GROUP_COLLECTIVE(FAdd, __CLC_ADD, double, 0)
342342

343-
// There is no Mul group op in SPIR-V, use non-uniform variant instead.
344-
__CLC_GROUP_COLLECTIVE(NonUniformIMul, IMul, __CLC_MUL, char, 1)
345-
__CLC_GROUP_COLLECTIVE(NonUniformIMul, IMul, __CLC_MUL, uchar, 1)
346-
__CLC_GROUP_COLLECTIVE(NonUniformIMul, IMul, __CLC_MUL, short, 1)
347-
__CLC_GROUP_COLLECTIVE(NonUniformIMul, IMul, __CLC_MUL, ushort, 1)
348-
__CLC_GROUP_COLLECTIVE(NonUniformIMul, IMul, __CLC_MUL, int, 1)
349-
__CLC_GROUP_COLLECTIVE(NonUniformIMul, IMul, __CLC_MUL, uint, 1)
350-
__CLC_GROUP_COLLECTIVE(NonUniformIMul, IMul, __CLC_MUL, long, 1)
351-
__CLC_GROUP_COLLECTIVE(NonUniformIMul, IMul, __CLC_MUL, ulong, 1)
352-
__CLC_GROUP_COLLECTIVE(NonUniformFMul, FMul, __CLC_MUL, half, 1)
353-
__CLC_GROUP_COLLECTIVE(NonUniformFMul, FMul, __CLC_MUL, float, 1)
354-
__CLC_GROUP_COLLECTIVE(NonUniformFMul, FMul, __CLC_MUL, double, 1)
343+
__CLC_GROUP_COLLECTIVE(IMulKHR, IMul, __CLC_MUL, char, 1)
344+
__CLC_GROUP_COLLECTIVE(IMulKHR, IMul, __CLC_MUL, uchar, 1)
345+
__CLC_GROUP_COLLECTIVE(IMulKHR, IMul, __CLC_MUL, short, 1)
346+
__CLC_GROUP_COLLECTIVE(IMulKHR, IMul, __CLC_MUL, ushort, 1)
347+
__CLC_GROUP_COLLECTIVE(IMulKHR, IMul, __CLC_MUL, int, 1)
348+
__CLC_GROUP_COLLECTIVE(IMulKHR, IMul, __CLC_MUL, uint, 1)
349+
__CLC_GROUP_COLLECTIVE(IMulKHR, IMul, __CLC_MUL, long, 1)
350+
__CLC_GROUP_COLLECTIVE(IMulKHR, IMul, __CLC_MUL, ulong, 1)
351+
__CLC_GROUP_COLLECTIVE(FMulKHR, FMul, __CLC_MUL, half, 1)
352+
__CLC_GROUP_COLLECTIVE(FMulKHR, FMul, __CLC_MUL, float, 1)
353+
__CLC_GROUP_COLLECTIVE(FMulKHR, FMul, __CLC_MUL, double, 1)
355354

356355
__CLC_GROUP_COLLECTIVE(SMin, __CLC_MIN, char, CHAR_MAX)
357356
__CLC_GROUP_COLLECTIVE(UMin, __CLC_MIN, uchar, UCHAR_MAX)
@@ -377,12 +376,12 @@ __CLC_GROUP_COLLECTIVE(FMax, __CLC_MAX, half, -HALF_MAX)
377376
__CLC_GROUP_COLLECTIVE(FMax, __CLC_MAX, float, -FLT_MAX)
378377
__CLC_GROUP_COLLECTIVE(FMax, __CLC_MAX, double, -DBL_MAX)
379378

380-
__CLC_GROUP_COLLECTIVE(NonUniformBitwiseAnd, __CLC_AND, uint, ~0)
381-
__CLC_GROUP_COLLECTIVE(NonUniformBitwiseOr, __CLC_OR, uint, 0)
382-
__CLC_GROUP_COLLECTIVE(NonUniformBitwiseXor, __CLC_XOR, uint, 0)
383-
__CLC_GROUP_COLLECTIVE(NonUniformBitwiseAnd, __CLC_AND, int, ~0)
384-
__CLC_GROUP_COLLECTIVE(NonUniformBitwiseOr, __CLC_OR, int, 0)
385-
__CLC_GROUP_COLLECTIVE(NonUniformBitwiseXor, __CLC_XOR, int, 0)
379+
__CLC_GROUP_COLLECTIVE(BitwiseAndKHR, __CLC_AND, uint, ~0)
380+
__CLC_GROUP_COLLECTIVE(BitwiseOrKHR, __CLC_OR, uint, 0)
381+
__CLC_GROUP_COLLECTIVE(BitwiseXorKHR, __CLC_XOR, uint, 0)
382+
__CLC_GROUP_COLLECTIVE(BitwiseAndKHR, __CLC_AND, int, ~0)
383+
__CLC_GROUP_COLLECTIVE(BitwiseOrKHR, __CLC_OR, int, 0)
384+
__CLC_GROUP_COLLECTIVE(BitwiseXorKHR, __CLC_XOR, int, 0)
386385

387386
// half requires additional mangled entry points
388387
_CLC_DEF _CLC_CONVERGENT half _Z17__spirv_GroupFAddjjDF16_(uint scope, uint op,

0 commit comments

Comments
 (0)