@@ -206,10 +206,11 @@ UR_APIEXPORT ur_result_t UR_APICALL urDeviceGetInfo(ur_device_handle_t hDevice,
206
206
return ReturnValue (Atomic64);
207
207
}
208
208
case UR_DEVICE_INFO_ATOMIC_MEMORY_ORDER_CAPABILITIES: {
209
- uint64_t Capabilities = UR_MEMORY_ORDER_CAPABILITY_FLAG_RELAXED |
210
- UR_MEMORY_ORDER_CAPABILITY_FLAG_ACQUIRE |
211
- UR_MEMORY_ORDER_CAPABILITY_FLAG_RELEASE |
212
- UR_MEMORY_ORDER_CAPABILITY_FLAG_ACQ_REL;
209
+ ur_memory_order_capability_flags_t Capabilities =
210
+ UR_MEMORY_ORDER_CAPABILITY_FLAG_RELAXED |
211
+ UR_MEMORY_ORDER_CAPABILITY_FLAG_ACQUIRE |
212
+ UR_MEMORY_ORDER_CAPABILITY_FLAG_RELEASE |
213
+ UR_MEMORY_ORDER_CAPABILITY_FLAG_ACQ_REL;
213
214
return ReturnValue (Capabilities);
214
215
}
215
216
case UR_DEVICE_INFO_ATOMIC_MEMORY_SCOPE_CAPABILITIES: {
@@ -315,7 +316,7 @@ UR_APIEXPORT ur_result_t UR_APICALL urDeviceGetInfo(ur_device_handle_t hDevice,
315
316
" runtime." );
316
317
}
317
318
318
- return ReturnValue (uint32_t { Enabled} );
319
+ return ReturnValue (Enabled);
319
320
}
320
321
case UR_DEVICE_INFO_MAX_READ_IMAGE_ARGS: {
321
322
// This call doesn't match to CUDA as it doesn't have images, but instead
@@ -473,7 +474,7 @@ UR_APIEXPORT ur_result_t UR_APICALL urDeviceGetInfo(ur_device_handle_t hDevice,
473
474
}
474
475
case UR_DEVICE_INFO_SINGLE_FP_CONFIG: {
475
476
// TODO: is this config consistent across all NVIDIA GPUs?
476
- uint64_t Config =
477
+ ur_device_fp_capability_flags_t Config =
477
478
UR_DEVICE_FP_CAPABILITY_FLAG_DENORM |
478
479
UR_DEVICE_FP_CAPABILITY_FLAG_INF_NAN |
479
480
UR_DEVICE_FP_CAPABILITY_FLAG_ROUND_TO_NEAREST |
@@ -485,12 +486,13 @@ UR_APIEXPORT ur_result_t UR_APICALL urDeviceGetInfo(ur_device_handle_t hDevice,
485
486
}
486
487
case UR_DEVICE_INFO_DOUBLE_FP_CONFIG: {
487
488
// TODO: is this config consistent across all NVIDIA GPUs?
488
- uint64_t Config = UR_DEVICE_FP_CAPABILITY_FLAG_DENORM |
489
- UR_DEVICE_FP_CAPABILITY_FLAG_INF_NAN |
490
- UR_DEVICE_FP_CAPABILITY_FLAG_ROUND_TO_NEAREST |
491
- UR_DEVICE_FP_CAPABILITY_FLAG_ROUND_TO_ZERO |
492
- UR_DEVICE_FP_CAPABILITY_FLAG_ROUND_TO_INF |
493
- UR_DEVICE_FP_CAPABILITY_FLAG_FMA;
489
+ ur_device_fp_capability_flags_t Config =
490
+ UR_DEVICE_FP_CAPABILITY_FLAG_DENORM |
491
+ UR_DEVICE_FP_CAPABILITY_FLAG_INF_NAN |
492
+ UR_DEVICE_FP_CAPABILITY_FLAG_ROUND_TO_NEAREST |
493
+ UR_DEVICE_FP_CAPABILITY_FLAG_ROUND_TO_ZERO |
494
+ UR_DEVICE_FP_CAPABILITY_FLAG_ROUND_TO_INF |
495
+ UR_DEVICE_FP_CAPABILITY_FLAG_FMA;
494
496
return ReturnValue (Config);
495
497
}
496
498
case UR_DEVICE_INFO_GLOBAL_MEM_CACHE_TYPE: {
@@ -600,13 +602,13 @@ UR_APIEXPORT ur_result_t UR_APICALL urDeviceGetInfo(ur_device_handle_t hDevice,
600
602
UR_QUEUE_FLAG_PROFILING_ENABLE));
601
603
case UR_DEVICE_INFO_QUEUE_ON_DEVICE_PROPERTIES: {
602
604
// The mandated minimum capability:
603
- uint64_t Capability = UR_QUEUE_FLAG_PROFILING_ENABLE |
604
- UR_QUEUE_FLAG_OUT_OF_ORDER_EXEC_MODE_ENABLE;
605
+ ur_queue_flags_t Capability = UR_QUEUE_FLAG_PROFILING_ENABLE |
606
+ UR_QUEUE_FLAG_OUT_OF_ORDER_EXEC_MODE_ENABLE;
605
607
return ReturnValue (Capability);
606
608
}
607
609
case UR_DEVICE_INFO_QUEUE_ON_HOST_PROPERTIES: {
608
610
// The mandated minimum capability:
609
- uint64_t Capability = UR_QUEUE_FLAG_PROFILING_ENABLE;
611
+ ur_queue_flags_t Capability = UR_QUEUE_FLAG_PROFILING_ENABLE;
610
612
return ReturnValue (Capability);
611
613
}
612
614
case UR_DEVICE_INFO_BUILT_IN_KERNELS: {
@@ -934,7 +936,7 @@ UR_APIEXPORT ur_result_t UR_APICALL urDeviceGetInfo(ur_device_handle_t hDevice,
934
936
hDevice->get ()) == CUDA_SUCCESS);
935
937
}
936
938
937
- uint64_t MemoryBandwidth = uint64_t ( MemoryClockKHz) * MemoryBusWidth * 250 ;
939
+ uint32_t MemoryBandwidth = MemoryClockKHz * MemoryBusWidth * 250 ;
938
940
939
941
return ReturnValue (MemoryBandwidth);
940
942
}
@@ -996,13 +998,14 @@ UR_APIEXPORT ur_result_t UR_APICALL urDeviceGetInfo(ur_device_handle_t hDevice,
996
998
case UR_DEVICE_INFO_KERNEL_SET_SPECIALIZATION_CONSTANTS:
997
999
return ReturnValue (false );
998
1000
// TODO: Investigate if this information is available on CUDA.
1001
+ case UR_DEVICE_INFO_MAX_READ_WRITE_IMAGE_ARGS:
999
1002
case UR_DEVICE_INFO_GPU_EU_COUNT:
1000
1003
case UR_DEVICE_INFO_GPU_EU_SIMD_WIDTH:
1001
1004
case UR_DEVICE_INFO_GPU_EU_SLICES:
1002
1005
case UR_DEVICE_INFO_GPU_SUBSLICES_PER_SLICE:
1003
1006
case UR_DEVICE_INFO_GPU_EU_COUNT_PER_SUBSLICE:
1004
1007
case UR_DEVICE_INFO_GPU_HW_THREADS_PER_EU:
1005
- return UR_RESULT_ERROR_INVALID_ENUMERATION ;
1008
+ return UR_RESULT_ERROR_UNSUPPORTED_ENUMERATION ;
1006
1009
1007
1010
default :
1008
1011
break ;
0 commit comments