File tree Expand file tree Collapse file tree 1 file changed +4
-3
lines changed Expand file tree Collapse file tree 1 file changed +4
-3
lines changed Original file line number Diff line number Diff line change @@ -55,9 +55,10 @@ __SYCL_EXPORT uint32_t reduGetMaxNumConcurrentWorkGroups(
55
55
std::shared_ptr<sycl::detail::queue_impl> Queue) {
56
56
device Dev = Queue->get_device ();
57
57
uint32_t NumThreads = Dev.get_info <info::device::max_compute_units>();
58
- // The heuristics require additional tuning for various devices and vendors.
59
- // For now assuming that each of execution units have about 8 working threads
60
- // gives good results on some known/supported GPU devices.
58
+ // TODO: The heuristics here require additional tuning for various devices
59
+ // and vendors. For now this code assumes that execution units have about
60
+ // 8 working threads, which gives good results on some known/supported
61
+ // GPU devices.
61
62
if (Dev.is_gpu ())
62
63
NumThreads *= 8 ;
63
64
return NumThreads;
You can’t perform that action at this time.
0 commit comments