Skip to content

Commit ad65f36

Browse files
authored
Remove unused class templates from __parallel_for_large_submitter (#2124)
Signed-off-by: Matthew Michel <[email protected]>
1 parent 6392c4a commit ad65f36

File tree

1 file changed

+4
-4
lines changed

1 file changed

+4
-4
lines changed

include/oneapi/dpl/pstl/hetero/dpcpp/parallel_backend_sycl_for.h

+4-4
Original file line numberDiff line numberDiff line change
@@ -77,11 +77,11 @@ struct __parallel_for_small_submitter<__internal::__optional_kernel_name<_Name..
7777
}
7878
};
7979

80-
template <typename _KernelName, typename... _RangeTypes>
80+
template <typename _KernelName>
8181
struct __parallel_for_large_submitter;
8282

83-
template <typename... _Name, typename... _RangeTypes>
84-
struct __parallel_for_large_submitter<__internal::__optional_kernel_name<_Name...>, _RangeTypes...>
83+
template <typename... _Name>
84+
struct __parallel_for_large_submitter<__internal::__optional_kernel_name<_Name...>>
8585
{
8686
// Limit the work-group size to 512 which has empirically yielded the best results across different architectures.
8787
static constexpr std::uint16_t __max_work_group_size = 512;
@@ -186,7 +186,7 @@ __parallel_for(oneapi::dpl::__internal::__device_backend_tag, _ExecutionPolicy&&
186186
oneapi::dpl::__par_backend_hetero::__internal::__kernel_name_provider<__parallel_for_large_kernel<_CustomName>>;
187187

188188
using __small_submitter = __parallel_for_small_submitter<_ForKernelSmall>;
189-
using __large_submitter = __parallel_for_large_submitter<_ForKernelLarge, _Ranges...>;
189+
using __large_submitter = __parallel_for_large_submitter<_ForKernelLarge>;
190190
// Compile two kernels: one for small-to-medium inputs and a second for large. This avoids runtime checks within a
191191
// single kernel that worsen performance for small cases. If the number of iterations of the large submitter is 1,
192192
// then only compile the basic kernel as the two versions are effectively the same.

0 commit comments

Comments
 (0)