Skip to content

Commit

Permalink
Pass sg_size for Intel PVC
Browse files Browse the repository at this point in the history
  • Loading branch information
muhammad-tanvir-1211 committed May 15, 2024
1 parent c3ec983 commit a602f78
Showing 1 changed file with 4 additions and 0 deletions.
4 changes: 4 additions & 0 deletions include/cutlass/gemm/device/gemm_universal_adapter.h
Original file line number Diff line number Diff line change
Expand Up @@ -402,7 +402,11 @@ class GemmUniversalAdapter<
const auto sycl_block = syclcompat::dim3(block.x, block.y, block.z);
const auto sycl_grid = syclcompat::dim3(grid.x, grid.y, grid.z);

#if defined (SYCL_INTEL_TARGET)
syclcompat::experimental::launch<device_kernel<GemmKernel>, 16>(sycl_grid, sycl_block, smem_size, params);
#else
syclcompat::launch<device_kernel<GemmKernel>>(sycl_grid, sycl_block, smem_size, params);
#endif
#else
device_kernel<GemmKernel><<<grid, block, smem_size, stream>>>(params);
#endif
Expand Down

0 comments on commit a602f78

Please sign in to comment.