Fix for public issue #211
- Add a slice-K tile size to the profiler - fix num warps calculations in implicit gemm header
This commit is contained in:
@ -74,7 +74,8 @@ public:
|
||||
|
||||
static int const kWarpCount =
|
||||
(ThreadblockShape::kM / WarpShape::kM) *
|
||||
(ThreadblockShape::kN / WarpShape::kN);
|
||||
(ThreadblockShape::kN / WarpShape::kN) *
|
||||
(ThreadblockShape::kK / WarpShape::kK);
|
||||
|
||||
/// Argument structure
|
||||
using Arguments = typename ImplicitGemmKernel::Arguments;
|
||||
|
||||
Reference in New Issue
Block a user