[BugFix] Illegal Memory Access in the blockwise cutlass fp8 GEMMs (#14396)
This commit is contained in:
parent
e1744502c2
commit
e5e03c2c1b
@ -402,7 +402,7 @@ struct CollectiveMma<
|
|||||||
|
|
||||||
// TODO: test `scale_copy_a` with `ScaleMsPerTile` < 128
|
// TODO: test `scale_copy_a` with `ScaleMsPerTile` < 128
|
||||||
TiledCopy scale_copy_a = make_tiled_copy(SmemBlockScalingCopyAtomA{},
|
TiledCopy scale_copy_a = make_tiled_copy(SmemBlockScalingCopyAtomA{},
|
||||||
Layout<Shape<_32, _1>>{}, Layout<Shape<_4, _1>>{}); // (1,1,1)
|
Layout<Shape<_32>>{}, Layout<Shape<_1>>{}); // (1,1,1)
|
||||||
TiledCopy scale_copy_b = make_tiled_copy(SmemBlockScalingCopyAtomB{},
|
TiledCopy scale_copy_b = make_tiled_copy(SmemBlockScalingCopyAtomB{},
|
||||||
Layout<Shape<_1>>{}, Layout<Shape<_1>>{}); // (1,1,1)
|
Layout<Shape<_1>>{}, Layout<Shape<_1>>{}); // (1,1,1)
|
||||||
ThrCopy thr_scale_copy_a = scale_copy_a.get_slice(threadIdx.x);
|
ThrCopy thr_scale_copy_a = scale_copy_a.get_slice(threadIdx.x);
|
||||||
|
Loading…
x
Reference in New Issue
Block a user