@@ -406,11 +406,12 @@ struct ABTransferThreadTiles
406406 // KPack / KRow / K1 - MNRepeat - K0 / KRow - MNWaves - KRow - MNPerWmma - K1
407407 return transform_tensor_descriptor (
408408 BlockDesc{},
409- make_tuple (make_unmerge_transform (make_tuple (
410- Number<ABK0 / (KPack / ABK1)>{}, KRow, Number<KPack / KRow / ABK1>{})),
411- make_unmerge_transform (make_tuple (
412- Number<MNRepeat>{}, Number<MNWaves>{}, Number<MNPerWmma>{})),
413- make_pass_through_transform (Number<ABK1>{})),
409+ make_tuple (
410+ make_unmerge_transform (make_tuple (
411+ Number<ABK0 / (KPack / ABK1)>{}, KRow, Number<KPack / KRow / ABK1>{})),
412+ make_unmerge_transform (
413+ make_tuple (Number<MNRepeat>{}, Number<MNWaves>{}, Number<MNPerWmma>{})),
414+ make_pass_through_transform (Number<ABK1>{})),
414415 make_tuple (Sequence<0 >{}, Sequence<1 >{}, Sequence<2 >{}),
415416 make_tuple (Sequence<2 , 4 , 0 >{}, Sequence<1 , 3 , 5 >{}, Sequence<6 >{}));
416417 }
@@ -439,13 +440,14 @@ struct ABTransferThreadTiles
439440
440441 return transform_tensor_descriptor (
441442 desc1,
442- make_tuple (make_pass_through_transform (Number<KPack / KPerWmmaBlk / KRow>{}),
443- make_pass_through_transform (Number<MNRepeat>{}),
444- make_merge_transform (make_tuple (Number<ABK0>{}, Number<ABK1 / KPack>{})),
445- make_pass_through_transform (Number<MNWaves>{}),
446- make_pass_through_transform (Number<KRow>{}),
447- make_pass_through_transform (Number<MNPerWmma>{}),
448- make_pass_through_transform (Number<KPerWmmaBlk>{})),
443+ make_tuple (
444+ make_pass_through_transform (Number<KPack / KPerWmmaBlk / KRow>{}),
445+ make_pass_through_transform (Number<MNRepeat>{}),
446+ make_merge_transform (make_tuple (Number<ABK0>{}, Number<ABK1 / KPack>{})),
447+ make_pass_through_transform (Number<MNWaves>{}),
448+ make_pass_through_transform (Number<KRow>{}),
449+ make_pass_through_transform (Number<MNPerWmma>{}),
450+ make_pass_through_transform (Number<KPerWmmaBlk>{})),
449451 make_tuple (Sequence<0 >{},
450452 Sequence<1 >{},
451453 Sequence<2 , 3 >{},
0 commit comments