Skip to content

Commit

Permalink
Fix copy operation and mma tile definition
Browse files Browse the repository at this point in the history
  • Loading branch information
aacostadiaz committed Oct 25, 2024
1 parent e0c3ceb commit 421e168
Show file tree
Hide file tree
Showing 2 changed files with 5 additions and 5 deletions.
2 changes: 1 addition & 1 deletion examples/sycl/pvc/pvc_collective_builder.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -321,7 +321,7 @@ int main(int argc, const char** argv)
using LayoutD = cutlass::layout::RowMajor;

// Workgroup-level tile
using TileShape = Shape<_256, _256, _32>;
using TileShape = Shape<_256, _128, _16>;

using CollectiveMainloop = cutlass::gemm::collective::CollectiveBuilder<
cutlass::arch::IntelPVC, cutlass::arch::OpClassTensorOp,
Expand Down
8 changes: 4 additions & 4 deletions include/cutlass/gemm/collective/builders/xe_mma_builder.inl
Original file line number Diff line number Diff line change
Expand Up @@ -86,14 +86,14 @@ struct CollectiveBuilder<
//Prepare Template arguments required of CollectiveMainLoop

using TiledMma = TiledMMA<MMA_Atom<XE_8x16x16_F32BF16BF16F32_TT>,
Layout<Shape<_1,_1,_1>>,
Tile<_32,_64,_32>>; // Subgroup level-tile
Layout<Shape<_8,_2,_1>>,
Tile<_64,_32,_16>>; // Subgroup level-tile

static constexpr int PipelineStages = 3;
using DispatchPolicy = cutlass::gemm::MainloopIntelPVC<PipelineStages>;

using GmemTiledCopyA = XE_2D_U16x8x16x4x2_LD_N;
using GmemTiledCopyB = XE_2D_U16x16x16x2x2_V;
using GmemTiledCopyA = XE_2D_U16x8x16_LD_N;
using GmemTiledCopyB = XE_2D_U16x16x16_LD_V;

//PVC pipeline does not use shared memory
using SmemLayoutAtomA = void;
Expand Down

0 comments on commit 421e168

Please sign in to comment.