Home
last modified time | relevance | path

Searched defs:AccumLambdaIteratorSm80 (Results 1 – 1 of 1) sorted by relevance

/aosp_15_r20/external/pytorch/aten/src/ATen/native/transformers/cuda/mem_eff_attention/gemm/
H A Dmma_accum_lambda_iterator.h23 struct AccumLambdaIteratorSm80 { struct
29 using Policy = typename T::Policy;
30 using InstructionShape = typename T::InstructionShape;
31 using OpDelta = typename T::OpDelta;
32 using Shape = typename T::Shape;
33 static int const kElementsPerAccess = InstructionShape::kN / 4;
34 static int const kRowsPerTile = 8;
35 static int const kAccumulatorRows = InstructionShape::kM / kRowsPerTile;
37 static cutlass::MatrixCoord CUTLASS_DEVICE get_lane_offset( in get_lane_offset()
50 CUTLASS_DEVICE static void iterateRows( in iterateRows()
[all …]