Skip to content

Commit 056783a

Browse files
committed
pre-commit
1 parent 49975c1 commit 056783a

File tree

1 file changed

+6
-4
lines changed

1 file changed

+6
-4
lines changed

lib/Dialect/TritonGPU/Transforms/BF16DotTC.cpp

Lines changed: 6 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -39,8 +39,8 @@ auto SplitF32(Value input, unsigned N, PatternRewriter &rewriter)
3939

4040
Value IEEEDot(PatternRewriter &rewriter, Value lhs, Value rhs, Value acc) {
4141
return rewriter.create<DotOp>(lhs.getLoc(), lhs, rhs, acc,
42-
/*inputPrecision=*/InputPrecision::IEEE,
43-
/*maxNumImpreciseAcc=*/0);
42+
/*inputPrecision=*/InputPrecision::IEEE,
43+
/*maxNumImpreciseAcc=*/0);
4444
}
4545

4646
auto getBF16Count(triton::InputPrecision precision) -> unsigned {
@@ -58,8 +58,10 @@ auto getBF16Count(triton::InputPrecision precision) -> unsigned {
5858
}
5959

6060
// Implements 3xBF16 https://arxiv.org/abs/1904.06376
61-
// See also https://github.com/openxla/xla/blob/e33f93fb7220d408811afdc926cf10baaf49c64e/xla/backends/gpu/codegen/triton/dot_algorithms.cc#L152
62-
// As well as https://github.com/ROCm/rocm-libraries/blob/develop/projects/hipblaslt/tensilelite/Tensile/Components/LocalRead.py#L288-L330
61+
// See also
62+
// https://github.com/openxla/xla/blob/e33f93fb7220d408811afdc926cf10baaf49c64e/xla/backends/gpu/codegen/triton/dot_algorithms.cc#L152
63+
// As well as
64+
// https://github.com/ROCm/rocm-libraries/blob/develop/projects/hipblaslt/tensilelite/Tensile/Components/LocalRead.py#L288-L330
6365
struct BF16xN : public OpRewritePattern<DotOp> {
6466
using OpRewritePattern::OpRewritePattern;
6567

0 commit comments

Comments
 (0)