Skip to content

Commit ed35a37

Browse files
authored
Add fast path in generic matmul (#1202)
This manually adds the critical optimisation investigated in JuliaLang/julia#56954. While we could rely on LLVM to continue doing this optimisation, it's more robust to add it manually.
1 parent 2a1696a commit ed35a37

File tree

2 files changed

+2
-0
lines changed

2 files changed

+2
-0
lines changed

src/matmul.jl

+1
Original file line numberDiff line numberDiff line change
@@ -1021,6 +1021,7 @@ function _generic_matmatmul_nonadjtrans!(C, A, B, alpha, beta)
10211021
@inbounds for n in axes(B, 2), k in axes(B, 1)
10221022
# Balpha = B[k,n] * alpha, but we skip the multiplication in case isone(alpha)
10231023
Balpha = @stable_muladdmul MulAddMul(alpha, false)(B[k,n])
1024+
!ismissing(Balpha) && iszero(Balpha) && continue
10241025
@simd for m in axes(A, 1)
10251026
C[m,n] = muladd(A[m,k], Balpha, C[m,n])
10261027
end

test/matmul.jl

+1
Original file line numberDiff line numberDiff line change
@@ -767,6 +767,7 @@ import LinearAlgebra: Adjoint, Transpose
767767
(*)(x::RootInt, y::Integer) = x.i * y
768768
adjoint(x::RootInt) = x
769769
transpose(x::RootInt) = x
770+
Base.zero(::RootInt) = RootInt(0)
770771

771772
@test Base.promote_op(*, RootInt, RootInt) === Int
772773

0 commit comments

Comments
 (0)