You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
Copy file name to clipboardExpand all lines: src/TriangularSolve.jl
+11-11Lines changed: 11 additions & 11 deletions
Original file line number
Diff line number
Diff line change
@@ -139,7 +139,7 @@ end
139
139
end
140
140
@inlinestore_small_kern!(spa, ::Nothing, v, spu, i, n, ::Val{false}) =vstore!(spa, v /vload(spu, (n,n)), i)
141
141
142
-
functionBdivU_small_kern!(spa::AbstractStridedPointer{T}, sp, spb::AbstractStridedPointer{T}, spu::AbstractStridedPointer{T}, N, mask::AbstractMask{W}, ::Val{UNIT}) where {T,UNIT,W}
142
+
@inlinefunctionBdivU_small_kern!(spa::AbstractStridedPointer{T}, sp, spb::AbstractStridedPointer{T}, spu::AbstractStridedPointer{T}, N, mask::AbstractMask{W}, ::Val{UNIT}) where {T,UNIT,W}
143
143
# W = VectorizationBase.pick_vector_width(T)
144
144
for n ∈CloseOpen(N)
145
145
Amn =vload(spb, (MM{W}(StaticInt(0)),n), mask)
@@ -149,7 +149,7 @@ function BdivU_small_kern!(spa::AbstractStridedPointer{T}, sp, spb::AbstractStri
149
149
store_small_kern!(spa, sp, Amn, spu, (MM{W}(StaticInt(0)),n), n, mask, Val{UNIT}())
150
150
end
151
151
end
152
-
functionBdivU_small_kern_u!(spa::AbstractStridedPointer{T}, sp, spb::AbstractStridedPointer{T}, spu::AbstractStridedPointer{T}, N, ::StaticInt{U}, ::Val{UNIT}) where {T,U,UNIT}
152
+
@inlinefunctionBdivU_small_kern_u!(spa::AbstractStridedPointer{T}, sp, spb::AbstractStridedPointer{T}, spu::AbstractStridedPointer{T}, N, ::StaticInt{U}, ::Val{UNIT}) where {T,U,UNIT}
functionrdiv_U!(spc::AbstractStridedPointer{T}, spa::AbstractStridedPointer, spu::AbstractStridedPointer, M, N, ::StaticInt{1}, ::Val{UNIT}) where {T,UNIT}
243
+
@inlinefunctionrdiv_U!(spc::AbstractStridedPointer{T}, spa::AbstractStridedPointer, spu::AbstractStridedPointer, M, N, ::StaticInt{1}, ::Val{UNIT}) where {T,UNIT}
244
244
WS =pick_vector_width(T)
245
245
W =Int(WS)
246
246
UF =unroll_factor(WS)
@@ -381,7 +381,6 @@ function rdiv_block_N!(
381
381
# println("Solve with N_temp = $N_temp and n = $n")
382
382
rdiv_U!(spc, spa_rdiv, gesp(spu, (n,StaticInt{0}())), M, N_temp, StaticInt{X}(), Val(UNIT))
383
383
repeat ||break
384
-
385
384
spa =gesp(spa, (StaticInt(0), B_normalized))
386
385
spc =gesp(spc, (StaticInt(0), B_normalized))
387
386
spu =gesp(spu, (StaticInt(0), B_normalized))
@@ -439,20 +438,21 @@ end
439
438
functionmultithread_rdiv!(
440
439
spc::AbstractStridedPointer{T}, spa, spu, M, N, mtb, ::Val{UNIT}, ::StaticInt{X}
0 commit comments