Skip to content
This repository was archived by the owner on Nov 4, 2024. It is now read-only.

Commit 26f4889

Browse files
committed
perf: upperbound LV usage
1 parent 4c1daf3 commit 26f4889

File tree

1 file changed

+2
-0
lines changed

1 file changed

+2
-0
lines changed

src/impl/matmul.jl

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -33,6 +33,7 @@ end
3333
function matmuladd!(C::AbstractMatrix, ::LoopedArrayOp, A::AbstractMatrix,
3434
B::AbstractMatrix, bias::AbstractVector)
3535
if unrolled_any((256), (size(C, 1), size(A, 2), size(B, 2))) &&
36+
unrolled_all((1024), (size(C, 1), size(A, 2), size(B, 2))) &&
3637
LoopVectorization.check_args(C, A, B)
3738
__matmuladd_loopvec!(C, A, B, bias)
3839
return
@@ -92,6 +93,7 @@ function matmul!(C::AbstractMatrix, ::AbstractInternalArrayOpMode,
9293
end
9394
function matmul!(C::AbstractMatrix, ::LoopedArrayOp, A::AbstractMatrix, B::AbstractMatrix)
9495
if unrolled_any((256), (size(C, 1), size(A, 2), size(B, 2))) &&
96+
unrolled_all((1024), (size(C, 1), size(A, 2), size(B, 2))) &&
9597
LoopVectorization.check_args(C, A, B)
9698
__matmul_loopvec!(C, A, B)
9799
return

0 commit comments

Comments
 (0)