Skip to content

Commit ef1ba23

Browse files
committed
14 -> 12 for loopmul decisions.
1 parent 960beb6 commit ef1ba23

File tree

1 file changed

+3
-3
lines changed

1 file changed

+3
-3
lines changed

src/matrix_multiply.jl

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -89,7 +89,7 @@ end
8989
@_inline_meta
9090
return mul_unrolled(Sa, Sb, a, b)
9191
end
92-
elseif sa[1] <= 14 && sa[2] <= 14 && sb[2] <= 14
92+
elseif sa[1] <= 12 && sa[2] <= 12 && sb[2] <= 12
9393
return quote
9494
@_inline_meta
9595
return mul_unrolled_chunks(Sa, Sb, a, b)
@@ -106,7 +106,7 @@ end
106106
S = Size(sa[1], sb[2])
107107

108108
# Heuristic choice between BLAS and explicit unrolling (or chunk-based unrolling)
109-
if sa[1]*sa[2]*sb[2] >= 14*14*14
109+
if sa[1]*sa[2]*sb[2] >= 12*12*12
110110
Sa = TSize{size(S),false}()
111111
Sb = TSize{sa,false}()
112112
Sc = TSize{sb,false}()
@@ -122,7 +122,7 @@ end
122122
@_inline_meta
123123
return mul_unrolled(Sa, Sb, a, b)
124124
end
125-
elseif sa[1] <= 14 && sa[2] <= 14 && sb[2] <= 14
125+
elseif sa[1] <= 12 && sa[2] <= 12 && sb[2] <= 12
126126
return quote
127127
@_inline_meta
128128
return similar_type(a, T, $S)(mul_unrolled_chunks(Sa, Sb, a, b))

0 commit comments

Comments
 (0)