Gemv microoptimization

This commit is contained in:
Charles Schlosser 2023-11-20 17:26:39 +00:00 committed by Rasmus Munk Larsen
parent 3cf6bb6f1c
commit d1b03fb5c9

View File

@ -362,9 +362,9 @@ EIGEN_DEVICE_FUNC EIGEN_DONT_INLINE void general_matrix_vector_product<Index,Lhs
HasQuarter = (int)ResPacketSizeQuarter < (int)ResPacketSizeHalf
};
const Index fullColBlockEnd = LhsPacketSize * (cols / LhsPacketSize);
const Index halfColBlockEnd = LhsPacketSizeHalf * (cols / LhsPacketSizeHalf);
const Index quarterColBlockEnd = LhsPacketSizeQuarter * (cols / LhsPacketSizeQuarter);
const Index fullColBlockEnd = cols & (-LhsPacketSize);
const Index halfColBlockEnd = cols & (-LhsPacketSizeHalf);
const Index quarterColBlockEnd = cols & (-LhsPacketSizeQuarter);
Index i=0;
for(; i<n8; i+=8)