mirror of
https://gitlab.com/libeigen/eigen.git
synced 2025-01-12 14:25:16 +08:00
Fix asm comments in 1px1 kernel
This commit is contained in:
parent
5d2fd64a1a
commit
2aa09e6b4e
@ -1481,17 +1481,17 @@ void gebp_kernel<LhsScalar,RhsScalar,Index,DataMapper,mr,nr,ConjugateLhs,Conjuga
|
|||||||
|
|
||||||
for(Index k=0; k<peeled_kc; k+=pk)
|
for(Index k=0; k<peeled_kc; k+=pk)
|
||||||
{
|
{
|
||||||
EIGEN_ASM_COMMENT("begin gebp micro kernel 2pX1");
|
EIGEN_ASM_COMMENT("begin gebp micro kernel 1pX1");
|
||||||
RhsPacket B_0;
|
RhsPacket B_0;
|
||||||
|
|
||||||
#define EIGEN_GEBGP_ONESTEP(K) \
|
#define EIGEN_GEBGP_ONESTEP(K) \
|
||||||
do { \
|
do { \
|
||||||
EIGEN_ASM_COMMENT("begin step of gebp micro kernel 2pX1"); \
|
EIGEN_ASM_COMMENT("begin step of gebp micro kernel 1pX1"); \
|
||||||
EIGEN_ASM_COMMENT("Note: these asm comments work around bug 935!"); \
|
EIGEN_ASM_COMMENT("Note: these asm comments work around bug 935!"); \
|
||||||
traits.loadLhs(&blA[(0+1*K)*LhsProgress], A0); \
|
traits.loadLhs(&blA[(0+1*K)*LhsProgress], A0); \
|
||||||
traits.loadRhs(&blB[(0+K)*RhsProgress], B_0); \
|
traits.loadRhs(&blB[(0+K)*RhsProgress], B_0); \
|
||||||
traits.madd(A0, B_0, C0, B_0); \
|
traits.madd(A0, B_0, C0, B_0); \
|
||||||
EIGEN_ASM_COMMENT("end step of gebp micro kernel 2pX1"); \
|
EIGEN_ASM_COMMENT("end step of gebp micro kernel 1pX1"); \
|
||||||
} while(false);
|
} while(false);
|
||||||
|
|
||||||
EIGEN_GEBGP_ONESTEP(0);
|
EIGEN_GEBGP_ONESTEP(0);
|
||||||
@ -1506,7 +1506,7 @@ void gebp_kernel<LhsScalar,RhsScalar,Index,DataMapper,mr,nr,ConjugateLhs,Conjuga
|
|||||||
blB += pk*RhsProgress;
|
blB += pk*RhsProgress;
|
||||||
blA += pk*1*Traits::LhsProgress;
|
blA += pk*1*Traits::LhsProgress;
|
||||||
|
|
||||||
EIGEN_ASM_COMMENT("end gebp micro kernel 2pX1");
|
EIGEN_ASM_COMMENT("end gebp micro kernel 1pX1");
|
||||||
}
|
}
|
||||||
|
|
||||||
// process remaining peeled loop
|
// process remaining peeled loop
|
||||||
|
Loading…
Reference in New Issue
Block a user