mirror of
https://gitlab.com/libeigen/eigen.git
synced 2025-05-01 08:14:10 +08:00
Product kernel: skip loop on columns if there is no remaining rows
This commit is contained in:
parent
6f64b0b487
commit
f9d2f3903e
@ -1255,6 +1255,7 @@ void gebp_kernel<LhsScalar,RhsScalar,Index,mr,nr,ConjugateLhs,ConjugateRhs>
|
||||
}
|
||||
}
|
||||
//---------- Process remaining rows, 1 at once ----------
|
||||
if(peeled_mc1<rows)
|
||||
{
|
||||
// loop on each panel of the rhs
|
||||
for(Index j2=0; j2<packet_cols4; j2+=nr)
|
||||
@ -1288,13 +1289,11 @@ void gebp_kernel<LhsScalar,RhsScalar,Index,mr,nr,ConjugateLhs,ConjugateRhs>
|
||||
straits.loadLhsUnaligned(blB+0*SwappedTraits::LhsProgress, A0);
|
||||
straits.loadLhsUnaligned(blB+1*SwappedTraits::LhsProgress, A1);
|
||||
|
||||
|
||||
straits.loadRhsQuad(blA+0*spk, B_0);
|
||||
straits.loadRhsQuad(blA+1*spk, B_1);
|
||||
straits.madd(A0,B_0,C0,B_0);
|
||||
straits.madd(A1,B_1,C1,B_1);
|
||||
|
||||
|
||||
straits.loadLhsUnaligned(blB+2*SwappedTraits::LhsProgress, A0);
|
||||
straits.loadLhsUnaligned(blB+3*SwappedTraits::LhsProgress, A1);
|
||||
straits.loadRhsQuad(blA+2*spk, B_0);
|
||||
|
Loading…
x
Reference in New Issue
Block a user