mirror of
https://gitlab.com/libeigen/eigen.git
synced 2026-04-10 11:34:33 +08:00
Revert "Fix GEBP half/quarter-packet loops for nr>=8 RHS packing on ARM64"
This reverts commit 888d708dcd.
This commit is contained in:
@@ -1496,16 +1496,7 @@ EIGEN_DONT_INLINE void gebp_kernel<LhsScalar, RhsScalar, Index, DataMapper, mr,
|
||||
EIGEN_IF_CONSTEXPR((LhsProgressHalf < LhsProgress) && mr >= LhsProgressHalf) {
|
||||
HalfTraits half_traits;
|
||||
for (Index i = peeled_mc1; i < peeled_mc_half; i += LhsProgressHalf) {
|
||||
#if EIGEN_ARCH_ARM64 || EIGEN_ARCH_LOONGARCH64
|
||||
EIGEN_IF_CONSTEXPR(nr >= 8) {
|
||||
for (Index j2 = 0; j2 < packet_cols8; j2 += 8) {
|
||||
gebp_micro_panel_impl<1, 8, HalfTraits, LhsScalar, RhsScalar, ResScalar, Index, DataMapper, LinearMapper,
|
||||
LhsPacket>(half_traits, res, blockA, blockB, alpha, i, j2, depth, strideA, strideB,
|
||||
offsetA, offsetB, prefetch_res_offset, peeled_kc, pk);
|
||||
}
|
||||
}
|
||||
#endif
|
||||
for (Index j2 = packet_cols8; j2 < packet_cols4; j2 += 4) {
|
||||
for (Index j2 = 0; j2 < packet_cols4; j2 += 4) {
|
||||
gebp_micro_panel_impl<1, 4, HalfTraits, LhsScalar, RhsScalar, ResScalar, Index, DataMapper, LinearMapper,
|
||||
LhsPacket>(half_traits, res, blockA, blockB, alpha, i, j2, depth, strideA, strideB,
|
||||
offsetA, offsetB, prefetch_res_offset, peeled_kc, pk);
|
||||
@@ -1522,16 +1513,7 @@ EIGEN_DONT_INLINE void gebp_kernel<LhsScalar, RhsScalar, Index, DataMapper, mr,
|
||||
EIGEN_IF_CONSTEXPR((LhsProgressQuarter < LhsProgressHalf) && mr >= LhsProgressQuarter) {
|
||||
QuarterTraits quarter_traits;
|
||||
for (Index i = peeled_mc_half; i < peeled_mc_quarter; i += LhsProgressQuarter) {
|
||||
#if EIGEN_ARCH_ARM64 || EIGEN_ARCH_LOONGARCH64
|
||||
EIGEN_IF_CONSTEXPR(nr >= 8) {
|
||||
for (Index j2 = 0; j2 < packet_cols8; j2 += 8) {
|
||||
gebp_micro_panel_impl<1, 8, QuarterTraits, LhsScalar, RhsScalar, ResScalar, Index, DataMapper, LinearMapper,
|
||||
LhsPacket>(quarter_traits, res, blockA, blockB, alpha, i, j2, depth, strideA, strideB,
|
||||
offsetA, offsetB, prefetch_res_offset, peeled_kc, pk);
|
||||
}
|
||||
}
|
||||
#endif
|
||||
for (Index j2 = packet_cols8; j2 < packet_cols4; j2 += 4) {
|
||||
for (Index j2 = 0; j2 < packet_cols4; j2 += 4) {
|
||||
gebp_micro_panel_impl<1, 4, QuarterTraits, LhsScalar, RhsScalar, ResScalar, Index, DataMapper, LinearMapper,
|
||||
LhsPacket>(quarter_traits, res, blockA, blockB, alpha, i, j2, depth, strideA, strideB,
|
||||
offsetA, offsetB, prefetch_res_offset, peeled_kc, pk);
|
||||
|
||||
Reference in New Issue
Block a user