int32x4_t pairwiseAddedOnce = vpaddlq_s16(vec);int64x2_t pairwiseAddedTwice = vpaddlq_s32(pairwiseAddedOnce);int16_t sum = (int16_t)(vgetq_lane_s64(pairwiseAddedTwice, 0) + vgetq_lane_s64(pairwiseAddedTwice, 1));
int16x4_t addedDRegisters = vadd_s16(vget_low_s16(vec), vget_high_s16(vec));int32x2_t pairwiseAddedOnce = vpaddl_s16(addedDRegisters);int64x1_t pairwiseAddedTwice = vpaddl_s32(pairwiseAddedOnce);int16_t sum = (int16_t)vget_lane_s64(pairwiseAddedTwice, 0);
int32x4_t pairwiseAddedOnce = vpaddlq_s16(vec);int64x2_t pairwiseAddedTwice = vpaddlq_s32(pairwiseAddedOnce);int32x2_t narrowed = vmovn_s64(pairwiseAddedTwice);int64x1_t pairwiseAddedThrice = vpaddl_s32(narrowed);int16_t sum = (int16_t)vget_lane_s64(pairwiseAddedThrice, 0);