*mn = __uhadd8(*mn,__uadd8(*pq,*co));but my doubt is how to avoid the overflow [255 + 2];any such instruction will care the saturation.?
*mn = __uhadd8(*mn,__uadd8(*pq,*co));
void qadd(uint32_t *mnx4, uint32_t *pqx4, uint32_t *cox4){ uint32_t t1 = __uqadd8(*mnx4, *pqx4); uint32_t t2 = __uhadd8(t1, *cox4); *mnx4 = t2;}