cen64/arch/x86_64/rsp/vadd.h
2014-12-26 14:19:46 -05:00

25 lines
703 B
C

//
// arch/x86_64/rsp/vadd.h
//
// This file is subject to the terms and conditions defined in
// 'LICENSE', which is part of this source code package.
//
#include "common.h"
static inline __m128i rsp_vadd(__m128i vs, __m128i vt,
__m128i carry, __m128i *acc_lo) {
__m128i vd, minimum, maximum;
// VCC uses unsaturated arithmetic.
vd = _mm_add_epi16(vs, vt);
*acc_lo = _mm_sub_epi16(vd, carry);
// VD is the signed sum of the two sources and the carry. Since we
// have to saturate the sum of all three, we have to be clever.
minimum = _mm_min_epi16(vs, vt);
maximum = _mm_max_epi16(vs, vt);
minimum = _mm_subs_epi16(minimum, carry);
return _mm_adds_epi16(minimum, maximum);
}