cen64/arch/x86_64/rsp/vrcpsq.c
2015-01-02 23:51:20 -05:00

81 lines
1.8 KiB
C

//
// arch/x86_64/rsp/vrcpsq.c
//
// This file is subject to the terms and conditions defined in
// 'LICENSE', which is part of this source code package.
//
#include "common.h"
#include "common/reciprocal.h"
#include "rsp/cpu.h"
#include "rsp/rsp.h"
#include <string.h>
__m128i rsp_vrcp_vrsq(struct rsp *rsp, uint32_t iw, int dp,
unsigned src, unsigned e, unsigned dest, unsigned de) {
uint32_t dp_input, sp_input;
int32_t input, result;
int16_t vt;
int32_t input_mask, data;
unsigned shift, idx;
// Get the element from VT.
vt = rsp->cp2.regs[src].e[e & 0x7];
dp_input = ((uint32_t) rsp->cp2.div_in << 16) | (uint16_t) vt;
sp_input = vt;
input = (dp) ? dp_input : sp_input;
input_mask = input >> 31;
data = input ^ input_mask;
if (input > -32768)
data -= input_mask;
// Handle edge cases.
if (data == 0)
result = 0x7fffFFFFU;
else if (input == -32768)
result = 0xffff0000U;
// Main case: compute the reciprocal.
else {
// TODO: Clean this up.
#ifdef _MSC_VER
unsigned long bsf_index;
_BitScanReverse(&bsf_index, data);
shift = 31 - bsf_index;
#else
shift = __builtin_clz(data);
#endif
// VRSQ
if (iw & 0x4) {
idx = (((unsigned long long) data << shift) & 0x7FC00000U) >> 22;
idx = (idx | 0x200) & 0x3FE | (shift % 2);
result = rsp_reciprocal_rom[idx];
result = ((0x10000 | result) << 14) >> ((31 - shift) >> 1);
}
// VRCP
else {
idx = (((unsigned long long) data << shift) & 0x7FC00000U) >> 22;
result = rsp_reciprocal_rom[idx];
result = ((0x10000 | result) << 14) >> (31 - shift);
}
result = result ^ input_mask;
}
// Write out the results.
rsp->cp2.div_out = result >> 16;
rsp->cp2.regs[dest].e[de & 0x7] = result;
return rsp_vect_load_unshuffled_operand(rsp->cp2.regs[dest].e);
}