#pragma ident "%Z%%M% %I% %E% SMI"
#include <sys/fpu/fpu_simulator.h>
#include <sys/fpu/globals.h>
static int
overflow_to_infinity(
fp_simd_type *pfpsd,
int sign)
{
int inf;
switch (pfpsd->fp_direction) {
case fp_nearest:
inf = 1;
break;
case fp_tozero:
inf = 0;
break;
case fp_positive:
inf = !sign;
break;
case fp_negative:
inf = sign;
break;
}
return (inf);
}
static void
round(
fp_simd_type *pfpsd,
unpacked *pu)
{
int increment;
int sr;
sr = pu->sticky|pu->rounded;
if (sr == 0)
return;
fpu_set_exception(pfpsd, fp_inexact);
switch (pfpsd->fp_direction) {
case fp_nearest:
increment = pu->rounded;
break;
case fp_tozero:
increment = 0;
break;
case fp_positive:
increment = (pu->sign == 0) & (sr != 0);
break;
case fp_negative:
increment = (pu->sign != 0) & (sr != 0);
break;
}
if (increment) {
pu->significand[3]++;
if (pu->significand[3] == 0) {
pu->significand[2]++;
if (pu->significand[2] == 0) {
pu->significand[1]++;
if (pu->significand[1] == 0) {
pu->significand[0]++;
if (pu->significand[0] == 0x20000) {
pu->exponent++;
pu->significand[0] = 0x10000;
}
}
}
}
}
if ((pfpsd->fp_direction == fp_nearest) &&
(pu->sticky == 0) && increment != 0) {
pu->significand[3] &= 0xfffffffe;
}
}
static void
packint32(
fp_simd_type *pfpsd,
unpacked *pu,
int32_t *px)
{
switch (pu->fpclass) {
case fp_zero:
*px = 0;
break;
case fp_normal:
if (pu->exponent >= 32)
goto overflow;
fpu_rightshift(pu, 112 - pu->exponent);
round(pfpsd, pu);
if (pu->significand[3] >= 0x80000000)
if ((pu->sign == 0)||(pu->significand[3] > 0x80000000))
goto overflow;
*px = pu->significand[3];
if (pu->sign)
*px = -*px;
break;
case fp_infinity:
case fp_quiet:
case fp_signaling:
overflow:
if (pu->sign)
*px = 0x80000000;
else
*px = 0x7fffffff;
pfpsd->fp_current_exceptions &= ~(1 << (int)fp_inexact);
fpu_set_exception(pfpsd, fp_invalid);
break;
}
}
static void
packint64(
fp_simd_type *pfpsd,
unpacked *pu,
int64_t *px)
{
union {
uint64_t ll;
uint32_t i[2];
} x;
switch (pu->fpclass) {
case fp_zero:
*px = 0;
break;
case fp_normal:
if (pu->exponent >= 64)
goto overflow;
fpu_rightshift(pu, 112 - pu->exponent);
round(pfpsd, pu);
if (pu->significand[2] >= 0x80000000)
if ((pu->sign == 0) ||
(pu->significand[2] > 0x80000000) ||
(((pu->significand[2] == 0x80000000) &&
(pu->significand[3] > 0))))
goto overflow;
x.i[0] = pu->significand[2];
x.i[1] = pu->significand[3];
*px = x.ll;
if (pu->sign)
*px = -*px;
break;
case fp_infinity:
case fp_quiet:
case fp_signaling:
overflow:
if (pu->sign)
*px = (int64_t)0x8000000000000000;
else
*px = (int64_t)0x7fffffffffffffff;
pfpsd->fp_current_exceptions &= ~(1 << (int)fp_inexact);
fpu_set_exception(pfpsd, fp_invalid);
break;
}
}
static void
packsingle(
fp_simd_type *pfpsd,
unpacked *pu,
single_type *px)
{
px->sign = pu->sign;
switch (pu->fpclass) {
case fp_zero:
px->exponent = 0;
px->significand = 0;
break;
case fp_infinity:
infinity:
px->exponent = 0xff;
px->significand = 0;
break;
case fp_quiet:
case fp_signaling:
fpu_rightshift(pu, 113-24);
px->exponent = 0xff;
px->significand = 0x400000|(0x3fffff&pu->significand[3]);
break;
case fp_normal:
fpu_rightshift(pu, 113-24);
pu->exponent += SINGLE_BIAS;
if (pu->exponent <= 0) {
px->exponent = 0;
fpu_rightshift(pu, 1 - pu->exponent);
round(pfpsd, pu);
if (pu->significand[3] == 0x800000) {
px->exponent = 1;
px->significand = 0;
fpu_set_exception(pfpsd, fp_inexact);
} else
px->significand = 0x7fffff & pu->significand[3];
if (pfpsd->fp_current_exceptions & (1 << fp_inexact))
fpu_set_exception(pfpsd, fp_underflow);
if (pfpsd->fp_fsrtem & (1<<fp_underflow)) {
fpu_set_exception(pfpsd, fp_underflow);
pfpsd->fp_current_exceptions &=
~(1 << (int)fp_inexact);
}
return;
}
round(pfpsd, pu);
if (pu->significand[3] == 0x1000000) {
pu->significand[3] = 0x800000;
pu->exponent += 1;
}
if (pu->exponent >= 0xff) {
fpu_set_exception(pfpsd, fp_overflow);
fpu_set_exception(pfpsd, fp_inexact);
if (pfpsd->fp_fsrtem & (1<<fp_overflow)) {
pfpsd->fp_current_exceptions &=
~(1 << (int)fp_inexact);
}
if (overflow_to_infinity(pfpsd, pu->sign))
goto infinity;
px->exponent = 0xfe;
px->significand = 0x7fffff;
return;
}
px->exponent = pu->exponent;
px->significand = 0x7fffff & pu->significand[3];
}
}
static void
packdouble(
fp_simd_type *pfpsd,
unpacked *pu,
double_type *px,
uint_t *py)
{
px->sign = pu->sign;
switch (pu->fpclass) {
case fp_zero:
px->exponent = 0;
px->significand = 0;
*py = 0;
break;
case fp_infinity:
infinity:
px->exponent = 0x7ff;
px->significand = 0;
*py = 0;
break;
case fp_quiet:
case fp_signaling:
fpu_rightshift(pu, 113-53);
px->exponent = 0x7ff;
px->significand = 0x80000 | (0x7ffff & pu->significand[2]);
*py = pu->significand[3];
break;
case fp_normal:
fpu_rightshift(pu, 113-53);
pu->exponent += DOUBLE_BIAS;
if (pu->exponent <= 0) {
px->exponent = 0;
fpu_rightshift(pu, 1 - pu->exponent);
round(pfpsd, pu);
if (pu->significand[2] == 0x100000) {
px->exponent = 1;
px->significand = 0;
*py = 0;
fpu_set_exception(pfpsd, fp_inexact);
} else {
px->exponent = 0;
px->significand = 0xfffff & pu->significand[2];
*py = pu->significand[3];
}
if (pfpsd->fp_current_exceptions & (1 << fp_inexact))
fpu_set_exception(pfpsd, fp_underflow);
if (pfpsd->fp_fsrtem & (1<<fp_underflow)) {
fpu_set_exception(pfpsd, fp_underflow);
pfpsd->fp_current_exceptions &=
~(1 << (int)fp_inexact);
}
return;
}
round(pfpsd, pu);
if (pu->significand[2] == 0x200000) {
pu->significand[2] = 0x100000;
pu->exponent += 1;
}
if (pu->exponent >= 0x7ff) {
fpu_set_exception(pfpsd, fp_overflow);
fpu_set_exception(pfpsd, fp_inexact);
if (pfpsd->fp_fsrtem & (1<<fp_overflow)) {
pfpsd->fp_current_exceptions &=
~(1 << (int)fp_inexact);
}
if (overflow_to_infinity(pfpsd, pu->sign))
goto infinity;
px->exponent = 0x7fe;
px->significand = 0xfffff;
*py = 0xffffffffU;
return;
}
px->exponent = pu->exponent;
px->significand = 0xfffff & pu->significand[2];
*py = pu->significand[3];
break;
}
}
static void
packextended(
fp_simd_type *pfpsd,
unpacked *pu,
extended_type *px,
uint_t *py,
uint_t *pz,
uint_t *pw)
{
px->sign = pu->sign;
switch (pu->fpclass) {
case fp_zero:
px->exponent = 0;
px->significand = 0;
*pz = 0;
*py = 0;
*pw = 0;
break;
case fp_infinity:
infinity:
px->exponent = 0x7fff;
px->significand = 0;
*pz = 0;
*py = 0;
*pw = 0;
break;
case fp_quiet:
case fp_signaling:
px->exponent = 0x7fff;
px->significand = 0x8000 | pu->significand[0];
*py = pu->significand[1];
*pz = pu->significand[2];
*pw = pu->significand[3];
break;
case fp_normal:
pu->exponent += EXTENDED_BIAS;
if (pu->exponent <= 0) {
fpu_rightshift(pu, 1-pu->exponent);
round(pfpsd, pu);
if (pu->significand[0] < 0x00010000) {
px->exponent = 0;
} else {
px->exponent = 1;
fpu_set_exception(pfpsd, fp_inexact);
}
if (pfpsd->fp_current_exceptions & (1 << fp_inexact))
fpu_set_exception(pfpsd, fp_underflow);
if (pfpsd->fp_fsrtem & (1<<fp_underflow)) {
fpu_set_exception(pfpsd, fp_underflow);
pfpsd->fp_current_exceptions &=
~(1 << (int)fp_inexact);
}
px->significand = pu->significand[0];
*py = pu->significand[1];
*pz = pu->significand[2];
*pw = pu->significand[3];
return;
}
round(pfpsd, pu);
if (pu->exponent >= 0x7fff) {
fpu_set_exception(pfpsd, fp_overflow);
fpu_set_exception(pfpsd, fp_inexact);
if (pfpsd->fp_fsrtem & (1<<fp_overflow)) {
pfpsd->fp_current_exceptions &=
~(1 << (int)fp_inexact);
}
if (overflow_to_infinity(pfpsd, pu->sign))
goto infinity;
px->exponent = 0x7ffe;
px->significand = 0xffff;
*py = 0xffffffffU;
*pz = 0xffffffffU;
*pw = 0xffffffffU;
return;
}
px->exponent = pu->exponent;
px->significand = pu->significand[0];
*py = pu->significand[1];
*pz = pu->significand[2];
*pw = pu->significand[3];
break;
}
}
void
_fp_pack(
fp_simd_type *pfpsd,
unpacked *pu,
uint_t n,
enum fp_op_type type)
{
switch (type) {
case fp_op_int32:
{
int32_t x;
packint32(pfpsd, pu, &x);
if (!(pfpsd->fp_current_exceptions & pfpsd->fp_fsrtem))
pfpsd->fp_current_write_freg(&x, n, pfpsd);
break;
}
case fp_op_int64:
{
int64_t x;
packint64(pfpsd, pu, &x);
if ((n & 0x1) == 1)
n = (n & 0x1e) | 0x20;
if (!(pfpsd->fp_current_exceptions & pfpsd->fp_fsrtem))
pfpsd->fp_current_write_dreg(&x, DOUBLE(n), pfpsd);
break;
}
case fp_op_single:
{
single_type x;
packsingle(pfpsd, pu, &x);
if (!(pfpsd->fp_current_exceptions & pfpsd->fp_fsrtem))
pfpsd->fp_current_write_freg(&x, n, pfpsd);
break;
}
case fp_op_double:
{
union {
double_type x[2];
uint32_t y[2];
uint64_t ll;
} db;
packdouble(pfpsd, pu, &db.x[0], &db.y[1]);
if (!(pfpsd->fp_current_exceptions &
pfpsd->fp_fsrtem)) {
if ((n & 0x1) == 1)
n = (n & 0x1e) | 0x20;
pfpsd->fp_current_write_dreg(&db.ll, DOUBLE(n),
pfpsd);
}
break;
}
case fp_op_extended:
{
union {
extended_type x;
uint32_t y[4];
uint64_t ll[2];
} ex;
unpacked U;
int k;
switch (pfpsd->fp_precision) {
case fp_single:
{
single_type tx;
packsingle(pfpsd, pu, &tx);
pu = &U;
unpacksingle(pfpsd, pu, tx);
break;
}
case fp_double:
{
double_type tx;
uint_t ty;
packdouble(pfpsd, pu, &tx, &ty);
pu = &U;
unpackdouble(pfpsd, pu, tx, ty);
break;
}
case fp_precision_3:
{
k = pu->exponent + EXTENDED_BIAS;
if (k >= 0) k = 113-64;
else k = 113-64-k;
fpu_rightshift(pu, 113-64);
round(pfpsd, pu);
pu->sticky = pu->rounded = 0;
pu->exponent += k;
fpu_normalize(pu);
break;
}
}
packextended(pfpsd, pu, &ex.x, &ex.y[1],
&ex.y[2], &ex.y[3]);
if (!(pfpsd->fp_current_exceptions &
pfpsd->fp_fsrtem)) {
if ((n & 0x1) == 1)
n = (n & 0x1e) | 0x20;
pfpsd->fp_current_write_dreg(&ex.ll[0],
QUAD_E(n), pfpsd);
pfpsd->fp_current_write_dreg(&ex.ll[1],
QUAD_F(n), pfpsd);
}
break;
}
}
}
void
_fp_pack_word(
fp_simd_type *pfpsd,
uint32_t *pu,
uint_t n)
{
pfpsd->fp_current_write_freg(pu, n, pfpsd);
}
void
_fp_pack_extword(
fp_simd_type *pfpsd,
uint64_t *pu,
uint_t n)
{
if ((n & 1) == 1)
n = (n & 0x1e) | 0x20;
pfpsd->fp_current_write_dreg(pu, DOUBLE(n), pfpsd);
}