* Copyright (c) 1995 Ken Nakata

/* $NetBSD: fpu_rem.c,v 1.18 2023/11/19 03:58:15 isaki Exp $ */

/*
* Copyright (c) 1995 Ken Nakata
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
* 3. Neither the name of the author nor the names of its contributors
* may be used to endorse or promote products derived from this software
* without specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*
* @(#)fpu_rem.c 10/24/95
*/

#include <sys/cdefs.h>
__KERNEL_RCSID(0, "$NetBSD: fpu_rem.c,v 1.18 2023/11/19 03:58:15 isaki Exp $");

#include <sys/types.h>
#include <sys/signal.h>
#include <machine/frame.h>

#include "fpu_emulate.h"

/*
* ALGORITHM
*
* Step 1. Save and strip signs of X and Y: signX := sign(X),
* signY := sign(Y), X := *X*, Y := *Y*,
* signQ := signX EOR signY. Record whether MOD or REM
* is requested.
*
* Step 2. Set L := expo(X)-expo(Y), Q := 0.
* If (L < 0) then
* R := X, go to Step 4.
* else
* R := 2^(-L)X, j := L.
* endif
*
* Step 3. Perform MOD(X,Y)
* 3.1 If R = Y, then { Q := Q + 1, R := 0, go to Step 7. }
* 3.2 If R > Y, then { R := R - Y, Q := Q + 1}
* 3.3 If j = 0, go to Step 4.
* 3.4 j := j - 1, Q := 2Q, R := 2R. Go to Step 3.1.
*
* Step 4. R := signX*R.
*
* Step 5. If MOD is requested, go to Step 7.
*
* Step 6. Now, R = MOD(X,Y), convert to REM(X,Y) is requested.
* Do banker's rounding.
* If abs(R) > Y/2
* || (abs(R) == Y/2 && Q % 2 == 1) then
* { Q := Q + 1, R := R - signX * Y }.
*
* Step 7. Return signQ, last 7 bits of Q, and R as required.
*/

static struct fpn * __fpu_modrem(struct fpemu *fe, int is_mod);
static int abscmp3(const struct fpn *a, const struct fpn *b);

/* Absolute FORTRAN Compare */
static int
abscmp3(const struct fpn *a, const struct fpn *b)
{
int i;

if (a->fp_exp < b->fp_exp) {
return -1;
} else if (a->fp_exp > b->fp_exp) {
return 1;
} else {
for (i = 0; i < 3; i++) {
if (a->fp_mant[i] < b->fp_mant[i])
return -1;
else if (a->fp_mant[i] > b->fp_mant[i])
return 1;
}
}
return 0;
}

static struct fpn *
__fpu_modrem(struct fpemu *fe, int is_mod)
{
static struct fpn X, Y;
struct fpn *x, *y, *r;
uint32_t signX, signY, signQ;
int j, l, q;
int cmp;

if (ISNAN(&fe->fe_f1) || ISNAN(&fe->fe_f2))
return fpu_newnan(fe);
if (ISINF(&fe->fe_f1) || ISZERO(&fe->fe_f2))
return fpu_newnan(fe);

CPYFPN(&X, &fe->fe_f1);
CPYFPN(&Y, &fe->fe_f2);
x = &X;
y = &Y;
q = 0;
r = &fe->fe_f2;

/*
* Step 1
*/
signX = x->fp_sign;
signY = y->fp_sign;
signQ = (signX ^ signY);
x->fp_sign = y->fp_sign = 0;

/* Special treatment that just return input value but Q is necessary */
if (ISZERO(x) || ISINF(y)) {
r = &fe->fe_f1;
goto Step7;
}

/*
* Step 2
*/
l = x->fp_exp - y->fp_exp;
CPYFPN(r, x);
if (l >= 0) {
r->fp_exp -= l;
j = l;

/*
* Step 3
*/
for (;;) {
cmp = abscmp3(r, y);

/* Step 3.1 */
if (cmp == 0)
break;

/* Step 3.2 */
if (cmp > 0) {
CPYFPN(&fe->fe_f1, r);
CPYFPN(&fe->fe_f2, y);
fe->fe_f2.fp_sign = 1;
r = fpu_add(fe);
q++;
}

/* Step 3.3 */
if (j == 0)
goto Step4;

/* Step 3.4 */
j--;
q += q;
r->fp_exp++;
}
/* R == Y */
q++;
r->fp_class = FPC_ZERO;
goto Step7;
}
Step4:
r->fp_sign = signX;

/*
* Step 5
*/
if (is_mod)
goto Step7;

/*
* Step 6
*/
/* y = y / 2 */
y->fp_exp--;
/* abscmp3 ignore sign */
cmp = abscmp3(r, y);
/* revert y */
y->fp_exp++;

if (cmp > 0 || (cmp == 0 && q % 2)) {
q++;
CPYFPN(&fe->fe_f1, r);
CPYFPN(&fe->fe_f2, y);
fe->fe_f2.fp_sign = !signX;
r = fpu_add(fe);
}

/*
* Step 7
*/
Step7:
q &= 0x7f;
q |= (signQ << 7);
fe->fe_fpframe->fpf_fpsr =
fe->fe_fpsr =
(fe->fe_fpsr & ~FPSR_QTT) | (q << 16);
return r;
}

struct fpn *
fpu_rem(struct fpemu *fe)
{
return __fpu_modrem(fe, 0);
}

struct fpn *
fpu_mod(struct fpemu *fe)
{
return __fpu_modrem(fe, 1);
}