fpu_trig.c - cachepc-linux - Fork of AMDESE/linux with modifications for CachePC side-channel attack

	cachepc-linux Fork of AMDESE/linux with modifications for CachePC side-channel attack
	git clone https://git.sinitax.com/sinitax/cachepc-linux
	Log \| Files \| Refs \| README \| LICENSE \| sfeed.txt
fpu_trig.c (39259B)
      1// SPDX-License-Identifier: GPL-2.0
      2/*---------------------------------------------------------------------------+
      3 |  fpu_trig.c                                                               |
      4 |                                                                           |
      5 | Implementation of the FPU "transcendental" functions.                     |
      6 |                                                                           |
      7 | Copyright (C) 1992,1993,1994,1997,1999                                    |
      8 |                       W. Metzenthen, 22 Parker St, Ormond, Vic 3163,      |
      9 |                       Australia.  E-mail   billm@melbpc.org.au            |
     10 |                                                                           |
     11 |                                                                           |
     12 +---------------------------------------------------------------------------*/
     13
     14#include "fpu_system.h"
     15#include "exception.h"
     16#include "fpu_emu.h"
     17#include "status_w.h"
     18#include "control_w.h"
     19#include "reg_constant.h"
     20
     21static void rem_kernel(unsigned long long st0, unsigned long long *y,
     22		       unsigned long long st1, unsigned long long q, int n);
     23
     24#define BETTER_THAN_486
     25
     26#define FCOS  4
     27
     28/* Used only by fptan, fsin, fcos, and fsincos. */
     29/* This routine produces very accurate results, similar to
     30   using a value of pi with more than 128 bits precision. */
     31/* Limited measurements show no results worse than 64 bit precision
     32   except for the results for arguments close to 2^63, where the
     33   precision of the result sometimes degrades to about 63.9 bits */
     34static int trig_arg(FPU_REG *st0_ptr, int even)
     35{
     36	FPU_REG tmp;
     37	u_char tmptag;
     38	unsigned long long q;
     39	int old_cw = control_word, saved_status = partial_status;
     40	int tag, st0_tag = TAG_Valid;
     41
     42	if (exponent(st0_ptr) >= 63) {
     43		partial_status |= SW_C2;	/* Reduction incomplete. */
     44		return -1;
     45	}
     46
     47	control_word &= ~CW_RC;
     48	control_word |= RC_CHOP;
     49
     50	setpositive(st0_ptr);
     51	tag = FPU_u_div(st0_ptr, &CONST_PI2, &tmp, PR_64_BITS | RC_CHOP | 0x3f,
     52			SIGN_POS);
     53
     54	FPU_round_to_int(&tmp, tag);	/* Fortunately, this can't overflow
     55					   to 2^64 */
     56	q = significand(&tmp);
     57	if (q) {
     58		rem_kernel(significand(st0_ptr),
     59			   &significand(&tmp),
     60			   significand(&CONST_PI2),
     61			   q, exponent(st0_ptr) - exponent(&CONST_PI2));
     62		setexponent16(&tmp, exponent(&CONST_PI2));
     63		st0_tag = FPU_normalize(&tmp);
     64		FPU_copy_to_reg0(&tmp, st0_tag);
     65	}
     66
     67	if ((even && !(q & 1)) || (!even && (q & 1))) {
     68		st0_tag =
     69		    FPU_sub(REV | LOADED | TAG_Valid, (int)&CONST_PI2,
     70			    FULL_PRECISION);
     71
     72#ifdef BETTER_THAN_486
     73		/* So far, the results are exact but based upon a 64 bit
     74		   precision approximation to pi/2. The technique used
     75		   now is equivalent to using an approximation to pi/2 which
     76		   is accurate to about 128 bits. */
     77		if ((exponent(st0_ptr) <= exponent(&CONST_PI2extra) + 64)
     78		    || (q > 1)) {
     79			/* This code gives the effect of having pi/2 to better than
     80			   128 bits precision. */
     81
     82			significand(&tmp) = q + 1;
     83			setexponent16(&tmp, 63);
     84			FPU_normalize(&tmp);
     85			tmptag =
     86			    FPU_u_mul(&CONST_PI2extra, &tmp, &tmp,
     87				      FULL_PRECISION, SIGN_POS,
     88				      exponent(&CONST_PI2extra) +
     89				      exponent(&tmp));
     90			setsign(&tmp, getsign(&CONST_PI2extra));
     91			st0_tag = FPU_add(&tmp, tmptag, 0, FULL_PRECISION);
     92			if (signnegative(st0_ptr)) {
     93				/* CONST_PI2extra is negative, so the result of the addition
     94				   can be negative. This means that the argument is actually
     95				   in a different quadrant. The correction is always < pi/2,
     96				   so it can't overflow into yet another quadrant. */
     97				setpositive(st0_ptr);
     98				q++;
     99			}
    100		}
    101#endif /* BETTER_THAN_486 */
    102	}
    103#ifdef BETTER_THAN_486
    104	else {
    105		/* So far, the results are exact but based upon a 64 bit
    106		   precision approximation to pi/2. The technique used
    107		   now is equivalent to using an approximation to pi/2 which
    108		   is accurate to about 128 bits. */
    109		if (((q > 0)
    110		     && (exponent(st0_ptr) <= exponent(&CONST_PI2extra) + 64))
    111		    || (q > 1)) {
    112			/* This code gives the effect of having p/2 to better than
    113			   128 bits precision. */
    114
    115			significand(&tmp) = q;
    116			setexponent16(&tmp, 63);
    117			FPU_normalize(&tmp);	/* This must return TAG_Valid */
    118			tmptag =
    119			    FPU_u_mul(&CONST_PI2extra, &tmp, &tmp,
    120				      FULL_PRECISION, SIGN_POS,
    121				      exponent(&CONST_PI2extra) +
    122				      exponent(&tmp));
    123			setsign(&tmp, getsign(&CONST_PI2extra));
    124			st0_tag = FPU_sub(LOADED | (tmptag & 0x0f), (int)&tmp,
    125					  FULL_PRECISION);
    126			if ((exponent(st0_ptr) == exponent(&CONST_PI2)) &&
    127			    ((st0_ptr->sigh > CONST_PI2.sigh)
    128			     || ((st0_ptr->sigh == CONST_PI2.sigh)
    129				 && (st0_ptr->sigl > CONST_PI2.sigl)))) {
    130				/* CONST_PI2extra is negative, so the result of the
    131				   subtraction can be larger than pi/2. This means
    132				   that the argument is actually in a different quadrant.
    133				   The correction is always < pi/2, so it can't overflow
    134				   into yet another quadrant. */
    135				st0_tag =
    136				    FPU_sub(REV | LOADED | TAG_Valid,
    137					    (int)&CONST_PI2, FULL_PRECISION);
    138				q++;
    139			}
    140		}
    141	}
    142#endif /* BETTER_THAN_486 */
    143
    144	FPU_settag0(st0_tag);
    145	control_word = old_cw;
    146	partial_status = saved_status & ~SW_C2;	/* Reduction complete. */
    147
    148	return (q & 3) | even;
    149}
    150
    151/* Convert a long to register */
    152static void convert_l2reg(long const *arg, int deststnr)
    153{
    154	int tag;
    155	long num = *arg;
    156	u_char sign;
    157	FPU_REG *dest = &st(deststnr);
    158
    159	if (num == 0) {
    160		FPU_copy_to_regi(&CONST_Z, TAG_Zero, deststnr);
    161		return;
    162	}
    163
    164	if (num > 0) {
    165		sign = SIGN_POS;
    166	} else {
    167		num = -num;
    168		sign = SIGN_NEG;
    169	}
    170
    171	dest->sigh = num;
    172	dest->sigl = 0;
    173	setexponent16(dest, 31);
    174	tag = FPU_normalize(dest);
    175	FPU_settagi(deststnr, tag);
    176	setsign(dest, sign);
    177	return;
    178}
    179
    180static void single_arg_error(FPU_REG *st0_ptr, u_char st0_tag)
    181{
    182	if (st0_tag == TAG_Empty)
    183		FPU_stack_underflow();	/* Puts a QNaN in st(0) */
    184	else if (st0_tag == TW_NaN)
    185		real_1op_NaN(st0_ptr);	/* return with a NaN in st(0) */
    186#ifdef PARANOID
    187	else
    188		EXCEPTION(EX_INTERNAL | 0x0112);
    189#endif /* PARANOID */
    190}
    191
    192static void single_arg_2_error(FPU_REG *st0_ptr, u_char st0_tag)
    193{
    194	int isNaN;
    195
    196	switch (st0_tag) {
    197	case TW_NaN:
    198		isNaN = (exponent(st0_ptr) == EXP_OVER)
    199		    && (st0_ptr->sigh & 0x80000000);
    200		if (isNaN && !(st0_ptr->sigh & 0x40000000)) {	/* Signaling ? */
    201			EXCEPTION(EX_Invalid);
    202			if (control_word & CW_Invalid) {
    203				/* The masked response */
    204				/* Convert to a QNaN */
    205				st0_ptr->sigh |= 0x40000000;
    206				push();
    207				FPU_copy_to_reg0(st0_ptr, TAG_Special);
    208			}
    209		} else if (isNaN) {
    210			/* A QNaN */
    211			push();
    212			FPU_copy_to_reg0(st0_ptr, TAG_Special);
    213		} else {
    214			/* pseudoNaN or other unsupported */
    215			EXCEPTION(EX_Invalid);
    216			if (control_word & CW_Invalid) {
    217				/* The masked response */
    218				FPU_copy_to_reg0(&CONST_QNaN, TAG_Special);
    219				push();
    220				FPU_copy_to_reg0(&CONST_QNaN, TAG_Special);
    221			}
    222		}
    223		break;		/* return with a NaN in st(0) */
    224#ifdef PARANOID
    225	default:
    226		EXCEPTION(EX_INTERNAL | 0x0112);
    227#endif /* PARANOID */
    228	}
    229}
    230
    231/*---------------------------------------------------------------------------*/
    232
    233static void f2xm1(FPU_REG *st0_ptr, u_char tag)
    234{
    235	FPU_REG a;
    236
    237	clear_C1();
    238
    239	if (tag == TAG_Valid) {
    240		/* For an 80486 FPU, the result is undefined if the arg is >= 1.0 */
    241		if (exponent(st0_ptr) < 0) {
    242		      denormal_arg:
    243
    244			FPU_to_exp16(st0_ptr, &a);
    245
    246			/* poly_2xm1(x) requires 0 < st(0) < 1. */
    247			poly_2xm1(getsign(st0_ptr), &a, st0_ptr);
    248		}
    249		set_precision_flag_up();	/* 80486 appears to always do this */
    250		return;
    251	}
    252
    253	if (tag == TAG_Zero)
    254		return;
    255
    256	if (tag == TAG_Special)
    257		tag = FPU_Special(st0_ptr);
    258
    259	switch (tag) {
    260	case TW_Denormal:
    261		if (denormal_operand() < 0)
    262			return;
    263		goto denormal_arg;
    264	case TW_Infinity:
    265		if (signnegative(st0_ptr)) {
    266			/* -infinity gives -1 (p16-10) */
    267			FPU_copy_to_reg0(&CONST_1, TAG_Valid);
    268			setnegative(st0_ptr);
    269		}
    270		return;
    271	default:
    272		single_arg_error(st0_ptr, tag);
    273	}
    274}
    275
    276static void fptan(FPU_REG *st0_ptr, u_char st0_tag)
    277{
    278	FPU_REG *st_new_ptr;
    279	int q;
    280	u_char arg_sign = getsign(st0_ptr);
    281
    282	/* Stack underflow has higher priority */
    283	if (st0_tag == TAG_Empty) {
    284		FPU_stack_underflow();	/* Puts a QNaN in st(0) */
    285		if (control_word & CW_Invalid) {
    286			st_new_ptr = &st(-1);
    287			push();
    288			FPU_stack_underflow();	/* Puts a QNaN in the new st(0) */
    289		}
    290		return;
    291	}
    292
    293	if (STACK_OVERFLOW) {
    294		FPU_stack_overflow();
    295		return;
    296	}
    297
    298	if (st0_tag == TAG_Valid) {
    299		if (exponent(st0_ptr) > -40) {
    300			if ((q = trig_arg(st0_ptr, 0)) == -1) {
    301				/* Operand is out of range */
    302				return;
    303			}
    304
    305			poly_tan(st0_ptr);
    306			setsign(st0_ptr, (q & 1) ^ (arg_sign != 0));
    307			set_precision_flag_up();	/* We do not really know if up or down */
    308		} else {
    309			/* For a small arg, the result == the argument */
    310			/* Underflow may happen */
    311
    312		      denormal_arg:
    313
    314			FPU_to_exp16(st0_ptr, st0_ptr);
    315
    316			st0_tag =
    317			    FPU_round(st0_ptr, 1, 0, FULL_PRECISION, arg_sign);
    318			FPU_settag0(st0_tag);
    319		}
    320		push();
    321		FPU_copy_to_reg0(&CONST_1, TAG_Valid);
    322		return;
    323	}
    324
    325	if (st0_tag == TAG_Zero) {
    326		push();
    327		FPU_copy_to_reg0(&CONST_1, TAG_Valid);
    328		setcc(0);
    329		return;
    330	}
    331
    332	if (st0_tag == TAG_Special)
    333		st0_tag = FPU_Special(st0_ptr);
    334
    335	if (st0_tag == TW_Denormal) {
    336		if (denormal_operand() < 0)
    337			return;
    338
    339		goto denormal_arg;
    340	}
    341
    342	if (st0_tag == TW_Infinity) {
    343		/* The 80486 treats infinity as an invalid operand */
    344		if (arith_invalid(0) >= 0) {
    345			st_new_ptr = &st(-1);
    346			push();
    347			arith_invalid(0);
    348		}
    349		return;
    350	}
    351
    352	single_arg_2_error(st0_ptr, st0_tag);
    353}
    354
    355static void fxtract(FPU_REG *st0_ptr, u_char st0_tag)
    356{
    357	FPU_REG *st_new_ptr;
    358	u_char sign;
    359	register FPU_REG *st1_ptr = st0_ptr;	/* anticipate */
    360
    361	if (STACK_OVERFLOW) {
    362		FPU_stack_overflow();
    363		return;
    364	}
    365
    366	clear_C1();
    367
    368	if (st0_tag == TAG_Valid) {
    369		long e;
    370
    371		push();
    372		sign = getsign(st1_ptr);
    373		reg_copy(st1_ptr, st_new_ptr);
    374		setexponent16(st_new_ptr, exponent(st_new_ptr));
    375
    376	      denormal_arg:
    377
    378		e = exponent16(st_new_ptr);
    379		convert_l2reg(&e, 1);
    380		setexponentpos(st_new_ptr, 0);
    381		setsign(st_new_ptr, sign);
    382		FPU_settag0(TAG_Valid);	/* Needed if arg was a denormal */
    383		return;
    384	} else if (st0_tag == TAG_Zero) {
    385		sign = getsign(st0_ptr);
    386
    387		if (FPU_divide_by_zero(0, SIGN_NEG) < 0)
    388			return;
    389
    390		push();
    391		FPU_copy_to_reg0(&CONST_Z, TAG_Zero);
    392		setsign(st_new_ptr, sign);
    393		return;
    394	}
    395
    396	if (st0_tag == TAG_Special)
    397		st0_tag = FPU_Special(st0_ptr);
    398
    399	if (st0_tag == TW_Denormal) {
    400		if (denormal_operand() < 0)
    401			return;
    402
    403		push();
    404		sign = getsign(st1_ptr);
    405		FPU_to_exp16(st1_ptr, st_new_ptr);
    406		goto denormal_arg;
    407	} else if (st0_tag == TW_Infinity) {
    408		sign = getsign(st0_ptr);
    409		setpositive(st0_ptr);
    410		push();
    411		FPU_copy_to_reg0(&CONST_INF, TAG_Special);
    412		setsign(st_new_ptr, sign);
    413		return;
    414	} else if (st0_tag == TW_NaN) {
    415		if (real_1op_NaN(st0_ptr) < 0)
    416			return;
    417
    418		push();
    419		FPU_copy_to_reg0(st0_ptr, TAG_Special);
    420		return;
    421	} else if (st0_tag == TAG_Empty) {
    422		/* Is this the correct behaviour? */
    423		if (control_word & EX_Invalid) {
    424			FPU_stack_underflow();
    425			push();
    426			FPU_stack_underflow();
    427		} else
    428			EXCEPTION(EX_StackUnder);
    429	}
    430#ifdef PARANOID
    431	else
    432		EXCEPTION(EX_INTERNAL | 0x119);
    433#endif /* PARANOID */
    434}
    435
    436static void fdecstp(void)
    437{
    438	clear_C1();
    439	top--;
    440}
    441
    442static void fincstp(void)
    443{
    444	clear_C1();
    445	top++;
    446}
    447
    448static void fsqrt_(FPU_REG *st0_ptr, u_char st0_tag)
    449{
    450	int expon;
    451
    452	clear_C1();
    453
    454	if (st0_tag == TAG_Valid) {
    455		u_char tag;
    456
    457		if (signnegative(st0_ptr)) {
    458			arith_invalid(0);	/* sqrt(negative) is invalid */
    459			return;
    460		}
    461
    462		/* make st(0) in  [1.0 .. 4.0) */
    463		expon = exponent(st0_ptr);
    464
    465	      denormal_arg:
    466
    467		setexponent16(st0_ptr, (expon & 1));
    468
    469		/* Do the computation, the sign of the result will be positive. */
    470		tag = wm_sqrt(st0_ptr, 0, 0, control_word, SIGN_POS);
    471		addexponent(st0_ptr, expon >> 1);
    472		FPU_settag0(tag);
    473		return;
    474	}
    475
    476	if (st0_tag == TAG_Zero)
    477		return;
    478
    479	if (st0_tag == TAG_Special)
    480		st0_tag = FPU_Special(st0_ptr);
    481
    482	if (st0_tag == TW_Infinity) {
    483		if (signnegative(st0_ptr))
    484			arith_invalid(0);	/* sqrt(-Infinity) is invalid */
    485		return;
    486	} else if (st0_tag == TW_Denormal) {
    487		if (signnegative(st0_ptr)) {
    488			arith_invalid(0);	/* sqrt(negative) is invalid */
    489			return;
    490		}
    491
    492		if (denormal_operand() < 0)
    493			return;
    494
    495		FPU_to_exp16(st0_ptr, st0_ptr);
    496
    497		expon = exponent16(st0_ptr);
    498
    499		goto denormal_arg;
    500	}
    501
    502	single_arg_error(st0_ptr, st0_tag);
    503
    504}
    505
    506static void frndint_(FPU_REG *st0_ptr, u_char st0_tag)
    507{
    508	int flags, tag;
    509
    510	if (st0_tag == TAG_Valid) {
    511		u_char sign;
    512
    513	      denormal_arg:
    514
    515		sign = getsign(st0_ptr);
    516
    517		if (exponent(st0_ptr) > 63)
    518			return;
    519
    520		if (st0_tag == TW_Denormal) {
    521			if (denormal_operand() < 0)
    522				return;
    523		}
    524
    525		/* Fortunately, this can't overflow to 2^64 */
    526		if ((flags = FPU_round_to_int(st0_ptr, st0_tag)))
    527			set_precision_flag(flags);
    528
    529		setexponent16(st0_ptr, 63);
    530		tag = FPU_normalize(st0_ptr);
    531		setsign(st0_ptr, sign);
    532		FPU_settag0(tag);
    533		return;
    534	}
    535
    536	if (st0_tag == TAG_Zero)
    537		return;
    538
    539	if (st0_tag == TAG_Special)
    540		st0_tag = FPU_Special(st0_ptr);
    541
    542	if (st0_tag == TW_Denormal)
    543		goto denormal_arg;
    544	else if (st0_tag == TW_Infinity)
    545		return;
    546	else
    547		single_arg_error(st0_ptr, st0_tag);
    548}
    549
    550static int f_sin(FPU_REG *st0_ptr, u_char tag)
    551{
    552	u_char arg_sign = getsign(st0_ptr);
    553
    554	if (tag == TAG_Valid) {
    555		int q;
    556
    557		if (exponent(st0_ptr) > -40) {
    558			if ((q = trig_arg(st0_ptr, 0)) == -1) {
    559				/* Operand is out of range */
    560				return 1;
    561			}
    562
    563			poly_sine(st0_ptr);
    564
    565			if (q & 2)
    566				changesign(st0_ptr);
    567
    568			setsign(st0_ptr, getsign(st0_ptr) ^ arg_sign);
    569
    570			/* We do not really know if up or down */
    571			set_precision_flag_up();
    572			return 0;
    573		} else {
    574			/* For a small arg, the result == the argument */
    575			set_precision_flag_up();	/* Must be up. */
    576			return 0;
    577		}
    578	}
    579
    580	if (tag == TAG_Zero) {
    581		setcc(0);
    582		return 0;
    583	}
    584
    585	if (tag == TAG_Special)
    586		tag = FPU_Special(st0_ptr);
    587
    588	if (tag == TW_Denormal) {
    589		if (denormal_operand() < 0)
    590			return 1;
    591
    592		/* For a small arg, the result == the argument */
    593		/* Underflow may happen */
    594		FPU_to_exp16(st0_ptr, st0_ptr);
    595
    596		tag = FPU_round(st0_ptr, 1, 0, FULL_PRECISION, arg_sign);
    597
    598		FPU_settag0(tag);
    599
    600		return 0;
    601	} else if (tag == TW_Infinity) {
    602		/* The 80486 treats infinity as an invalid operand */
    603		arith_invalid(0);
    604		return 1;
    605	} else {
    606		single_arg_error(st0_ptr, tag);
    607		return 1;
    608	}
    609}
    610
    611static void fsin(FPU_REG *st0_ptr, u_char tag)
    612{
    613	f_sin(st0_ptr, tag);
    614}
    615
    616static int f_cos(FPU_REG *st0_ptr, u_char tag)
    617{
    618	u_char st0_sign;
    619
    620	st0_sign = getsign(st0_ptr);
    621
    622	if (tag == TAG_Valid) {
    623		int q;
    624
    625		if (exponent(st0_ptr) > -40) {
    626			if ((exponent(st0_ptr) < 0)
    627			    || ((exponent(st0_ptr) == 0)
    628				&& (significand(st0_ptr) <=
    629				    0xc90fdaa22168c234LL))) {
    630				poly_cos(st0_ptr);
    631
    632				/* We do not really know if up or down */
    633				set_precision_flag_down();
    634
    635				return 0;
    636			} else if ((q = trig_arg(st0_ptr, FCOS)) != -1) {
    637				poly_sine(st0_ptr);
    638
    639				if ((q + 1) & 2)
    640					changesign(st0_ptr);
    641
    642				/* We do not really know if up or down */
    643				set_precision_flag_down();
    644
    645				return 0;
    646			} else {
    647				/* Operand is out of range */
    648				return 1;
    649			}
    650		} else {
    651		      denormal_arg:
    652
    653			setcc(0);
    654			FPU_copy_to_reg0(&CONST_1, TAG_Valid);
    655#ifdef PECULIAR_486
    656			set_precision_flag_down();	/* 80486 appears to do this. */
    657#else
    658			set_precision_flag_up();	/* Must be up. */
    659#endif /* PECULIAR_486 */
    660			return 0;
    661		}
    662	} else if (tag == TAG_Zero) {
    663		FPU_copy_to_reg0(&CONST_1, TAG_Valid);
    664		setcc(0);
    665		return 0;
    666	}
    667
    668	if (tag == TAG_Special)
    669		tag = FPU_Special(st0_ptr);
    670
    671	if (tag == TW_Denormal) {
    672		if (denormal_operand() < 0)
    673			return 1;
    674
    675		goto denormal_arg;
    676	} else if (tag == TW_Infinity) {
    677		/* The 80486 treats infinity as an invalid operand */
    678		arith_invalid(0);
    679		return 1;
    680	} else {
    681		single_arg_error(st0_ptr, tag);	/* requires st0_ptr == &st(0) */
    682		return 1;
    683	}
    684}
    685
    686static void fcos(FPU_REG *st0_ptr, u_char st0_tag)
    687{
    688	f_cos(st0_ptr, st0_tag);
    689}
    690
    691static void fsincos(FPU_REG *st0_ptr, u_char st0_tag)
    692{
    693	FPU_REG *st_new_ptr;
    694	FPU_REG arg;
    695	u_char tag;
    696
    697	/* Stack underflow has higher priority */
    698	if (st0_tag == TAG_Empty) {
    699		FPU_stack_underflow();	/* Puts a QNaN in st(0) */
    700		if (control_word & CW_Invalid) {
    701			st_new_ptr = &st(-1);
    702			push();
    703			FPU_stack_underflow();	/* Puts a QNaN in the new st(0) */
    704		}
    705		return;
    706	}
    707
    708	if (STACK_OVERFLOW) {
    709		FPU_stack_overflow();
    710		return;
    711	}
    712
    713	if (st0_tag == TAG_Special)
    714		tag = FPU_Special(st0_ptr);
    715	else
    716		tag = st0_tag;
    717
    718	if (tag == TW_NaN) {
    719		single_arg_2_error(st0_ptr, TW_NaN);
    720		return;
    721	} else if (tag == TW_Infinity) {
    722		/* The 80486 treats infinity as an invalid operand */
    723		if (arith_invalid(0) >= 0) {
    724			/* Masked response */
    725			push();
    726			arith_invalid(0);
    727		}
    728		return;
    729	}
    730
    731	reg_copy(st0_ptr, &arg);
    732	if (!f_sin(st0_ptr, st0_tag)) {
    733		push();
    734		FPU_copy_to_reg0(&arg, st0_tag);
    735		f_cos(&st(0), st0_tag);
    736	} else {
    737		/* An error, so restore st(0) */
    738		FPU_copy_to_reg0(&arg, st0_tag);
    739	}
    740}
    741
    742/*---------------------------------------------------------------------------*/
    743/* The following all require two arguments: st(0) and st(1) */
    744
    745/* A lean, mean kernel for the fprem instructions. This relies upon
    746   the division and rounding to an integer in do_fprem giving an
    747   exact result. Because of this, rem_kernel() needs to deal only with
    748   the least significant 64 bits, the more significant bits of the
    749   result must be zero.
    750 */
    751static void rem_kernel(unsigned long long st0, unsigned long long *y,
    752		       unsigned long long st1, unsigned long long q, int n)
    753{
    754	int dummy;
    755	unsigned long long x;
    756
    757	x = st0 << n;
    758
    759	/* Do the required multiplication and subtraction in the one operation */
    760
    761	/* lsw x -= lsw st1 * lsw q */
    762	asm volatile ("mull %4; subl %%eax,%0; sbbl %%edx,%1":"=m"
    763		      (((unsigned *)&x)[0]), "=m"(((unsigned *)&x)[1]),
    764		      "=a"(dummy)
    765		      :"2"(((unsigned *)&st1)[0]), "m"(((unsigned *)&q)[0])
    766		      :"%dx");
    767	/* msw x -= msw st1 * lsw q */
    768	asm volatile ("mull %3; subl %%eax,%0":"=m" (((unsigned *)&x)[1]),
    769		      "=a"(dummy)
    770		      :"1"(((unsigned *)&st1)[1]), "m"(((unsigned *)&q)[0])
    771		      :"%dx");
    772	/* msw x -= lsw st1 * msw q */
    773	asm volatile ("mull %3; subl %%eax,%0":"=m" (((unsigned *)&x)[1]),
    774		      "=a"(dummy)
    775		      :"1"(((unsigned *)&st1)[0]), "m"(((unsigned *)&q)[1])
    776		      :"%dx");
    777
    778	*y = x;
    779}
    780
    781/* Remainder of st(0) / st(1) */
    782/* This routine produces exact results, i.e. there is never any
    783   rounding or truncation, etc of the result. */
    784static void do_fprem(FPU_REG *st0_ptr, u_char st0_tag, int round)
    785{
    786	FPU_REG *st1_ptr = &st(1);
    787	u_char st1_tag = FPU_gettagi(1);
    788
    789	if (!((st0_tag ^ TAG_Valid) | (st1_tag ^ TAG_Valid))) {
    790		FPU_REG tmp, st0, st1;
    791		u_char st0_sign, st1_sign;
    792		u_char tmptag;
    793		int tag;
    794		int old_cw;
    795		int expdif;
    796		long long q;
    797		unsigned short saved_status;
    798		int cc;
    799
    800	      fprem_valid:
    801		/* Convert registers for internal use. */
    802		st0_sign = FPU_to_exp16(st0_ptr, &st0);
    803		st1_sign = FPU_to_exp16(st1_ptr, &st1);
    804		expdif = exponent16(&st0) - exponent16(&st1);
    805
    806		old_cw = control_word;
    807		cc = 0;
    808
    809		/* We want the status following the denorm tests, but don't want
    810		   the status changed by the arithmetic operations. */
    811		saved_status = partial_status;
    812		control_word &= ~CW_RC;
    813		control_word |= RC_CHOP;
    814
    815		if (expdif < 64) {
    816			/* This should be the most common case */
    817
    818			if (expdif > -2) {
    819				u_char sign = st0_sign ^ st1_sign;
    820				tag = FPU_u_div(&st0, &st1, &tmp,
    821						PR_64_BITS | RC_CHOP | 0x3f,
    822						sign);
    823				setsign(&tmp, sign);
    824
    825				if (exponent(&tmp) >= 0) {
    826					FPU_round_to_int(&tmp, tag);	/* Fortunately, this can't
    827									   overflow to 2^64 */
    828					q = significand(&tmp);
    829
    830					rem_kernel(significand(&st0),
    831						   &significand(&tmp),
    832						   significand(&st1),
    833						   q, expdif);
    834
    835					setexponent16(&tmp, exponent16(&st1));
    836				} else {
    837					reg_copy(&st0, &tmp);
    838					q = 0;
    839				}
    840
    841				if ((round == RC_RND)
    842				    && (tmp.sigh & 0xc0000000)) {
    843					/* We may need to subtract st(1) once more,
    844					   to get a result <= 1/2 of st(1). */
    845					unsigned long long x;
    846					expdif =
    847					    exponent16(&st1) - exponent16(&tmp);
    848					if (expdif <= 1) {
    849						if (expdif == 0)
    850							x = significand(&st1) -
    851							    significand(&tmp);
    852						else	/* expdif is 1 */
    853							x = (significand(&st1)
    854							     << 1) -
    855							    significand(&tmp);
    856						if ((x < significand(&tmp)) ||
    857						    /* or equi-distant (from 0 & st(1)) and q is odd */
    858						    ((x == significand(&tmp))
    859						     && (q & 1))) {
    860							st0_sign = !st0_sign;
    861							significand(&tmp) = x;
    862							q++;
    863						}
    864					}
    865				}
    866
    867				if (q & 4)
    868					cc |= SW_C0;
    869				if (q & 2)
    870					cc |= SW_C3;
    871				if (q & 1)
    872					cc |= SW_C1;
    873			} else {
    874				control_word = old_cw;
    875				setcc(0);
    876				return;
    877			}
    878		} else {
    879			/* There is a large exponent difference ( >= 64 ) */
    880			/* To make much sense, the code in this section should
    881			   be done at high precision. */
    882			int exp_1, N;
    883			u_char sign;
    884
    885			/* prevent overflow here */
    886			/* N is 'a number between 32 and 63' (p26-113) */
    887			reg_copy(&st0, &tmp);
    888			tmptag = st0_tag;
    889			N = (expdif & 0x0000001f) + 32;	/* This choice gives results
    890							   identical to an AMD 486 */
    891			setexponent16(&tmp, N);
    892			exp_1 = exponent16(&st1);
    893			setexponent16(&st1, 0);
    894			expdif -= N;
    895
    896			sign = getsign(&tmp) ^ st1_sign;
    897			tag =
    898			    FPU_u_div(&tmp, &st1, &tmp,
    899				      PR_64_BITS | RC_CHOP | 0x3f, sign);
    900			setsign(&tmp, sign);
    901
    902			FPU_round_to_int(&tmp, tag);	/* Fortunately, this can't
    903							   overflow to 2^64 */
    904
    905			rem_kernel(significand(&st0),
    906				   &significand(&tmp),
    907				   significand(&st1),
    908				   significand(&tmp), exponent(&tmp)
    909			    );
    910			setexponent16(&tmp, exp_1 + expdif);
    911
    912			/* It is possible for the operation to be complete here.
    913			   What does the IEEE standard say? The Intel 80486 manual
    914			   implies that the operation will never be completed at this
    915			   point, and the behaviour of a real 80486 confirms this.
    916			 */
    917			if (!(tmp.sigh | tmp.sigl)) {
    918				/* The result is zero */
    919				control_word = old_cw;
    920				partial_status = saved_status;
    921				FPU_copy_to_reg0(&CONST_Z, TAG_Zero);
    922				setsign(&st0, st0_sign);
    923#ifdef PECULIAR_486
    924				setcc(SW_C2);
    925#else
    926				setcc(0);
    927#endif /* PECULIAR_486 */
    928				return;
    929			}
    930			cc = SW_C2;
    931		}
    932
    933		control_word = old_cw;
    934		partial_status = saved_status;
    935		tag = FPU_normalize_nuo(&tmp);
    936		reg_copy(&tmp, st0_ptr);
    937
    938		/* The only condition to be looked for is underflow,
    939		   and it can occur here only if underflow is unmasked. */
    940		if ((exponent16(&tmp) <= EXP_UNDER) && (tag != TAG_Zero)
    941		    && !(control_word & CW_Underflow)) {
    942			setcc(cc);
    943			tag = arith_underflow(st0_ptr);
    944			setsign(st0_ptr, st0_sign);
    945			FPU_settag0(tag);
    946			return;
    947		} else if ((exponent16(&tmp) > EXP_UNDER) || (tag == TAG_Zero)) {
    948			stdexp(st0_ptr);
    949			setsign(st0_ptr, st0_sign);
    950		} else {
    951			tag =
    952			    FPU_round(st0_ptr, 0, 0, FULL_PRECISION, st0_sign);
    953		}
    954		FPU_settag0(tag);
    955		setcc(cc);
    956
    957		return;
    958	}
    959
    960	if (st0_tag == TAG_Special)
    961		st0_tag = FPU_Special(st0_ptr);
    962	if (st1_tag == TAG_Special)
    963		st1_tag = FPU_Special(st1_ptr);
    964
    965	if (((st0_tag == TAG_Valid) && (st1_tag == TW_Denormal))
    966	    || ((st0_tag == TW_Denormal) && (st1_tag == TAG_Valid))
    967	    || ((st0_tag == TW_Denormal) && (st1_tag == TW_Denormal))) {
    968		if (denormal_operand() < 0)
    969			return;
    970		goto fprem_valid;
    971	} else if ((st0_tag == TAG_Empty) || (st1_tag == TAG_Empty)) {
    972		FPU_stack_underflow();
    973		return;
    974	} else if (st0_tag == TAG_Zero) {
    975		if (st1_tag == TAG_Valid) {
    976			setcc(0);
    977			return;
    978		} else if (st1_tag == TW_Denormal) {
    979			if (denormal_operand() < 0)
    980				return;
    981			setcc(0);
    982			return;
    983		} else if (st1_tag == TAG_Zero) {
    984			arith_invalid(0);
    985			return;
    986		} /* fprem(?,0) always invalid */
    987		else if (st1_tag == TW_Infinity) {
    988			setcc(0);
    989			return;
    990		}
    991	} else if ((st0_tag == TAG_Valid) || (st0_tag == TW_Denormal)) {
    992		if (st1_tag == TAG_Zero) {
    993			arith_invalid(0);	/* fprem(Valid,Zero) is invalid */
    994			return;
    995		} else if (st1_tag != TW_NaN) {
    996			if (((st0_tag == TW_Denormal)
    997			     || (st1_tag == TW_Denormal))
    998			    && (denormal_operand() < 0))
    999				return;
   1000
   1001			if (st1_tag == TW_Infinity) {
   1002				/* fprem(Valid,Infinity) is o.k. */
   1003				setcc(0);
   1004				return;
   1005			}
   1006		}
   1007	} else if (st0_tag == TW_Infinity) {
   1008		if (st1_tag != TW_NaN) {
   1009			arith_invalid(0);	/* fprem(Infinity,?) is invalid */
   1010			return;
   1011		}
   1012	}
   1013
   1014	/* One of the registers must contain a NaN if we got here. */
   1015
   1016#ifdef PARANOID
   1017	if ((st0_tag != TW_NaN) && (st1_tag != TW_NaN))
   1018		EXCEPTION(EX_INTERNAL | 0x118);
   1019#endif /* PARANOID */
   1020
   1021	real_2op_NaN(st1_ptr, st1_tag, 0, st1_ptr);
   1022
   1023}
   1024
   1025/* ST(1) <- ST(1) * log ST;  pop ST */
   1026static void fyl2x(FPU_REG *st0_ptr, u_char st0_tag)
   1027{
   1028	FPU_REG *st1_ptr = &st(1), exponent;
   1029	u_char st1_tag = FPU_gettagi(1);
   1030	u_char sign;
   1031	int e, tag;
   1032
   1033	clear_C1();
   1034
   1035	if ((st0_tag == TAG_Valid) && (st1_tag == TAG_Valid)) {
   1036	      both_valid:
   1037		/* Both regs are Valid or Denormal */
   1038		if (signpositive(st0_ptr)) {
   1039			if (st0_tag == TW_Denormal)
   1040				FPU_to_exp16(st0_ptr, st0_ptr);
   1041			else
   1042				/* Convert st(0) for internal use. */
   1043				setexponent16(st0_ptr, exponent(st0_ptr));
   1044
   1045			if ((st0_ptr->sigh == 0x80000000)
   1046			    && (st0_ptr->sigl == 0)) {
   1047				/* Special case. The result can be precise. */
   1048				u_char esign;
   1049				e = exponent16(st0_ptr);
   1050				if (e >= 0) {
   1051					exponent.sigh = e;
   1052					esign = SIGN_POS;
   1053				} else {
   1054					exponent.sigh = -e;
   1055					esign = SIGN_NEG;
   1056				}
   1057				exponent.sigl = 0;
   1058				setexponent16(&exponent, 31);
   1059				tag = FPU_normalize_nuo(&exponent);
   1060				stdexp(&exponent);
   1061				setsign(&exponent, esign);
   1062				tag =
   1063				    FPU_mul(&exponent, tag, 1, FULL_PRECISION);
   1064				if (tag >= 0)
   1065					FPU_settagi(1, tag);
   1066			} else {
   1067				/* The usual case */
   1068				sign = getsign(st1_ptr);
   1069				if (st1_tag == TW_Denormal)
   1070					FPU_to_exp16(st1_ptr, st1_ptr);
   1071				else
   1072					/* Convert st(1) for internal use. */
   1073					setexponent16(st1_ptr,
   1074						      exponent(st1_ptr));
   1075				poly_l2(st0_ptr, st1_ptr, sign);
   1076			}
   1077		} else {
   1078			/* negative */
   1079			if (arith_invalid(1) < 0)
   1080				return;
   1081		}
   1082
   1083		FPU_pop();
   1084
   1085		return;
   1086	}
   1087
   1088	if (st0_tag == TAG_Special)
   1089		st0_tag = FPU_Special(st0_ptr);
   1090	if (st1_tag == TAG_Special)
   1091		st1_tag = FPU_Special(st1_ptr);
   1092
   1093	if ((st0_tag == TAG_Empty) || (st1_tag == TAG_Empty)) {
   1094		FPU_stack_underflow_pop(1);
   1095		return;
   1096	} else if ((st0_tag <= TW_Denormal) && (st1_tag <= TW_Denormal)) {
   1097		if (st0_tag == TAG_Zero) {
   1098			if (st1_tag == TAG_Zero) {
   1099				/* Both args zero is invalid */
   1100				if (arith_invalid(1) < 0)
   1101					return;
   1102			} else {
   1103				u_char sign;
   1104				sign = getsign(st1_ptr) ^ SIGN_NEG;
   1105				if (FPU_divide_by_zero(1, sign) < 0)
   1106					return;
   1107
   1108				setsign(st1_ptr, sign);
   1109			}
   1110		} else if (st1_tag == TAG_Zero) {
   1111			/* st(1) contains zero, st(0) valid <> 0 */
   1112			/* Zero is the valid answer */
   1113			sign = getsign(st1_ptr);
   1114
   1115			if (signnegative(st0_ptr)) {
   1116				/* log(negative) */
   1117				if (arith_invalid(1) < 0)
   1118					return;
   1119			} else if ((st0_tag == TW_Denormal)
   1120				   && (denormal_operand() < 0))
   1121				return;
   1122			else {
   1123				if (exponent(st0_ptr) < 0)
   1124					sign ^= SIGN_NEG;
   1125
   1126				FPU_copy_to_reg1(&CONST_Z, TAG_Zero);
   1127				setsign(st1_ptr, sign);
   1128			}
   1129		} else {
   1130			/* One or both operands are denormals. */
   1131			if (denormal_operand() < 0)
   1132				return;
   1133			goto both_valid;
   1134		}
   1135	} else if ((st0_tag == TW_NaN) || (st1_tag == TW_NaN)) {
   1136		if (real_2op_NaN(st0_ptr, st0_tag, 1, st0_ptr) < 0)
   1137			return;
   1138	}
   1139	/* One or both arg must be an infinity */
   1140	else if (st0_tag == TW_Infinity) {
   1141		if ((signnegative(st0_ptr)) || (st1_tag == TAG_Zero)) {
   1142			/* log(-infinity) or 0*log(infinity) */
   1143			if (arith_invalid(1) < 0)
   1144				return;
   1145		} else {
   1146			u_char sign = getsign(st1_ptr);
   1147
   1148			if ((st1_tag == TW_Denormal)
   1149			    && (denormal_operand() < 0))
   1150				return;
   1151
   1152			FPU_copy_to_reg1(&CONST_INF, TAG_Special);
   1153			setsign(st1_ptr, sign);
   1154		}
   1155	}
   1156	/* st(1) must be infinity here */
   1157	else if (((st0_tag == TAG_Valid) || (st0_tag == TW_Denormal))
   1158		 && (signpositive(st0_ptr))) {
   1159		if (exponent(st0_ptr) >= 0) {
   1160			if ((exponent(st0_ptr) == 0) &&
   1161			    (st0_ptr->sigh == 0x80000000) &&
   1162			    (st0_ptr->sigl == 0)) {
   1163				/* st(0) holds 1.0 */
   1164				/* infinity*log(1) */
   1165				if (arith_invalid(1) < 0)
   1166					return;
   1167			}
   1168			/* else st(0) is positive and > 1.0 */
   1169		} else {
   1170			/* st(0) is positive and < 1.0 */
   1171
   1172			if ((st0_tag == TW_Denormal)
   1173			    && (denormal_operand() < 0))
   1174				return;
   1175
   1176			changesign(st1_ptr);
   1177		}
   1178	} else {
   1179		/* st(0) must be zero or negative */
   1180		if (st0_tag == TAG_Zero) {
   1181			/* This should be invalid, but a real 80486 is happy with it. */
   1182
   1183#ifndef PECULIAR_486
   1184			sign = getsign(st1_ptr);
   1185			if (FPU_divide_by_zero(1, sign) < 0)
   1186				return;
   1187#endif /* PECULIAR_486 */
   1188
   1189			changesign(st1_ptr);
   1190		} else if (arith_invalid(1) < 0)	/* log(negative) */
   1191			return;
   1192	}
   1193
   1194	FPU_pop();
   1195}
   1196
   1197static void fpatan(FPU_REG *st0_ptr, u_char st0_tag)
   1198{
   1199	FPU_REG *st1_ptr = &st(1);
   1200	u_char st1_tag = FPU_gettagi(1);
   1201	int tag;
   1202
   1203	clear_C1();
   1204	if (!((st0_tag ^ TAG_Valid) | (st1_tag ^ TAG_Valid))) {
   1205	      valid_atan:
   1206
   1207		poly_atan(st0_ptr, st0_tag, st1_ptr, st1_tag);
   1208
   1209		FPU_pop();
   1210
   1211		return;
   1212	}
   1213
   1214	if (st0_tag == TAG_Special)
   1215		st0_tag = FPU_Special(st0_ptr);
   1216	if (st1_tag == TAG_Special)
   1217		st1_tag = FPU_Special(st1_ptr);
   1218
   1219	if (((st0_tag == TAG_Valid) && (st1_tag == TW_Denormal))
   1220	    || ((st0_tag == TW_Denormal) && (st1_tag == TAG_Valid))
   1221	    || ((st0_tag == TW_Denormal) && (st1_tag == TW_Denormal))) {
   1222		if (denormal_operand() < 0)
   1223			return;
   1224
   1225		goto valid_atan;
   1226	} else if ((st0_tag == TAG_Empty) || (st1_tag == TAG_Empty)) {
   1227		FPU_stack_underflow_pop(1);
   1228		return;
   1229	} else if ((st0_tag == TW_NaN) || (st1_tag == TW_NaN)) {
   1230		if (real_2op_NaN(st0_ptr, st0_tag, 1, st0_ptr) >= 0)
   1231			FPU_pop();
   1232		return;
   1233	} else if ((st0_tag == TW_Infinity) || (st1_tag == TW_Infinity)) {
   1234		u_char sign = getsign(st1_ptr);
   1235		if (st0_tag == TW_Infinity) {
   1236			if (st1_tag == TW_Infinity) {
   1237				if (signpositive(st0_ptr)) {
   1238					FPU_copy_to_reg1(&CONST_PI4, TAG_Valid);
   1239				} else {
   1240					setpositive(st1_ptr);
   1241					tag =
   1242					    FPU_u_add(&CONST_PI4, &CONST_PI2,
   1243						      st1_ptr, FULL_PRECISION,
   1244						      SIGN_POS,
   1245						      exponent(&CONST_PI4),
   1246						      exponent(&CONST_PI2));
   1247					if (tag >= 0)
   1248						FPU_settagi(1, tag);
   1249				}
   1250			} else {
   1251				if ((st1_tag == TW_Denormal)
   1252				    && (denormal_operand() < 0))
   1253					return;
   1254
   1255				if (signpositive(st0_ptr)) {
   1256					FPU_copy_to_reg1(&CONST_Z, TAG_Zero);
   1257					setsign(st1_ptr, sign);	/* An 80486 preserves the sign */
   1258					FPU_pop();
   1259					return;
   1260				} else {
   1261					FPU_copy_to_reg1(&CONST_PI, TAG_Valid);
   1262				}
   1263			}
   1264		} else {
   1265			/* st(1) is infinity, st(0) not infinity */
   1266			if ((st0_tag == TW_Denormal)
   1267			    && (denormal_operand() < 0))
   1268				return;
   1269
   1270			FPU_copy_to_reg1(&CONST_PI2, TAG_Valid);
   1271		}
   1272		setsign(st1_ptr, sign);
   1273	} else if (st1_tag == TAG_Zero) {
   1274		/* st(0) must be valid or zero */
   1275		u_char sign = getsign(st1_ptr);
   1276
   1277		if ((st0_tag == TW_Denormal) && (denormal_operand() < 0))
   1278			return;
   1279
   1280		if (signpositive(st0_ptr)) {
   1281			/* An 80486 preserves the sign */
   1282			FPU_pop();
   1283			return;
   1284		}
   1285
   1286		FPU_copy_to_reg1(&CONST_PI, TAG_Valid);
   1287		setsign(st1_ptr, sign);
   1288	} else if (st0_tag == TAG_Zero) {
   1289		/* st(1) must be TAG_Valid here */
   1290		u_char sign = getsign(st1_ptr);
   1291
   1292		if ((st1_tag == TW_Denormal) && (denormal_operand() < 0))
   1293			return;
   1294
   1295		FPU_copy_to_reg1(&CONST_PI2, TAG_Valid);
   1296		setsign(st1_ptr, sign);
   1297	}
   1298#ifdef PARANOID
   1299	else
   1300		EXCEPTION(EX_INTERNAL | 0x125);
   1301#endif /* PARANOID */
   1302
   1303	FPU_pop();
   1304	set_precision_flag_up();	/* We do not really know if up or down */
   1305}
   1306
   1307static void fprem(FPU_REG *st0_ptr, u_char st0_tag)
   1308{
   1309	do_fprem(st0_ptr, st0_tag, RC_CHOP);
   1310}
   1311
   1312static void fprem1(FPU_REG *st0_ptr, u_char st0_tag)
   1313{
   1314	do_fprem(st0_ptr, st0_tag, RC_RND);
   1315}
   1316
   1317static void fyl2xp1(FPU_REG *st0_ptr, u_char st0_tag)
   1318{
   1319	u_char sign, sign1;
   1320	FPU_REG *st1_ptr = &st(1), a, b;
   1321	u_char st1_tag = FPU_gettagi(1);
   1322
   1323	clear_C1();
   1324	if (!((st0_tag ^ TAG_Valid) | (st1_tag ^ TAG_Valid))) {
   1325	      valid_yl2xp1:
   1326
   1327		sign = getsign(st0_ptr);
   1328		sign1 = getsign(st1_ptr);
   1329
   1330		FPU_to_exp16(st0_ptr, &a);
   1331		FPU_to_exp16(st1_ptr, &b);
   1332
   1333		if (poly_l2p1(sign, sign1, &a, &b, st1_ptr))
   1334			return;
   1335
   1336		FPU_pop();
   1337		return;
   1338	}
   1339
   1340	if (st0_tag == TAG_Special)
   1341		st0_tag = FPU_Special(st0_ptr);
   1342	if (st1_tag == TAG_Special)
   1343		st1_tag = FPU_Special(st1_ptr);
   1344
   1345	if (((st0_tag == TAG_Valid) && (st1_tag == TW_Denormal))
   1346	    || ((st0_tag == TW_Denormal) && (st1_tag == TAG_Valid))
   1347	    || ((st0_tag == TW_Denormal) && (st1_tag == TW_Denormal))) {
   1348		if (denormal_operand() < 0)
   1349			return;
   1350
   1351		goto valid_yl2xp1;
   1352	} else if ((st0_tag == TAG_Empty) | (st1_tag == TAG_Empty)) {
   1353		FPU_stack_underflow_pop(1);
   1354		return;
   1355	} else if (st0_tag == TAG_Zero) {
   1356		switch (st1_tag) {
   1357		case TW_Denormal:
   1358			if (denormal_operand() < 0)
   1359				return;
   1360			fallthrough;
   1361		case TAG_Zero:
   1362		case TAG_Valid:
   1363			setsign(st0_ptr, getsign(st0_ptr) ^ getsign(st1_ptr));
   1364			FPU_copy_to_reg1(st0_ptr, st0_tag);
   1365			break;
   1366
   1367		case TW_Infinity:
   1368			/* Infinity*log(1) */
   1369			if (arith_invalid(1) < 0)
   1370				return;
   1371			break;
   1372
   1373		case TW_NaN:
   1374			if (real_2op_NaN(st0_ptr, st0_tag, 1, st0_ptr) < 0)
   1375				return;
   1376			break;
   1377
   1378		default:
   1379#ifdef PARANOID
   1380			EXCEPTION(EX_INTERNAL | 0x116);
   1381			return;
   1382#endif /* PARANOID */
   1383			break;
   1384		}
   1385	} else if ((st0_tag == TAG_Valid) || (st0_tag == TW_Denormal)) {
   1386		switch (st1_tag) {
   1387		case TAG_Zero:
   1388			if (signnegative(st0_ptr)) {
   1389				if (exponent(st0_ptr) >= 0) {
   1390					/* st(0) holds <= -1.0 */
   1391#ifdef PECULIAR_486		/* Stupid 80486 doesn't worry about log(negative). */
   1392					changesign(st1_ptr);
   1393#else
   1394					if (arith_invalid(1) < 0)
   1395						return;
   1396#endif /* PECULIAR_486 */
   1397				} else if ((st0_tag == TW_Denormal)
   1398					   && (denormal_operand() < 0))
   1399					return;
   1400				else
   1401					changesign(st1_ptr);
   1402			} else if ((st0_tag == TW_Denormal)
   1403				   && (denormal_operand() < 0))
   1404				return;
   1405			break;
   1406
   1407		case TW_Infinity:
   1408			if (signnegative(st0_ptr)) {
   1409				if ((exponent(st0_ptr) >= 0) &&
   1410				    !((st0_ptr->sigh == 0x80000000) &&
   1411				      (st0_ptr->sigl == 0))) {
   1412					/* st(0) holds < -1.0 */
   1413#ifdef PECULIAR_486		/* Stupid 80486 doesn't worry about log(negative). */
   1414					changesign(st1_ptr);
   1415#else
   1416					if (arith_invalid(1) < 0)
   1417						return;
   1418#endif /* PECULIAR_486 */
   1419				} else if ((st0_tag == TW_Denormal)
   1420					   && (denormal_operand() < 0))
   1421					return;
   1422				else
   1423					changesign(st1_ptr);
   1424			} else if ((st0_tag == TW_Denormal)
   1425				   && (denormal_operand() < 0))
   1426				return;
   1427			break;
   1428
   1429		case TW_NaN:
   1430			if (real_2op_NaN(st0_ptr, st0_tag, 1, st0_ptr) < 0)
   1431				return;
   1432		}
   1433
   1434	} else if (st0_tag == TW_NaN) {
   1435		if (real_2op_NaN(st0_ptr, st0_tag, 1, st0_ptr) < 0)
   1436			return;
   1437	} else if (st0_tag == TW_Infinity) {
   1438		if (st1_tag == TW_NaN) {
   1439			if (real_2op_NaN(st0_ptr, st0_tag, 1, st0_ptr) < 0)
   1440				return;
   1441		} else if (signnegative(st0_ptr)) {
   1442#ifndef PECULIAR_486
   1443			/* This should have higher priority than denormals, but... */
   1444			if (arith_invalid(1) < 0)	/* log(-infinity) */
   1445				return;
   1446#endif /* PECULIAR_486 */
   1447			if ((st1_tag == TW_Denormal)
   1448			    && (denormal_operand() < 0))
   1449				return;
   1450#ifdef PECULIAR_486
   1451			/* Denormal operands actually get higher priority */
   1452			if (arith_invalid(1) < 0)	/* log(-infinity) */
   1453				return;
   1454#endif /* PECULIAR_486 */
   1455		} else if (st1_tag == TAG_Zero) {
   1456			/* log(infinity) */
   1457			if (arith_invalid(1) < 0)
   1458				return;
   1459		}
   1460
   1461		/* st(1) must be valid here. */
   1462
   1463		else if ((st1_tag == TW_Denormal) && (denormal_operand() < 0))
   1464			return;
   1465
   1466		/* The Manual says that log(Infinity) is invalid, but a real
   1467		   80486 sensibly says that it is o.k. */
   1468		else {
   1469			u_char sign = getsign(st1_ptr);
   1470			FPU_copy_to_reg1(&CONST_INF, TAG_Special);
   1471			setsign(st1_ptr, sign);
   1472		}
   1473	}
   1474#ifdef PARANOID
   1475	else {
   1476		EXCEPTION(EX_INTERNAL | 0x117);
   1477		return;
   1478	}
   1479#endif /* PARANOID */
   1480
   1481	FPU_pop();
   1482	return;
   1483
   1484}
   1485
   1486static void fscale(FPU_REG *st0_ptr, u_char st0_tag)
   1487{
   1488	FPU_REG *st1_ptr = &st(1);
   1489	u_char st1_tag = FPU_gettagi(1);
   1490	int old_cw = control_word;
   1491	u_char sign = getsign(st0_ptr);
   1492
   1493	clear_C1();
   1494	if (!((st0_tag ^ TAG_Valid) | (st1_tag ^ TAG_Valid))) {
   1495		long scale;
   1496		FPU_REG tmp;
   1497
   1498		/* Convert register for internal use. */
   1499		setexponent16(st0_ptr, exponent(st0_ptr));
   1500
   1501	      valid_scale:
   1502
   1503		if (exponent(st1_ptr) > 30) {
   1504			/* 2^31 is far too large, would require 2^(2^30) or 2^(-2^30) */
   1505
   1506			if (signpositive(st1_ptr)) {
   1507				EXCEPTION(EX_Overflow);
   1508				FPU_copy_to_reg0(&CONST_INF, TAG_Special);
   1509			} else {
   1510				EXCEPTION(EX_Underflow);
   1511				FPU_copy_to_reg0(&CONST_Z, TAG_Zero);
   1512			}
   1513			setsign(st0_ptr, sign);
   1514			return;
   1515		}
   1516
   1517		control_word &= ~CW_RC;
   1518		control_word |= RC_CHOP;
   1519		reg_copy(st1_ptr, &tmp);
   1520		FPU_round_to_int(&tmp, st1_tag);	/* This can never overflow here */
   1521		control_word = old_cw;
   1522		scale = signnegative(st1_ptr) ? -tmp.sigl : tmp.sigl;
   1523		scale += exponent16(st0_ptr);
   1524
   1525		setexponent16(st0_ptr, scale);
   1526
   1527		/* Use FPU_round() to properly detect under/overflow etc */
   1528		FPU_round(st0_ptr, 0, 0, control_word, sign);
   1529
   1530		return;
   1531	}
   1532
   1533	if (st0_tag == TAG_Special)
   1534		st0_tag = FPU_Special(st0_ptr);
   1535	if (st1_tag == TAG_Special)
   1536		st1_tag = FPU_Special(st1_ptr);
   1537
   1538	if ((st0_tag == TAG_Valid) || (st0_tag == TW_Denormal)) {
   1539		switch (st1_tag) {
   1540		case TAG_Valid:
   1541			/* st(0) must be a denormal */
   1542			if ((st0_tag == TW_Denormal)
   1543			    && (denormal_operand() < 0))
   1544				return;
   1545
   1546			FPU_to_exp16(st0_ptr, st0_ptr);	/* Will not be left on stack */
   1547			goto valid_scale;
   1548
   1549		case TAG_Zero:
   1550			if (st0_tag == TW_Denormal)
   1551				denormal_operand();
   1552			return;
   1553
   1554		case TW_Denormal:
   1555			denormal_operand();
   1556			return;
   1557
   1558		case TW_Infinity:
   1559			if ((st0_tag == TW_Denormal)
   1560			    && (denormal_operand() < 0))
   1561				return;
   1562
   1563			if (signpositive(st1_ptr))
   1564				FPU_copy_to_reg0(&CONST_INF, TAG_Special);
   1565			else
   1566				FPU_copy_to_reg0(&CONST_Z, TAG_Zero);
   1567			setsign(st0_ptr, sign);
   1568			return;
   1569
   1570		case TW_NaN:
   1571			real_2op_NaN(st1_ptr, st1_tag, 0, st0_ptr);
   1572			return;
   1573		}
   1574	} else if (st0_tag == TAG_Zero) {
   1575		switch (st1_tag) {
   1576		case TAG_Valid:
   1577		case TAG_Zero:
   1578			return;
   1579
   1580		case TW_Denormal:
   1581			denormal_operand();
   1582			return;
   1583
   1584		case TW_Infinity:
   1585			if (signpositive(st1_ptr))
   1586				arith_invalid(0);	/* Zero scaled by +Infinity */
   1587			return;
   1588
   1589		case TW_NaN:
   1590			real_2op_NaN(st1_ptr, st1_tag, 0, st0_ptr);
   1591			return;
   1592		}
   1593	} else if (st0_tag == TW_Infinity) {
   1594		switch (st1_tag) {
   1595		case TAG_Valid:
   1596		case TAG_Zero:
   1597			return;
   1598
   1599		case TW_Denormal:
   1600			denormal_operand();
   1601			return;
   1602
   1603		case TW_Infinity:
   1604			if (signnegative(st1_ptr))
   1605				arith_invalid(0);	/* Infinity scaled by -Infinity */
   1606			return;
   1607
   1608		case TW_NaN:
   1609			real_2op_NaN(st1_ptr, st1_tag, 0, st0_ptr);
   1610			return;
   1611		}
   1612	} else if (st0_tag == TW_NaN) {
   1613		if (st1_tag != TAG_Empty) {
   1614			real_2op_NaN(st1_ptr, st1_tag, 0, st0_ptr);
   1615			return;
   1616		}
   1617	}
   1618#ifdef PARANOID
   1619	if (!((st0_tag == TAG_Empty) || (st1_tag == TAG_Empty))) {
   1620		EXCEPTION(EX_INTERNAL | 0x115);
   1621		return;
   1622	}
   1623#endif
   1624
   1625	/* At least one of st(0), st(1) must be empty */
   1626	FPU_stack_underflow();
   1627
   1628}
   1629
   1630/*---------------------------------------------------------------------------*/
   1631
   1632static FUNC_ST0 const trig_table_a[] = {
   1633	f2xm1, fyl2x, fptan, fpatan,
   1634	fxtract, fprem1, (FUNC_ST0) fdecstp, (FUNC_ST0) fincstp
   1635};
   1636
   1637void FPU_triga(void)
   1638{
   1639	(trig_table_a[FPU_rm]) (&st(0), FPU_gettag0());
   1640}
   1641
   1642static FUNC_ST0 const trig_table_b[] = {
   1643	fprem, fyl2xp1, fsqrt_, fsincos, frndint_, fscale, fsin, fcos
   1644};
   1645
   1646void FPU_trigb(void)
   1647{
   1648	(trig_table_b[FPU_rm]) (&st(0), FPU_gettag0());
   1649}