xref: /linux/arch/x86/math-emu/fpu_trig.c (revision eb01fe7abbe2d0b38824d2a93fdb4cc3eaf2ccc1)
1 // SPDX-License-Identifier: GPL-2.0
2 /*---------------------------------------------------------------------------+
3  |  fpu_trig.c                                                               |
4  |                                                                           |
5  | Implementation of the FPU "transcendental" functions.                     |
6  |                                                                           |
7  | Copyright (C) 1992,1993,1994,1997,1999                                    |
8  |                       W. Metzenthen, 22 Parker St, Ormond, Vic 3163,      |
9  |                       Australia.  E-mail   billm@melbpc.org.au            |
10  |                                                                           |
11  |                                                                           |
12  +---------------------------------------------------------------------------*/
13 
14 #include "fpu_system.h"
15 #include "exception.h"
16 #include "fpu_emu.h"
17 #include "status_w.h"
18 #include "control_w.h"
19 #include "reg_constant.h"
20 
21 static void rem_kernel(unsigned long long st0, unsigned long long *y,
22 		       unsigned long long st1, unsigned long long q, int n);
23 
24 #define BETTER_THAN_486
25 
26 #define FCOS  4
27 
28 /* Used only by fptan, fsin, fcos, and fsincos. */
29 /* This routine produces very accurate results, similar to
30    using a value of pi with more than 128 bits precision. */
31 /* Limited measurements show no results worse than 64 bit precision
32    except for the results for arguments close to 2^63, where the
33    precision of the result sometimes degrades to about 63.9 bits */
34 static int trig_arg(FPU_REG *st0_ptr, int even)
35 {
36 	FPU_REG tmp;
37 	u_char tmptag;
38 	unsigned long long q;
39 	int old_cw = control_word, saved_status = partial_status;
40 	int tag, st0_tag = TAG_Valid;
41 
42 	if (exponent(st0_ptr) >= 63) {
43 		partial_status |= SW_C2;	/* Reduction incomplete. */
44 		return -1;
45 	}
46 
47 	control_word &= ~CW_RC;
48 	control_word |= RC_CHOP;
49 
50 	setpositive(st0_ptr);
51 	tag = FPU_u_div(st0_ptr, &CONST_PI2, &tmp, PR_64_BITS | RC_CHOP | 0x3f,
52 			SIGN_POS);
53 
54 	FPU_round_to_int(&tmp, tag);	/* Fortunately, this can't overflow
55 					   to 2^64 */
56 	q = significand(&tmp);
57 	if (q) {
58 		rem_kernel(significand(st0_ptr),
59 			   &significand(&tmp),
60 			   significand(&CONST_PI2),
61 			   q, exponent(st0_ptr) - exponent(&CONST_PI2));
62 		setexponent16(&tmp, exponent(&CONST_PI2));
63 		st0_tag = FPU_normalize(&tmp);
64 		FPU_copy_to_reg0(&tmp, st0_tag);
65 	}
66 
67 	if ((even && !(q & 1)) || (!even && (q & 1))) {
68 		st0_tag =
69 		    FPU_sub(REV | LOADED | TAG_Valid, (int)&CONST_PI2,
70 			    FULL_PRECISION);
71 
72 #ifdef BETTER_THAN_486
73 		/* So far, the results are exact but based upon a 64 bit
74 		   precision approximation to pi/2. The technique used
75 		   now is equivalent to using an approximation to pi/2 which
76 		   is accurate to about 128 bits. */
77 		if ((exponent(st0_ptr) <= exponent(&CONST_PI2extra) + 64)
78 		    || (q > 1)) {
79 			/* This code gives the effect of having pi/2 to better than
80 			   128 bits precision. */
81 
82 			significand(&tmp) = q + 1;
83 			setexponent16(&tmp, 63);
84 			FPU_normalize(&tmp);
85 			tmptag =
86 			    FPU_u_mul(&CONST_PI2extra, &tmp, &tmp,
87 				      FULL_PRECISION, SIGN_POS,
88 				      exponent(&CONST_PI2extra) +
89 				      exponent(&tmp));
90 			setsign(&tmp, getsign(&CONST_PI2extra));
91 			st0_tag = FPU_add(&tmp, tmptag, 0, FULL_PRECISION);
92 			if (signnegative(st0_ptr)) {
93 				/* CONST_PI2extra is negative, so the result of the addition
94 				   can be negative. This means that the argument is actually
95 				   in a different quadrant. The correction is always < pi/2,
96 				   so it can't overflow into yet another quadrant. */
97 				setpositive(st0_ptr);
98 				q++;
99 			}
100 		}
101 #endif /* BETTER_THAN_486 */
102 	}
103 #ifdef BETTER_THAN_486
104 	else {
105 		/* So far, the results are exact but based upon a 64 bit
106 		   precision approximation to pi/2. The technique used
107 		   now is equivalent to using an approximation to pi/2 which
108 		   is accurate to about 128 bits. */
109 		if (((q > 0)
110 		     && (exponent(st0_ptr) <= exponent(&CONST_PI2extra) + 64))
111 		    || (q > 1)) {
112 			/* This code gives the effect of having p/2 to better than
113 			   128 bits precision. */
114 
115 			significand(&tmp) = q;
116 			setexponent16(&tmp, 63);
117 			FPU_normalize(&tmp);	/* This must return TAG_Valid */
118 			tmptag =
119 			    FPU_u_mul(&CONST_PI2extra, &tmp, &tmp,
120 				      FULL_PRECISION, SIGN_POS,
121 				      exponent(&CONST_PI2extra) +
122 				      exponent(&tmp));
123 			setsign(&tmp, getsign(&CONST_PI2extra));
124 			st0_tag = FPU_sub(LOADED | (tmptag & 0x0f), (int)&tmp,
125 					  FULL_PRECISION);
126 			if ((exponent(st0_ptr) == exponent(&CONST_PI2)) &&
127 			    ((st0_ptr->sigh > CONST_PI2.sigh)
128 			     || ((st0_ptr->sigh == CONST_PI2.sigh)
129 				 && (st0_ptr->sigl > CONST_PI2.sigl)))) {
130 				/* CONST_PI2extra is negative, so the result of the
131 				   subtraction can be larger than pi/2. This means
132 				   that the argument is actually in a different quadrant.
133 				   The correction is always < pi/2, so it can't overflow
134 				   into yet another quadrant. */
135 				st0_tag =
136 				    FPU_sub(REV | LOADED | TAG_Valid,
137 					    (int)&CONST_PI2, FULL_PRECISION);
138 				q++;
139 			}
140 		}
141 	}
142 #endif /* BETTER_THAN_486 */
143 
144 	FPU_settag0(st0_tag);
145 	control_word = old_cw;
146 	partial_status = saved_status & ~SW_C2;	/* Reduction complete. */
147 
148 	return (q & 3) | even;
149 }
150 
151 /* Convert a long to register */
152 static void convert_l2reg(long const *arg, int deststnr)
153 {
154 	int tag;
155 	long num = *arg;
156 	u_char sign;
157 	FPU_REG *dest = &st(deststnr);
158 
159 	if (num == 0) {
160 		FPU_copy_to_regi(&CONST_Z, TAG_Zero, deststnr);
161 		return;
162 	}
163 
164 	if (num > 0) {
165 		sign = SIGN_POS;
166 	} else {
167 		num = -num;
168 		sign = SIGN_NEG;
169 	}
170 
171 	dest->sigh = num;
172 	dest->sigl = 0;
173 	setexponent16(dest, 31);
174 	tag = FPU_normalize(dest);
175 	FPU_settagi(deststnr, tag);
176 	setsign(dest, sign);
177 	return;
178 }
179 
180 static void single_arg_error(FPU_REG *st0_ptr, u_char st0_tag)
181 {
182 	if (st0_tag == TAG_Empty)
183 		FPU_stack_underflow();	/* Puts a QNaN in st(0) */
184 	else if (st0_tag == TW_NaN)
185 		real_1op_NaN(st0_ptr);	/* return with a NaN in st(0) */
186 #ifdef PARANOID
187 	else
188 		EXCEPTION(EX_INTERNAL | 0x0112);
189 #endif /* PARANOID */
190 }
191 
192 static void single_arg_2_error(FPU_REG *st0_ptr, u_char st0_tag)
193 {
194 	int isNaN;
195 
196 	switch (st0_tag) {
197 	case TW_NaN:
198 		isNaN = (exponent(st0_ptr) == EXP_OVER)
199 		    && (st0_ptr->sigh & 0x80000000);
200 		if (isNaN && !(st0_ptr->sigh & 0x40000000)) {	/* Signaling ? */
201 			EXCEPTION(EX_Invalid);
202 			if (control_word & CW_Invalid) {
203 				/* The masked response */
204 				/* Convert to a QNaN */
205 				st0_ptr->sigh |= 0x40000000;
206 				push();
207 				FPU_copy_to_reg0(st0_ptr, TAG_Special);
208 			}
209 		} else if (isNaN) {
210 			/* A QNaN */
211 			push();
212 			FPU_copy_to_reg0(st0_ptr, TAG_Special);
213 		} else {
214 			/* pseudoNaN or other unsupported */
215 			EXCEPTION(EX_Invalid);
216 			if (control_word & CW_Invalid) {
217 				/* The masked response */
218 				FPU_copy_to_reg0(&CONST_QNaN, TAG_Special);
219 				push();
220 				FPU_copy_to_reg0(&CONST_QNaN, TAG_Special);
221 			}
222 		}
223 		break;		/* return with a NaN in st(0) */
224 #ifdef PARANOID
225 	default:
226 		EXCEPTION(EX_INTERNAL | 0x0112);
227 #endif /* PARANOID */
228 	}
229 }
230 
231 /*---------------------------------------------------------------------------*/
232 
233 static void f2xm1(FPU_REG *st0_ptr, u_char tag)
234 {
235 	FPU_REG a;
236 
237 	clear_C1();
238 
239 	if (tag == TAG_Valid) {
240 		/* For an 80486 FPU, the result is undefined if the arg is >= 1.0 */
241 		if (exponent(st0_ptr) < 0) {
242 		      denormal_arg:
243 
244 			FPU_to_exp16(st0_ptr, &a);
245 
246 			/* poly_2xm1(x) requires 0 < st(0) < 1. */
247 			poly_2xm1(getsign(st0_ptr), &a, st0_ptr);
248 		}
249 		set_precision_flag_up();	/* 80486 appears to always do this */
250 		return;
251 	}
252 
253 	if (tag == TAG_Zero)
254 		return;
255 
256 	if (tag == TAG_Special)
257 		tag = FPU_Special(st0_ptr);
258 
259 	switch (tag) {
260 	case TW_Denormal:
261 		if (denormal_operand() < 0)
262 			return;
263 		goto denormal_arg;
264 	case TW_Infinity:
265 		if (signnegative(st0_ptr)) {
266 			/* -infinity gives -1 (p16-10) */
267 			FPU_copy_to_reg0(&CONST_1, TAG_Valid);
268 			setnegative(st0_ptr);
269 		}
270 		return;
271 	default:
272 		single_arg_error(st0_ptr, tag);
273 	}
274 }
275 
276 static void fptan(FPU_REG *st0_ptr, u_char st0_tag)
277 {
278 	FPU_REG *st_new_ptr;
279 	int q;
280 	u_char arg_sign = getsign(st0_ptr);
281 
282 	/* Stack underflow has higher priority */
283 	if (st0_tag == TAG_Empty) {
284 		FPU_stack_underflow();	/* Puts a QNaN in st(0) */
285 		if (control_word & CW_Invalid) {
286 			st_new_ptr = &st(-1);
287 			push();
288 			FPU_stack_underflow();	/* Puts a QNaN in the new st(0) */
289 		}
290 		return;
291 	}
292 
293 	if (STACK_OVERFLOW) {
294 		FPU_stack_overflow();
295 		return;
296 	}
297 
298 	if (st0_tag == TAG_Valid) {
299 		if (exponent(st0_ptr) > -40) {
300 			if ((q = trig_arg(st0_ptr, 0)) == -1) {
301 				/* Operand is out of range */
302 				return;
303 			}
304 
305 			poly_tan(st0_ptr);
306 			setsign(st0_ptr, (q & 1) ^ (arg_sign != 0));
307 			set_precision_flag_up();	/* We do not really know if up or down */
308 		} else {
309 			/* For a small arg, the result == the argument */
310 			/* Underflow may happen */
311 
312 		      denormal_arg:
313 
314 			FPU_to_exp16(st0_ptr, st0_ptr);
315 
316 			st0_tag =
317 			    FPU_round(st0_ptr, 1, 0, FULL_PRECISION, arg_sign);
318 			FPU_settag0(st0_tag);
319 		}
320 		push();
321 		FPU_copy_to_reg0(&CONST_1, TAG_Valid);
322 		return;
323 	}
324 
325 	if (st0_tag == TAG_Zero) {
326 		push();
327 		FPU_copy_to_reg0(&CONST_1, TAG_Valid);
328 		setcc(0);
329 		return;
330 	}
331 
332 	if (st0_tag == TAG_Special)
333 		st0_tag = FPU_Special(st0_ptr);
334 
335 	if (st0_tag == TW_Denormal) {
336 		if (denormal_operand() < 0)
337 			return;
338 
339 		goto denormal_arg;
340 	}
341 
342 	if (st0_tag == TW_Infinity) {
343 		/* The 80486 treats infinity as an invalid operand */
344 		if (arith_invalid(0) >= 0) {
345 			st_new_ptr = &st(-1);
346 			push();
347 			arith_invalid(0);
348 		}
349 		return;
350 	}
351 
352 	single_arg_2_error(st0_ptr, st0_tag);
353 }
354 
355 static void fxtract(FPU_REG *st0_ptr, u_char st0_tag)
356 {
357 	FPU_REG *st_new_ptr;
358 	u_char sign;
359 	register FPU_REG *st1_ptr = st0_ptr;	/* anticipate */
360 
361 	if (STACK_OVERFLOW) {
362 		FPU_stack_overflow();
363 		return;
364 	}
365 
366 	clear_C1();
367 
368 	if (st0_tag == TAG_Valid) {
369 		long e;
370 
371 		push();
372 		sign = getsign(st1_ptr);
373 		reg_copy(st1_ptr, st_new_ptr);
374 		setexponent16(st_new_ptr, exponent(st_new_ptr));
375 
376 	      denormal_arg:
377 
378 		e = exponent16(st_new_ptr);
379 		convert_l2reg(&e, 1);
380 		setexponentpos(st_new_ptr, 0);
381 		setsign(st_new_ptr, sign);
382 		FPU_settag0(TAG_Valid);	/* Needed if arg was a denormal */
383 		return;
384 	} else if (st0_tag == TAG_Zero) {
385 		sign = getsign(st0_ptr);
386 
387 		if (FPU_divide_by_zero(0, SIGN_NEG) < 0)
388 			return;
389 
390 		push();
391 		FPU_copy_to_reg0(&CONST_Z, TAG_Zero);
392 		setsign(st_new_ptr, sign);
393 		return;
394 	}
395 
396 	if (st0_tag == TAG_Special)
397 		st0_tag = FPU_Special(st0_ptr);
398 
399 	if (st0_tag == TW_Denormal) {
400 		if (denormal_operand() < 0)
401 			return;
402 
403 		push();
404 		sign = getsign(st1_ptr);
405 		FPU_to_exp16(st1_ptr, st_new_ptr);
406 		goto denormal_arg;
407 	} else if (st0_tag == TW_Infinity) {
408 		sign = getsign(st0_ptr);
409 		setpositive(st0_ptr);
410 		push();
411 		FPU_copy_to_reg0(&CONST_INF, TAG_Special);
412 		setsign(st_new_ptr, sign);
413 		return;
414 	} else if (st0_tag == TW_NaN) {
415 		if (real_1op_NaN(st0_ptr) < 0)
416 			return;
417 
418 		push();
419 		FPU_copy_to_reg0(st0_ptr, TAG_Special);
420 		return;
421 	} else if (st0_tag == TAG_Empty) {
422 		/* Is this the correct behaviour? */
423 		if (control_word & EX_Invalid) {
424 			FPU_stack_underflow();
425 			push();
426 			FPU_stack_underflow();
427 		} else
428 			EXCEPTION(EX_StackUnder);
429 	}
430 #ifdef PARANOID
431 	else
432 		EXCEPTION(EX_INTERNAL | 0x119);
433 #endif /* PARANOID */
434 }
435 
436 static void fdecstp(void)
437 {
438 	clear_C1();
439 	top--;
440 }
441 
442 static void fincstp(void)
443 {
444 	clear_C1();
445 	top++;
446 }
447 
448 static void fsqrt_(FPU_REG *st0_ptr, u_char st0_tag)
449 {
450 	int expon;
451 
452 	clear_C1();
453 
454 	if (st0_tag == TAG_Valid) {
455 		u_char tag;
456 
457 		if (signnegative(st0_ptr)) {
458 			arith_invalid(0);	/* sqrt(negative) is invalid */
459 			return;
460 		}
461 
462 		/* make st(0) in  [1.0 .. 4.0) */
463 		expon = exponent(st0_ptr);
464 
465 	      denormal_arg:
466 
467 		setexponent16(st0_ptr, (expon & 1));
468 
469 		/* Do the computation, the sign of the result will be positive. */
470 		tag = wm_sqrt(st0_ptr, 0, 0, control_word, SIGN_POS);
471 		addexponent(st0_ptr, expon >> 1);
472 		FPU_settag0(tag);
473 		return;
474 	}
475 
476 	if (st0_tag == TAG_Zero)
477 		return;
478 
479 	if (st0_tag == TAG_Special)
480 		st0_tag = FPU_Special(st0_ptr);
481 
482 	if (st0_tag == TW_Infinity) {
483 		if (signnegative(st0_ptr))
484 			arith_invalid(0);	/* sqrt(-Infinity) is invalid */
485 		return;
486 	} else if (st0_tag == TW_Denormal) {
487 		if (signnegative(st0_ptr)) {
488 			arith_invalid(0);	/* sqrt(negative) is invalid */
489 			return;
490 		}
491 
492 		if (denormal_operand() < 0)
493 			return;
494 
495 		FPU_to_exp16(st0_ptr, st0_ptr);
496 
497 		expon = exponent16(st0_ptr);
498 
499 		goto denormal_arg;
500 	}
501 
502 	single_arg_error(st0_ptr, st0_tag);
503 
504 }
505 
506 static void frndint_(FPU_REG *st0_ptr, u_char st0_tag)
507 {
508 	int flags, tag;
509 
510 	if (st0_tag == TAG_Valid) {
511 		u_char sign;
512 
513 	      denormal_arg:
514 
515 		sign = getsign(st0_ptr);
516 
517 		if (exponent(st0_ptr) > 63)
518 			return;
519 
520 		if (st0_tag == TW_Denormal) {
521 			if (denormal_operand() < 0)
522 				return;
523 		}
524 
525 		/* Fortunately, this can't overflow to 2^64 */
526 		if ((flags = FPU_round_to_int(st0_ptr, st0_tag)))
527 			set_precision_flag(flags);
528 
529 		setexponent16(st0_ptr, 63);
530 		tag = FPU_normalize(st0_ptr);
531 		setsign(st0_ptr, sign);
532 		FPU_settag0(tag);
533 		return;
534 	}
535 
536 	if (st0_tag == TAG_Zero)
537 		return;
538 
539 	if (st0_tag == TAG_Special)
540 		st0_tag = FPU_Special(st0_ptr);
541 
542 	if (st0_tag == TW_Denormal)
543 		goto denormal_arg;
544 	else if (st0_tag == TW_Infinity)
545 		return;
546 	else
547 		single_arg_error(st0_ptr, st0_tag);
548 }
549 
550 static int f_sin(FPU_REG *st0_ptr, u_char tag)
551 {
552 	u_char arg_sign = getsign(st0_ptr);
553 
554 	if (tag == TAG_Valid) {
555 		int q;
556 
557 		if (exponent(st0_ptr) > -40) {
558 			if ((q = trig_arg(st0_ptr, 0)) == -1) {
559 				/* Operand is out of range */
560 				return 1;
561 			}
562 
563 			poly_sine(st0_ptr);
564 
565 			if (q & 2)
566 				changesign(st0_ptr);
567 
568 			setsign(st0_ptr, getsign(st0_ptr) ^ arg_sign);
569 
570 			/* We do not really know if up or down */
571 			set_precision_flag_up();
572 			return 0;
573 		} else {
574 			/* For a small arg, the result == the argument */
575 			set_precision_flag_up();	/* Must be up. */
576 			return 0;
577 		}
578 	}
579 
580 	if (tag == TAG_Zero) {
581 		setcc(0);
582 		return 0;
583 	}
584 
585 	if (tag == TAG_Special)
586 		tag = FPU_Special(st0_ptr);
587 
588 	if (tag == TW_Denormal) {
589 		if (denormal_operand() < 0)
590 			return 1;
591 
592 		/* For a small arg, the result == the argument */
593 		/* Underflow may happen */
594 		FPU_to_exp16(st0_ptr, st0_ptr);
595 
596 		tag = FPU_round(st0_ptr, 1, 0, FULL_PRECISION, arg_sign);
597 
598 		FPU_settag0(tag);
599 
600 		return 0;
601 	} else if (tag == TW_Infinity) {
602 		/* The 80486 treats infinity as an invalid operand */
603 		arith_invalid(0);
604 		return 1;
605 	} else {
606 		single_arg_error(st0_ptr, tag);
607 		return 1;
608 	}
609 }
610 
611 static void fsin(FPU_REG *st0_ptr, u_char tag)
612 {
613 	f_sin(st0_ptr, tag);
614 }
615 
616 static int f_cos(FPU_REG *st0_ptr, u_char tag)
617 {
618 	u_char st0_sign;
619 
620 	st0_sign = getsign(st0_ptr);
621 
622 	if (tag == TAG_Valid) {
623 		int q;
624 
625 		if (exponent(st0_ptr) > -40) {
626 			if ((exponent(st0_ptr) < 0)
627 			    || ((exponent(st0_ptr) == 0)
628 				&& (significand(st0_ptr) <=
629 				    0xc90fdaa22168c234LL))) {
630 				poly_cos(st0_ptr);
631 
632 				/* We do not really know if up or down */
633 				set_precision_flag_down();
634 
635 				return 0;
636 			} else if ((q = trig_arg(st0_ptr, FCOS)) != -1) {
637 				poly_sine(st0_ptr);
638 
639 				if ((q + 1) & 2)
640 					changesign(st0_ptr);
641 
642 				/* We do not really know if up or down */
643 				set_precision_flag_down();
644 
645 				return 0;
646 			} else {
647 				/* Operand is out of range */
648 				return 1;
649 			}
650 		} else {
651 		      denormal_arg:
652 
653 			setcc(0);
654 			FPU_copy_to_reg0(&CONST_1, TAG_Valid);
655 #ifdef PECULIAR_486
656 			set_precision_flag_down();	/* 80486 appears to do this. */
657 #else
658 			set_precision_flag_up();	/* Must be up. */
659 #endif /* PECULIAR_486 */
660 			return 0;
661 		}
662 	} else if (tag == TAG_Zero) {
663 		FPU_copy_to_reg0(&CONST_1, TAG_Valid);
664 		setcc(0);
665 		return 0;
666 	}
667 
668 	if (tag == TAG_Special)
669 		tag = FPU_Special(st0_ptr);
670 
671 	if (tag == TW_Denormal) {
672 		if (denormal_operand() < 0)
673 			return 1;
674 
675 		goto denormal_arg;
676 	} else if (tag == TW_Infinity) {
677 		/* The 80486 treats infinity as an invalid operand */
678 		arith_invalid(0);
679 		return 1;
680 	} else {
681 		single_arg_error(st0_ptr, tag);	/* requires st0_ptr == &st(0) */
682 		return 1;
683 	}
684 }
685 
686 static void fcos(FPU_REG *st0_ptr, u_char st0_tag)
687 {
688 	f_cos(st0_ptr, st0_tag);
689 }
690 
691 static void fsincos(FPU_REG *st0_ptr, u_char st0_tag)
692 {
693 	FPU_REG *st_new_ptr;
694 	FPU_REG arg;
695 	u_char tag;
696 
697 	/* Stack underflow has higher priority */
698 	if (st0_tag == TAG_Empty) {
699 		FPU_stack_underflow();	/* Puts a QNaN in st(0) */
700 		if (control_word & CW_Invalid) {
701 			st_new_ptr = &st(-1);
702 			push();
703 			FPU_stack_underflow();	/* Puts a QNaN in the new st(0) */
704 		}
705 		return;
706 	}
707 
708 	if (STACK_OVERFLOW) {
709 		FPU_stack_overflow();
710 		return;
711 	}
712 
713 	if (st0_tag == TAG_Special)
714 		tag = FPU_Special(st0_ptr);
715 	else
716 		tag = st0_tag;
717 
718 	if (tag == TW_NaN) {
719 		single_arg_2_error(st0_ptr, TW_NaN);
720 		return;
721 	} else if (tag == TW_Infinity) {
722 		/* The 80486 treats infinity as an invalid operand */
723 		if (arith_invalid(0) >= 0) {
724 			/* Masked response */
725 			push();
726 			arith_invalid(0);
727 		}
728 		return;
729 	}
730 
731 	reg_copy(st0_ptr, &arg);
732 	if (!f_sin(st0_ptr, st0_tag)) {
733 		push();
734 		FPU_copy_to_reg0(&arg, st0_tag);
735 		f_cos(&st(0), st0_tag);
736 	} else {
737 		/* An error, so restore st(0) */
738 		FPU_copy_to_reg0(&arg, st0_tag);
739 	}
740 }
741 
742 /*---------------------------------------------------------------------------*/
743 /* The following all require two arguments: st(0) and st(1) */
744 
745 /* A lean, mean kernel for the fprem instructions. This relies upon
746    the division and rounding to an integer in do_fprem giving an
747    exact result. Because of this, rem_kernel() needs to deal only with
748    the least significant 64 bits, the more significant bits of the
749    result must be zero.
750  */
751 static void rem_kernel(unsigned long long st0, unsigned long long *y,
752 		       unsigned long long st1, unsigned long long q, int n)
753 {
754 	int dummy;
755 	unsigned long long x;
756 
757 	x = st0 << n;
758 
759 	/* Do the required multiplication and subtraction in the one operation */
760 
761 	/* lsw x -= lsw st1 * lsw q */
762 	asm volatile ("mull %4; subl %%eax,%0; sbbl %%edx,%1":"=m"
763 		      (((unsigned *)&x)[0]), "=m"(((unsigned *)&x)[1]),
764 		      "=a"(dummy)
765 		      :"2"(((unsigned *)&st1)[0]), "m"(((unsigned *)&q)[0])
766 		      :"%dx");
767 	/* msw x -= msw st1 * lsw q */
768 	asm volatile ("mull %3; subl %%eax,%0":"=m" (((unsigned *)&x)[1]),
769 		      "=a"(dummy)
770 		      :"1"(((unsigned *)&st1)[1]), "m"(((unsigned *)&q)[0])
771 		      :"%dx");
772 	/* msw x -= lsw st1 * msw q */
773 	asm volatile ("mull %3; subl %%eax,%0":"=m" (((unsigned *)&x)[1]),
774 		      "=a"(dummy)
775 		      :"1"(((unsigned *)&st1)[0]), "m"(((unsigned *)&q)[1])
776 		      :"%dx");
777 
778 	*y = x;
779 }
780 
781 /* Remainder of st(0) / st(1) */
782 /* This routine produces exact results, i.e. there is never any
783    rounding or truncation, etc of the result. */
784 static void do_fprem(FPU_REG *st0_ptr, u_char st0_tag, int round)
785 {
786 	FPU_REG *st1_ptr = &st(1);
787 	u_char st1_tag = FPU_gettagi(1);
788 
789 	if (!((st0_tag ^ TAG_Valid) | (st1_tag ^ TAG_Valid))) {
790 		FPU_REG tmp, st0, st1;
791 		u_char st0_sign, st1_sign;
792 		u_char tmptag;
793 		int tag;
794 		int old_cw;
795 		int expdif;
796 		long long q;
797 		unsigned short saved_status;
798 		int cc;
799 
800 	      fprem_valid:
801 		/* Convert registers for internal use. */
802 		st0_sign = FPU_to_exp16(st0_ptr, &st0);
803 		st1_sign = FPU_to_exp16(st1_ptr, &st1);
804 		expdif = exponent16(&st0) - exponent16(&st1);
805 
806 		old_cw = control_word;
807 		cc = 0;
808 
809 		/* We want the status following the denorm tests, but don't want
810 		   the status changed by the arithmetic operations. */
811 		saved_status = partial_status;
812 		control_word &= ~CW_RC;
813 		control_word |= RC_CHOP;
814 
815 		if (expdif < 64) {
816 			/* This should be the most common case */
817 
818 			if (expdif > -2) {
819 				u_char sign = st0_sign ^ st1_sign;
820 				tag = FPU_u_div(&st0, &st1, &tmp,
821 						PR_64_BITS | RC_CHOP | 0x3f,
822 						sign);
823 				setsign(&tmp, sign);
824 
825 				if (exponent(&tmp) >= 0) {
826 					FPU_round_to_int(&tmp, tag);	/* Fortunately, this can't
827 									   overflow to 2^64 */
828 					q = significand(&tmp);
829 
830 					rem_kernel(significand(&st0),
831 						   &significand(&tmp),
832 						   significand(&st1),
833 						   q, expdif);
834 
835 					setexponent16(&tmp, exponent16(&st1));
836 				} else {
837 					reg_copy(&st0, &tmp);
838 					q = 0;
839 				}
840 
841 				if ((round == RC_RND)
842 				    && (tmp.sigh & 0xc0000000)) {
843 					/* We may need to subtract st(1) once more,
844 					   to get a result <= 1/2 of st(1). */
845 					unsigned long long x;
846 					expdif =
847 					    exponent16(&st1) - exponent16(&tmp);
848 					if (expdif <= 1) {
849 						if (expdif == 0)
850 							x = significand(&st1) -
851 							    significand(&tmp);
852 						else	/* expdif is 1 */
853 							x = (significand(&st1)
854 							     << 1) -
855 							    significand(&tmp);
856 						if ((x < significand(&tmp)) ||
857 						    /* or equi-distant (from 0 & st(1)) and q is odd */
858 						    ((x == significand(&tmp))
859 						     && (q & 1))) {
860 							st0_sign = !st0_sign;
861 							significand(&tmp) = x;
862 							q++;
863 						}
864 					}
865 				}
866 
867 				if (q & 4)
868 					cc |= SW_C0;
869 				if (q & 2)
870 					cc |= SW_C3;
871 				if (q & 1)
872 					cc |= SW_C1;
873 			} else {
874 				control_word = old_cw;
875 				setcc(0);
876 				return;
877 			}
878 		} else {
879 			/* There is a large exponent difference ( >= 64 ) */
880 			/* To make much sense, the code in this section should
881 			   be done at high precision. */
882 			int exp_1, N;
883 			u_char sign;
884 
885 			/* prevent overflow here */
886 			/* N is 'a number between 32 and 63' (p26-113) */
887 			reg_copy(&st0, &tmp);
888 			tmptag = st0_tag;
889 			N = (expdif & 0x0000001f) + 32;	/* This choice gives results
890 							   identical to an AMD 486 */
891 			setexponent16(&tmp, N);
892 			exp_1 = exponent16(&st1);
893 			setexponent16(&st1, 0);
894 			expdif -= N;
895 
896 			sign = getsign(&tmp) ^ st1_sign;
897 			tag =
898 			    FPU_u_div(&tmp, &st1, &tmp,
899 				      PR_64_BITS | RC_CHOP | 0x3f, sign);
900 			setsign(&tmp, sign);
901 
902 			FPU_round_to_int(&tmp, tag);	/* Fortunately, this can't
903 							   overflow to 2^64 */
904 
905 			rem_kernel(significand(&st0),
906 				   &significand(&tmp),
907 				   significand(&st1),
908 				   significand(&tmp), exponent(&tmp)
909 			    );
910 			setexponent16(&tmp, exp_1 + expdif);
911 
912 			/* It is possible for the operation to be complete here.
913 			   What does the IEEE standard say? The Intel 80486 manual
914 			   implies that the operation will never be completed at this
915 			   point, and the behaviour of a real 80486 confirms this.
916 			 */
917 			if (!(tmp.sigh | tmp.sigl)) {
918 				/* The result is zero */
919 				control_word = old_cw;
920 				partial_status = saved_status;
921 				FPU_copy_to_reg0(&CONST_Z, TAG_Zero);
922 				setsign(&st0, st0_sign);
923 #ifdef PECULIAR_486
924 				setcc(SW_C2);
925 #else
926 				setcc(0);
927 #endif /* PECULIAR_486 */
928 				return;
929 			}
930 			cc = SW_C2;
931 		}
932 
933 		control_word = old_cw;
934 		partial_status = saved_status;
935 		tag = FPU_normalize_nuo(&tmp);
936 		reg_copy(&tmp, st0_ptr);
937 
938 		/* The only condition to be looked for is underflow,
939 		   and it can occur here only if underflow is unmasked. */
940 		if ((exponent16(&tmp) <= EXP_UNDER) && (tag != TAG_Zero)
941 		    && !(control_word & CW_Underflow)) {
942 			setcc(cc);
943 			tag = arith_underflow(st0_ptr);
944 			setsign(st0_ptr, st0_sign);
945 			FPU_settag0(tag);
946 			return;
947 		} else if ((exponent16(&tmp) > EXP_UNDER) || (tag == TAG_Zero)) {
948 			stdexp(st0_ptr);
949 			setsign(st0_ptr, st0_sign);
950 		} else {
951 			tag =
952 			    FPU_round(st0_ptr, 0, 0, FULL_PRECISION, st0_sign);
953 		}
954 		FPU_settag0(tag);
955 		setcc(cc);
956 
957 		return;
958 	}
959 
960 	if (st0_tag == TAG_Special)
961 		st0_tag = FPU_Special(st0_ptr);
962 	if (st1_tag == TAG_Special)
963 		st1_tag = FPU_Special(st1_ptr);
964 
965 	if (((st0_tag == TAG_Valid) && (st1_tag == TW_Denormal))
966 	    || ((st0_tag == TW_Denormal) && (st1_tag == TAG_Valid))
967 	    || ((st0_tag == TW_Denormal) && (st1_tag == TW_Denormal))) {
968 		if (denormal_operand() < 0)
969 			return;
970 		goto fprem_valid;
971 	} else if ((st0_tag == TAG_Empty) || (st1_tag == TAG_Empty)) {
972 		FPU_stack_underflow();
973 		return;
974 	} else if (st0_tag == TAG_Zero) {
975 		if (st1_tag == TAG_Valid) {
976 			setcc(0);
977 			return;
978 		} else if (st1_tag == TW_Denormal) {
979 			if (denormal_operand() < 0)
980 				return;
981 			setcc(0);
982 			return;
983 		} else if (st1_tag == TAG_Zero) {
984 			arith_invalid(0);
985 			return;
986 		} /* fprem(?,0) always invalid */
987 		else if (st1_tag == TW_Infinity) {
988 			setcc(0);
989 			return;
990 		}
991 	} else if ((st0_tag == TAG_Valid) || (st0_tag == TW_Denormal)) {
992 		if (st1_tag == TAG_Zero) {
993 			arith_invalid(0);	/* fprem(Valid,Zero) is invalid */
994 			return;
995 		} else if (st1_tag != TW_NaN) {
996 			if (((st0_tag == TW_Denormal)
997 			     || (st1_tag == TW_Denormal))
998 			    && (denormal_operand() < 0))
999 				return;
1000 
1001 			if (st1_tag == TW_Infinity) {
1002 				/* fprem(Valid,Infinity) is o.k. */
1003 				setcc(0);
1004 				return;
1005 			}
1006 		}
1007 	} else if (st0_tag == TW_Infinity) {
1008 		if (st1_tag != TW_NaN) {
1009 			arith_invalid(0);	/* fprem(Infinity,?) is invalid */
1010 			return;
1011 		}
1012 	}
1013 
1014 	/* One of the registers must contain a NaN if we got here. */
1015 
1016 #ifdef PARANOID
1017 	if ((st0_tag != TW_NaN) && (st1_tag != TW_NaN))
1018 		EXCEPTION(EX_INTERNAL | 0x118);
1019 #endif /* PARANOID */
1020 
1021 	real_2op_NaN(st1_ptr, st1_tag, 0, st1_ptr);
1022 
1023 }
1024 
1025 /* ST(1) <- ST(1) * log ST;  pop ST */
1026 static void fyl2x(FPU_REG *st0_ptr, u_char st0_tag)
1027 {
1028 	FPU_REG *st1_ptr = &st(1), exponent;
1029 	u_char st1_tag = FPU_gettagi(1);
1030 	u_char sign;
1031 	int e, tag;
1032 
1033 	clear_C1();
1034 
1035 	if ((st0_tag == TAG_Valid) && (st1_tag == TAG_Valid)) {
1036 	      both_valid:
1037 		/* Both regs are Valid or Denormal */
1038 		if (signpositive(st0_ptr)) {
1039 			if (st0_tag == TW_Denormal)
1040 				FPU_to_exp16(st0_ptr, st0_ptr);
1041 			else
1042 				/* Convert st(0) for internal use. */
1043 				setexponent16(st0_ptr, exponent(st0_ptr));
1044 
1045 			if ((st0_ptr->sigh == 0x80000000)
1046 			    && (st0_ptr->sigl == 0)) {
1047 				/* Special case. The result can be precise. */
1048 				u_char esign;
1049 				e = exponent16(st0_ptr);
1050 				if (e >= 0) {
1051 					exponent.sigh = e;
1052 					esign = SIGN_POS;
1053 				} else {
1054 					exponent.sigh = -e;
1055 					esign = SIGN_NEG;
1056 				}
1057 				exponent.sigl = 0;
1058 				setexponent16(&exponent, 31);
1059 				tag = FPU_normalize_nuo(&exponent);
1060 				stdexp(&exponent);
1061 				setsign(&exponent, esign);
1062 				tag =
1063 				    FPU_mul(&exponent, tag, 1, FULL_PRECISION);
1064 				if (tag >= 0)
1065 					FPU_settagi(1, tag);
1066 			} else {
1067 				/* The usual case */
1068 				sign = getsign(st1_ptr);
1069 				if (st1_tag == TW_Denormal)
1070 					FPU_to_exp16(st1_ptr, st1_ptr);
1071 				else
1072 					/* Convert st(1) for internal use. */
1073 					setexponent16(st1_ptr,
1074 						      exponent(st1_ptr));
1075 				poly_l2(st0_ptr, st1_ptr, sign);
1076 			}
1077 		} else {
1078 			/* negative */
1079 			if (arith_invalid(1) < 0)
1080 				return;
1081 		}
1082 
1083 		FPU_pop();
1084 
1085 		return;
1086 	}
1087 
1088 	if (st0_tag == TAG_Special)
1089 		st0_tag = FPU_Special(st0_ptr);
1090 	if (st1_tag == TAG_Special)
1091 		st1_tag = FPU_Special(st1_ptr);
1092 
1093 	if ((st0_tag == TAG_Empty) || (st1_tag == TAG_Empty)) {
1094 		FPU_stack_underflow_pop(1);
1095 		return;
1096 	} else if ((st0_tag <= TW_Denormal) && (st1_tag <= TW_Denormal)) {
1097 		if (st0_tag == TAG_Zero) {
1098 			if (st1_tag == TAG_Zero) {
1099 				/* Both args zero is invalid */
1100 				if (arith_invalid(1) < 0)
1101 					return;
1102 			} else {
1103 				u_char sign;
1104 				sign = getsign(st1_ptr) ^ SIGN_NEG;
1105 				if (FPU_divide_by_zero(1, sign) < 0)
1106 					return;
1107 
1108 				setsign(st1_ptr, sign);
1109 			}
1110 		} else if (st1_tag == TAG_Zero) {
1111 			/* st(1) contains zero, st(0) valid <> 0 */
1112 			/* Zero is the valid answer */
1113 			sign = getsign(st1_ptr);
1114 
1115 			if (signnegative(st0_ptr)) {
1116 				/* log(negative) */
1117 				if (arith_invalid(1) < 0)
1118 					return;
1119 			} else if ((st0_tag == TW_Denormal)
1120 				   && (denormal_operand() < 0))
1121 				return;
1122 			else {
1123 				if (exponent(st0_ptr) < 0)
1124 					sign ^= SIGN_NEG;
1125 
1126 				FPU_copy_to_reg1(&CONST_Z, TAG_Zero);
1127 				setsign(st1_ptr, sign);
1128 			}
1129 		} else {
1130 			/* One or both operands are denormals. */
1131 			if (denormal_operand() < 0)
1132 				return;
1133 			goto both_valid;
1134 		}
1135 	} else if ((st0_tag == TW_NaN) || (st1_tag == TW_NaN)) {
1136 		if (real_2op_NaN(st0_ptr, st0_tag, 1, st0_ptr) < 0)
1137 			return;
1138 	}
1139 	/* One or both arg must be an infinity */
1140 	else if (st0_tag == TW_Infinity) {
1141 		if ((signnegative(st0_ptr)) || (st1_tag == TAG_Zero)) {
1142 			/* log(-infinity) or 0*log(infinity) */
1143 			if (arith_invalid(1) < 0)
1144 				return;
1145 		} else {
1146 			u_char sign = getsign(st1_ptr);
1147 
1148 			if ((st1_tag == TW_Denormal)
1149 			    && (denormal_operand() < 0))
1150 				return;
1151 
1152 			FPU_copy_to_reg1(&CONST_INF, TAG_Special);
1153 			setsign(st1_ptr, sign);
1154 		}
1155 	}
1156 	/* st(1) must be infinity here */
1157 	else if (((st0_tag == TAG_Valid) || (st0_tag == TW_Denormal))
1158 		 && (signpositive(st0_ptr))) {
1159 		if (exponent(st0_ptr) >= 0) {
1160 			if ((exponent(st0_ptr) == 0) &&
1161 			    (st0_ptr->sigh == 0x80000000) &&
1162 			    (st0_ptr->sigl == 0)) {
1163 				/* st(0) holds 1.0 */
1164 				/* infinity*log(1) */
1165 				if (arith_invalid(1) < 0)
1166 					return;
1167 			}
1168 			/* else st(0) is positive and > 1.0 */
1169 		} else {
1170 			/* st(0) is positive and < 1.0 */
1171 
1172 			if ((st0_tag == TW_Denormal)
1173 			    && (denormal_operand() < 0))
1174 				return;
1175 
1176 			changesign(st1_ptr);
1177 		}
1178 	} else {
1179 		/* st(0) must be zero or negative */
1180 		if (st0_tag == TAG_Zero) {
1181 			/* This should be invalid, but a real 80486 is happy with it. */
1182 
1183 #ifndef PECULIAR_486
1184 			sign = getsign(st1_ptr);
1185 			if (FPU_divide_by_zero(1, sign) < 0)
1186 				return;
1187 #endif /* PECULIAR_486 */
1188 
1189 			changesign(st1_ptr);
1190 		} else if (arith_invalid(1) < 0)	/* log(negative) */
1191 			return;
1192 	}
1193 
1194 	FPU_pop();
1195 }
1196 
1197 static void fpatan(FPU_REG *st0_ptr, u_char st0_tag)
1198 {
1199 	FPU_REG *st1_ptr = &st(1);
1200 	u_char st1_tag = FPU_gettagi(1);
1201 	int tag;
1202 
1203 	clear_C1();
1204 	if (!((st0_tag ^ TAG_Valid) | (st1_tag ^ TAG_Valid))) {
1205 	      valid_atan:
1206 
1207 		poly_atan(st0_ptr, st0_tag, st1_ptr, st1_tag);
1208 
1209 		FPU_pop();
1210 
1211 		return;
1212 	}
1213 
1214 	if (st0_tag == TAG_Special)
1215 		st0_tag = FPU_Special(st0_ptr);
1216 	if (st1_tag == TAG_Special)
1217 		st1_tag = FPU_Special(st1_ptr);
1218 
1219 	if (((st0_tag == TAG_Valid) && (st1_tag == TW_Denormal))
1220 	    || ((st0_tag == TW_Denormal) && (st1_tag == TAG_Valid))
1221 	    || ((st0_tag == TW_Denormal) && (st1_tag == TW_Denormal))) {
1222 		if (denormal_operand() < 0)
1223 			return;
1224 
1225 		goto valid_atan;
1226 	} else if ((st0_tag == TAG_Empty) || (st1_tag == TAG_Empty)) {
1227 		FPU_stack_underflow_pop(1);
1228 		return;
1229 	} else if ((st0_tag == TW_NaN) || (st1_tag == TW_NaN)) {
1230 		if (real_2op_NaN(st0_ptr, st0_tag, 1, st0_ptr) >= 0)
1231 			FPU_pop();
1232 		return;
1233 	} else if ((st0_tag == TW_Infinity) || (st1_tag == TW_Infinity)) {
1234 		u_char sign = getsign(st1_ptr);
1235 		if (st0_tag == TW_Infinity) {
1236 			if (st1_tag == TW_Infinity) {
1237 				if (signpositive(st0_ptr)) {
1238 					FPU_copy_to_reg1(&CONST_PI4, TAG_Valid);
1239 				} else {
1240 					setpositive(st1_ptr);
1241 					tag =
1242 					    FPU_u_add(&CONST_PI4, &CONST_PI2,
1243 						      st1_ptr, FULL_PRECISION,
1244 						      SIGN_POS,
1245 						      exponent(&CONST_PI4),
1246 						      exponent(&CONST_PI2));
1247 					if (tag >= 0)
1248 						FPU_settagi(1, tag);
1249 				}
1250 			} else {
1251 				if ((st1_tag == TW_Denormal)
1252 				    && (denormal_operand() < 0))
1253 					return;
1254 
1255 				if (signpositive(st0_ptr)) {
1256 					FPU_copy_to_reg1(&CONST_Z, TAG_Zero);
1257 					setsign(st1_ptr, sign);	/* An 80486 preserves the sign */
1258 					FPU_pop();
1259 					return;
1260 				} else {
1261 					FPU_copy_to_reg1(&CONST_PI, TAG_Valid);
1262 				}
1263 			}
1264 		} else {
1265 			/* st(1) is infinity, st(0) not infinity */
1266 			if ((st0_tag == TW_Denormal)
1267 			    && (denormal_operand() < 0))
1268 				return;
1269 
1270 			FPU_copy_to_reg1(&CONST_PI2, TAG_Valid);
1271 		}
1272 		setsign(st1_ptr, sign);
1273 	} else if (st1_tag == TAG_Zero) {
1274 		/* st(0) must be valid or zero */
1275 		u_char sign = getsign(st1_ptr);
1276 
1277 		if ((st0_tag == TW_Denormal) && (denormal_operand() < 0))
1278 			return;
1279 
1280 		if (signpositive(st0_ptr)) {
1281 			/* An 80486 preserves the sign */
1282 			FPU_pop();
1283 			return;
1284 		}
1285 
1286 		FPU_copy_to_reg1(&CONST_PI, TAG_Valid);
1287 		setsign(st1_ptr, sign);
1288 	} else if (st0_tag == TAG_Zero) {
1289 		/* st(1) must be TAG_Valid here */
1290 		u_char sign = getsign(st1_ptr);
1291 
1292 		if ((st1_tag == TW_Denormal) && (denormal_operand() < 0))
1293 			return;
1294 
1295 		FPU_copy_to_reg1(&CONST_PI2, TAG_Valid);
1296 		setsign(st1_ptr, sign);
1297 	}
1298 #ifdef PARANOID
1299 	else
1300 		EXCEPTION(EX_INTERNAL | 0x125);
1301 #endif /* PARANOID */
1302 
1303 	FPU_pop();
1304 	set_precision_flag_up();	/* We do not really know if up or down */
1305 }
1306 
1307 static void fprem(FPU_REG *st0_ptr, u_char st0_tag)
1308 {
1309 	do_fprem(st0_ptr, st0_tag, RC_CHOP);
1310 }
1311 
1312 static void fprem1(FPU_REG *st0_ptr, u_char st0_tag)
1313 {
1314 	do_fprem(st0_ptr, st0_tag, RC_RND);
1315 }
1316 
1317 static void fyl2xp1(FPU_REG *st0_ptr, u_char st0_tag)
1318 {
1319 	u_char sign, sign1;
1320 	FPU_REG *st1_ptr = &st(1), a, b;
1321 	u_char st1_tag = FPU_gettagi(1);
1322 
1323 	clear_C1();
1324 	if (!((st0_tag ^ TAG_Valid) | (st1_tag ^ TAG_Valid))) {
1325 	      valid_yl2xp1:
1326 
1327 		sign = getsign(st0_ptr);
1328 		sign1 = getsign(st1_ptr);
1329 
1330 		FPU_to_exp16(st0_ptr, &a);
1331 		FPU_to_exp16(st1_ptr, &b);
1332 
1333 		if (poly_l2p1(sign, sign1, &a, &b, st1_ptr))
1334 			return;
1335 
1336 		FPU_pop();
1337 		return;
1338 	}
1339 
1340 	if (st0_tag == TAG_Special)
1341 		st0_tag = FPU_Special(st0_ptr);
1342 	if (st1_tag == TAG_Special)
1343 		st1_tag = FPU_Special(st1_ptr);
1344 
1345 	if (((st0_tag == TAG_Valid) && (st1_tag == TW_Denormal))
1346 	    || ((st0_tag == TW_Denormal) && (st1_tag == TAG_Valid))
1347 	    || ((st0_tag == TW_Denormal) && (st1_tag == TW_Denormal))) {
1348 		if (denormal_operand() < 0)
1349 			return;
1350 
1351 		goto valid_yl2xp1;
1352 	} else if ((st0_tag == TAG_Empty) | (st1_tag == TAG_Empty)) {
1353 		FPU_stack_underflow_pop(1);
1354 		return;
1355 	} else if (st0_tag == TAG_Zero) {
1356 		switch (st1_tag) {
1357 		case TW_Denormal:
1358 			if (denormal_operand() < 0)
1359 				return;
1360 			fallthrough;
1361 		case TAG_Zero:
1362 		case TAG_Valid:
1363 			setsign(st0_ptr, getsign(st0_ptr) ^ getsign(st1_ptr));
1364 			FPU_copy_to_reg1(st0_ptr, st0_tag);
1365 			break;
1366 
1367 		case TW_Infinity:
1368 			/* Infinity*log(1) */
1369 			if (arith_invalid(1) < 0)
1370 				return;
1371 			break;
1372 
1373 		case TW_NaN:
1374 			if (real_2op_NaN(st0_ptr, st0_tag, 1, st0_ptr) < 0)
1375 				return;
1376 			break;
1377 
1378 		default:
1379 #ifdef PARANOID
1380 			EXCEPTION(EX_INTERNAL | 0x116);
1381 			return;
1382 #endif /* PARANOID */
1383 			break;
1384 		}
1385 	} else if ((st0_tag == TAG_Valid) || (st0_tag == TW_Denormal)) {
1386 		switch (st1_tag) {
1387 		case TAG_Zero:
1388 			if (signnegative(st0_ptr)) {
1389 				if (exponent(st0_ptr) >= 0) {
1390 					/* st(0) holds <= -1.0 */
1391 #ifdef PECULIAR_486		/* Stupid 80486 doesn't worry about log(negative). */
1392 					changesign(st1_ptr);
1393 #else
1394 					if (arith_invalid(1) < 0)
1395 						return;
1396 #endif /* PECULIAR_486 */
1397 				} else if ((st0_tag == TW_Denormal)
1398 					   && (denormal_operand() < 0))
1399 					return;
1400 				else
1401 					changesign(st1_ptr);
1402 			} else if ((st0_tag == TW_Denormal)
1403 				   && (denormal_operand() < 0))
1404 				return;
1405 			break;
1406 
1407 		case TW_Infinity:
1408 			if (signnegative(st0_ptr)) {
1409 				if ((exponent(st0_ptr) >= 0) &&
1410 				    !((st0_ptr->sigh == 0x80000000) &&
1411 				      (st0_ptr->sigl == 0))) {
1412 					/* st(0) holds < -1.0 */
1413 #ifdef PECULIAR_486		/* Stupid 80486 doesn't worry about log(negative). */
1414 					changesign(st1_ptr);
1415 #else
1416 					if (arith_invalid(1) < 0)
1417 						return;
1418 #endif /* PECULIAR_486 */
1419 				} else if ((st0_tag == TW_Denormal)
1420 					   && (denormal_operand() < 0))
1421 					return;
1422 				else
1423 					changesign(st1_ptr);
1424 			} else if ((st0_tag == TW_Denormal)
1425 				   && (denormal_operand() < 0))
1426 				return;
1427 			break;
1428 
1429 		case TW_NaN:
1430 			if (real_2op_NaN(st0_ptr, st0_tag, 1, st0_ptr) < 0)
1431 				return;
1432 		}
1433 
1434 	} else if (st0_tag == TW_NaN) {
1435 		if (real_2op_NaN(st0_ptr, st0_tag, 1, st0_ptr) < 0)
1436 			return;
1437 	} else if (st0_tag == TW_Infinity) {
1438 		if (st1_tag == TW_NaN) {
1439 			if (real_2op_NaN(st0_ptr, st0_tag, 1, st0_ptr) < 0)
1440 				return;
1441 		} else if (signnegative(st0_ptr)) {
1442 #ifndef PECULIAR_486
1443 			/* This should have higher priority than denormals, but... */
1444 			if (arith_invalid(1) < 0)	/* log(-infinity) */
1445 				return;
1446 #endif /* PECULIAR_486 */
1447 			if ((st1_tag == TW_Denormal)
1448 			    && (denormal_operand() < 0))
1449 				return;
1450 #ifdef PECULIAR_486
1451 			/* Denormal operands actually get higher priority */
1452 			if (arith_invalid(1) < 0)	/* log(-infinity) */
1453 				return;
1454 #endif /* PECULIAR_486 */
1455 		} else if (st1_tag == TAG_Zero) {
1456 			/* log(infinity) */
1457 			if (arith_invalid(1) < 0)
1458 				return;
1459 		}
1460 
1461 		/* st(1) must be valid here. */
1462 
1463 		else if ((st1_tag == TW_Denormal) && (denormal_operand() < 0))
1464 			return;
1465 
1466 		/* The Manual says that log(Infinity) is invalid, but a real
1467 		   80486 sensibly says that it is o.k. */
1468 		else {
1469 			u_char sign = getsign(st1_ptr);
1470 			FPU_copy_to_reg1(&CONST_INF, TAG_Special);
1471 			setsign(st1_ptr, sign);
1472 		}
1473 	}
1474 #ifdef PARANOID
1475 	else {
1476 		EXCEPTION(EX_INTERNAL | 0x117);
1477 		return;
1478 	}
1479 #endif /* PARANOID */
1480 
1481 	FPU_pop();
1482 	return;
1483 
1484 }
1485 
1486 static void fscale(FPU_REG *st0_ptr, u_char st0_tag)
1487 {
1488 	FPU_REG *st1_ptr = &st(1);
1489 	u_char st1_tag = FPU_gettagi(1);
1490 	int old_cw = control_word;
1491 	u_char sign = getsign(st0_ptr);
1492 
1493 	clear_C1();
1494 	if (!((st0_tag ^ TAG_Valid) | (st1_tag ^ TAG_Valid))) {
1495 		long scale;
1496 		FPU_REG tmp;
1497 
1498 		/* Convert register for internal use. */
1499 		setexponent16(st0_ptr, exponent(st0_ptr));
1500 
1501 	      valid_scale:
1502 
1503 		if (exponent(st1_ptr) > 30) {
1504 			/* 2^31 is far too large, would require 2^(2^30) or 2^(-2^30) */
1505 
1506 			if (signpositive(st1_ptr)) {
1507 				EXCEPTION(EX_Overflow);
1508 				FPU_copy_to_reg0(&CONST_INF, TAG_Special);
1509 			} else {
1510 				EXCEPTION(EX_Underflow);
1511 				FPU_copy_to_reg0(&CONST_Z, TAG_Zero);
1512 			}
1513 			setsign(st0_ptr, sign);
1514 			return;
1515 		}
1516 
1517 		control_word &= ~CW_RC;
1518 		control_word |= RC_CHOP;
1519 		reg_copy(st1_ptr, &tmp);
1520 		FPU_round_to_int(&tmp, st1_tag);	/* This can never overflow here */
1521 		control_word = old_cw;
1522 		scale = signnegative(st1_ptr) ? -tmp.sigl : tmp.sigl;
1523 		scale += exponent16(st0_ptr);
1524 
1525 		setexponent16(st0_ptr, scale);
1526 
1527 		/* Use FPU_round() to properly detect under/overflow etc */
1528 		FPU_round(st0_ptr, 0, 0, control_word, sign);
1529 
1530 		return;
1531 	}
1532 
1533 	if (st0_tag == TAG_Special)
1534 		st0_tag = FPU_Special(st0_ptr);
1535 	if (st1_tag == TAG_Special)
1536 		st1_tag = FPU_Special(st1_ptr);
1537 
1538 	if ((st0_tag == TAG_Valid) || (st0_tag == TW_Denormal)) {
1539 		switch (st1_tag) {
1540 		case TAG_Valid:
1541 			/* st(0) must be a denormal */
1542 			if ((st0_tag == TW_Denormal)
1543 			    && (denormal_operand() < 0))
1544 				return;
1545 
1546 			FPU_to_exp16(st0_ptr, st0_ptr);	/* Will not be left on stack */
1547 			goto valid_scale;
1548 
1549 		case TAG_Zero:
1550 			if (st0_tag == TW_Denormal)
1551 				denormal_operand();
1552 			return;
1553 
1554 		case TW_Denormal:
1555 			denormal_operand();
1556 			return;
1557 
1558 		case TW_Infinity:
1559 			if ((st0_tag == TW_Denormal)
1560 			    && (denormal_operand() < 0))
1561 				return;
1562 
1563 			if (signpositive(st1_ptr))
1564 				FPU_copy_to_reg0(&CONST_INF, TAG_Special);
1565 			else
1566 				FPU_copy_to_reg0(&CONST_Z, TAG_Zero);
1567 			setsign(st0_ptr, sign);
1568 			return;
1569 
1570 		case TW_NaN:
1571 			real_2op_NaN(st1_ptr, st1_tag, 0, st0_ptr);
1572 			return;
1573 		}
1574 	} else if (st0_tag == TAG_Zero) {
1575 		switch (st1_tag) {
1576 		case TAG_Valid:
1577 		case TAG_Zero:
1578 			return;
1579 
1580 		case TW_Denormal:
1581 			denormal_operand();
1582 			return;
1583 
1584 		case TW_Infinity:
1585 			if (signpositive(st1_ptr))
1586 				arith_invalid(0);	/* Zero scaled by +Infinity */
1587 			return;
1588 
1589 		case TW_NaN:
1590 			real_2op_NaN(st1_ptr, st1_tag, 0, st0_ptr);
1591 			return;
1592 		}
1593 	} else if (st0_tag == TW_Infinity) {
1594 		switch (st1_tag) {
1595 		case TAG_Valid:
1596 		case TAG_Zero:
1597 			return;
1598 
1599 		case TW_Denormal:
1600 			denormal_operand();
1601 			return;
1602 
1603 		case TW_Infinity:
1604 			if (signnegative(st1_ptr))
1605 				arith_invalid(0);	/* Infinity scaled by -Infinity */
1606 			return;
1607 
1608 		case TW_NaN:
1609 			real_2op_NaN(st1_ptr, st1_tag, 0, st0_ptr);
1610 			return;
1611 		}
1612 	} else if (st0_tag == TW_NaN) {
1613 		if (st1_tag != TAG_Empty) {
1614 			real_2op_NaN(st1_ptr, st1_tag, 0, st0_ptr);
1615 			return;
1616 		}
1617 	}
1618 #ifdef PARANOID
1619 	if (!((st0_tag == TAG_Empty) || (st1_tag == TAG_Empty))) {
1620 		EXCEPTION(EX_INTERNAL | 0x115);
1621 		return;
1622 	}
1623 #endif
1624 
1625 	/* At least one of st(0), st(1) must be empty */
1626 	FPU_stack_underflow();
1627 
1628 }
1629 
1630 /*---------------------------------------------------------------------------*/
1631 
1632 static FUNC_ST0 const trig_table_a[] = {
1633 	f2xm1, fyl2x, fptan, fpatan,
1634 	fxtract, fprem1, (FUNC_ST0) fdecstp, (FUNC_ST0) fincstp
1635 };
1636 
1637 void FPU_triga(void)
1638 {
1639 	(trig_table_a[FPU_rm]) (&st(0), FPU_gettag0());
1640 }
1641 
1642 static FUNC_ST0 const trig_table_b[] = {
1643 	fprem, fyl2xp1, fsqrt_, fsincos, frndint_, fscale, fsin, fcos
1644 };
1645 
1646 void FPU_trigb(void)
1647 {
1648 	(trig_table_b[FPU_rm]) (&st(0), FPU_gettag0());
1649 }
1650