CoCalc -- fpu

GitHub Repository: torvalds/linux
Path: blob/master/arch/x86/math-emu/fpu_trig.c
²⁶⁴²⁴ views
1
// SPDX-License-Identifier: GPL-2.0
2
/*---------------------------------------------------------------------------+
3
 |  fpu_trig.c                                                               |
4
 |                                                                           |
5
 | Implementation of the FPU "transcendental" functions.                     |
6
 |                                                                           |
7
 | Copyright (C) 1992,1993,1994,1997,1999                                    |
8
 |                       W. Metzenthen, 22 Parker St, Ormond, Vic 3163,      |
9
 |                       Australia.  E-mail   [email protected]            |
10
 |                                                                           |
11
 |                                                                           |
12
 +---------------------------------------------------------------------------*/
13

14
#include "fpu_system.h"
15
#include "exception.h"
16
#include "fpu_emu.h"
17
#include "status_w.h"
18
#include "control_w.h"
19
#include "reg_constant.h"
20

21
static void rem_kernel(unsigned long long st0, unsigned long long *y,
22
		       unsigned long long st1, unsigned long long q, int n);
23

24
#define BETTER_THAN_486
25

26
#define FCOS  4
27

28
/* Used only by fptan, fsin, fcos, and fsincos. */
29
/* This routine produces very accurate results, similar to
30
   using a value of pi with more than 128 bits precision. */
31
/* Limited measurements show no results worse than 64 bit precision
32
   except for the results for arguments close to 2^63, where the
33
   precision of the result sometimes degrades to about 63.9 bits */
34
static int trig_arg(FPU_REG *st0_ptr, int even)
35
{
36
	FPU_REG tmp;
37
	u_char tmptag;
38
	unsigned long long q;
39
	int old_cw = control_word, saved_status = partial_status;
40
	int tag, st0_tag = TAG_Valid;
41

42
	if (exponent(st0_ptr) >= 63) {
43
		partial_status |= SW_C2;	/* Reduction incomplete. */
44
		return -1;
45
	}
46

47
	control_word &= ~CW_RC;
48
	control_word |= RC_CHOP;
49

50
	setpositive(st0_ptr);
51
	tag = FPU_u_div(st0_ptr, &CONST_PI2, &tmp, PR_64_BITS | RC_CHOP | 0x3f,
52
			SIGN_POS);
53

54
	FPU_round_to_int(&tmp, tag);	/* Fortunately, this can't overflow
55
					   to 2^64 */
56
	q = significand(&tmp);
57
	if (q) {
58
		rem_kernel(significand(st0_ptr),
59
			   &significand(&tmp),
60
			   significand(&CONST_PI2),
61
			   q, exponent(st0_ptr) - exponent(&CONST_PI2));
62
		setexponent16(&tmp, exponent(&CONST_PI2));
63
		st0_tag = FPU_normalize(&tmp);
64
		FPU_copy_to_reg0(&tmp, st0_tag);
65
	}
66

67
	if ((even && !(q & 1)) || (!even && (q & 1))) {
68
		st0_tag =
69
		    FPU_sub(REV | LOADED | TAG_Valid, (int)&CONST_PI2,
70
			    FULL_PRECISION);
71

72
#ifdef BETTER_THAN_486
73
		/* So far, the results are exact but based upon a 64 bit
74
		   precision approximation to pi/2. The technique used
75
		   now is equivalent to using an approximation to pi/2 which
76
		   is accurate to about 128 bits. */
77
		if ((exponent(st0_ptr) <= exponent(&CONST_PI2extra) + 64)
78
		    || (q > 1)) {
79
			/* This code gives the effect of having pi/2 to better than
80
			   128 bits precision. */
81

82
			significand(&tmp) = q + 1;
83
			setexponent16(&tmp, 63);
84
			FPU_normalize(&tmp);
85
			tmptag =
86
			    FPU_u_mul(&CONST_PI2extra, &tmp, &tmp,
87
				      FULL_PRECISION, SIGN_POS,
88
				      exponent(&CONST_PI2extra) +
89
				      exponent(&tmp));
90
			setsign(&tmp, getsign(&CONST_PI2extra));
91
			st0_tag = FPU_add(&tmp, tmptag, 0, FULL_PRECISION);
92
			if (signnegative(st0_ptr)) {
93
				/* CONST_PI2extra is negative, so the result of the addition
94
				   can be negative. This means that the argument is actually
95
				   in a different quadrant. The correction is always < pi/2,
96
				   so it can't overflow into yet another quadrant. */
97
				setpositive(st0_ptr);
98
				q++;
99
			}
100
		}
101
#endif /* BETTER_THAN_486 */
102
	}
103
#ifdef BETTER_THAN_486
104
	else {
105
		/* So far, the results are exact but based upon a 64 bit
106
		   precision approximation to pi/2. The technique used
107
		   now is equivalent to using an approximation to pi/2 which
108
		   is accurate to about 128 bits. */
109
		if (((q > 0)
110
		     && (exponent(st0_ptr) <= exponent(&CONST_PI2extra) + 64))
111
		    || (q > 1)) {
112
			/* This code gives the effect of having p/2 to better than
113
			   128 bits precision. */
114

115
			significand(&tmp) = q;
116
			setexponent16(&tmp, 63);
117
			FPU_normalize(&tmp);	/* This must return TAG_Valid */
118
			tmptag =
119
			    FPU_u_mul(&CONST_PI2extra, &tmp, &tmp,
120
				      FULL_PRECISION, SIGN_POS,
121
				      exponent(&CONST_PI2extra) +
122
				      exponent(&tmp));
123
			setsign(&tmp, getsign(&CONST_PI2extra));
124
			st0_tag = FPU_sub(LOADED | (tmptag & 0x0f), (int)&tmp,
125
					  FULL_PRECISION);
126
			if ((exponent(st0_ptr) == exponent(&CONST_PI2)) &&
127
			    ((st0_ptr->sigh > CONST_PI2.sigh)
128
			     || ((st0_ptr->sigh == CONST_PI2.sigh)
129
				 && (st0_ptr->sigl > CONST_PI2.sigl)))) {
130
				/* CONST_PI2extra is negative, so the result of the
131
				   subtraction can be larger than pi/2. This means
132
				   that the argument is actually in a different quadrant.
133
				   The correction is always < pi/2, so it can't overflow
134
				   into yet another quadrant. */
135
				st0_tag =
136
				    FPU_sub(REV | LOADED | TAG_Valid,
137
					    (int)&CONST_PI2, FULL_PRECISION);
138
				q++;
139
			}
140
		}
141
	}
142
#endif /* BETTER_THAN_486 */
143

144
	FPU_settag0(st0_tag);
145
	control_word = old_cw;
146
	partial_status = saved_status & ~SW_C2;	/* Reduction complete. */
147

148
	return (q & 3) | even;
149
}
150

151
/* Convert a long to register */
152
static void convert_l2reg(long const *arg, int deststnr)
153
{
154
	int tag;
155
	long num = *arg;
156
	u_char sign;
157
	FPU_REG *dest = &st(deststnr);
158

159
	if (num == 0) {
160
		FPU_copy_to_regi(&CONST_Z, TAG_Zero, deststnr);
161
		return;
162
	}
163

164
	if (num > 0) {
165
		sign = SIGN_POS;
166
	} else {
167
		num = -num;
168
		sign = SIGN_NEG;
169
	}
170

171
	dest->sigh = num;
172
	dest->sigl = 0;
173
	setexponent16(dest, 31);
174
	tag = FPU_normalize(dest);
175
	FPU_settagi(deststnr, tag);
176
	setsign(dest, sign);
177
	return;
178
}
179

180
static void single_arg_error(FPU_REG *st0_ptr, u_char st0_tag)
181
{
182
	if (st0_tag == TAG_Empty)
183
		FPU_stack_underflow();	/* Puts a QNaN in st(0) */
184
	else if (st0_tag == TW_NaN)
185
		real_1op_NaN(st0_ptr);	/* return with a NaN in st(0) */
186
#ifdef PARANOID
187
	else
188
		EXCEPTION(EX_INTERNAL | 0x0112);
189
#endif /* PARANOID */
190
}
191

192
static void single_arg_2_error(FPU_REG *st0_ptr, u_char st0_tag)
193
{
194
	int isNaN;
195

196
	switch (st0_tag) {
197
	case TW_NaN:
198
		isNaN = (exponent(st0_ptr) == EXP_OVER)
199
		    && (st0_ptr->sigh & 0x80000000);
200
		if (isNaN && !(st0_ptr->sigh & 0x40000000)) {	/* Signaling ? */
201
			EXCEPTION(EX_Invalid);
202
			if (control_word & CW_Invalid) {
203
				/* The masked response */
204
				/* Convert to a QNaN */
205
				st0_ptr->sigh |= 0x40000000;
206
				push();
207
				FPU_copy_to_reg0(st0_ptr, TAG_Special);
208
			}
209
		} else if (isNaN) {
210
			/* A QNaN */
211
			push();
212
			FPU_copy_to_reg0(st0_ptr, TAG_Special);
213
		} else {
214
			/* pseudoNaN or other unsupported */
215
			EXCEPTION(EX_Invalid);
216
			if (control_word & CW_Invalid) {
217
				/* The masked response */
218
				FPU_copy_to_reg0(&CONST_QNaN, TAG_Special);
219
				push();
220
				FPU_copy_to_reg0(&CONST_QNaN, TAG_Special);
221
			}
222
		}
223
		break;		/* return with a NaN in st(0) */
224
#ifdef PARANOID
225
	default:
226
		EXCEPTION(EX_INTERNAL | 0x0112);
227
#endif /* PARANOID */
228
	}
229
}
230

231
/*---------------------------------------------------------------------------*/
232

233
static void f2xm1(FPU_REG *st0_ptr, u_char tag)
234
{
235
	FPU_REG a;
236

237
	clear_C1();
238

239
	if (tag == TAG_Valid) {
240
		/* For an 80486 FPU, the result is undefined if the arg is >= 1.0 */
241
		if (exponent(st0_ptr) < 0) {
242
		      denormal_arg:
243

244
			FPU_to_exp16(st0_ptr, &a);
245

246
			/* poly_2xm1(x) requires 0 < st(0) < 1. */
247
			poly_2xm1(getsign(st0_ptr), &a, st0_ptr);
248
		}
249
		set_precision_flag_up();	/* 80486 appears to always do this */
250
		return;
251
	}
252

253
	if (tag == TAG_Zero)
254
		return;
255

256
	if (tag == TAG_Special)
257
		tag = FPU_Special(st0_ptr);
258

259
	switch (tag) {
260
	case TW_Denormal:
261
		if (denormal_operand() < 0)
262
			return;
263
		goto denormal_arg;
264
	case TW_Infinity:
265
		if (signnegative(st0_ptr)) {
266
			/* -infinity gives -1 (p16-10) */
267
			FPU_copy_to_reg0(&CONST_1, TAG_Valid);
268
			setnegative(st0_ptr);
269
		}
270
		return;
271
	default:
272
		single_arg_error(st0_ptr, tag);
273
	}
274
}
275

276
static void fptan(FPU_REG *st0_ptr, u_char st0_tag)
277
{
278
	FPU_REG *st_new_ptr;
279
	int q;
280
	u_char arg_sign = getsign(st0_ptr);
281

282
	/* Stack underflow has higher priority */
283
	if (st0_tag == TAG_Empty) {
284
		FPU_stack_underflow();	/* Puts a QNaN in st(0) */
285
		if (control_word & CW_Invalid) {
286
			st_new_ptr = &st(-1);
287
			push();
288
			FPU_stack_underflow();	/* Puts a QNaN in the new st(0) */
289
		}
290
		return;
291
	}
292

293
	if (STACK_OVERFLOW) {
294
		FPU_stack_overflow();
295
		return;
296
	}
297

298
	if (st0_tag == TAG_Valid) {
299
		if (exponent(st0_ptr) > -40) {
300
			if ((q = trig_arg(st0_ptr, 0)) == -1) {
301
				/* Operand is out of range */
302
				return;
303
			}
304

305
			poly_tan(st0_ptr);
306
			setsign(st0_ptr, (q & 1) ^ (arg_sign != 0));
307
			set_precision_flag_up();	/* We do not really know if up or down */
308
		} else {
309
			/* For a small arg, the result == the argument */
310
			/* Underflow may happen */
311

312
		      denormal_arg:
313

314
			FPU_to_exp16(st0_ptr, st0_ptr);
315

316
			st0_tag =
317
			    FPU_round(st0_ptr, 1, 0, FULL_PRECISION, arg_sign);
318
			FPU_settag0(st0_tag);
319
		}
320
		push();
321
		FPU_copy_to_reg0(&CONST_1, TAG_Valid);
322
		return;
323
	}
324

325
	if (st0_tag == TAG_Zero) {
326
		push();
327
		FPU_copy_to_reg0(&CONST_1, TAG_Valid);
328
		setcc(0);
329
		return;
330
	}
331

332
	if (st0_tag == TAG_Special)
333
		st0_tag = FPU_Special(st0_ptr);
334

335
	if (st0_tag == TW_Denormal) {
336
		if (denormal_operand() < 0)
337
			return;
338

339
		goto denormal_arg;
340
	}
341

342
	if (st0_tag == TW_Infinity) {
343
		/* The 80486 treats infinity as an invalid operand */
344
		if (arith_invalid(0) >= 0) {
345
			st_new_ptr = &st(-1);
346
			push();
347
			arith_invalid(0);
348
		}
349
		return;
350
	}
351

352
	single_arg_2_error(st0_ptr, st0_tag);
353
}
354

355
static void fxtract(FPU_REG *st0_ptr, u_char st0_tag)
356
{
357
	FPU_REG *st_new_ptr;
358
	u_char sign;
359
	register FPU_REG *st1_ptr = st0_ptr;	/* anticipate */
360

361
	if (STACK_OVERFLOW) {
362
		FPU_stack_overflow();
363
		return;
364
	}
365

366
	clear_C1();
367

368
	if (st0_tag == TAG_Valid) {
369
		long e;
370

371
		push();
372
		sign = getsign(st1_ptr);
373
		reg_copy(st1_ptr, st_new_ptr);
374
		setexponent16(st_new_ptr, exponent(st_new_ptr));
375

376
	      denormal_arg:
377

378
		e = exponent16(st_new_ptr);
379
		convert_l2reg(&e, 1);
380
		setexponentpos(st_new_ptr, 0);
381
		setsign(st_new_ptr, sign);
382
		FPU_settag0(TAG_Valid);	/* Needed if arg was a denormal */
383
		return;
384
	} else if (st0_tag == TAG_Zero) {
385
		sign = getsign(st0_ptr);
386

387
		if (FPU_divide_by_zero(0, SIGN_NEG) < 0)
388
			return;
389

390
		push();
391
		FPU_copy_to_reg0(&CONST_Z, TAG_Zero);
392
		setsign(st_new_ptr, sign);
393
		return;
394
	}
395

396
	if (st0_tag == TAG_Special)
397
		st0_tag = FPU_Special(st0_ptr);
398

399
	if (st0_tag == TW_Denormal) {
400
		if (denormal_operand() < 0)
401
			return;
402

403
		push();
404
		sign = getsign(st1_ptr);
405
		FPU_to_exp16(st1_ptr, st_new_ptr);
406
		goto denormal_arg;
407
	} else if (st0_tag == TW_Infinity) {
408
		sign = getsign(st0_ptr);
409
		setpositive(st0_ptr);
410
		push();
411
		FPU_copy_to_reg0(&CONST_INF, TAG_Special);
412
		setsign(st_new_ptr, sign);
413
		return;
414
	} else if (st0_tag == TW_NaN) {
415
		if (real_1op_NaN(st0_ptr) < 0)
416
			return;
417

418
		push();
419
		FPU_copy_to_reg0(st0_ptr, TAG_Special);
420
		return;
421
	} else if (st0_tag == TAG_Empty) {
422
		/* Is this the correct behaviour? */
423
		if (control_word & EX_Invalid) {
424
			FPU_stack_underflow();
425
			push();
426
			FPU_stack_underflow();
427
		} else
428
			EXCEPTION(EX_StackUnder);
429
	}
430
#ifdef PARANOID
431
	else
432
		EXCEPTION(EX_INTERNAL | 0x119);
433
#endif /* PARANOID */
434
}
435

436
static void fdecstp(FPU_REG *st0_ptr, u_char st0_tag)
437
{
438
	clear_C1();
439
	top--;
440
}
441

442
static void fincstp(FPU_REG *st0_ptr, u_char st0_tag)
443
{
444
	clear_C1();
445
	top++;
446
}
447

448
static void fsqrt_(FPU_REG *st0_ptr, u_char st0_tag)
449
{
450
	int expon;
451

452
	clear_C1();
453

454
	if (st0_tag == TAG_Valid) {
455
		u_char tag;
456

457
		if (signnegative(st0_ptr)) {
458
			arith_invalid(0);	/* sqrt(negative) is invalid */
459
			return;
460
		}
461

462
		/* make st(0) in  [1.0 .. 4.0) */
463
		expon = exponent(st0_ptr);
464

465
	      denormal_arg:
466

467
		setexponent16(st0_ptr, (expon & 1));
468

469
		/* Do the computation, the sign of the result will be positive. */
470
		tag = wm_sqrt(st0_ptr, 0, 0, control_word, SIGN_POS);
471
		addexponent(st0_ptr, expon >> 1);
472
		FPU_settag0(tag);
473
		return;
474
	}
475

476
	if (st0_tag == TAG_Zero)
477
		return;
478

479
	if (st0_tag == TAG_Special)
480
		st0_tag = FPU_Special(st0_ptr);
481

482
	if (st0_tag == TW_Infinity) {
483
		if (signnegative(st0_ptr))
484
			arith_invalid(0);	/* sqrt(-Infinity) is invalid */
485
		return;
486
	} else if (st0_tag == TW_Denormal) {
487
		if (signnegative(st0_ptr)) {
488
			arith_invalid(0);	/* sqrt(negative) is invalid */
489
			return;
490
		}
491

492
		if (denormal_operand() < 0)
493
			return;
494

495
		FPU_to_exp16(st0_ptr, st0_ptr);
496

497
		expon = exponent16(st0_ptr);
498

499
		goto denormal_arg;
500
	}
501

502
	single_arg_error(st0_ptr, st0_tag);
503

504
}
505

506
static void frndint_(FPU_REG *st0_ptr, u_char st0_tag)
507
{
508
	int flags, tag;
509

510
	if (st0_tag == TAG_Valid) {
511
		u_char sign;
512

513
	      denormal_arg:
514

515
		sign = getsign(st0_ptr);
516

517
		if (exponent(st0_ptr) > 63)
518
			return;
519

520
		if (st0_tag == TW_Denormal) {
521
			if (denormal_operand() < 0)
522
				return;
523
		}
524

525
		/* Fortunately, this can't overflow to 2^64 */
526
		if ((flags = FPU_round_to_int(st0_ptr, st0_tag)))
527
			set_precision_flag(flags);
528

529
		setexponent16(st0_ptr, 63);
530
		tag = FPU_normalize(st0_ptr);
531
		setsign(st0_ptr, sign);
532
		FPU_settag0(tag);
533
		return;
534
	}
535

536
	if (st0_tag == TAG_Zero)
537
		return;
538

539
	if (st0_tag == TAG_Special)
540
		st0_tag = FPU_Special(st0_ptr);
541

542
	if (st0_tag == TW_Denormal)
543
		goto denormal_arg;
544
	else if (st0_tag == TW_Infinity)
545
		return;
546
	else
547
		single_arg_error(st0_ptr, st0_tag);
548
}
549

550
static int f_sin(FPU_REG *st0_ptr, u_char tag)
551
{
552
	u_char arg_sign = getsign(st0_ptr);
553

554
	if (tag == TAG_Valid) {
555
		int q;
556

557
		if (exponent(st0_ptr) > -40) {
558
			if ((q = trig_arg(st0_ptr, 0)) == -1) {
559
				/* Operand is out of range */
560
				return 1;
561
			}
562

563
			poly_sine(st0_ptr);
564

565
			if (q & 2)
566
				changesign(st0_ptr);
567

568
			setsign(st0_ptr, getsign(st0_ptr) ^ arg_sign);
569

570
			/* We do not really know if up or down */
571
			set_precision_flag_up();
572
			return 0;
573
		} else {
574
			/* For a small arg, the result == the argument */
575
			set_precision_flag_up();	/* Must be up. */
576
			return 0;
577
		}
578
	}
579

580
	if (tag == TAG_Zero) {
581
		setcc(0);
582
		return 0;
583
	}
584

585
	if (tag == TAG_Special)
586
		tag = FPU_Special(st0_ptr);
587

588
	if (tag == TW_Denormal) {
589
		if (denormal_operand() < 0)
590
			return 1;
591

592
		/* For a small arg, the result == the argument */
593
		/* Underflow may happen */
594
		FPU_to_exp16(st0_ptr, st0_ptr);
595

596
		tag = FPU_round(st0_ptr, 1, 0, FULL_PRECISION, arg_sign);
597

598
		FPU_settag0(tag);
599

600
		return 0;
601
	} else if (tag == TW_Infinity) {
602
		/* The 80486 treats infinity as an invalid operand */
603
		arith_invalid(0);
604
		return 1;
605
	} else {
606
		single_arg_error(st0_ptr, tag);
607
		return 1;
608
	}
609
}
610

611
static void fsin(FPU_REG *st0_ptr, u_char tag)
612
{
613
	f_sin(st0_ptr, tag);
614
}
615

616
static int f_cos(FPU_REG *st0_ptr, u_char tag)
617
{
618
	u_char st0_sign;
619

620
	st0_sign = getsign(st0_ptr);
621

622
	if (tag == TAG_Valid) {
623
		int q;
624

625
		if (exponent(st0_ptr) > -40) {
626
			if ((exponent(st0_ptr) < 0)
627
			    || ((exponent(st0_ptr) == 0)
628
				&& (significand(st0_ptr) <=
629
				    0xc90fdaa22168c234LL))) {
630
				poly_cos(st0_ptr);
631

632
				/* We do not really know if up or down */
633
				set_precision_flag_down();
634

635
				return 0;
636
			} else if ((q = trig_arg(st0_ptr, FCOS)) != -1) {
637
				poly_sine(st0_ptr);
638

639
				if ((q + 1) & 2)
640
					changesign(st0_ptr);
641

642
				/* We do not really know if up or down */
643
				set_precision_flag_down();
644

645
				return 0;
646
			} else {
647
				/* Operand is out of range */
648
				return 1;
649
			}
650
		} else {
651
		      denormal_arg:
652

653
			setcc(0);
654
			FPU_copy_to_reg0(&CONST_1, TAG_Valid);
655
#ifdef PECULIAR_486
656
			set_precision_flag_down();	/* 80486 appears to do this. */
657
#else
658
			set_precision_flag_up();	/* Must be up. */
659
#endif /* PECULIAR_486 */
660
			return 0;
661
		}
662
	} else if (tag == TAG_Zero) {
663
		FPU_copy_to_reg0(&CONST_1, TAG_Valid);
664
		setcc(0);
665
		return 0;
666
	}
667

668
	if (tag == TAG_Special)
669
		tag = FPU_Special(st0_ptr);
670

671
	if (tag == TW_Denormal) {
672
		if (denormal_operand() < 0)
673
			return 1;
674

675
		goto denormal_arg;
676
	} else if (tag == TW_Infinity) {
677
		/* The 80486 treats infinity as an invalid operand */
678
		arith_invalid(0);
679
		return 1;
680
	} else {
681
		single_arg_error(st0_ptr, tag);	/* requires st0_ptr == &st(0) */
682
		return 1;
683
	}
684
}
685

686
static void fcos(FPU_REG *st0_ptr, u_char st0_tag)
687
{
688
	f_cos(st0_ptr, st0_tag);
689
}
690

691
static void fsincos(FPU_REG *st0_ptr, u_char st0_tag)
692
{
693
	FPU_REG *st_new_ptr;
694
	FPU_REG arg;
695
	u_char tag;
696

697
	/* Stack underflow has higher priority */
698
	if (st0_tag == TAG_Empty) {
699
		FPU_stack_underflow();	/* Puts a QNaN in st(0) */
700
		if (control_word & CW_Invalid) {
701
			st_new_ptr = &st(-1);
702
			push();
703
			FPU_stack_underflow();	/* Puts a QNaN in the new st(0) */
704
		}
705
		return;
706
	}
707

708
	if (STACK_OVERFLOW) {
709
		FPU_stack_overflow();
710
		return;
711
	}
712

713
	if (st0_tag == TAG_Special)
714
		tag = FPU_Special(st0_ptr);
715
	else
716
		tag = st0_tag;
717

718
	if (tag == TW_NaN) {
719
		single_arg_2_error(st0_ptr, TW_NaN);
720
		return;
721
	} else if (tag == TW_Infinity) {
722
		/* The 80486 treats infinity as an invalid operand */
723
		if (arith_invalid(0) >= 0) {
724
			/* Masked response */
725
			push();
726
			arith_invalid(0);
727
		}
728
		return;
729
	}
730

731
	reg_copy(st0_ptr, &arg);
732
	if (!f_sin(st0_ptr, st0_tag)) {
733
		push();
734
		FPU_copy_to_reg0(&arg, st0_tag);
735
		f_cos(&st(0), st0_tag);
736
	} else {
737
		/* An error, so restore st(0) */
738
		FPU_copy_to_reg0(&arg, st0_tag);
739
	}
740
}
741

742
/*---------------------------------------------------------------------------*/
743
/* The following all require two arguments: st(0) and st(1) */
744

745
/* A lean, mean kernel for the fprem instructions. This relies upon
746
   the division and rounding to an integer in do_fprem giving an
747
   exact result. Because of this, rem_kernel() needs to deal only with
748
   the least significant 64 bits, the more significant bits of the
749
   result must be zero.
750
 */
751
static void rem_kernel(unsigned long long st0, unsigned long long *y,
752
		       unsigned long long st1, unsigned long long q, int n)
753
{
754
	int dummy;
755
	unsigned long long x;
756

757
	x = st0 << n;
758

759
	/* Do the required multiplication and subtraction in the one operation */
760

761
	/* lsw x -= lsw st1 * lsw q */
762
	asm volatile ("mull %4; subl %%eax,%0; sbbl %%edx,%1":"=m"
763
		      (((unsigned *)&x)[0]), "=m"(((unsigned *)&x)[1]),
764
		      "=a"(dummy)
765
		      :"2"(((unsigned *)&st1)[0]), "m"(((unsigned *)&q)[0])
766
		      :"%dx");
767
	/* msw x -= msw st1 * lsw q */
768
	asm volatile ("mull %3; subl %%eax,%0":"=m" (((unsigned *)&x)[1]),
769
		      "=a"(dummy)
770
		      :"1"(((unsigned *)&st1)[1]), "m"(((unsigned *)&q)[0])
771
		      :"%dx");
772
	/* msw x -= lsw st1 * msw q */
773
	asm volatile ("mull %3; subl %%eax,%0":"=m" (((unsigned *)&x)[1]),
774
		      "=a"(dummy)
775
		      :"1"(((unsigned *)&st1)[0]), "m"(((unsigned *)&q)[1])
776
		      :"%dx");
777

778
	*y = x;
779
}
780

781
/* Remainder of st(0) / st(1) */
782
/* This routine produces exact results, i.e. there is never any
783
   rounding or truncation, etc of the result. */
784
static void do_fprem(FPU_REG *st0_ptr, u_char st0_tag, int round)
785
{
786
	FPU_REG *st1_ptr = &st(1);
787
	u_char st1_tag = FPU_gettagi(1);
788

789
	if (!((st0_tag ^ TAG_Valid) | (st1_tag ^ TAG_Valid))) {
790
		FPU_REG tmp, st0, st1;
791
		u_char st0_sign, st1_sign;
792
		u_char tmptag;
793
		int tag;
794
		int old_cw;
795
		int expdif;
796
		long long q;
797
		unsigned short saved_status;
798
		int cc;
799

800
	      fprem_valid:
801
		/* Convert registers for internal use. */
802
		st0_sign = FPU_to_exp16(st0_ptr, &st0);
803
		st1_sign = FPU_to_exp16(st1_ptr, &st1);
804
		expdif = exponent16(&st0) - exponent16(&st1);
805

806
		old_cw = control_word;
807
		cc = 0;
808

809
		/* We want the status following the denorm tests, but don't want
810
		   the status changed by the arithmetic operations. */
811
		saved_status = partial_status;
812
		control_word &= ~CW_RC;
813
		control_word |= RC_CHOP;
814

815
		if (expdif < 64) {
816
			/* This should be the most common case */
817

818
			if (expdif > -2) {
819
				u_char sign = st0_sign ^ st1_sign;
820
				tag = FPU_u_div(&st0, &st1, &tmp,
821
						PR_64_BITS | RC_CHOP | 0x3f,
822
						sign);
823
				setsign(&tmp, sign);
824

825
				if (exponent(&tmp) >= 0) {
826
					FPU_round_to_int(&tmp, tag);	/* Fortunately, this can't
827
									   overflow to 2^64 */
828
					q = significand(&tmp);
829

830
					rem_kernel(significand(&st0),
831
						   &significand(&tmp),
832
						   significand(&st1),
833
						   q, expdif);
834

835
					setexponent16(&tmp, exponent16(&st1));
836
				} else {
837
					reg_copy(&st0, &tmp);
838
					q = 0;
839
				}
840

841
				if ((round == RC_RND)
842
				    && (tmp.sigh & 0xc0000000)) {
843
					/* We may need to subtract st(1) once more,
844
					   to get a result <= 1/2 of st(1). */
845
					unsigned long long x;
846
					expdif =
847
					    exponent16(&st1) - exponent16(&tmp);
848
					if (expdif <= 1) {
849
						if (expdif == 0)
850
							x = significand(&st1) -
851
							    significand(&tmp);
852
						else	/* expdif is 1 */
853
							x = (significand(&st1)
854
							     << 1) -
855
							    significand(&tmp);
856
						if ((x < significand(&tmp)) ||
857
						    /* or equi-distant (from 0 & st(1)) and q is odd */
858
						    ((x == significand(&tmp))
859
						     && (q & 1))) {
860
							st0_sign = !st0_sign;
861
							significand(&tmp) = x;
862
							q++;
863
						}
864
					}
865
				}
866

867
				if (q & 4)
868
					cc |= SW_C0;
869
				if (q & 2)
870
					cc |= SW_C3;
871
				if (q & 1)
872
					cc |= SW_C1;
873
			} else {
874
				control_word = old_cw;
875
				setcc(0);
876
				return;
877
			}
878
		} else {
879
			/* There is a large exponent difference ( >= 64 ) */
880
			/* To make much sense, the code in this section should
881
			   be done at high precision. */
882
			int exp_1, N;
883
			u_char sign;
884

885
			/* prevent overflow here */
886
			/* N is 'a number between 32 and 63' (p26-113) */
887
			reg_copy(&st0, &tmp);
888
			tmptag = st0_tag;
889
			N = (expdif & 0x0000001f) + 32;	/* This choice gives results
890
							   identical to an AMD 486 */
891
			setexponent16(&tmp, N);
892
			exp_1 = exponent16(&st1);
893
			setexponent16(&st1, 0);
894
			expdif -= N;
895

896
			sign = getsign(&tmp) ^ st1_sign;
897
			tag =
898
			    FPU_u_div(&tmp, &st1, &tmp,
899
				      PR_64_BITS | RC_CHOP | 0x3f, sign);
900
			setsign(&tmp, sign);
901

902
			FPU_round_to_int(&tmp, tag);	/* Fortunately, this can't
903
							   overflow to 2^64 */
904

905
			rem_kernel(significand(&st0),
906
				   &significand(&tmp),
907
				   significand(&st1),
908
				   significand(&tmp), exponent(&tmp)
909
			    );
910
			setexponent16(&tmp, exp_1 + expdif);
911

912
			/* It is possible for the operation to be complete here.
913
			   What does the IEEE standard say? The Intel 80486 manual
914
			   implies that the operation will never be completed at this
915
			   point, and the behaviour of a real 80486 confirms this.
916
			 */
917
			if (!(tmp.sigh | tmp.sigl)) {
918
				/* The result is zero */
919
				control_word = old_cw;
920
				partial_status = saved_status;
921
				FPU_copy_to_reg0(&CONST_Z, TAG_Zero);
922
				setsign(&st0, st0_sign);
923
#ifdef PECULIAR_486
924
				setcc(SW_C2);
925
#else
926
				setcc(0);
927
#endif /* PECULIAR_486 */
928
				return;
929
			}
930
			cc = SW_C2;
931
		}
932

933
		control_word = old_cw;
934
		partial_status = saved_status;
935
		tag = FPU_normalize_nuo(&tmp);
936
		reg_copy(&tmp, st0_ptr);
937

938
		/* The only condition to be looked for is underflow,
939
		   and it can occur here only if underflow is unmasked. */
940
		if ((exponent16(&tmp) <= EXP_UNDER) && (tag != TAG_Zero)
941
		    && !(control_word & CW_Underflow)) {
942
			setcc(cc);
943
			tag = arith_underflow(st0_ptr);
944
			setsign(st0_ptr, st0_sign);
945
			FPU_settag0(tag);
946
			return;
947
		} else if ((exponent16(&tmp) > EXP_UNDER) || (tag == TAG_Zero)) {
948
			stdexp(st0_ptr);
949
			setsign(st0_ptr, st0_sign);
950
		} else {
951
			tag =
952
			    FPU_round(st0_ptr, 0, 0, FULL_PRECISION, st0_sign);
953
		}
954
		FPU_settag0(tag);
955
		setcc(cc);
956

957
		return;
958
	}
959

960
	if (st0_tag == TAG_Special)
961
		st0_tag = FPU_Special(st0_ptr);
962
	if (st1_tag == TAG_Special)
963
		st1_tag = FPU_Special(st1_ptr);
964

965
	if (((st0_tag == TAG_Valid) && (st1_tag == TW_Denormal))
966
	    || ((st0_tag == TW_Denormal) && (st1_tag == TAG_Valid))
967
	    || ((st0_tag == TW_Denormal) && (st1_tag == TW_Denormal))) {
968
		if (denormal_operand() < 0)
969
			return;
970
		goto fprem_valid;
971
	} else if ((st0_tag == TAG_Empty) || (st1_tag == TAG_Empty)) {
972
		FPU_stack_underflow();
973
		return;
974
	} else if (st0_tag == TAG_Zero) {
975
		if (st1_tag == TAG_Valid) {
976
			setcc(0);
977
			return;
978
		} else if (st1_tag == TW_Denormal) {
979
			if (denormal_operand() < 0)
980
				return;
981
			setcc(0);
982
			return;
983
		} else if (st1_tag == TAG_Zero) {
984
			arith_invalid(0);
985
			return;
986
		} /* fprem(?,0) always invalid */
987
		else if (st1_tag == TW_Infinity) {
988
			setcc(0);
989
			return;
990
		}
991
	} else if ((st0_tag == TAG_Valid) || (st0_tag == TW_Denormal)) {
992
		if (st1_tag == TAG_Zero) {
993
			arith_invalid(0);	/* fprem(Valid,Zero) is invalid */
994
			return;
995
		} else if (st1_tag != TW_NaN) {
996
			if (((st0_tag == TW_Denormal)
997
			     || (st1_tag == TW_Denormal))
998
			    && (denormal_operand() < 0))
999
				return;
1000

1001
			if (st1_tag == TW_Infinity) {
1002
				/* fprem(Valid,Infinity) is o.k. */
1003
				setcc(0);
1004
				return;
1005
			}
1006
		}
1007
	} else if (st0_tag == TW_Infinity) {
1008
		if (st1_tag != TW_NaN) {
1009
			arith_invalid(0);	/* fprem(Infinity,?) is invalid */
1010
			return;
1011
		}
1012
	}
1013

1014
	/* One of the registers must contain a NaN if we got here. */
1015

1016
#ifdef PARANOID
1017
	if ((st0_tag != TW_NaN) && (st1_tag != TW_NaN))
1018
		EXCEPTION(EX_INTERNAL | 0x118);
1019
#endif /* PARANOID */
1020

1021
	real_2op_NaN(st1_ptr, st1_tag, 0, st1_ptr);
1022

1023
}
1024

1025
/* ST(1) <- ST(1) * log ST;  pop ST */
1026
static void fyl2x(FPU_REG *st0_ptr, u_char st0_tag)
1027
{
1028
	FPU_REG *st1_ptr = &st(1), exponent;
1029
	u_char st1_tag = FPU_gettagi(1);
1030
	u_char sign;
1031
	int e, tag;
1032

1033
	clear_C1();
1034

1035
	if ((st0_tag == TAG_Valid) && (st1_tag == TAG_Valid)) {
1036
	      both_valid:
1037
		/* Both regs are Valid or Denormal */
1038
		if (signpositive(st0_ptr)) {
1039
			if (st0_tag == TW_Denormal)
1040
				FPU_to_exp16(st0_ptr, st0_ptr);
1041
			else
1042
				/* Convert st(0) for internal use. */
1043
				setexponent16(st0_ptr, exponent(st0_ptr));
1044

1045
			if ((st0_ptr->sigh == 0x80000000)
1046
			    && (st0_ptr->sigl == 0)) {
1047
				/* Special case. The result can be precise. */
1048
				u_char esign;
1049
				e = exponent16(st0_ptr);
1050
				if (e >= 0) {
1051
					exponent.sigh = e;
1052
					esign = SIGN_POS;
1053
				} else {
1054
					exponent.sigh = -e;
1055
					esign = SIGN_NEG;
1056
				}
1057
				exponent.sigl = 0;
1058
				setexponent16(&exponent, 31);
1059
				tag = FPU_normalize_nuo(&exponent);
1060
				stdexp(&exponent);
1061
				setsign(&exponent, esign);
1062
				tag =
1063
				    FPU_mul(&exponent, tag, 1, FULL_PRECISION);
1064
				if (tag >= 0)
1065
					FPU_settagi(1, tag);
1066
			} else {
1067
				/* The usual case */
1068
				sign = getsign(st1_ptr);
1069
				if (st1_tag == TW_Denormal)
1070
					FPU_to_exp16(st1_ptr, st1_ptr);
1071
				else
1072
					/* Convert st(1) for internal use. */
1073
					setexponent16(st1_ptr,
1074
						      exponent(st1_ptr));
1075
				poly_l2(st0_ptr, st1_ptr, sign);
1076
			}
1077
		} else {
1078
			/* negative */
1079
			if (arith_invalid(1) < 0)
1080
				return;
1081
		}
1082

1083
		FPU_pop();
1084

1085
		return;
1086
	}
1087

1088
	if (st0_tag == TAG_Special)
1089
		st0_tag = FPU_Special(st0_ptr);
1090
	if (st1_tag == TAG_Special)
1091
		st1_tag = FPU_Special(st1_ptr);
1092

1093
	if ((st0_tag == TAG_Empty) || (st1_tag == TAG_Empty)) {
1094
		FPU_stack_underflow_pop(1);
1095
		return;
1096
	} else if ((st0_tag <= TW_Denormal) && (st1_tag <= TW_Denormal)) {
1097
		if (st0_tag == TAG_Zero) {
1098
			if (st1_tag == TAG_Zero) {
1099
				/* Both args zero is invalid */
1100
				if (arith_invalid(1) < 0)
1101
					return;
1102
			} else {
1103
				u_char sign;
1104
				sign = getsign(st1_ptr) ^ SIGN_NEG;
1105
				if (FPU_divide_by_zero(1, sign) < 0)
1106
					return;
1107

1108
				setsign(st1_ptr, sign);
1109
			}
1110
		} else if (st1_tag == TAG_Zero) {
1111
			/* st(1) contains zero, st(0) valid <> 0 */
1112
			/* Zero is the valid answer */
1113
			sign = getsign(st1_ptr);
1114

1115
			if (signnegative(st0_ptr)) {
1116
				/* log(negative) */
1117
				if (arith_invalid(1) < 0)
1118
					return;
1119
			} else if ((st0_tag == TW_Denormal)
1120
				   && (denormal_operand() < 0))
1121
				return;
1122
			else {
1123
				if (exponent(st0_ptr) < 0)
1124
					sign ^= SIGN_NEG;
1125

1126
				FPU_copy_to_reg1(&CONST_Z, TAG_Zero);
1127
				setsign(st1_ptr, sign);
1128
			}
1129
		} else {
1130
			/* One or both operands are denormals. */
1131
			if (denormal_operand() < 0)
1132
				return;
1133
			goto both_valid;
1134
		}
1135
	} else if ((st0_tag == TW_NaN) || (st1_tag == TW_NaN)) {
1136
		if (real_2op_NaN(st0_ptr, st0_tag, 1, st0_ptr) < 0)
1137
			return;
1138
	}
1139
	/* One or both arg must be an infinity */
1140
	else if (st0_tag == TW_Infinity) {
1141
		if ((signnegative(st0_ptr)) || (st1_tag == TAG_Zero)) {
1142
			/* log(-infinity) or 0*log(infinity) */
1143
			if (arith_invalid(1) < 0)
1144
				return;
1145
		} else {
1146
			u_char sign = getsign(st1_ptr);
1147

1148
			if ((st1_tag == TW_Denormal)
1149
			    && (denormal_operand() < 0))
1150
				return;
1151

1152
			FPU_copy_to_reg1(&CONST_INF, TAG_Special);
1153
			setsign(st1_ptr, sign);
1154
		}
1155
	}
1156
	/* st(1) must be infinity here */
1157
	else if (((st0_tag == TAG_Valid) || (st0_tag == TW_Denormal))
1158
		 && (signpositive(st0_ptr))) {
1159
		if (exponent(st0_ptr) >= 0) {
1160
			if ((exponent(st0_ptr) == 0) &&
1161
			    (st0_ptr->sigh == 0x80000000) &&
1162
			    (st0_ptr->sigl == 0)) {
1163
				/* st(0) holds 1.0 */
1164
				/* infinity*log(1) */
1165
				if (arith_invalid(1) < 0)
1166
					return;
1167
			}
1168
			/* else st(0) is positive and > 1.0 */
1169
		} else {
1170
			/* st(0) is positive and < 1.0 */
1171

1172
			if ((st0_tag == TW_Denormal)
1173
			    && (denormal_operand() < 0))
1174
				return;
1175

1176
			changesign(st1_ptr);
1177
		}
1178
	} else {
1179
		/* st(0) must be zero or negative */
1180
		if (st0_tag == TAG_Zero) {
1181
			/* This should be invalid, but a real 80486 is happy with it. */
1182

1183
#ifndef PECULIAR_486
1184
			sign = getsign(st1_ptr);
1185
			if (FPU_divide_by_zero(1, sign) < 0)
1186
				return;
1187
#endif /* PECULIAR_486 */
1188

1189
			changesign(st1_ptr);
1190
		} else if (arith_invalid(1) < 0)	/* log(negative) */
1191
			return;
1192
	}
1193

1194
	FPU_pop();
1195
}
1196

1197
static void fpatan(FPU_REG *st0_ptr, u_char st0_tag)
1198
{
1199
	FPU_REG *st1_ptr = &st(1);
1200
	u_char st1_tag = FPU_gettagi(1);
1201
	int tag;
1202

1203
	clear_C1();
1204
	if (!((st0_tag ^ TAG_Valid) | (st1_tag ^ TAG_Valid))) {
1205
	      valid_atan:
1206

1207
		poly_atan(st0_ptr, st0_tag, st1_ptr, st1_tag);
1208

1209
		FPU_pop();
1210

1211
		return;
1212
	}
1213

1214
	if (st0_tag == TAG_Special)
1215
		st0_tag = FPU_Special(st0_ptr);
1216
	if (st1_tag == TAG_Special)
1217
		st1_tag = FPU_Special(st1_ptr);
1218

1219
	if (((st0_tag == TAG_Valid) && (st1_tag == TW_Denormal))
1220
	    || ((st0_tag == TW_Denormal) && (st1_tag == TAG_Valid))
1221
	    || ((st0_tag == TW_Denormal) && (st1_tag == TW_Denormal))) {
1222
		if (denormal_operand() < 0)
1223
			return;
1224

1225
		goto valid_atan;
1226
	} else if ((st0_tag == TAG_Empty) || (st1_tag == TAG_Empty)) {
1227
		FPU_stack_underflow_pop(1);
1228
		return;
1229
	} else if ((st0_tag == TW_NaN) || (st1_tag == TW_NaN)) {
1230
		if (real_2op_NaN(st0_ptr, st0_tag, 1, st0_ptr) >= 0)
1231
			FPU_pop();
1232
		return;
1233
	} else if ((st0_tag == TW_Infinity) || (st1_tag == TW_Infinity)) {
1234
		u_char sign = getsign(st1_ptr);
1235
		if (st0_tag == TW_Infinity) {
1236
			if (st1_tag == TW_Infinity) {
1237
				if (signpositive(st0_ptr)) {
1238
					FPU_copy_to_reg1(&CONST_PI4, TAG_Valid);
1239
				} else {
1240
					setpositive(st1_ptr);
1241
					tag =
1242
					    FPU_u_add(&CONST_PI4, &CONST_PI2,
1243
						      st1_ptr, FULL_PRECISION,
1244
						      SIGN_POS,
1245
						      exponent(&CONST_PI4),
1246
						      exponent(&CONST_PI2));
1247
					if (tag >= 0)
1248
						FPU_settagi(1, tag);
1249
				}
1250
			} else {
1251
				if ((st1_tag == TW_Denormal)
1252
				    && (denormal_operand() < 0))
1253
					return;
1254

1255
				if (signpositive(st0_ptr)) {
1256
					FPU_copy_to_reg1(&CONST_Z, TAG_Zero);
1257
					setsign(st1_ptr, sign);	/* An 80486 preserves the sign */
1258
					FPU_pop();
1259
					return;
1260
				} else {
1261
					FPU_copy_to_reg1(&CONST_PI, TAG_Valid);
1262
				}
1263
			}
1264
		} else {
1265
			/* st(1) is infinity, st(0) not infinity */
1266
			if ((st0_tag == TW_Denormal)
1267
			    && (denormal_operand() < 0))
1268
				return;
1269

1270
			FPU_copy_to_reg1(&CONST_PI2, TAG_Valid);
1271
		}
1272
		setsign(st1_ptr, sign);
1273
	} else if (st1_tag == TAG_Zero) {
1274
		/* st(0) must be valid or zero */
1275
		u_char sign = getsign(st1_ptr);
1276

1277
		if ((st0_tag == TW_Denormal) && (denormal_operand() < 0))
1278
			return;
1279

1280
		if (signpositive(st0_ptr)) {
1281
			/* An 80486 preserves the sign */
1282
			FPU_pop();
1283
			return;
1284
		}
1285

1286
		FPU_copy_to_reg1(&CONST_PI, TAG_Valid);
1287
		setsign(st1_ptr, sign);
1288
	} else if (st0_tag == TAG_Zero) {
1289
		/* st(1) must be TAG_Valid here */
1290
		u_char sign = getsign(st1_ptr);
1291

1292
		if ((st1_tag == TW_Denormal) && (denormal_operand() < 0))
1293
			return;
1294

1295
		FPU_copy_to_reg1(&CONST_PI2, TAG_Valid);
1296
		setsign(st1_ptr, sign);
1297
	}
1298
#ifdef PARANOID
1299
	else
1300
		EXCEPTION(EX_INTERNAL | 0x125);
1301
#endif /* PARANOID */
1302

1303
	FPU_pop();
1304
	set_precision_flag_up();	/* We do not really know if up or down */
1305
}
1306

1307
static void fprem(FPU_REG *st0_ptr, u_char st0_tag)
1308
{
1309
	do_fprem(st0_ptr, st0_tag, RC_CHOP);
1310
}
1311

1312
static void fprem1(FPU_REG *st0_ptr, u_char st0_tag)
1313
{
1314
	do_fprem(st0_ptr, st0_tag, RC_RND);
1315
}
1316

1317
static void fyl2xp1(FPU_REG *st0_ptr, u_char st0_tag)
1318
{
1319
	u_char sign, sign1;
1320
	FPU_REG *st1_ptr = &st(1), a, b;
1321
	u_char st1_tag = FPU_gettagi(1);
1322

1323
	clear_C1();
1324
	if (!((st0_tag ^ TAG_Valid) | (st1_tag ^ TAG_Valid))) {
1325
	      valid_yl2xp1:
1326

1327
		sign = getsign(st0_ptr);
1328
		sign1 = getsign(st1_ptr);
1329

1330
		FPU_to_exp16(st0_ptr, &a);
1331
		FPU_to_exp16(st1_ptr, &b);
1332

1333
		if (poly_l2p1(sign, sign1, &a, &b, st1_ptr))
1334
			return;
1335

1336
		FPU_pop();
1337
		return;
1338
	}
1339

1340
	if (st0_tag == TAG_Special)
1341
		st0_tag = FPU_Special(st0_ptr);
1342
	if (st1_tag == TAG_Special)
1343
		st1_tag = FPU_Special(st1_ptr);
1344

1345
	if (((st0_tag == TAG_Valid) && (st1_tag == TW_Denormal))
1346
	    || ((st0_tag == TW_Denormal) && (st1_tag == TAG_Valid))
1347
	    || ((st0_tag == TW_Denormal) && (st1_tag == TW_Denormal))) {
1348
		if (denormal_operand() < 0)
1349
			return;
1350

1351
		goto valid_yl2xp1;
1352
	} else if ((st0_tag == TAG_Empty) | (st1_tag == TAG_Empty)) {
1353
		FPU_stack_underflow_pop(1);
1354
		return;
1355
	} else if (st0_tag == TAG_Zero) {
1356
		switch (st1_tag) {
1357
		case TW_Denormal:
1358
			if (denormal_operand() < 0)
1359
				return;
1360
			fallthrough;
1361
		case TAG_Zero:
1362
		case TAG_Valid:
1363
			setsign(st0_ptr, getsign(st0_ptr) ^ getsign(st1_ptr));
1364
			FPU_copy_to_reg1(st0_ptr, st0_tag);
1365
			break;
1366

1367
		case TW_Infinity:
1368
			/* Infinity*log(1) */
1369
			if (arith_invalid(1) < 0)
1370
				return;
1371
			break;
1372

1373
		case TW_NaN:
1374
			if (real_2op_NaN(st0_ptr, st0_tag, 1, st0_ptr) < 0)
1375
				return;
1376
			break;
1377

1378
		default:
1379
#ifdef PARANOID
1380
			EXCEPTION(EX_INTERNAL | 0x116);
1381
			return;
1382
#endif /* PARANOID */
1383
			break;
1384
		}
1385
	} else if ((st0_tag == TAG_Valid) || (st0_tag == TW_Denormal)) {
1386
		switch (st1_tag) {
1387
		case TAG_Zero:
1388
			if (signnegative(st0_ptr)) {
1389
				if (exponent(st0_ptr) >= 0) {
1390
					/* st(0) holds <= -1.0 */
1391
#ifdef PECULIAR_486		/* Stupid 80486 doesn't worry about log(negative). */
1392
					changesign(st1_ptr);
1393
#else
1394
					if (arith_invalid(1) < 0)
1395
						return;
1396
#endif /* PECULIAR_486 */
1397
				} else if ((st0_tag == TW_Denormal)
1398
					   && (denormal_operand() < 0))
1399
					return;
1400
				else
1401
					changesign(st1_ptr);
1402
			} else if ((st0_tag == TW_Denormal)
1403
				   && (denormal_operand() < 0))
1404
				return;
1405
			break;
1406

1407
		case TW_Infinity:
1408
			if (signnegative(st0_ptr)) {
1409
				if ((exponent(st0_ptr) >= 0) &&
1410
				    !((st0_ptr->sigh == 0x80000000) &&
1411
				      (st0_ptr->sigl == 0))) {
1412
					/* st(0) holds < -1.0 */
1413
#ifdef PECULIAR_486		/* Stupid 80486 doesn't worry about log(negative). */
1414
					changesign(st1_ptr);
1415
#else
1416
					if (arith_invalid(1) < 0)
1417
						return;
1418
#endif /* PECULIAR_486 */
1419
				} else if ((st0_tag == TW_Denormal)
1420
					   && (denormal_operand() < 0))
1421
					return;
1422
				else
1423
					changesign(st1_ptr);
1424
			} else if ((st0_tag == TW_Denormal)
1425
				   && (denormal_operand() < 0))
1426
				return;
1427
			break;
1428

1429
		case TW_NaN:
1430
			if (real_2op_NaN(st0_ptr, st0_tag, 1, st0_ptr) < 0)
1431
				return;
1432
		}
1433

1434
	} else if (st0_tag == TW_NaN) {
1435
		if (real_2op_NaN(st0_ptr, st0_tag, 1, st0_ptr) < 0)
1436
			return;
1437
	} else if (st0_tag == TW_Infinity) {
1438
		if (st1_tag == TW_NaN) {
1439
			if (real_2op_NaN(st0_ptr, st0_tag, 1, st0_ptr) < 0)
1440
				return;
1441
		} else if (signnegative(st0_ptr)) {
1442
#ifndef PECULIAR_486
1443
			/* This should have higher priority than denormals, but... */
1444
			if (arith_invalid(1) < 0)	/* log(-infinity) */
1445
				return;
1446
#endif /* PECULIAR_486 */
1447
			if ((st1_tag == TW_Denormal)
1448
			    && (denormal_operand() < 0))
1449
				return;
1450
#ifdef PECULIAR_486
1451
			/* Denormal operands actually get higher priority */
1452
			if (arith_invalid(1) < 0)	/* log(-infinity) */
1453
				return;
1454
#endif /* PECULIAR_486 */
1455
		} else if (st1_tag == TAG_Zero) {
1456
			/* log(infinity) */
1457
			if (arith_invalid(1) < 0)
1458
				return;
1459
		}
1460

1461
		/* st(1) must be valid here. */
1462

1463
		else if ((st1_tag == TW_Denormal) && (denormal_operand() < 0))
1464
			return;
1465

1466
		/* The Manual says that log(Infinity) is invalid, but a real
1467
		   80486 sensibly says that it is o.k. */
1468
		else {
1469
			u_char sign = getsign(st1_ptr);
1470
			FPU_copy_to_reg1(&CONST_INF, TAG_Special);
1471
			setsign(st1_ptr, sign);
1472
		}
1473
	}
1474
#ifdef PARANOID
1475
	else {
1476
		EXCEPTION(EX_INTERNAL | 0x117);
1477
		return;
1478
	}
1479
#endif /* PARANOID */
1480

1481
	FPU_pop();
1482
	return;
1483

1484
}
1485

1486
static void fscale(FPU_REG *st0_ptr, u_char st0_tag)
1487
{
1488
	FPU_REG *st1_ptr = &st(1);
1489
	u_char st1_tag = FPU_gettagi(1);
1490
	int old_cw = control_word;
1491
	u_char sign = getsign(st0_ptr);
1492

1493
	clear_C1();
1494
	if (!((st0_tag ^ TAG_Valid) | (st1_tag ^ TAG_Valid))) {
1495
		long scale;
1496
		FPU_REG tmp;
1497

1498
		/* Convert register for internal use. */
1499
		setexponent16(st0_ptr, exponent(st0_ptr));
1500

1501
	      valid_scale:
1502

1503
		if (exponent(st1_ptr) > 30) {
1504
			/* 2^31 is far too large, would require 2^(2^30) or 2^(-2^30) */
1505

1506
			if (signpositive(st1_ptr)) {
1507
				EXCEPTION(EX_Overflow);
1508
				FPU_copy_to_reg0(&CONST_INF, TAG_Special);
1509
			} else {
1510
				EXCEPTION(EX_Underflow);
1511
				FPU_copy_to_reg0(&CONST_Z, TAG_Zero);
1512
			}
1513
			setsign(st0_ptr, sign);
1514
			return;
1515
		}
1516

1517
		control_word &= ~CW_RC;
1518
		control_word |= RC_CHOP;
1519
		reg_copy(st1_ptr, &tmp);
1520
		FPU_round_to_int(&tmp, st1_tag);	/* This can never overflow here */
1521
		control_word = old_cw;
1522
		scale = signnegative(st1_ptr) ? -tmp.sigl : tmp.sigl;
1523
		scale += exponent16(st0_ptr);
1524

1525
		setexponent16(st0_ptr, scale);
1526

1527
		/* Use FPU_round() to properly detect under/overflow etc */
1528
		FPU_round(st0_ptr, 0, 0, control_word, sign);
1529

1530
		return;
1531
	}
1532

1533
	if (st0_tag == TAG_Special)
1534
		st0_tag = FPU_Special(st0_ptr);
1535
	if (st1_tag == TAG_Special)
1536
		st1_tag = FPU_Special(st1_ptr);
1537

1538
	if ((st0_tag == TAG_Valid) || (st0_tag == TW_Denormal)) {
1539
		switch (st1_tag) {
1540
		case TAG_Valid:
1541
			/* st(0) must be a denormal */
1542
			if ((st0_tag == TW_Denormal)
1543
			    && (denormal_operand() < 0))
1544
				return;
1545

1546
			FPU_to_exp16(st0_ptr, st0_ptr);	/* Will not be left on stack */
1547
			goto valid_scale;
1548

1549
		case TAG_Zero:
1550
			if (st0_tag == TW_Denormal)
1551
				denormal_operand();
1552
			return;
1553

1554
		case TW_Denormal:
1555
			denormal_operand();
1556
			return;
1557

1558
		case TW_Infinity:
1559
			if ((st0_tag == TW_Denormal)
1560
			    && (denormal_operand() < 0))
1561
				return;
1562

1563
			if (signpositive(st1_ptr))
1564
				FPU_copy_to_reg0(&CONST_INF, TAG_Special);
1565
			else
1566
				FPU_copy_to_reg0(&CONST_Z, TAG_Zero);
1567
			setsign(st0_ptr, sign);
1568
			return;
1569

1570
		case TW_NaN:
1571
			real_2op_NaN(st1_ptr, st1_tag, 0, st0_ptr);
1572
			return;
1573
		}
1574
	} else if (st0_tag == TAG_Zero) {
1575
		switch (st1_tag) {
1576
		case TAG_Valid:
1577
		case TAG_Zero:
1578
			return;
1579

1580
		case TW_Denormal:
1581
			denormal_operand();
1582
			return;
1583

1584
		case TW_Infinity:
1585
			if (signpositive(st1_ptr))
1586
				arith_invalid(0);	/* Zero scaled by +Infinity */
1587
			return;
1588

1589
		case TW_NaN:
1590
			real_2op_NaN(st1_ptr, st1_tag, 0, st0_ptr);
1591
			return;
1592
		}
1593
	} else if (st0_tag == TW_Infinity) {
1594
		switch (st1_tag) {
1595
		case TAG_Valid:
1596
		case TAG_Zero:
1597
			return;
1598

1599
		case TW_Denormal:
1600
			denormal_operand();
1601
			return;
1602

1603
		case TW_Infinity:
1604
			if (signnegative(st1_ptr))
1605
				arith_invalid(0);	/* Infinity scaled by -Infinity */
1606
			return;
1607

1608
		case TW_NaN:
1609
			real_2op_NaN(st1_ptr, st1_tag, 0, st0_ptr);
1610
			return;
1611
		}
1612
	} else if (st0_tag == TW_NaN) {
1613
		if (st1_tag != TAG_Empty) {
1614
			real_2op_NaN(st1_ptr, st1_tag, 0, st0_ptr);
1615
			return;
1616
		}
1617
	}
1618
#ifdef PARANOID
1619
	if (!((st0_tag == TAG_Empty) || (st1_tag == TAG_Empty))) {
1620
		EXCEPTION(EX_INTERNAL | 0x115);
1621
		return;
1622
	}
1623
#endif
1624

1625
	/* At least one of st(0), st(1) must be empty */
1626
	FPU_stack_underflow();
1627

1628
}
1629

1630
/*---------------------------------------------------------------------------*/
1631

1632
static FUNC_ST0 const trig_table_a[] = {
1633
	f2xm1, fyl2x, fptan, fpatan,
1634
	fxtract, fprem1, fdecstp, fincstp,
1635
};
1636

1637
void FPU_triga(void)
1638
{
1639
	(trig_table_a[FPU_rm]) (&st(0), FPU_gettag0());
1640
}
1641

1642
static FUNC_ST0 const trig_table_b[] = {
1643
	fprem, fyl2xp1, fsqrt_, fsincos, frndint_, fscale, fsin, fcos
1644
};
1645

1646
void FPU_trigb(void)
1647
{
1648
	(trig_table_b[FPU_rm]) (&st(0), FPU_gettag0());
1649
}
1650

1651
Product

Resources

Company