CoCalc -- res

GitHub Repository: awilliam/linux-vfio
Path: blob/master/arch/m68k/fpsp040/res_func.S
¹⁰⁸¹⁷ views
1
|
2
|	res_func.sa 3.9 7/29/91
3
|
4
| Normalizes denormalized numbers if necessary and updates the
5
| stack frame.  The function is then restored back into the
6
| machine and the 040 completes the operation.  This routine
7
| is only used by the unsupported data type/format handler.
8
| (Exception vector 55).
9
|
10
| For packed move out (fmove.p fpm,<ea>) the operation is
11
| completed here; data is packed and moved to user memory.
12
| The stack is restored to the 040 only in the case of a
13
| reportable exception in the conversion.
14
|
15
|
16
|		Copyright (C) Motorola, Inc. 1990
17
|			All Rights Reserved
18
|
19
|       For details on the license for this file, please see the
20
|       file, README, in this same directory.
21

22
RES_FUNC:    |idnt    2,1 | Motorola 040 Floating Point Software Package
23

24
	|section	8
25

26
#include "fpsp.h"
27

28
sp_bnds:	.short	0x3f81,0x407e
29
		.short	0x3f6a,0x0000
30
dp_bnds:	.short	0x3c01,0x43fe
31
		.short	0x3bcd,0x0000
32

33
	|xref	mem_write
34
	|xref	bindec
35
	|xref	get_fline
36
	|xref	round
37
	|xref	denorm
38
	|xref	dest_ext
39
	|xref	dest_dbl
40
	|xref	dest_sgl
41
	|xref	unf_sub
42
	|xref	nrm_set
43
	|xref	dnrm_lp
44
	|xref	ovf_res
45
	|xref	reg_dest
46
	|xref	t_ovfl
47
	|xref	t_unfl
48

49
	.global	res_func
50
	.global	p_move
51

52
res_func:
53
	clrb	DNRM_FLG(%a6)
54
	clrb	RES_FLG(%a6)
55
	clrb	CU_ONLY(%a6)
56
	tstb	DY_MO_FLG(%a6)
57
	beqs	monadic
58
dyadic:
59
	btstb	#7,DTAG(%a6)	|if dop = norm=000, zero=001,
60
|				;inf=010 or nan=011
61
	beqs	monadic		|then branch
62
|				;else denorm
63
| HANDLE DESTINATION DENORM HERE
64
|				;set dtag to norm
65
|				;write the tag & fpte15 to the fstack
66
	leal	FPTEMP(%a6),%a0
67

68
	bclrb	#sign_bit,LOCAL_EX(%a0)
69
	sne	LOCAL_SGN(%a0)
70

71
	bsr	nrm_set		|normalize number (exp will go negative)
72
	bclrb	#sign_bit,LOCAL_EX(%a0) |get rid of false sign
73
	bfclr	LOCAL_SGN(%a0){#0:#8}	|change back to IEEE ext format
74
	beqs	dpos
75
	bsetb	#sign_bit,LOCAL_EX(%a0)
76
dpos:
77
	bfclr	DTAG(%a6){#0:#4}	|set tag to normalized, FPTE15 = 0
78
	bsetb	#4,DTAG(%a6)	|set FPTE15
79
	orb	#0x0f,DNRM_FLG(%a6)
80
monadic:
81
	leal	ETEMP(%a6),%a0
82
	btstb	#direction_bit,CMDREG1B(%a6)	|check direction
83
	bne	opclass3			|it is a mv out
84
|
85
| At this point, only opclass 0 and 2 possible
86
|
87
	btstb	#7,STAG(%a6)	|if sop = norm=000, zero=001,
88
|				;inf=010 or nan=011
89
	bne	mon_dnrm	|else denorm
90
	tstb	DY_MO_FLG(%a6)	|all cases of dyadic instructions would
91
	bne	normal		|require normalization of denorm
92

93
| At this point:
94
|	monadic instructions:	fabs  = $18  fneg   = $1a  ftst   = $3a
95
|				fmove = $00  fsmove = $40  fdmove = $44
96
|				fsqrt = $05* fssqrt = $41  fdsqrt = $45
97
|				(*fsqrt reencoded to $05)
98
|
99
	movew	CMDREG1B(%a6),%d0	|get command register
100
	andil	#0x7f,%d0			|strip to only command word
101
|
102
| At this point, fabs, fneg, fsmove, fdmove, ftst, fsqrt, fssqrt, and
103
| fdsqrt are possible.
104
| For cases fabs, fneg, fsmove, and fdmove goto spos (do not normalize)
105
| For cases fsqrt, fssqrt, and fdsqrt goto nrm_src (do normalize)
106
|
107
	btstl	#0,%d0
108
	bne	normal			|weed out fsqrt instructions
109
|
110
| cu_norm handles fmove in instructions with normalized inputs.
111
| The routine round is used to correctly round the input for the
112
| destination precision and mode.
113
|
114
cu_norm:
115
	st	CU_ONLY(%a6)		|set cu-only inst flag
116
	movew	CMDREG1B(%a6),%d0
117
	andib	#0x3b,%d0		|isolate bits to select inst
118
	tstb	%d0
119
	beql	cu_nmove	|if zero, it is an fmove
120
	cmpib	#0x18,%d0
121
	beql	cu_nabs		|if $18, it is fabs
122
	cmpib	#0x1a,%d0
123
	beql	cu_nneg		|if $1a, it is fneg
124
|
125
| Inst is ftst.  Check the source operand and set the cc's accordingly.
126
| No write is done, so simply rts.
127
|
128
cu_ntst:
129
	movew	LOCAL_EX(%a0),%d0
130
	bclrl	#15,%d0
131
	sne	LOCAL_SGN(%a0)
132
	beqs	cu_ntpo
133
	orl	#neg_mask,USER_FPSR(%a6) |set N
134
cu_ntpo:
135
	cmpiw	#0x7fff,%d0	|test for inf/nan
136
	bnes	cu_ntcz
137
	tstl	LOCAL_HI(%a0)
138
	bnes	cu_ntn
139
	tstl	LOCAL_LO(%a0)
140
	bnes	cu_ntn
141
	orl	#inf_mask,USER_FPSR(%a6)
142
	rts
143
cu_ntn:
144
	orl	#nan_mask,USER_FPSR(%a6)
145
	movel	ETEMP_EX(%a6),FPTEMP_EX(%a6)	|set up fptemp sign for
146
|						;snan handler
147

148
	rts
149
cu_ntcz:
150
	tstl	LOCAL_HI(%a0)
151
	bnel	cu_ntsx
152
	tstl	LOCAL_LO(%a0)
153
	bnel	cu_ntsx
154
	orl	#z_mask,USER_FPSR(%a6)
155
cu_ntsx:
156
	rts
157
|
158
| Inst is fabs.  Execute the absolute value function on the input.
159
| Branch to the fmove code.  If the operand is NaN, do nothing.
160
|
161
cu_nabs:
162
	moveb	STAG(%a6),%d0
163
	btstl	#5,%d0			|test for NaN or zero
164
	bne	wr_etemp		|if either, simply write it
165
	bclrb	#7,LOCAL_EX(%a0)		|do abs
166
	bras	cu_nmove		|fmove code will finish
167
|
168
| Inst is fneg.  Execute the negate value function on the input.
169
| Fall though to the fmove code.  If the operand is NaN, do nothing.
170
|
171
cu_nneg:
172
	moveb	STAG(%a6),%d0
173
	btstl	#5,%d0			|test for NaN or zero
174
	bne	wr_etemp		|if either, simply write it
175
	bchgb	#7,LOCAL_EX(%a0)		|do neg
176
|
177
| Inst is fmove.  This code also handles all result writes.
178
| If bit 2 is set, round is forced to double.  If it is clear,
179
| and bit 6 is set, round is forced to single.  If both are clear,
180
| the round precision is found in the fpcr.  If the rounding precision
181
| is double or single, round the result before the write.
182
|
183
cu_nmove:
184
	moveb	STAG(%a6),%d0
185
	andib	#0xe0,%d0			|isolate stag bits
186
	bne	wr_etemp		|if not norm, simply write it
187
	btstb	#2,CMDREG1B+1(%a6)	|check for rd
188
	bne	cu_nmrd
189
	btstb	#6,CMDREG1B+1(%a6)	|check for rs
190
	bne	cu_nmrs
191
|
192
| The move or operation is not with forced precision.  Test for
193
| nan or inf as the input; if so, simply write it to FPn.  Use the
194
| FPCR_MODE byte to get rounding on norms and zeros.
195
|
196
cu_nmnr:
197
	bfextu	FPCR_MODE(%a6){#0:#2},%d0
198
	tstb	%d0			|check for extended
199
	beq	cu_wrexn		|if so, just write result
200
	cmpib	#1,%d0			|check for single
201
	beq	cu_nmrs			|fall through to double
202
|
203
| The move is fdmove or round precision is double.
204
|
205
cu_nmrd:
206
	movel	#2,%d0			|set up the size for denorm
207
	movew	LOCAL_EX(%a0),%d1		|compare exponent to double threshold
208
	andw	#0x7fff,%d1
209
	cmpw	#0x3c01,%d1
210
	bls	cu_nunfl
211
	bfextu	FPCR_MODE(%a6){#2:#2},%d1	|get rmode
212
	orl	#0x00020000,%d1		|or in rprec (double)
213
	clrl	%d0			|clear g,r,s for round
214
	bclrb	#sign_bit,LOCAL_EX(%a0)	|convert to internal format
215
	sne	LOCAL_SGN(%a0)
216
	bsrl	round
217
	bfclr	LOCAL_SGN(%a0){#0:#8}
218
	beqs	cu_nmrdc
219
	bsetb	#sign_bit,LOCAL_EX(%a0)
220
cu_nmrdc:
221
	movew	LOCAL_EX(%a0),%d1		|check for overflow
222
	andw	#0x7fff,%d1
223
	cmpw	#0x43ff,%d1
224
	bge	cu_novfl		|take care of overflow case
225
	bra	cu_wrexn
226
|
227
| The move is fsmove or round precision is single.
228
|
229
cu_nmrs:
230
	movel	#1,%d0
231
	movew	LOCAL_EX(%a0),%d1
232
	andw	#0x7fff,%d1
233
	cmpw	#0x3f81,%d1
234
	bls	cu_nunfl
235
	bfextu	FPCR_MODE(%a6){#2:#2},%d1
236
	orl	#0x00010000,%d1
237
	clrl	%d0
238
	bclrb	#sign_bit,LOCAL_EX(%a0)
239
	sne	LOCAL_SGN(%a0)
240
	bsrl	round
241
	bfclr	LOCAL_SGN(%a0){#0:#8}
242
	beqs	cu_nmrsc
243
	bsetb	#sign_bit,LOCAL_EX(%a0)
244
cu_nmrsc:
245
	movew	LOCAL_EX(%a0),%d1
246
	andw	#0x7FFF,%d1
247
	cmpw	#0x407f,%d1
248
	blt	cu_wrexn
249
|
250
| The operand is above precision boundaries.  Use t_ovfl to
251
| generate the correct value.
252
|
253
cu_novfl:
254
	bsr	t_ovfl
255
	bra	cu_wrexn
256
|
257
| The operand is below precision boundaries.  Use denorm to
258
| generate the correct value.
259
|
260
cu_nunfl:
261
	bclrb	#sign_bit,LOCAL_EX(%a0)
262
	sne	LOCAL_SGN(%a0)
263
	bsr	denorm
264
	bfclr	LOCAL_SGN(%a0){#0:#8}	|change back to IEEE ext format
265
	beqs	cu_nucont
266
	bsetb	#sign_bit,LOCAL_EX(%a0)
267
cu_nucont:
268
	bfextu	FPCR_MODE(%a6){#2:#2},%d1
269
	btstb	#2,CMDREG1B+1(%a6)	|check for rd
270
	bne	inst_d
271
	btstb	#6,CMDREG1B+1(%a6)	|check for rs
272
	bne	inst_s
273
	swap	%d1
274
	moveb	FPCR_MODE(%a6),%d1
275
	lsrb	#6,%d1
276
	swap	%d1
277
	bra	inst_sd
278
inst_d:
279
	orl	#0x00020000,%d1
280
	bra	inst_sd
281
inst_s:
282
	orl	#0x00010000,%d1
283
inst_sd:
284
	bclrb	#sign_bit,LOCAL_EX(%a0)
285
	sne	LOCAL_SGN(%a0)
286
	bsrl	round
287
	bfclr	LOCAL_SGN(%a0){#0:#8}
288
	beqs	cu_nuflp
289
	bsetb	#sign_bit,LOCAL_EX(%a0)
290
cu_nuflp:
291
	btstb	#inex2_bit,FPSR_EXCEPT(%a6)
292
	beqs	cu_nuninx
293
	orl	#aunfl_mask,USER_FPSR(%a6) |if the round was inex, set AUNFL
294
cu_nuninx:
295
	tstl	LOCAL_HI(%a0)		|test for zero
296
	bnes	cu_nunzro
297
	tstl	LOCAL_LO(%a0)
298
	bnes	cu_nunzro
299
|
300
| The mantissa is zero from the denorm loop.  Check sign and rmode
301
| to see if rounding should have occurred which would leave the lsb.
302
|
303
	movel	USER_FPCR(%a6),%d0
304
	andil	#0x30,%d0		|isolate rmode
305
	cmpil	#0x20,%d0
306
	blts	cu_nzro
307
	bnes	cu_nrp
308
cu_nrm:
309
	tstw	LOCAL_EX(%a0)	|if positive, set lsb
310
	bges	cu_nzro
311
	btstb	#7,FPCR_MODE(%a6) |check for double
312
	beqs	cu_nincs
313
	bras	cu_nincd
314
cu_nrp:
315
	tstw	LOCAL_EX(%a0)	|if positive, set lsb
316
	blts	cu_nzro
317
	btstb	#7,FPCR_MODE(%a6) |check for double
318
	beqs	cu_nincs
319
cu_nincd:
320
	orl	#0x800,LOCAL_LO(%a0) |inc for double
321
	bra	cu_nunzro
322
cu_nincs:
323
	orl	#0x100,LOCAL_HI(%a0) |inc for single
324
	bra	cu_nunzro
325
cu_nzro:
326
	orl	#z_mask,USER_FPSR(%a6)
327
	moveb	STAG(%a6),%d0
328
	andib	#0xe0,%d0
329
	cmpib	#0x40,%d0		|check if input was tagged zero
330
	beqs	cu_numv
331
cu_nunzro:
332
	orl	#unfl_mask,USER_FPSR(%a6) |set unfl
333
cu_numv:
334
	movel	(%a0),ETEMP(%a6)
335
	movel	4(%a0),ETEMP_HI(%a6)
336
	movel	8(%a0),ETEMP_LO(%a6)
337
|
338
| Write the result to memory, setting the fpsr cc bits.  NaN and Inf
339
| bypass cu_wrexn.
340
|
341
cu_wrexn:
342
	tstw	LOCAL_EX(%a0)		|test for zero
343
	beqs	cu_wrzero
344
	cmpw	#0x8000,LOCAL_EX(%a0)	|test for zero
345
	bnes	cu_wreon
346
cu_wrzero:
347
	orl	#z_mask,USER_FPSR(%a6)	|set Z bit
348
cu_wreon:
349
	tstw	LOCAL_EX(%a0)
350
	bpl	wr_etemp
351
	orl	#neg_mask,USER_FPSR(%a6)
352
	bra	wr_etemp
353

354
|
355
| HANDLE SOURCE DENORM HERE
356
|
357
|				;clear denorm stag to norm
358
|				;write the new tag & ete15 to the fstack
359
mon_dnrm:
360
|
361
| At this point, check for the cases in which normalizing the
362
| denorm produces incorrect results.
363
|
364
	tstb	DY_MO_FLG(%a6)	|all cases of dyadic instructions would
365
	bnes	nrm_src		|require normalization of denorm
366

367
| At this point:
368
|	monadic instructions:	fabs  = $18  fneg   = $1a  ftst   = $3a
369
|				fmove = $00  fsmove = $40  fdmove = $44
370
|				fsqrt = $05* fssqrt = $41  fdsqrt = $45
371
|				(*fsqrt reencoded to $05)
372
|
373
	movew	CMDREG1B(%a6),%d0	|get command register
374
	andil	#0x7f,%d0			|strip to only command word
375
|
376
| At this point, fabs, fneg, fsmove, fdmove, ftst, fsqrt, fssqrt, and
377
| fdsqrt are possible.
378
| For cases fabs, fneg, fsmove, and fdmove goto spos (do not normalize)
379
| For cases fsqrt, fssqrt, and fdsqrt goto nrm_src (do normalize)
380
|
381
	btstl	#0,%d0
382
	bnes	nrm_src		|weed out fsqrt instructions
383
	st	CU_ONLY(%a6)	|set cu-only inst flag
384
	bra	cu_dnrm		|fmove, fabs, fneg, ftst
385
|				;cases go to cu_dnrm
386
nrm_src:
387
	bclrb	#sign_bit,LOCAL_EX(%a0)
388
	sne	LOCAL_SGN(%a0)
389
	bsr	nrm_set		|normalize number (exponent will go
390
|				; negative)
391
	bclrb	#sign_bit,LOCAL_EX(%a0) |get rid of false sign
392

393
	bfclr	LOCAL_SGN(%a0){#0:#8}	|change back to IEEE ext format
394
	beqs	spos
395
	bsetb	#sign_bit,LOCAL_EX(%a0)
396
spos:
397
	bfclr	STAG(%a6){#0:#4}	|set tag to normalized, FPTE15 = 0
398
	bsetb	#4,STAG(%a6)	|set ETE15
399
	orb	#0xf0,DNRM_FLG(%a6)
400
normal:
401
	tstb	DNRM_FLG(%a6)	|check if any of the ops were denorms
402
	bne	ck_wrap		|if so, check if it is a potential
403
|				;wrap-around case
404
fix_stk:
405
	moveb	#0xfe,CU_SAVEPC(%a6)
406
	bclrb	#E1,E_BYTE(%a6)
407

408
	clrw	NMNEXC(%a6)
409

410
	st	RES_FLG(%a6)	|indicate that a restore is needed
411
	rts
412

413
|
414
| cu_dnrm handles all cu-only instructions (fmove, fabs, fneg, and
415
| ftst) completely in software without an frestore to the 040.
416
|
417
cu_dnrm:
418
	st	CU_ONLY(%a6)
419
	movew	CMDREG1B(%a6),%d0
420
	andib	#0x3b,%d0		|isolate bits to select inst
421
	tstb	%d0
422
	beql	cu_dmove	|if zero, it is an fmove
423
	cmpib	#0x18,%d0
424
	beql	cu_dabs		|if $18, it is fabs
425
	cmpib	#0x1a,%d0
426
	beql	cu_dneg		|if $1a, it is fneg
427
|
428
| Inst is ftst.  Check the source operand and set the cc's accordingly.
429
| No write is done, so simply rts.
430
|
431
cu_dtst:
432
	movew	LOCAL_EX(%a0),%d0
433
	bclrl	#15,%d0
434
	sne	LOCAL_SGN(%a0)
435
	beqs	cu_dtpo
436
	orl	#neg_mask,USER_FPSR(%a6) |set N
437
cu_dtpo:
438
	cmpiw	#0x7fff,%d0	|test for inf/nan
439
	bnes	cu_dtcz
440
	tstl	LOCAL_HI(%a0)
441
	bnes	cu_dtn
442
	tstl	LOCAL_LO(%a0)
443
	bnes	cu_dtn
444
	orl	#inf_mask,USER_FPSR(%a6)
445
	rts
446
cu_dtn:
447
	orl	#nan_mask,USER_FPSR(%a6)
448
	movel	ETEMP_EX(%a6),FPTEMP_EX(%a6)	|set up fptemp sign for
449
|						;snan handler
450
	rts
451
cu_dtcz:
452
	tstl	LOCAL_HI(%a0)
453
	bnel	cu_dtsx
454
	tstl	LOCAL_LO(%a0)
455
	bnel	cu_dtsx
456
	orl	#z_mask,USER_FPSR(%a6)
457
cu_dtsx:
458
	rts
459
|
460
| Inst is fabs.  Execute the absolute value function on the input.
461
| Branch to the fmove code.
462
|
463
cu_dabs:
464
	bclrb	#7,LOCAL_EX(%a0)		|do abs
465
	bras	cu_dmove		|fmove code will finish
466
|
467
| Inst is fneg.  Execute the negate value function on the input.
468
| Fall though to the fmove code.
469
|
470
cu_dneg:
471
	bchgb	#7,LOCAL_EX(%a0)		|do neg
472
|
473
| Inst is fmove.  This code also handles all result writes.
474
| If bit 2 is set, round is forced to double.  If it is clear,
475
| and bit 6 is set, round is forced to single.  If both are clear,
476
| the round precision is found in the fpcr.  If the rounding precision
477
| is double or single, the result is zero, and the mode is checked
478
| to determine if the lsb of the result should be set.
479
|
480
cu_dmove:
481
	btstb	#2,CMDREG1B+1(%a6)	|check for rd
482
	bne	cu_dmrd
483
	btstb	#6,CMDREG1B+1(%a6)	|check for rs
484
	bne	cu_dmrs
485
|
486
| The move or operation is not with forced precision.  Use the
487
| FPCR_MODE byte to get rounding.
488
|
489
cu_dmnr:
490
	bfextu	FPCR_MODE(%a6){#0:#2},%d0
491
	tstb	%d0			|check for extended
492
	beq	cu_wrexd		|if so, just write result
493
	cmpib	#1,%d0			|check for single
494
	beq	cu_dmrs			|fall through to double
495
|
496
| The move is fdmove or round precision is double.  Result is zero.
497
| Check rmode for rp or rm and set lsb accordingly.
498
|
499
cu_dmrd:
500
	bfextu	FPCR_MODE(%a6){#2:#2},%d1	|get rmode
501
	tstw	LOCAL_EX(%a0)		|check sign
502
	blts	cu_dmdn
503
	cmpib	#3,%d1			|check for rp
504
	bne	cu_dpd			|load double pos zero
505
	bra	cu_dpdr			|load double pos zero w/lsb
506
cu_dmdn:
507
	cmpib	#2,%d1			|check for rm
508
	bne	cu_dnd			|load double neg zero
509
	bra	cu_dndr			|load double neg zero w/lsb
510
|
511
| The move is fsmove or round precision is single.  Result is zero.
512
| Check for rp or rm and set lsb accordingly.
513
|
514
cu_dmrs:
515
	bfextu	FPCR_MODE(%a6){#2:#2},%d1	|get rmode
516
	tstw	LOCAL_EX(%a0)		|check sign
517
	blts	cu_dmsn
518
	cmpib	#3,%d1			|check for rp
519
	bne	cu_spd			|load single pos zero
520
	bra	cu_spdr			|load single pos zero w/lsb
521
cu_dmsn:
522
	cmpib	#2,%d1			|check for rm
523
	bne	cu_snd			|load single neg zero
524
	bra	cu_sndr			|load single neg zero w/lsb
525
|
526
| The precision is extended, so the result in etemp is correct.
527
| Simply set unfl (not inex2 or aunfl) and write the result to
528
| the correct fp register.
529
cu_wrexd:
530
	orl	#unfl_mask,USER_FPSR(%a6)
531
	tstw	LOCAL_EX(%a0)
532
	beq	wr_etemp
533
	orl	#neg_mask,USER_FPSR(%a6)
534
	bra	wr_etemp
535
|
536
| These routines write +/- zero in double format.  The routines
537
| cu_dpdr and cu_dndr set the double lsb.
538
|
539
cu_dpd:
540
	movel	#0x3c010000,LOCAL_EX(%a0)	|force pos double zero
541
	clrl	LOCAL_HI(%a0)
542
	clrl	LOCAL_LO(%a0)
543
	orl	#z_mask,USER_FPSR(%a6)
544
	orl	#unfinx_mask,USER_FPSR(%a6)
545
	bra	wr_etemp
546
cu_dpdr:
547
	movel	#0x3c010000,LOCAL_EX(%a0)	|force pos double zero
548
	clrl	LOCAL_HI(%a0)
549
	movel	#0x800,LOCAL_LO(%a0)	|with lsb set
550
	orl	#unfinx_mask,USER_FPSR(%a6)
551
	bra	wr_etemp
552
cu_dnd:
553
	movel	#0xbc010000,LOCAL_EX(%a0)	|force pos double zero
554
	clrl	LOCAL_HI(%a0)
555
	clrl	LOCAL_LO(%a0)
556
	orl	#z_mask,USER_FPSR(%a6)
557
	orl	#neg_mask,USER_FPSR(%a6)
558
	orl	#unfinx_mask,USER_FPSR(%a6)
559
	bra	wr_etemp
560
cu_dndr:
561
	movel	#0xbc010000,LOCAL_EX(%a0)	|force pos double zero
562
	clrl	LOCAL_HI(%a0)
563
	movel	#0x800,LOCAL_LO(%a0)	|with lsb set
564
	orl	#neg_mask,USER_FPSR(%a6)
565
	orl	#unfinx_mask,USER_FPSR(%a6)
566
	bra	wr_etemp
567
|
568
| These routines write +/- zero in single format.  The routines
569
| cu_dpdr and cu_dndr set the single lsb.
570
|
571
cu_spd:
572
	movel	#0x3f810000,LOCAL_EX(%a0)	|force pos single zero
573
	clrl	LOCAL_HI(%a0)
574
	clrl	LOCAL_LO(%a0)
575
	orl	#z_mask,USER_FPSR(%a6)
576
	orl	#unfinx_mask,USER_FPSR(%a6)
577
	bra	wr_etemp
578
cu_spdr:
579
	movel	#0x3f810000,LOCAL_EX(%a0)	|force pos single zero
580
	movel	#0x100,LOCAL_HI(%a0)	|with lsb set
581
	clrl	LOCAL_LO(%a0)
582
	orl	#unfinx_mask,USER_FPSR(%a6)
583
	bra	wr_etemp
584
cu_snd:
585
	movel	#0xbf810000,LOCAL_EX(%a0)	|force pos single zero
586
	clrl	LOCAL_HI(%a0)
587
	clrl	LOCAL_LO(%a0)
588
	orl	#z_mask,USER_FPSR(%a6)
589
	orl	#neg_mask,USER_FPSR(%a6)
590
	orl	#unfinx_mask,USER_FPSR(%a6)
591
	bra	wr_etemp
592
cu_sndr:
593
	movel	#0xbf810000,LOCAL_EX(%a0)	|force pos single zero
594
	movel	#0x100,LOCAL_HI(%a0)	|with lsb set
595
	clrl	LOCAL_LO(%a0)
596
	orl	#neg_mask,USER_FPSR(%a6)
597
	orl	#unfinx_mask,USER_FPSR(%a6)
598
	bra	wr_etemp
599

600
|
601
| This code checks for 16-bit overflow conditions on dyadic
602
| operations which are not restorable into the floating-point
603
| unit and must be completed in software.  Basically, this
604
| condition exists with a very large norm and a denorm.  One
605
| of the operands must be denormalized to enter this code.
606
|
607
| Flags used:
608
|	DY_MO_FLG contains 0 for monadic op, $ff for dyadic
609
|	DNRM_FLG contains $00 for neither op denormalized
610
|	                  $0f for the destination op denormalized
611
|	                  $f0 for the source op denormalized
612
|	                  $ff for both ops denormalized
613
|
614
| The wrap-around condition occurs for add, sub, div, and cmp
615
| when
616
|
617
|	abs(dest_exp - src_exp) >= $8000
618
|
619
| and for mul when
620
|
621
|	(dest_exp + src_exp) < $0
622
|
623
| we must process the operation here if this case is true.
624
|
625
| The rts following the frcfpn routine is the exit from res_func
626
| for this condition.  The restore flag (RES_FLG) is left clear.
627
| No frestore is done unless an exception is to be reported.
628
|
629
| For fadd:
630
|	if(sign_of(dest) != sign_of(src))
631
|		replace exponent of src with $3fff (keep sign)
632
|		use fpu to perform dest+new_src (user's rmode and X)
633
|		clr sticky
634
|	else
635
|		set sticky
636
|	call round with user's precision and mode
637
|	move result to fpn and wbtemp
638
|
639
| For fsub:
640
|	if(sign_of(dest) == sign_of(src))
641
|		replace exponent of src with $3fff (keep sign)
642
|		use fpu to perform dest+new_src (user's rmode and X)
643
|		clr sticky
644
|	else
645
|		set sticky
646
|	call round with user's precision and mode
647
|	move result to fpn and wbtemp
648
|
649
| For fdiv/fsgldiv:
650
|	if(both operands are denorm)
651
|		restore_to_fpu;
652
|	if(dest is norm)
653
|		force_ovf;
654
|	else(dest is denorm)
655
|		force_unf:
656
|
657
| For fcmp:
658
|	if(dest is norm)
659
|		N = sign_of(dest);
660
|	else(dest is denorm)
661
|		N = sign_of(src);
662
|
663
| For fmul:
664
|	if(both operands are denorm)
665
|		force_unf;
666
|	if((dest_exp + src_exp) < 0)
667
|		force_unf:
668
|	else
669
|		restore_to_fpu;
670
|
671
| local equates:
672
	.set	addcode,0x22
673
	.set	subcode,0x28
674
	.set	mulcode,0x23
675
	.set	divcode,0x20
676
	.set	cmpcode,0x38
677
ck_wrap:
678
	| tstb	DY_MO_FLG(%a6)	;check for fsqrt
679
	beq	fix_stk		|if zero, it is fsqrt
680
	movew	CMDREG1B(%a6),%d0
681
	andiw	#0x3b,%d0		|strip to command bits
682
	cmpiw	#addcode,%d0
683
	beq	wrap_add
684
	cmpiw	#subcode,%d0
685
	beq	wrap_sub
686
	cmpiw	#mulcode,%d0
687
	beq	wrap_mul
688
	cmpiw	#cmpcode,%d0
689
	beq	wrap_cmp
690
|
691
| Inst is fdiv.
692
|
693
wrap_div:
694
	cmpb	#0xff,DNRM_FLG(%a6) |if both ops denorm,
695
	beq	fix_stk		 |restore to fpu
696
|
697
| One of the ops is denormalized.  Test for wrap condition
698
| and force the result.
699
|
700
	cmpb	#0x0f,DNRM_FLG(%a6) |check for dest denorm
701
	bnes	div_srcd
702
div_destd:
703
	bsrl	ckinf_ns
704
	bne	fix_stk
705
	bfextu	ETEMP_EX(%a6){#1:#15},%d0	|get src exp (always pos)
706
	bfexts	FPTEMP_EX(%a6){#1:#15},%d1	|get dest exp (always neg)
707
	subl	%d1,%d0			|subtract dest from src
708
	cmpl	#0x7fff,%d0
709
	blt	fix_stk			|if less, not wrap case
710
	clrb	WBTEMP_SGN(%a6)
711
	movew	ETEMP_EX(%a6),%d0		|find the sign of the result
712
	movew	FPTEMP_EX(%a6),%d1
713
	eorw	%d1,%d0
714
	andiw	#0x8000,%d0
715
	beq	force_unf
716
	st	WBTEMP_SGN(%a6)
717
	bra	force_unf
718

719
ckinf_ns:
720
	moveb	STAG(%a6),%d0		|check source tag for inf or nan
721
	bra	ck_in_com
722
ckinf_nd:
723
	moveb	DTAG(%a6),%d0		|check destination tag for inf or nan
724
ck_in_com:
725
	andib	#0x60,%d0			|isolate tag bits
726
	cmpb	#0x40,%d0			|is it inf?
727
	beq	nan_or_inf		|not wrap case
728
	cmpb	#0x60,%d0			|is it nan?
729
	beq	nan_or_inf		|yes, not wrap case?
730
	cmpb	#0x20,%d0			|is it a zero?
731
	beq	nan_or_inf		|yes
732
	clrl	%d0
733
	rts				|then ; it is either a zero of norm,
734
|					;check wrap case
735
nan_or_inf:
736
	moveql	#-1,%d0
737
	rts
738

739

740

741
div_srcd:
742
	bsrl	ckinf_nd
743
	bne	fix_stk
744
	bfextu	FPTEMP_EX(%a6){#1:#15},%d0	|get dest exp (always pos)
745
	bfexts	ETEMP_EX(%a6){#1:#15},%d1	|get src exp (always neg)
746
	subl	%d1,%d0			|subtract src from dest
747
	cmpl	#0x8000,%d0
748
	blt	fix_stk			|if less, not wrap case
749
	clrb	WBTEMP_SGN(%a6)
750
	movew	ETEMP_EX(%a6),%d0		|find the sign of the result
751
	movew	FPTEMP_EX(%a6),%d1
752
	eorw	%d1,%d0
753
	andiw	#0x8000,%d0
754
	beqs	force_ovf
755
	st	WBTEMP_SGN(%a6)
756
|
757
| This code handles the case of the instruction resulting in
758
| an overflow condition.
759
|
760
force_ovf:
761
	bclrb	#E1,E_BYTE(%a6)
762
	orl	#ovfl_inx_mask,USER_FPSR(%a6)
763
	clrw	NMNEXC(%a6)
764
	leal	WBTEMP(%a6),%a0		|point a0 to memory location
765
	movew	CMDREG1B(%a6),%d0
766
	btstl	#6,%d0			|test for forced precision
767
	beqs	frcovf_fpcr
768
	btstl	#2,%d0			|check for double
769
	bnes	frcovf_dbl
770
	movel	#0x1,%d0			|inst is forced single
771
	bras	frcovf_rnd
772
frcovf_dbl:
773
	movel	#0x2,%d0			|inst is forced double
774
	bras	frcovf_rnd
775
frcovf_fpcr:
776
	bfextu	FPCR_MODE(%a6){#0:#2},%d0	|inst not forced - use fpcr prec
777
frcovf_rnd:
778

779
| The 881/882 does not set inex2 for the following case, so the
780
| line is commented out to be compatible with 881/882
781
|	tst.b	%d0
782
|	beq.b	frcovf_x
783
|	or.l	#inex2_mask,USER_FPSR(%a6) ;if prec is s or d, set inex2
784

785
|frcovf_x:
786
	bsrl	ovf_res			|get correct result based on
787
|					;round precision/mode.  This
788
|					;sets FPSR_CC correctly
789
|					;returns in external format
790
	bfclr	WBTEMP_SGN(%a6){#0:#8}
791
	beq	frcfpn
792
	bsetb	#sign_bit,WBTEMP_EX(%a6)
793
	bra	frcfpn
794
|
795
| Inst is fadd.
796
|
797
wrap_add:
798
	cmpb	#0xff,DNRM_FLG(%a6) |if both ops denorm,
799
	beq	fix_stk		 |restore to fpu
800
|
801
| One of the ops is denormalized.  Test for wrap condition
802
| and complete the instruction.
803
|
804
	cmpb	#0x0f,DNRM_FLG(%a6) |check for dest denorm
805
	bnes	add_srcd
806
add_destd:
807
	bsrl	ckinf_ns
808
	bne	fix_stk
809
	bfextu	ETEMP_EX(%a6){#1:#15},%d0	|get src exp (always pos)
810
	bfexts	FPTEMP_EX(%a6){#1:#15},%d1	|get dest exp (always neg)
811
	subl	%d1,%d0			|subtract dest from src
812
	cmpl	#0x8000,%d0
813
	blt	fix_stk			|if less, not wrap case
814
	bra	add_wrap
815
add_srcd:
816
	bsrl	ckinf_nd
817
	bne	fix_stk
818
	bfextu	FPTEMP_EX(%a6){#1:#15},%d0	|get dest exp (always pos)
819
	bfexts	ETEMP_EX(%a6){#1:#15},%d1	|get src exp (always neg)
820
	subl	%d1,%d0			|subtract src from dest
821
	cmpl	#0x8000,%d0
822
	blt	fix_stk			|if less, not wrap case
823
|
824
| Check the signs of the operands.  If they are unlike, the fpu
825
| can be used to add the norm and 1.0 with the sign of the
826
| denorm and it will correctly generate the result in extended
827
| precision.  We can then call round with no sticky and the result
828
| will be correct for the user's rounding mode and precision.  If
829
| the signs are the same, we call round with the sticky bit set
830
| and the result will be correct for the user's rounding mode and
831
| precision.
832
|
833
add_wrap:
834
	movew	ETEMP_EX(%a6),%d0
835
	movew	FPTEMP_EX(%a6),%d1
836
	eorw	%d1,%d0
837
	andiw	#0x8000,%d0
838
	beq	add_same
839
|
840
| The signs are unlike.
841
|
842
	cmpb	#0x0f,DNRM_FLG(%a6) |is dest the denorm?
843
	bnes	add_u_srcd
844
	movew	FPTEMP_EX(%a6),%d0
845
	andiw	#0x8000,%d0
846
	orw	#0x3fff,%d0	|force the exponent to +/- 1
847
	movew	%d0,FPTEMP_EX(%a6) |in the denorm
848
	movel	USER_FPCR(%a6),%d0
849
	andil	#0x30,%d0
850
	fmovel	%d0,%fpcr		|set up users rmode and X
851
	fmovex	ETEMP(%a6),%fp0
852
	faddx	FPTEMP(%a6),%fp0
853
	leal	WBTEMP(%a6),%a0	|point a0 to wbtemp in frame
854
	fmovel	%fpsr,%d1
855
	orl	%d1,USER_FPSR(%a6) |capture cc's and inex from fadd
856
	fmovex	%fp0,WBTEMP(%a6)	|write result to memory
857
	lsrl	#4,%d0		|put rmode in lower 2 bits
858
	movel	USER_FPCR(%a6),%d1
859
	andil	#0xc0,%d1
860
	lsrl	#6,%d1		|put precision in upper word
861
	swap	%d1
862
	orl	%d0,%d1		|set up for round call
863
	clrl	%d0		|force sticky to zero
864
	bclrb	#sign_bit,WBTEMP_EX(%a6)
865
	sne	WBTEMP_SGN(%a6)
866
	bsrl	round		|round result to users rmode & prec
867
	bfclr	WBTEMP_SGN(%a6){#0:#8}	|convert back to IEEE ext format
868
	beq	frcfpnr
869
	bsetb	#sign_bit,WBTEMP_EX(%a6)
870
	bra	frcfpnr
871
add_u_srcd:
872
	movew	ETEMP_EX(%a6),%d0
873
	andiw	#0x8000,%d0
874
	orw	#0x3fff,%d0	|force the exponent to +/- 1
875
	movew	%d0,ETEMP_EX(%a6) |in the denorm
876
	movel	USER_FPCR(%a6),%d0
877
	andil	#0x30,%d0
878
	fmovel	%d0,%fpcr		|set up users rmode and X
879
	fmovex	ETEMP(%a6),%fp0
880
	faddx	FPTEMP(%a6),%fp0
881
	fmovel	%fpsr,%d1
882
	orl	%d1,USER_FPSR(%a6) |capture cc's and inex from fadd
883
	leal	WBTEMP(%a6),%a0	|point a0 to wbtemp in frame
884
	fmovex	%fp0,WBTEMP(%a6)	|write result to memory
885
	lsrl	#4,%d0		|put rmode in lower 2 bits
886
	movel	USER_FPCR(%a6),%d1
887
	andil	#0xc0,%d1
888
	lsrl	#6,%d1		|put precision in upper word
889
	swap	%d1
890
	orl	%d0,%d1		|set up for round call
891
	clrl	%d0		|force sticky to zero
892
	bclrb	#sign_bit,WBTEMP_EX(%a6)
893
	sne	WBTEMP_SGN(%a6)	|use internal format for round
894
	bsrl	round		|round result to users rmode & prec
895
	bfclr	WBTEMP_SGN(%a6){#0:#8}	|convert back to IEEE ext format
896
	beq	frcfpnr
897
	bsetb	#sign_bit,WBTEMP_EX(%a6)
898
	bra	frcfpnr
899
|
900
| Signs are alike:
901
|
902
add_same:
903
	cmpb	#0x0f,DNRM_FLG(%a6) |is dest the denorm?
904
	bnes	add_s_srcd
905
add_s_destd:
906
	leal	ETEMP(%a6),%a0
907
	movel	USER_FPCR(%a6),%d0
908
	andil	#0x30,%d0
909
	lsrl	#4,%d0		|put rmode in lower 2 bits
910
	movel	USER_FPCR(%a6),%d1
911
	andil	#0xc0,%d1
912
	lsrl	#6,%d1		|put precision in upper word
913
	swap	%d1
914
	orl	%d0,%d1		|set up for round call
915
	movel	#0x20000000,%d0	|set sticky for round
916
	bclrb	#sign_bit,ETEMP_EX(%a6)
917
	sne	ETEMP_SGN(%a6)
918
	bsrl	round		|round result to users rmode & prec
919
	bfclr	ETEMP_SGN(%a6){#0:#8}	|convert back to IEEE ext format
920
	beqs	add_s_dclr
921
	bsetb	#sign_bit,ETEMP_EX(%a6)
922
add_s_dclr:
923
	leal	WBTEMP(%a6),%a0
924
	movel	ETEMP(%a6),(%a0)	|write result to wbtemp
925
	movel	ETEMP_HI(%a6),4(%a0)
926
	movel	ETEMP_LO(%a6),8(%a0)
927
	tstw	ETEMP_EX(%a6)
928
	bgt	add_ckovf
929
	orl	#neg_mask,USER_FPSR(%a6)
930
	bra	add_ckovf
931
add_s_srcd:
932
	leal	FPTEMP(%a6),%a0
933
	movel	USER_FPCR(%a6),%d0
934
	andil	#0x30,%d0
935
	lsrl	#4,%d0		|put rmode in lower 2 bits
936
	movel	USER_FPCR(%a6),%d1
937
	andil	#0xc0,%d1
938
	lsrl	#6,%d1		|put precision in upper word
939
	swap	%d1
940
	orl	%d0,%d1		|set up for round call
941
	movel	#0x20000000,%d0	|set sticky for round
942
	bclrb	#sign_bit,FPTEMP_EX(%a6)
943
	sne	FPTEMP_SGN(%a6)
944
	bsrl	round		|round result to users rmode & prec
945
	bfclr	FPTEMP_SGN(%a6){#0:#8}	|convert back to IEEE ext format
946
	beqs	add_s_sclr
947
	bsetb	#sign_bit,FPTEMP_EX(%a6)
948
add_s_sclr:
949
	leal	WBTEMP(%a6),%a0
950
	movel	FPTEMP(%a6),(%a0)	|write result to wbtemp
951
	movel	FPTEMP_HI(%a6),4(%a0)
952
	movel	FPTEMP_LO(%a6),8(%a0)
953
	tstw	FPTEMP_EX(%a6)
954
	bgt	add_ckovf
955
	orl	#neg_mask,USER_FPSR(%a6)
956
add_ckovf:
957
	movew	WBTEMP_EX(%a6),%d0
958
	andiw	#0x7fff,%d0
959
	cmpiw	#0x7fff,%d0
960
	bne	frcfpnr
961
|
962
| The result has overflowed to $7fff exponent.  Set I, ovfl,
963
| and aovfl, and clr the mantissa (incorrectly set by the
964
| round routine.)
965
|
966
	orl	#inf_mask+ovfl_inx_mask,USER_FPSR(%a6)
967
	clrl	4(%a0)
968
	bra	frcfpnr
969
|
970
| Inst is fsub.
971
|
972
wrap_sub:
973
	cmpb	#0xff,DNRM_FLG(%a6) |if both ops denorm,
974
	beq	fix_stk		 |restore to fpu
975
|
976
| One of the ops is denormalized.  Test for wrap condition
977
| and complete the instruction.
978
|
979
	cmpb	#0x0f,DNRM_FLG(%a6) |check for dest denorm
980
	bnes	sub_srcd
981
sub_destd:
982
	bsrl	ckinf_ns
983
	bne	fix_stk
984
	bfextu	ETEMP_EX(%a6){#1:#15},%d0	|get src exp (always pos)
985
	bfexts	FPTEMP_EX(%a6){#1:#15},%d1	|get dest exp (always neg)
986
	subl	%d1,%d0			|subtract src from dest
987
	cmpl	#0x8000,%d0
988
	blt	fix_stk			|if less, not wrap case
989
	bra	sub_wrap
990
sub_srcd:
991
	bsrl	ckinf_nd
992
	bne	fix_stk
993
	bfextu	FPTEMP_EX(%a6){#1:#15},%d0	|get dest exp (always pos)
994
	bfexts	ETEMP_EX(%a6){#1:#15},%d1	|get src exp (always neg)
995
	subl	%d1,%d0			|subtract dest from src
996
	cmpl	#0x8000,%d0
997
	blt	fix_stk			|if less, not wrap case
998
|
999
| Check the signs of the operands.  If they are alike, the fpu
1000
| can be used to subtract from the norm 1.0 with the sign of the
1001
| denorm and it will correctly generate the result in extended
1002
| precision.  We can then call round with no sticky and the result
1003
| will be correct for the user's rounding mode and precision.  If
1004
| the signs are unlike, we call round with the sticky bit set
1005
| and the result will be correct for the user's rounding mode and
1006
| precision.
1007
|
1008
sub_wrap:
1009
	movew	ETEMP_EX(%a6),%d0
1010
	movew	FPTEMP_EX(%a6),%d1
1011
	eorw	%d1,%d0
1012
	andiw	#0x8000,%d0
1013
	bne	sub_diff
1014
|
1015
| The signs are alike.
1016
|
1017
	cmpb	#0x0f,DNRM_FLG(%a6) |is dest the denorm?
1018
	bnes	sub_u_srcd
1019
	movew	FPTEMP_EX(%a6),%d0
1020
	andiw	#0x8000,%d0
1021
	orw	#0x3fff,%d0	|force the exponent to +/- 1
1022
	movew	%d0,FPTEMP_EX(%a6) |in the denorm
1023
	movel	USER_FPCR(%a6),%d0
1024
	andil	#0x30,%d0
1025
	fmovel	%d0,%fpcr		|set up users rmode and X
1026
	fmovex	FPTEMP(%a6),%fp0
1027
	fsubx	ETEMP(%a6),%fp0
1028
	fmovel	%fpsr,%d1
1029
	orl	%d1,USER_FPSR(%a6) |capture cc's and inex from fadd
1030
	leal	WBTEMP(%a6),%a0	|point a0 to wbtemp in frame
1031
	fmovex	%fp0,WBTEMP(%a6)	|write result to memory
1032
	lsrl	#4,%d0		|put rmode in lower 2 bits
1033
	movel	USER_FPCR(%a6),%d1
1034
	andil	#0xc0,%d1
1035
	lsrl	#6,%d1		|put precision in upper word
1036
	swap	%d1
1037
	orl	%d0,%d1		|set up for round call
1038
	clrl	%d0		|force sticky to zero
1039
	bclrb	#sign_bit,WBTEMP_EX(%a6)
1040
	sne	WBTEMP_SGN(%a6)
1041
	bsrl	round		|round result to users rmode & prec
1042
	bfclr	WBTEMP_SGN(%a6){#0:#8}	|convert back to IEEE ext format
1043
	beq	frcfpnr
1044
	bsetb	#sign_bit,WBTEMP_EX(%a6)
1045
	bra	frcfpnr
1046
sub_u_srcd:
1047
	movew	ETEMP_EX(%a6),%d0
1048
	andiw	#0x8000,%d0
1049
	orw	#0x3fff,%d0	|force the exponent to +/- 1
1050
	movew	%d0,ETEMP_EX(%a6) |in the denorm
1051
	movel	USER_FPCR(%a6),%d0
1052
	andil	#0x30,%d0
1053
	fmovel	%d0,%fpcr		|set up users rmode and X
1054
	fmovex	FPTEMP(%a6),%fp0
1055
	fsubx	ETEMP(%a6),%fp0
1056
	fmovel	%fpsr,%d1
1057
	orl	%d1,USER_FPSR(%a6) |capture cc's and inex from fadd
1058
	leal	WBTEMP(%a6),%a0	|point a0 to wbtemp in frame
1059
	fmovex	%fp0,WBTEMP(%a6)	|write result to memory
1060
	lsrl	#4,%d0		|put rmode in lower 2 bits
1061
	movel	USER_FPCR(%a6),%d1
1062
	andil	#0xc0,%d1
1063
	lsrl	#6,%d1		|put precision in upper word
1064
	swap	%d1
1065
	orl	%d0,%d1		|set up for round call
1066
	clrl	%d0		|force sticky to zero
1067
	bclrb	#sign_bit,WBTEMP_EX(%a6)
1068
	sne	WBTEMP_SGN(%a6)
1069
	bsrl	round		|round result to users rmode & prec
1070
	bfclr	WBTEMP_SGN(%a6){#0:#8}	|convert back to IEEE ext format
1071
	beq	frcfpnr
1072
	bsetb	#sign_bit,WBTEMP_EX(%a6)
1073
	bra	frcfpnr
1074
|
1075
| Signs are unlike:
1076
|
1077
sub_diff:
1078
	cmpb	#0x0f,DNRM_FLG(%a6) |is dest the denorm?
1079
	bnes	sub_s_srcd
1080
sub_s_destd:
1081
	leal	ETEMP(%a6),%a0
1082
	movel	USER_FPCR(%a6),%d0
1083
	andil	#0x30,%d0
1084
	lsrl	#4,%d0		|put rmode in lower 2 bits
1085
	movel	USER_FPCR(%a6),%d1
1086
	andil	#0xc0,%d1
1087
	lsrl	#6,%d1		|put precision in upper word
1088
	swap	%d1
1089
	orl	%d0,%d1		|set up for round call
1090
	movel	#0x20000000,%d0	|set sticky for round
1091
|
1092
| Since the dest is the denorm, the sign is the opposite of the
1093
| norm sign.
1094
|
1095
	eoriw	#0x8000,ETEMP_EX(%a6)	|flip sign on result
1096
	tstw	ETEMP_EX(%a6)
1097
	bgts	sub_s_dwr
1098
	orl	#neg_mask,USER_FPSR(%a6)
1099
sub_s_dwr:
1100
	bclrb	#sign_bit,ETEMP_EX(%a6)
1101
	sne	ETEMP_SGN(%a6)
1102
	bsrl	round		|round result to users rmode & prec
1103
	bfclr	ETEMP_SGN(%a6){#0:#8}	|convert back to IEEE ext format
1104
	beqs	sub_s_dclr
1105
	bsetb	#sign_bit,ETEMP_EX(%a6)
1106
sub_s_dclr:
1107
	leal	WBTEMP(%a6),%a0
1108
	movel	ETEMP(%a6),(%a0)	|write result to wbtemp
1109
	movel	ETEMP_HI(%a6),4(%a0)
1110
	movel	ETEMP_LO(%a6),8(%a0)
1111
	bra	sub_ckovf
1112
sub_s_srcd:
1113
	leal	FPTEMP(%a6),%a0
1114
	movel	USER_FPCR(%a6),%d0
1115
	andil	#0x30,%d0
1116
	lsrl	#4,%d0		|put rmode in lower 2 bits
1117
	movel	USER_FPCR(%a6),%d1
1118
	andil	#0xc0,%d1
1119
	lsrl	#6,%d1		|put precision in upper word
1120
	swap	%d1
1121
	orl	%d0,%d1		|set up for round call
1122
	movel	#0x20000000,%d0	|set sticky for round
1123
	bclrb	#sign_bit,FPTEMP_EX(%a6)
1124
	sne	FPTEMP_SGN(%a6)
1125
	bsrl	round		|round result to users rmode & prec
1126
	bfclr	FPTEMP_SGN(%a6){#0:#8}	|convert back to IEEE ext format
1127
	beqs	sub_s_sclr
1128
	bsetb	#sign_bit,FPTEMP_EX(%a6)
1129
sub_s_sclr:
1130
	leal	WBTEMP(%a6),%a0
1131
	movel	FPTEMP(%a6),(%a0)	|write result to wbtemp
1132
	movel	FPTEMP_HI(%a6),4(%a0)
1133
	movel	FPTEMP_LO(%a6),8(%a0)
1134
	tstw	FPTEMP_EX(%a6)
1135
	bgt	sub_ckovf
1136
	orl	#neg_mask,USER_FPSR(%a6)
1137
sub_ckovf:
1138
	movew	WBTEMP_EX(%a6),%d0
1139
	andiw	#0x7fff,%d0
1140
	cmpiw	#0x7fff,%d0
1141
	bne	frcfpnr
1142
|
1143
| The result has overflowed to $7fff exponent.  Set I, ovfl,
1144
| and aovfl, and clr the mantissa (incorrectly set by the
1145
| round routine.)
1146
|
1147
	orl	#inf_mask+ovfl_inx_mask,USER_FPSR(%a6)
1148
	clrl	4(%a0)
1149
	bra	frcfpnr
1150
|
1151
| Inst is fcmp.
1152
|
1153
wrap_cmp:
1154
	cmpb	#0xff,DNRM_FLG(%a6) |if both ops denorm,
1155
	beq	fix_stk		 |restore to fpu
1156
|
1157
| One of the ops is denormalized.  Test for wrap condition
1158
| and complete the instruction.
1159
|
1160
	cmpb	#0x0f,DNRM_FLG(%a6) |check for dest denorm
1161
	bnes	cmp_srcd
1162
cmp_destd:
1163
	bsrl	ckinf_ns
1164
	bne	fix_stk
1165
	bfextu	ETEMP_EX(%a6){#1:#15},%d0	|get src exp (always pos)
1166
	bfexts	FPTEMP_EX(%a6){#1:#15},%d1	|get dest exp (always neg)
1167
	subl	%d1,%d0			|subtract dest from src
1168
	cmpl	#0x8000,%d0
1169
	blt	fix_stk			|if less, not wrap case
1170
	tstw	ETEMP_EX(%a6)		|set N to ~sign_of(src)
1171
	bge	cmp_setn
1172
	rts
1173
cmp_srcd:
1174
	bsrl	ckinf_nd
1175
	bne	fix_stk
1176
	bfextu	FPTEMP_EX(%a6){#1:#15},%d0	|get dest exp (always pos)
1177
	bfexts	ETEMP_EX(%a6){#1:#15},%d1	|get src exp (always neg)
1178
	subl	%d1,%d0			|subtract src from dest
1179
	cmpl	#0x8000,%d0
1180
	blt	fix_stk			|if less, not wrap case
1181
	tstw	FPTEMP_EX(%a6)		|set N to sign_of(dest)
1182
	blt	cmp_setn
1183
	rts
1184
cmp_setn:
1185
	orl	#neg_mask,USER_FPSR(%a6)
1186
	rts
1187

1188
|
1189
| Inst is fmul.
1190
|
1191
wrap_mul:
1192
	cmpb	#0xff,DNRM_FLG(%a6) |if both ops denorm,
1193
	beq	force_unf	|force an underflow (really!)
1194
|
1195
| One of the ops is denormalized.  Test for wrap condition
1196
| and complete the instruction.
1197
|
1198
	cmpb	#0x0f,DNRM_FLG(%a6) |check for dest denorm
1199
	bnes	mul_srcd
1200
mul_destd:
1201
	bsrl	ckinf_ns
1202
	bne	fix_stk
1203
	bfextu	ETEMP_EX(%a6){#1:#15},%d0	|get src exp (always pos)
1204
	bfexts	FPTEMP_EX(%a6){#1:#15},%d1	|get dest exp (always neg)
1205
	addl	%d1,%d0			|subtract dest from src
1206
	bgt	fix_stk
1207
	bra	force_unf
1208
mul_srcd:
1209
	bsrl	ckinf_nd
1210
	bne	fix_stk
1211
	bfextu	FPTEMP_EX(%a6){#1:#15},%d0	|get dest exp (always pos)
1212
	bfexts	ETEMP_EX(%a6){#1:#15},%d1	|get src exp (always neg)
1213
	addl	%d1,%d0			|subtract src from dest
1214
	bgt	fix_stk
1215

1216
|
1217
| This code handles the case of the instruction resulting in
1218
| an underflow condition.
1219
|
1220
force_unf:
1221
	bclrb	#E1,E_BYTE(%a6)
1222
	orl	#unfinx_mask,USER_FPSR(%a6)
1223
	clrw	NMNEXC(%a6)
1224
	clrb	WBTEMP_SGN(%a6)
1225
	movew	ETEMP_EX(%a6),%d0		|find the sign of the result
1226
	movew	FPTEMP_EX(%a6),%d1
1227
	eorw	%d1,%d0
1228
	andiw	#0x8000,%d0
1229
	beqs	frcunfcont
1230
	st	WBTEMP_SGN(%a6)
1231
frcunfcont:
1232
	lea	WBTEMP(%a6),%a0		|point a0 to memory location
1233
	movew	CMDREG1B(%a6),%d0
1234
	btstl	#6,%d0			|test for forced precision
1235
	beqs	frcunf_fpcr
1236
	btstl	#2,%d0			|check for double
1237
	bnes	frcunf_dbl
1238
	movel	#0x1,%d0			|inst is forced single
1239
	bras	frcunf_rnd
1240
frcunf_dbl:
1241
	movel	#0x2,%d0			|inst is forced double
1242
	bras	frcunf_rnd
1243
frcunf_fpcr:
1244
	bfextu	FPCR_MODE(%a6){#0:#2},%d0	|inst not forced - use fpcr prec
1245
frcunf_rnd:
1246
	bsrl	unf_sub			|get correct result based on
1247
|					;round precision/mode.  This
1248
|					;sets FPSR_CC correctly
1249
	bfclr	WBTEMP_SGN(%a6){#0:#8}	|convert back to IEEE ext format
1250
	beqs	frcfpn
1251
	bsetb	#sign_bit,WBTEMP_EX(%a6)
1252
	bra	frcfpn
1253

1254
|
1255
| Write the result to the user's fpn.  All results must be HUGE to be
1256
| written; otherwise the results would have overflowed or underflowed.
1257
| If the rounding precision is single or double, the ovf_res routine
1258
| is needed to correctly supply the max value.
1259
|
1260
frcfpnr:
1261
	movew	CMDREG1B(%a6),%d0
1262
	btstl	#6,%d0			|test for forced precision
1263
	beqs	frcfpn_fpcr
1264
	btstl	#2,%d0			|check for double
1265
	bnes	frcfpn_dbl
1266
	movel	#0x1,%d0			|inst is forced single
1267
	bras	frcfpn_rnd
1268
frcfpn_dbl:
1269
	movel	#0x2,%d0			|inst is forced double
1270
	bras	frcfpn_rnd
1271
frcfpn_fpcr:
1272
	bfextu	FPCR_MODE(%a6){#0:#2},%d0	|inst not forced - use fpcr prec
1273
	tstb	%d0
1274
	beqs	frcfpn			|if extended, write what you got
1275
frcfpn_rnd:
1276
	bclrb	#sign_bit,WBTEMP_EX(%a6)
1277
	sne	WBTEMP_SGN(%a6)
1278
	bsrl	ovf_res			|get correct result based on
1279
|					;round precision/mode.  This
1280
|					;sets FPSR_CC correctly
1281
	bfclr	WBTEMP_SGN(%a6){#0:#8}	|convert back to IEEE ext format
1282
	beqs	frcfpn_clr
1283
	bsetb	#sign_bit,WBTEMP_EX(%a6)
1284
frcfpn_clr:
1285
	orl	#ovfinx_mask,USER_FPSR(%a6)
1286
|
1287
| Perform the write.
1288
|
1289
frcfpn:
1290
	bfextu	CMDREG1B(%a6){#6:#3},%d0	|extract fp destination register
1291
	cmpib	#3,%d0
1292
	bles	frc0123			|check if dest is fp0-fp3
1293
	movel	#7,%d1
1294
	subl	%d0,%d1
1295
	clrl	%d0
1296
	bsetl	%d1,%d0
1297
	fmovemx WBTEMP(%a6),%d0
1298
	rts
1299
frc0123:
1300
	cmpib	#0,%d0
1301
	beqs	frc0_dst
1302
	cmpib	#1,%d0
1303
	beqs	frc1_dst
1304
	cmpib	#2,%d0
1305
	beqs	frc2_dst
1306
frc3_dst:
1307
	movel	WBTEMP_EX(%a6),USER_FP3(%a6)
1308
	movel	WBTEMP_HI(%a6),USER_FP3+4(%a6)
1309
	movel	WBTEMP_LO(%a6),USER_FP3+8(%a6)
1310
	rts
1311
frc2_dst:
1312
	movel	WBTEMP_EX(%a6),USER_FP2(%a6)
1313
	movel	WBTEMP_HI(%a6),USER_FP2+4(%a6)
1314
	movel	WBTEMP_LO(%a6),USER_FP2+8(%a6)
1315
	rts
1316
frc1_dst:
1317
	movel	WBTEMP_EX(%a6),USER_FP1(%a6)
1318
	movel	WBTEMP_HI(%a6),USER_FP1+4(%a6)
1319
	movel	WBTEMP_LO(%a6),USER_FP1+8(%a6)
1320
	rts
1321
frc0_dst:
1322
	movel	WBTEMP_EX(%a6),USER_FP0(%a6)
1323
	movel	WBTEMP_HI(%a6),USER_FP0+4(%a6)
1324
	movel	WBTEMP_LO(%a6),USER_FP0+8(%a6)
1325
	rts
1326

1327
|
1328
| Write etemp to fpn.
1329
| A check is made on enabled and signalled snan exceptions,
1330
| and the destination is not overwritten if this condition exists.
1331
| This code is designed to make fmoveins of unsupported data types
1332
| faster.
1333
|
1334
wr_etemp:
1335
	btstb	#snan_bit,FPSR_EXCEPT(%a6)	|if snan is set, and
1336
	beqs	fmoveinc		|enabled, force restore
1337
	btstb	#snan_bit,FPCR_ENABLE(%a6) |and don't overwrite
1338
	beqs	fmoveinc		|the dest
1339
	movel	ETEMP_EX(%a6),FPTEMP_EX(%a6)	|set up fptemp sign for
1340
|						;snan handler
1341
	tstb	ETEMP(%a6)		|check for negative
1342
	blts	snan_neg
1343
	rts
1344
snan_neg:
1345
	orl	#neg_bit,USER_FPSR(%a6)	|snan is negative; set N
1346
	rts
1347
fmoveinc:
1348
	clrw	NMNEXC(%a6)
1349
	bclrb	#E1,E_BYTE(%a6)
1350
	moveb	STAG(%a6),%d0		|check if stag is inf
1351
	andib	#0xe0,%d0
1352
	cmpib	#0x40,%d0
1353
	bnes	fminc_cnan
1354
	orl	#inf_mask,USER_FPSR(%a6) |if inf, nothing yet has set I
1355
	tstw	LOCAL_EX(%a0)		|check sign
1356
	bges	fminc_con
1357
	orl	#neg_mask,USER_FPSR(%a6)
1358
	bra	fminc_con
1359
fminc_cnan:
1360
	cmpib	#0x60,%d0			|check if stag is NaN
1361
	bnes	fminc_czero
1362
	orl	#nan_mask,USER_FPSR(%a6) |if nan, nothing yet has set NaN
1363
	movel	ETEMP_EX(%a6),FPTEMP_EX(%a6)	|set up fptemp sign for
1364
|						;snan handler
1365
	tstw	LOCAL_EX(%a0)		|check sign
1366
	bges	fminc_con
1367
	orl	#neg_mask,USER_FPSR(%a6)
1368
	bra	fminc_con
1369
fminc_czero:
1370
	cmpib	#0x20,%d0			|check if zero
1371
	bnes	fminc_con
1372
	orl	#z_mask,USER_FPSR(%a6)	|if zero, set Z
1373
	tstw	LOCAL_EX(%a0)		|check sign
1374
	bges	fminc_con
1375
	orl	#neg_mask,USER_FPSR(%a6)
1376
fminc_con:
1377
	bfextu	CMDREG1B(%a6){#6:#3},%d0	|extract fp destination register
1378
	cmpib	#3,%d0
1379
	bles	fp0123			|check if dest is fp0-fp3
1380
	movel	#7,%d1
1381
	subl	%d0,%d1
1382
	clrl	%d0
1383
	bsetl	%d1,%d0
1384
	fmovemx ETEMP(%a6),%d0
1385
	rts
1386

1387
fp0123:
1388
	cmpib	#0,%d0
1389
	beqs	fp0_dst
1390
	cmpib	#1,%d0
1391
	beqs	fp1_dst
1392
	cmpib	#2,%d0
1393
	beqs	fp2_dst
1394
fp3_dst:
1395
	movel	ETEMP_EX(%a6),USER_FP3(%a6)
1396
	movel	ETEMP_HI(%a6),USER_FP3+4(%a6)
1397
	movel	ETEMP_LO(%a6),USER_FP3+8(%a6)
1398
	rts
1399
fp2_dst:
1400
	movel	ETEMP_EX(%a6),USER_FP2(%a6)
1401
	movel	ETEMP_HI(%a6),USER_FP2+4(%a6)
1402
	movel	ETEMP_LO(%a6),USER_FP2+8(%a6)
1403
	rts
1404
fp1_dst:
1405
	movel	ETEMP_EX(%a6),USER_FP1(%a6)
1406
	movel	ETEMP_HI(%a6),USER_FP1+4(%a6)
1407
	movel	ETEMP_LO(%a6),USER_FP1+8(%a6)
1408
	rts
1409
fp0_dst:
1410
	movel	ETEMP_EX(%a6),USER_FP0(%a6)
1411
	movel	ETEMP_HI(%a6),USER_FP0+4(%a6)
1412
	movel	ETEMP_LO(%a6),USER_FP0+8(%a6)
1413
	rts
1414

1415
opclass3:
1416
	st	CU_ONLY(%a6)
1417
	movew	CMDREG1B(%a6),%d0	|check if packed moveout
1418
	andiw	#0x0c00,%d0	|isolate last 2 bits of size field
1419
	cmpiw	#0x0c00,%d0	|if size is 011 or 111, it is packed
1420
	beq	pack_out	|else it is norm or denorm
1421
	bra	mv_out
1422

1423

1424
|
1425
|	MOVE OUT
1426
|
1427

1428
mv_tbl:
1429
	.long	li
1430
	.long	sgp
1431
	.long	xp
1432
	.long	mvout_end	|should never be taken
1433
	.long	wi
1434
	.long	dp
1435
	.long	bi
1436
	.long	mvout_end	|should never be taken
1437
mv_out:
1438
	bfextu	CMDREG1B(%a6){#3:#3},%d1	|put source specifier in d1
1439
	leal	mv_tbl,%a0
1440
	movel	%a0@(%d1:l:4),%a0
1441
	jmp	(%a0)
1442

1443
|
1444
| This exit is for move-out to memory.  The aunfl bit is
1445
| set if the result is inex and unfl is signalled.
1446
|
1447
mvout_end:
1448
	btstb	#inex2_bit,FPSR_EXCEPT(%a6)
1449
	beqs	no_aufl
1450
	btstb	#unfl_bit,FPSR_EXCEPT(%a6)
1451
	beqs	no_aufl
1452
	bsetb	#aunfl_bit,FPSR_AEXCEPT(%a6)
1453
no_aufl:
1454
	clrw	NMNEXC(%a6)
1455
	bclrb	#E1,E_BYTE(%a6)
1456
	fmovel	#0,%FPSR			|clear any cc bits from res_func
1457
|
1458
| Return ETEMP to extended format from internal extended format so
1459
| that gen_except will have a correctly signed value for ovfl/unfl
1460
| handlers.
1461
|
1462
	bfclr	ETEMP_SGN(%a6){#0:#8}
1463
	beqs	mvout_con
1464
	bsetb	#sign_bit,ETEMP_EX(%a6)
1465
mvout_con:
1466
	rts
1467
|
1468
| This exit is for move-out to int register.  The aunfl bit is
1469
| not set in any case for this move.
1470
|
1471
mvouti_end:
1472
	clrw	NMNEXC(%a6)
1473
	bclrb	#E1,E_BYTE(%a6)
1474
	fmovel	#0,%FPSR			|clear any cc bits from res_func
1475
|
1476
| Return ETEMP to extended format from internal extended format so
1477
| that gen_except will have a correctly signed value for ovfl/unfl
1478
| handlers.
1479
|
1480
	bfclr	ETEMP_SGN(%a6){#0:#8}
1481
	beqs	mvouti_con
1482
	bsetb	#sign_bit,ETEMP_EX(%a6)
1483
mvouti_con:
1484
	rts
1485
|
1486
| li is used to handle a long integer source specifier
1487
|
1488

1489
li:
1490
	moveql	#4,%d0		|set byte count
1491

1492
	btstb	#7,STAG(%a6)	|check for extended denorm
1493
	bne	int_dnrm	|if so, branch
1494

1495
	fmovemx ETEMP(%a6),%fp0-%fp0
1496
	fcmpd	#0x41dfffffffc00000,%fp0
1497
| 41dfffffffc00000 in dbl prec = 401d0000fffffffe00000000 in ext prec
1498
	fbge	lo_plrg
1499
	fcmpd	#0xc1e0000000000000,%fp0
1500
| c1e0000000000000 in dbl prec = c01e00008000000000000000 in ext prec
1501
	fble	lo_nlrg
1502
|
1503
| at this point, the answer is between the largest pos and neg values
1504
|
1505
	movel	USER_FPCR(%a6),%d1	|use user's rounding mode
1506
	andil	#0x30,%d1
1507
	fmovel	%d1,%fpcr
1508
	fmovel	%fp0,L_SCR1(%a6)	|let the 040 perform conversion
1509
	fmovel %fpsr,%d1
1510
	orl	%d1,USER_FPSR(%a6)	|capture inex2/ainex if set
1511
	bra	int_wrt
1512

1513

1514
lo_plrg:
1515
	movel	#0x7fffffff,L_SCR1(%a6)	|answer is largest positive int
1516
	fbeq	int_wrt			|exact answer
1517
	fcmpd	#0x41dfffffffe00000,%fp0
1518
| 41dfffffffe00000 in dbl prec = 401d0000ffffffff00000000 in ext prec
1519
	fbge	int_operr		|set operr
1520
	bra	int_inx			|set inexact
1521

1522
lo_nlrg:
1523
	movel	#0x80000000,L_SCR1(%a6)
1524
	fbeq	int_wrt			|exact answer
1525
	fcmpd	#0xc1e0000000100000,%fp0
1526
| c1e0000000100000 in dbl prec = c01e00008000000080000000 in ext prec
1527
	fblt	int_operr		|set operr
1528
	bra	int_inx			|set inexact
1529

1530
|
1531
| wi is used to handle a word integer source specifier
1532
|
1533

1534
wi:
1535
	moveql	#2,%d0		|set byte count
1536

1537
	btstb	#7,STAG(%a6)	|check for extended denorm
1538
	bne	int_dnrm	|branch if so
1539

1540
	fmovemx ETEMP(%a6),%fp0-%fp0
1541
	fcmps	#0x46fffe00,%fp0
1542
| 46fffe00 in sgl prec = 400d0000fffe000000000000 in ext prec
1543
	fbge	wo_plrg
1544
	fcmps	#0xc7000000,%fp0
1545
| c7000000 in sgl prec = c00e00008000000000000000 in ext prec
1546
	fble	wo_nlrg
1547

1548
|
1549
| at this point, the answer is between the largest pos and neg values
1550
|
1551
	movel	USER_FPCR(%a6),%d1	|use user's rounding mode
1552
	andil	#0x30,%d1
1553
	fmovel	%d1,%fpcr
1554
	fmovew	%fp0,L_SCR1(%a6)	|let the 040 perform conversion
1555
	fmovel %fpsr,%d1
1556
	orl	%d1,USER_FPSR(%a6)	|capture inex2/ainex if set
1557
	bra	int_wrt
1558

1559
wo_plrg:
1560
	movew	#0x7fff,L_SCR1(%a6)	|answer is largest positive int
1561
	fbeq	int_wrt			|exact answer
1562
	fcmps	#0x46ffff00,%fp0
1563
| 46ffff00 in sgl prec = 400d0000ffff000000000000 in ext prec
1564
	fbge	int_operr		|set operr
1565
	bra	int_inx			|set inexact
1566

1567
wo_nlrg:
1568
	movew	#0x8000,L_SCR1(%a6)
1569
	fbeq	int_wrt			|exact answer
1570
	fcmps	#0xc7000080,%fp0
1571
| c7000080 in sgl prec = c00e00008000800000000000 in ext prec
1572
	fblt	int_operr		|set operr
1573
	bra	int_inx			|set inexact
1574

1575
|
1576
| bi is used to handle a byte integer source specifier
1577
|
1578

1579
bi:
1580
	moveql	#1,%d0		|set byte count
1581

1582
	btstb	#7,STAG(%a6)	|check for extended denorm
1583
	bne	int_dnrm	|branch if so
1584

1585
	fmovemx ETEMP(%a6),%fp0-%fp0
1586
	fcmps	#0x42fe0000,%fp0
1587
| 42fe0000 in sgl prec = 40050000fe00000000000000 in ext prec
1588
	fbge	by_plrg
1589
	fcmps	#0xc3000000,%fp0
1590
| c3000000 in sgl prec = c00600008000000000000000 in ext prec
1591
	fble	by_nlrg
1592

1593
|
1594
| at this point, the answer is between the largest pos and neg values
1595
|
1596
	movel	USER_FPCR(%a6),%d1	|use user's rounding mode
1597
	andil	#0x30,%d1
1598
	fmovel	%d1,%fpcr
1599
	fmoveb	%fp0,L_SCR1(%a6)	|let the 040 perform conversion
1600
	fmovel %fpsr,%d1
1601
	orl	%d1,USER_FPSR(%a6)	|capture inex2/ainex if set
1602
	bra	int_wrt
1603

1604
by_plrg:
1605
	moveb	#0x7f,L_SCR1(%a6)		|answer is largest positive int
1606
	fbeq	int_wrt			|exact answer
1607
	fcmps	#0x42ff0000,%fp0
1608
| 42ff0000 in sgl prec = 40050000ff00000000000000 in ext prec
1609
	fbge	int_operr		|set operr
1610
	bra	int_inx			|set inexact
1611

1612
by_nlrg:
1613
	moveb	#0x80,L_SCR1(%a6)
1614
	fbeq	int_wrt			|exact answer
1615
	fcmps	#0xc3008000,%fp0
1616
| c3008000 in sgl prec = c00600008080000000000000 in ext prec
1617
	fblt	int_operr		|set operr
1618
	bra	int_inx			|set inexact
1619

1620
|
1621
| Common integer routines
1622
|
1623
| int_drnrm---account for possible nonzero result for round up with positive
1624
| operand and round down for negative answer.  In the first case (result = 1)
1625
| byte-width (store in d0) of result must be honored.  In the second case,
1626
| -1 in L_SCR1(a6) will cover all contingencies (FMOVE.B/W/L out).
1627

1628
int_dnrm:
1629
	movel	#0,L_SCR1(%a6)	| initialize result to 0
1630
	bfextu	FPCR_MODE(%a6){#2:#2},%d1	| d1 is the rounding mode
1631
	cmpb	#2,%d1
1632
	bmis	int_inx		| if RN or RZ, done
1633
	bnes	int_rp		| if RP, continue below
1634
	tstw	ETEMP(%a6)	| RM: store -1 in L_SCR1 if src is negative
1635
	bpls	int_inx		| otherwise result is 0
1636
	movel	#-1,L_SCR1(%a6)
1637
	bras	int_inx
1638
int_rp:
1639
	tstw	ETEMP(%a6)	| RP: store +1 of proper width in L_SCR1 if
1640
|				; source is greater than 0
1641
	bmis	int_inx		| otherwise, result is 0
1642
	lea	L_SCR1(%a6),%a1	| a1 is address of L_SCR1
1643
	addal	%d0,%a1		| offset by destination width -1
1644
	subal	#1,%a1
1645
	bsetb	#0,(%a1)		| set low bit at a1 address
1646
int_inx:
1647
	oril	#inx2a_mask,USER_FPSR(%a6)
1648
	bras	int_wrt
1649
int_operr:
1650
	fmovemx %fp0-%fp0,FPTEMP(%a6)	|FPTEMP must contain the extended
1651
|				;precision source that needs to be
1652
|				;converted to integer this is required
1653
|				;if the operr exception is enabled.
1654
|				;set operr/aiop (no inex2 on int ovfl)
1655

1656
	oril	#opaop_mask,USER_FPSR(%a6)
1657
|				;fall through to perform int_wrt
1658
int_wrt:
1659
	movel	EXC_EA(%a6),%a1	|load destination address
1660
	tstl	%a1		|check to see if it is a dest register
1661
	beqs	wrt_dn		|write data register
1662
	lea	L_SCR1(%a6),%a0	|point to supervisor source address
1663
	bsrl	mem_write
1664
	bra	mvouti_end
1665

1666
wrt_dn:
1667
	movel	%d0,-(%sp)	|d0 currently contains the size to write
1668
	bsrl	get_fline	|get_fline returns Dn in d0
1669
	andiw	#0x7,%d0		|isolate register
1670
	movel	(%sp)+,%d1	|get size
1671
	cmpil	#4,%d1		|most frequent case
1672
	beqs	sz_long
1673
	cmpil	#2,%d1
1674
	bnes	sz_con
1675
	orl	#8,%d0		|add 'word' size to register#
1676
	bras	sz_con
1677
sz_long:
1678
	orl	#0x10,%d0		|add 'long' size to register#
1679
sz_con:
1680
	movel	%d0,%d1		|reg_dest expects size:reg in d1
1681
	bsrl	reg_dest	|load proper data register
1682
	bra	mvouti_end
1683
xp:
1684
	lea	ETEMP(%a6),%a0
1685
	bclrb	#sign_bit,LOCAL_EX(%a0)
1686
	sne	LOCAL_SGN(%a0)
1687
	btstb	#7,STAG(%a6)	|check for extended denorm
1688
	bne	xdnrm
1689
	clrl	%d0
1690
	bras	do_fp		|do normal case
1691
sgp:
1692
	lea	ETEMP(%a6),%a0
1693
	bclrb	#sign_bit,LOCAL_EX(%a0)
1694
	sne	LOCAL_SGN(%a0)
1695
	btstb	#7,STAG(%a6)	|check for extended denorm
1696
	bne	sp_catas	|branch if so
1697
	movew	LOCAL_EX(%a0),%d0
1698
	lea	sp_bnds,%a1
1699
	cmpw	(%a1),%d0
1700
	blt	sp_under
1701
	cmpw	2(%a1),%d0
1702
	bgt	sp_over
1703
	movel	#1,%d0		|set destination format to single
1704
	bras	do_fp		|do normal case
1705
dp:
1706
	lea	ETEMP(%a6),%a0
1707
	bclrb	#sign_bit,LOCAL_EX(%a0)
1708
	sne	LOCAL_SGN(%a0)
1709

1710
	btstb	#7,STAG(%a6)	|check for extended denorm
1711
	bne	dp_catas	|branch if so
1712

1713
	movew	LOCAL_EX(%a0),%d0
1714
	lea	dp_bnds,%a1
1715

1716
	cmpw	(%a1),%d0
1717
	blt	dp_under
1718
	cmpw	2(%a1),%d0
1719
	bgt	dp_over
1720

1721
	movel	#2,%d0		|set destination format to double
1722
|				;fall through to do_fp
1723
|
1724
do_fp:
1725
	bfextu	FPCR_MODE(%a6){#2:#2},%d1	|rnd mode in d1
1726
	swap	%d0			|rnd prec in upper word
1727
	addl	%d0,%d1			|d1 has PREC/MODE info
1728

1729
	clrl	%d0			|clear g,r,s
1730

1731
	bsrl	round			|round
1732

1733
	movel	%a0,%a1
1734
	movel	EXC_EA(%a6),%a0
1735

1736
	bfextu	CMDREG1B(%a6){#3:#3},%d1	|extract destination format
1737
|					;at this point only the dest
1738
|					;formats sgl, dbl, ext are
1739
|					;possible
1740
	cmpb	#2,%d1
1741
	bgts	ddbl			|double=5, extended=2, single=1
1742
	bnes	dsgl
1743
|					;fall through to dext
1744
dext:
1745
	bsrl	dest_ext
1746
	bra	mvout_end
1747
dsgl:
1748
	bsrl	dest_sgl
1749
	bra	mvout_end
1750
ddbl:
1751
	bsrl	dest_dbl
1752
	bra	mvout_end
1753

1754
|
1755
| Handle possible denorm or catastrophic underflow cases here
1756
|
1757
xdnrm:
1758
	bsr	set_xop		|initialize WBTEMP
1759
	bsetb	#wbtemp15_bit,WB_BYTE(%a6) |set wbtemp15
1760

1761
	movel	%a0,%a1
1762
	movel	EXC_EA(%a6),%a0	|a0 has the destination pointer
1763
	bsrl	dest_ext	|store to memory
1764
	bsetb	#unfl_bit,FPSR_EXCEPT(%a6)
1765
	bra	mvout_end
1766

1767
sp_under:
1768
	bsetb	#etemp15_bit,STAG(%a6)
1769

1770
	cmpw	4(%a1),%d0
1771
	blts	sp_catas	|catastrophic underflow case
1772

1773
	movel	#1,%d0		|load in round precision
1774
	movel	#sgl_thresh,%d1	|load in single denorm threshold
1775
	bsrl	dpspdnrm	|expects d1 to have the proper
1776
|				;denorm threshold
1777
	bsrl	dest_sgl	|stores value to destination
1778
	bsetb	#unfl_bit,FPSR_EXCEPT(%a6)
1779
	bra	mvout_end	|exit
1780

1781
dp_under:
1782
	bsetb	#etemp15_bit,STAG(%a6)
1783

1784
	cmpw	4(%a1),%d0
1785
	blts	dp_catas	|catastrophic underflow case
1786

1787
	movel	#dbl_thresh,%d1	|load in double precision threshold
1788
	movel	#2,%d0
1789
	bsrl	dpspdnrm	|expects d1 to have proper
1790
|				;denorm threshold
1791
|				;expects d0 to have round precision
1792
	bsrl	dest_dbl	|store value to destination
1793
	bsetb	#unfl_bit,FPSR_EXCEPT(%a6)
1794
	bra	mvout_end	|exit
1795

1796
|
1797
| Handle catastrophic underflow cases here
1798
|
1799
sp_catas:
1800
| Temp fix for z bit set in unf_sub
1801
	movel	USER_FPSR(%a6),-(%a7)
1802

1803
	movel	#1,%d0		|set round precision to sgl
1804

1805
	bsrl	unf_sub		|a0 points to result
1806

1807
	movel	(%a7)+,USER_FPSR(%a6)
1808

1809
	movel	#1,%d0
1810
	subw	%d0,LOCAL_EX(%a0) |account for difference between
1811
|				;denorm/norm bias
1812

1813
	movel	%a0,%a1		|a1 has the operand input
1814
	movel	EXC_EA(%a6),%a0	|a0 has the destination pointer
1815

1816
	bsrl	dest_sgl	|store the result
1817
	oril	#unfinx_mask,USER_FPSR(%a6)
1818
	bra	mvout_end
1819

1820
dp_catas:
1821
| Temp fix for z bit set in unf_sub
1822
	movel	USER_FPSR(%a6),-(%a7)
1823

1824
	movel	#2,%d0		|set round precision to dbl
1825
	bsrl	unf_sub		|a0 points to result
1826

1827
	movel	(%a7)+,USER_FPSR(%a6)
1828

1829
	movel	#1,%d0
1830
	subw	%d0,LOCAL_EX(%a0) |account for difference between
1831
|				;denorm/norm bias
1832

1833
	movel	%a0,%a1		|a1 has the operand input
1834
	movel	EXC_EA(%a6),%a0	|a0 has the destination pointer
1835

1836
	bsrl	dest_dbl	|store the result
1837
	oril	#unfinx_mask,USER_FPSR(%a6)
1838
	bra	mvout_end
1839

1840
|
1841
| Handle catastrophic overflow cases here
1842
|
1843
sp_over:
1844
| Temp fix for z bit set in unf_sub
1845
	movel	USER_FPSR(%a6),-(%a7)
1846

1847
	movel	#1,%d0
1848
	leal	FP_SCR1(%a6),%a0	|use FP_SCR1 for creating result
1849
	movel	ETEMP_EX(%a6),(%a0)
1850
	movel	ETEMP_HI(%a6),4(%a0)
1851
	movel	ETEMP_LO(%a6),8(%a0)
1852
	bsrl	ovf_res
1853

1854
	movel	(%a7)+,USER_FPSR(%a6)
1855

1856
	movel	%a0,%a1
1857
	movel	EXC_EA(%a6),%a0
1858
	bsrl	dest_sgl
1859
	orl	#ovfinx_mask,USER_FPSR(%a6)
1860
	bra	mvout_end
1861

1862
dp_over:
1863
| Temp fix for z bit set in ovf_res
1864
	movel	USER_FPSR(%a6),-(%a7)
1865

1866
	movel	#2,%d0
1867
	leal	FP_SCR1(%a6),%a0	|use FP_SCR1 for creating result
1868
	movel	ETEMP_EX(%a6),(%a0)
1869
	movel	ETEMP_HI(%a6),4(%a0)
1870
	movel	ETEMP_LO(%a6),8(%a0)
1871
	bsrl	ovf_res
1872

1873
	movel	(%a7)+,USER_FPSR(%a6)
1874

1875
	movel	%a0,%a1
1876
	movel	EXC_EA(%a6),%a0
1877
	bsrl	dest_dbl
1878
	orl	#ovfinx_mask,USER_FPSR(%a6)
1879
	bra	mvout_end
1880

1881
|
1882
|	DPSPDNRM
1883
|
1884
| This subroutine takes an extended normalized number and denormalizes
1885
| it to the given round precision. This subroutine also decrements
1886
| the input operand's exponent by 1 to account for the fact that
1887
| dest_sgl or dest_dbl expects a normalized number's bias.
1888
|
1889
| Input: a0  points to a normalized number in internal extended format
1890
|	 d0  is the round precision (=1 for sgl; =2 for dbl)
1891
|	 d1  is the single precision or double precision
1892
|	     denorm threshold
1893
|
1894
| Output: (In the format for dest_sgl or dest_dbl)
1895
|	 a0   points to the destination
1896
|	 a1   points to the operand
1897
|
1898
| Exceptions: Reports inexact 2 exception by setting USER_FPSR bits
1899
|
1900
dpspdnrm:
1901
	movel	%d0,-(%a7)	|save round precision
1902
	clrl	%d0		|clear initial g,r,s
1903
	bsrl	dnrm_lp		|careful with d0, it's needed by round
1904

1905
	bfextu	FPCR_MODE(%a6){#2:#2},%d1 |get rounding mode
1906
	swap	%d1
1907
	movew	2(%a7),%d1	|set rounding precision
1908
	swap	%d1		|at this point d1 has PREC/MODE info
1909
	bsrl	round		|round result, sets the inex bit in
1910
|				;USER_FPSR if needed
1911

1912
	movew	#1,%d0
1913
	subw	%d0,LOCAL_EX(%a0) |account for difference in denorm
1914
|				;vs norm bias
1915

1916
	movel	%a0,%a1		|a1 has the operand input
1917
	movel	EXC_EA(%a6),%a0	|a0 has the destination pointer
1918
	addw	#4,%a7		|pop stack
1919
	rts
1920
|
1921
| SET_XOP initialized WBTEMP with the value pointed to by a0
1922
| input: a0 points to input operand in the internal extended format
1923
|
1924
set_xop:
1925
	movel	LOCAL_EX(%a0),WBTEMP_EX(%a6)
1926
	movel	LOCAL_HI(%a0),WBTEMP_HI(%a6)
1927
	movel	LOCAL_LO(%a0),WBTEMP_LO(%a6)
1928
	bfclr	WBTEMP_SGN(%a6){#0:#8}
1929
	beqs	sxop
1930
	bsetb	#sign_bit,WBTEMP_EX(%a6)
1931
sxop:
1932
	bfclr	STAG(%a6){#5:#4}	|clear wbtm66,wbtm1,wbtm0,sbit
1933
	rts
1934
|
1935
|	P_MOVE
1936
|
1937
p_movet:
1938
	.long	p_move
1939
	.long	p_movez
1940
	.long	p_movei
1941
	.long	p_moven
1942
	.long	p_move
1943
p_regd:
1944
	.long	p_dyd0
1945
	.long	p_dyd1
1946
	.long	p_dyd2
1947
	.long	p_dyd3
1948
	.long	p_dyd4
1949
	.long	p_dyd5
1950
	.long	p_dyd6
1951
	.long	p_dyd7
1952

1953
pack_out:
1954
	leal	p_movet,%a0	|load jmp table address
1955
	movew	STAG(%a6),%d0	|get source tag
1956
	bfextu	%d0{#16:#3},%d0	|isolate source bits
1957
	movel	(%a0,%d0.w*4),%a0	|load a0 with routine label for tag
1958
	jmp	(%a0)		|go to the routine
1959

1960
p_write:
1961
	movel	#0x0c,%d0	|get byte count
1962
	movel	EXC_EA(%a6),%a1	|get the destination address
1963
	bsr	mem_write	|write the user's destination
1964
	moveb	#0,CU_SAVEPC(%a6) |set the cu save pc to all 0's
1965

1966
|
1967
| Also note that the dtag must be set to norm here - this is because
1968
| the 040 uses the dtag to execute the correct microcode.
1969
|
1970
        bfclr    DTAG(%a6){#0:#3}  |set dtag to norm
1971

1972
	rts
1973

1974
| Notes on handling of special case (zero, inf, and nan) inputs:
1975
|	1. Operr is not signalled if the k-factor is greater than 18.
1976
|	2. Per the manual, status bits are not set.
1977
|
1978

1979
p_move:
1980
	movew	CMDREG1B(%a6),%d0
1981
	btstl	#kfact_bit,%d0	|test for dynamic k-factor
1982
	beqs	statick		|if clear, k-factor is static
1983
dynamick:
1984
	bfextu	%d0{#25:#3},%d0	|isolate register for dynamic k-factor
1985
	lea	p_regd,%a0
1986
	movel	%a0@(%d0:l:4),%a0
1987
	jmp	(%a0)
1988
statick:
1989
	andiw	#0x007f,%d0	|get k-factor
1990
	bfexts	%d0{#25:#7},%d0	|sign extend d0 for bindec
1991
	leal	ETEMP(%a6),%a0	|a0 will point to the packed decimal
1992
	bsrl	bindec		|perform the convert; data at a6
1993
	leal	FP_SCR1(%a6),%a0	|load a0 with result address
1994
	bral	p_write
1995
p_movez:
1996
	leal	ETEMP(%a6),%a0	|a0 will point to the packed decimal
1997
	clrw	2(%a0)		|clear lower word of exp
1998
	clrl	4(%a0)		|load second lword of ZERO
1999
	clrl	8(%a0)		|load third lword of ZERO
2000
	bra	p_write		|go write results
2001
p_movei:
2002
	fmovel	#0,%FPSR		|clear aiop
2003
	leal	ETEMP(%a6),%a0	|a0 will point to the packed decimal
2004
	clrw	2(%a0)		|clear lower word of exp
2005
	bra	p_write		|go write the result
2006
p_moven:
2007
	leal	ETEMP(%a6),%a0	|a0 will point to the packed decimal
2008
	clrw	2(%a0)		|clear lower word of exp
2009
	bra	p_write		|go write the result
2010

2011
|
2012
| Routines to read the dynamic k-factor from Dn.
2013
|
2014
p_dyd0:
2015
	movel	USER_D0(%a6),%d0
2016
	bras	statick
2017
p_dyd1:
2018
	movel	USER_D1(%a6),%d0
2019
	bras	statick
2020
p_dyd2:
2021
	movel	%d2,%d0
2022
	bras	statick
2023
p_dyd3:
2024
	movel	%d3,%d0
2025
	bras	statick
2026
p_dyd4:
2027
	movel	%d4,%d0
2028
	bras	statick
2029
p_dyd5:
2030
	movel	%d5,%d0
2031
	bras	statick
2032
p_dyd6:
2033
	movel	%d6,%d0
2034
	bra	statick
2035
p_dyd7:
2036
	movel	%d7,%d0
2037
	bra	statick
2038

2039
	|end
2040

2041
Product

Resources

Company