CoCalc -- kernel

GitHub Repository: awilliam/linux-vfio
Path: blob/master/arch/m68k/fpsp040/kernel_ex.S
¹⁷⁴⁸¹ views
1
|
2
|	kernel_ex.sa 3.3 12/19/90
3
|
4
| This file contains routines to force exception status in the
5
| fpu for exceptional cases detected or reported within the
6
| transcendental functions.  Typically, the t_xx routine will
7
| set the appropriate bits in the USER_FPSR word on the stack.
8
| The bits are tested in gen_except.sa to determine if an exceptional
9
| situation needs to be created on return from the FPSP.
10
|
11

12
|		Copyright (C) Motorola, Inc. 1990
13
|			All Rights Reserved
14
|
15
|       For details on the license for this file, please see the
16
|       file, README, in this same directory.
17

18
KERNEL_EX:    |idnt    2,1 | Motorola 040 Floating Point Software Package
19

20
	|section    8
21

22
#include "fpsp.h"
23

24
mns_inf:  .long 0xffff0000,0x00000000,0x00000000
25
pls_inf:  .long 0x7fff0000,0x00000000,0x00000000
26
nan:      .long 0x7fff0000,0xffffffff,0xffffffff
27
huge:     .long 0x7ffe0000,0xffffffff,0xffffffff
28

29
	|xref	  ovf_r_k
30
	|xref	  unf_sub
31
	|xref	  nrm_set
32

33
	.global	  t_dz
34
	.global      t_dz2
35
	.global      t_operr
36
	.global      t_unfl
37
	.global      t_ovfl
38
	.global      t_ovfl2
39
	.global      t_inx2
40
	.global	  t_frcinx
41
	.global	  t_extdnrm
42
	.global	  t_resdnrm
43
	.global	  dst_nan
44
	.global	  src_nan
45
|
46
|	DZ exception
47
|
48
|
49
|	if dz trap disabled
50
|		store properly signed inf (use sign of etemp) into fp0
51
|		set FPSR exception status dz bit, condition code
52
|		inf bit, and accrued dz bit
53
|		return
54
|		frestore the frame into the machine (done by unimp_hd)
55
|
56
|	else dz trap enabled
57
|		set exception status bit & accrued bits in FPSR
58
|		set flag to disable sto_res from corrupting fp register
59
|		return
60
|		frestore the frame into the machine (done by unimp_hd)
61
|
62
| t_dz2 is used by monadic functions such as flogn (from do_func).
63
| t_dz is used by monadic functions such as satanh (from the
64
| transcendental function).
65
|
66
t_dz2:
67
	bsetb	#neg_bit,FPSR_CC(%a6)	|set neg bit in FPSR
68
	fmovel	#0,%FPSR			|clr status bits (Z set)
69
	btstb	#dz_bit,FPCR_ENABLE(%a6)	|test FPCR for dz exc enabled
70
	bnes	dz_ena_end
71
	bras	m_inf			|flogx always returns -inf
72
t_dz:
73
	fmovel	#0,%FPSR			|clr status bits (Z set)
74
	btstb	#dz_bit,FPCR_ENABLE(%a6)	|test FPCR for dz exc enabled
75
	bnes	dz_ena
76
|
77
|	dz disabled
78
|
79
	btstb	#sign_bit,ETEMP_EX(%a6)	|check sign for neg or pos
80
	beqs	p_inf			|branch if pos sign
81

82
m_inf:
83
	fmovemx mns_inf,%fp0-%fp0		|load -inf
84
	bsetb	#neg_bit,FPSR_CC(%a6)	|set neg bit in FPSR
85
	bras	set_fpsr
86
p_inf:
87
	fmovemx pls_inf,%fp0-%fp0		|load +inf
88
set_fpsr:
89
	orl	#dzinf_mask,USER_FPSR(%a6) |set I,DZ,ADZ
90
	rts
91
|
92
|	dz enabled
93
|
94
dz_ena:
95
	btstb	#sign_bit,ETEMP_EX(%a6)	|check sign for neg or pos
96
	beqs	dz_ena_end
97
	bsetb	#neg_bit,FPSR_CC(%a6)	|set neg bit in FPSR
98
dz_ena_end:
99
	orl	#dzinf_mask,USER_FPSR(%a6) |set I,DZ,ADZ
100
	st	STORE_FLG(%a6)
101
	rts
102
|
103
|	OPERR exception
104
|
105
|	if (operr trap disabled)
106
|		set FPSR exception status operr bit, condition code
107
|		nan bit; Store default NAN into fp0
108
|		frestore the frame into the machine (done by unimp_hd)
109
|
110
|	else (operr trap enabled)
111
|		set FPSR exception status operr bit, accrued operr bit
112
|		set flag to disable sto_res from corrupting fp register
113
|		frestore the frame into the machine (done by unimp_hd)
114
|
115
t_operr:
116
	orl	#opnan_mask,USER_FPSR(%a6) |set NaN, OPERR, AIOP
117

118
	btstb	#operr_bit,FPCR_ENABLE(%a6) |test FPCR for operr enabled
119
	bnes	op_ena
120

121
	fmovemx nan,%fp0-%fp0		|load default nan
122
	rts
123
op_ena:
124
	st	STORE_FLG(%a6)		|do not corrupt destination
125
	rts
126

127
|
128
|	t_unfl --- UNFL exception
129
|
130
| This entry point is used by all routines requiring unfl, inex2,
131
| aunfl, and ainex to be set on exit.
132
|
133
| On entry, a0 points to the exceptional operand.  The final exceptional
134
| operand is built in FP_SCR1 and only the sign from the original operand
135
| is used.
136
|
137
t_unfl:
138
	clrl	FP_SCR1(%a6)		|set exceptional operand to zero
139
	clrl	FP_SCR1+4(%a6)
140
	clrl	FP_SCR1+8(%a6)
141
	tstb	(%a0)			|extract sign from caller's exop
142
	bpls	unfl_signok
143
	bset	#sign_bit,FP_SCR1(%a6)
144
unfl_signok:
145
	leal	FP_SCR1(%a6),%a0
146
	orl	#unfinx_mask,USER_FPSR(%a6)
147
|					;set UNFL, INEX2, AUNFL, AINEX
148
unfl_con:
149
	btstb	#unfl_bit,FPCR_ENABLE(%a6)
150
	beqs	unfl_dis
151

152
unfl_ena:
153
	bfclr	STAG(%a6){#5:#3}		|clear wbtm66,wbtm1,wbtm0
154
	bsetb	#wbtemp15_bit,WB_BYTE(%a6) |set wbtemp15
155
	bsetb	#sticky_bit,STICKY(%a6)	|set sticky bit
156

157
	bclrb	#E1,E_BYTE(%a6)
158

159
unfl_dis:
160
	bfextu	FPCR_MODE(%a6){#0:#2},%d0	|get round precision
161

162
	bclrb	#sign_bit,LOCAL_EX(%a0)
163
	sne	LOCAL_SGN(%a0)		|convert to internal ext format
164

165
	bsr	unf_sub			|returns IEEE result at a0
166
|					;and sets FPSR_CC accordingly
167

168
	bfclr	LOCAL_SGN(%a0){#0:#8}	|convert back to IEEE ext format
169
	beqs	unfl_fin
170

171
	bsetb	#sign_bit,LOCAL_EX(%a0)
172
	bsetb	#sign_bit,FP_SCR1(%a6)	|set sign bit of exc operand
173

174
unfl_fin:
175
	fmovemx (%a0),%fp0-%fp0		|store result in fp0
176
	rts
177

178

179
|
180
|	t_ovfl2 --- OVFL exception (without inex2 returned)
181
|
182
| This entry is used by scale to force catastrophic overflow.  The
183
| ovfl, aovfl, and ainex bits are set, but not the inex2 bit.
184
|
185
t_ovfl2:
186
	orl	#ovfl_inx_mask,USER_FPSR(%a6)
187
	movel	ETEMP(%a6),FP_SCR1(%a6)
188
	movel	ETEMP_HI(%a6),FP_SCR1+4(%a6)
189
	movel	ETEMP_LO(%a6),FP_SCR1+8(%a6)
190
|
191
| Check for single or double round precision.  If single, check if
192
| the lower 40 bits of ETEMP are zero; if not, set inex2.  If double,
193
| check if the lower 21 bits are zero; if not, set inex2.
194
|
195
	moveb	FPCR_MODE(%a6),%d0
196
	andib	#0xc0,%d0
197
	beq	t_work		|if extended, finish ovfl processing
198
	cmpib	#0x40,%d0		|test for single
199
	bnes	t_dbl
200
t_sgl:
201
	tstb	ETEMP_LO(%a6)
202
	bnes	t_setinx2
203
	movel	ETEMP_HI(%a6),%d0
204
	andil	#0xff,%d0		|look at only lower 8 bits
205
	bnes	t_setinx2
206
	bra	t_work
207
t_dbl:
208
	movel	ETEMP_LO(%a6),%d0
209
	andil	#0x7ff,%d0	|look at only lower 11 bits
210
	beq	t_work
211
t_setinx2:
212
	orl	#inex2_mask,USER_FPSR(%a6)
213
	bras	t_work
214
|
215
|	t_ovfl --- OVFL exception
216
|
217
|** Note: the exc operand is returned in ETEMP.
218
|
219
t_ovfl:
220
	orl	#ovfinx_mask,USER_FPSR(%a6)
221
t_work:
222
	btstb	#ovfl_bit,FPCR_ENABLE(%a6) |test FPCR for ovfl enabled
223
	beqs	ovf_dis
224

225
ovf_ena:
226
	clrl	FP_SCR1(%a6)		|set exceptional operand
227
	clrl	FP_SCR1+4(%a6)
228
	clrl	FP_SCR1+8(%a6)
229

230
	bfclr	STAG(%a6){#5:#3}		|clear wbtm66,wbtm1,wbtm0
231
	bclrb	#wbtemp15_bit,WB_BYTE(%a6) |clear wbtemp15
232
	bsetb	#sticky_bit,STICKY(%a6)	|set sticky bit
233

234
	bclrb	#E1,E_BYTE(%a6)
235
|					;fall through to disabled case
236

237
| For disabled overflow call 'ovf_r_k'.  This routine loads the
238
| correct result based on the rounding precision, destination
239
| format, rounding mode and sign.
240
|
241
ovf_dis:
242
	bsr	ovf_r_k			|returns unsigned ETEMP_EX
243
|					;and sets FPSR_CC accordingly.
244
	bfclr	ETEMP_SGN(%a6){#0:#8}	|fix sign
245
	beqs	ovf_pos
246
	bsetb	#sign_bit,ETEMP_EX(%a6)
247
	bsetb	#sign_bit,FP_SCR1(%a6)	|set exceptional operand sign
248
ovf_pos:
249
	fmovemx ETEMP(%a6),%fp0-%fp0		|move the result to fp0
250
	rts
251

252

253
|
254
|	INEX2 exception
255
|
256
| The inex2 and ainex bits are set.
257
|
258
t_inx2:
259
	orl	#inx2a_mask,USER_FPSR(%a6) |set INEX2, AINEX
260
	rts
261

262
|
263
|	Force Inex2
264
|
265
| This routine is called by the transcendental routines to force
266
| the inex2 exception bits set in the FPSR.  If the underflow bit
267
| is set, but the underflow trap was not taken, the aunfl bit in
268
| the FPSR must be set.
269
|
270
t_frcinx:
271
	orl	#inx2a_mask,USER_FPSR(%a6) |set INEX2, AINEX
272
	btstb	#unfl_bit,FPSR_EXCEPT(%a6) |test for unfl bit set
273
	beqs	no_uacc1		|if clear, do not set aunfl
274
	bsetb	#aunfl_bit,FPSR_AEXCEPT(%a6)
275
no_uacc1:
276
	rts
277

278
|
279
|	DST_NAN
280
|
281
| Determine if the destination nan is signalling or non-signalling,
282
| and set the FPSR bits accordingly.  See the MC68040 User's Manual
283
| section 3.2.2.5 NOT-A-NUMBERS.
284
|
285
dst_nan:
286
	btstb	#sign_bit,FPTEMP_EX(%a6) |test sign of nan
287
	beqs	dst_pos			|if clr, it was positive
288
	bsetb	#neg_bit,FPSR_CC(%a6)	|set N bit
289
dst_pos:
290
	btstb	#signan_bit,FPTEMP_HI(%a6) |check if signalling
291
	beqs	dst_snan		|branch if signalling
292

293
	fmovel	%d1,%fpcr			|restore user's rmode/prec
294
	fmovex FPTEMP(%a6),%fp0		|return the non-signalling nan
295
|
296
| Check the source nan.  If it is signalling, snan will be reported.
297
|
298
	moveb	STAG(%a6),%d0
299
	andib	#0xe0,%d0
300
	cmpib	#0x60,%d0
301
	bnes	no_snan
302
	btstb	#signan_bit,ETEMP_HI(%a6) |check if signalling
303
	bnes	no_snan
304
	orl	#snaniop_mask,USER_FPSR(%a6) |set NAN, SNAN, AIOP
305
no_snan:
306
	rts
307

308
dst_snan:
309
	btstb	#snan_bit,FPCR_ENABLE(%a6) |check if trap enabled
310
	beqs	dst_dis			|branch if disabled
311

312
	orb	#nan_tag,DTAG(%a6)	|set up dtag for nan
313
	st	STORE_FLG(%a6)		|do not store a result
314
	orl	#snaniop_mask,USER_FPSR(%a6) |set NAN, SNAN, AIOP
315
	rts
316

317
dst_dis:
318
	bsetb	#signan_bit,FPTEMP_HI(%a6) |set SNAN bit in sop
319
	fmovel	%d1,%fpcr			|restore user's rmode/prec
320
	fmovex FPTEMP(%a6),%fp0		|load non-sign. nan
321
	orl	#snaniop_mask,USER_FPSR(%a6) |set NAN, SNAN, AIOP
322
	rts
323

324
|
325
|	SRC_NAN
326
|
327
| Determine if the source nan is signalling or non-signalling,
328
| and set the FPSR bits accordingly.  See the MC68040 User's Manual
329
| section 3.2.2.5 NOT-A-NUMBERS.
330
|
331
src_nan:
332
	btstb	#sign_bit,ETEMP_EX(%a6) |test sign of nan
333
	beqs	src_pos			|if clr, it was positive
334
	bsetb	#neg_bit,FPSR_CC(%a6)	|set N bit
335
src_pos:
336
	btstb	#signan_bit,ETEMP_HI(%a6) |check if signalling
337
	beqs	src_snan		|branch if signalling
338
	fmovel	%d1,%fpcr			|restore user's rmode/prec
339
	fmovex ETEMP(%a6),%fp0		|return the non-signalling nan
340
	rts
341

342
src_snan:
343
	btstb	#snan_bit,FPCR_ENABLE(%a6) |check if trap enabled
344
	beqs	src_dis			|branch if disabled
345
	bsetb	#signan_bit,ETEMP_HI(%a6) |set SNAN bit in sop
346
	orb	#norm_tag,DTAG(%a6)	|set up dtag for norm
347
	orb	#nan_tag,STAG(%a6)	|set up stag for nan
348
	st	STORE_FLG(%a6)		|do not store a result
349
	orl	#snaniop_mask,USER_FPSR(%a6) |set NAN, SNAN, AIOP
350
	rts
351

352
src_dis:
353
	bsetb	#signan_bit,ETEMP_HI(%a6) |set SNAN bit in sop
354
	fmovel	%d1,%fpcr			|restore user's rmode/prec
355
	fmovex ETEMP(%a6),%fp0		|load non-sign. nan
356
	orl	#snaniop_mask,USER_FPSR(%a6) |set NAN, SNAN, AIOP
357
	rts
358

359
|
360
| For all functions that have a denormalized input and that f(x)=x,
361
| this is the entry point
362
|
363
t_extdnrm:
364
	orl	#unfinx_mask,USER_FPSR(%a6)
365
|					;set UNFL, INEX2, AUNFL, AINEX
366
	bras	xdnrm_con
367
|
368
| Entry point for scale with extended denorm.  The function does
369
| not set inex2, aunfl, or ainex.
370
|
371
t_resdnrm:
372
	orl	#unfl_mask,USER_FPSR(%a6)
373

374
xdnrm_con:
375
	btstb	#unfl_bit,FPCR_ENABLE(%a6)
376
	beqs	xdnrm_dis
377

378
|
379
| If exceptions are enabled, the additional task of setting up WBTEMP
380
| is needed so that when the underflow exception handler is entered,
381
| the user perceives no difference between what the 040 provides vs.
382
| what the FPSP provides.
383
|
384
xdnrm_ena:
385
	movel	%a0,-(%a7)
386

387
	movel	LOCAL_EX(%a0),FP_SCR1(%a6)
388
	movel	LOCAL_HI(%a0),FP_SCR1+4(%a6)
389
	movel	LOCAL_LO(%a0),FP_SCR1+8(%a6)
390

391
	lea	FP_SCR1(%a6),%a0
392

393
	bclrb	#sign_bit,LOCAL_EX(%a0)
394
	sne	LOCAL_SGN(%a0)		|convert to internal ext format
395
	tstw	LOCAL_EX(%a0)		|check if input is denorm
396
	beqs	xdnrm_dn		|if so, skip nrm_set
397
	bsr	nrm_set			|normalize the result (exponent
398
|					;will be negative
399
xdnrm_dn:
400
	bclrb	#sign_bit,LOCAL_EX(%a0)	|take off false sign
401
	bfclr	LOCAL_SGN(%a0){#0:#8}	|change back to IEEE ext format
402
	beqs	xdep
403
	bsetb	#sign_bit,LOCAL_EX(%a0)
404
xdep:
405
	bfclr	STAG(%a6){#5:#3}		|clear wbtm66,wbtm1,wbtm0
406
	bsetb	#wbtemp15_bit,WB_BYTE(%a6) |set wbtemp15
407
	bclrb	#sticky_bit,STICKY(%a6)	|clear sticky bit
408
	bclrb	#E1,E_BYTE(%a6)
409
	movel	(%a7)+,%a0
410
xdnrm_dis:
411
	bfextu	FPCR_MODE(%a6){#0:#2},%d0	|get round precision
412
	bnes	not_ext			|if not round extended, store
413
|					;IEEE defaults
414
is_ext:
415
	btstb	#sign_bit,LOCAL_EX(%a0)
416
	beqs	xdnrm_store
417

418
	bsetb	#neg_bit,FPSR_CC(%a6)	|set N bit in FPSR_CC
419

420
	bras	xdnrm_store
421

422
not_ext:
423
	bclrb	#sign_bit,LOCAL_EX(%a0)
424
	sne	LOCAL_SGN(%a0)		|convert to internal ext format
425
	bsr	unf_sub			|returns IEEE result pointed by
426
|					;a0; sets FPSR_CC accordingly
427
	bfclr	LOCAL_SGN(%a0){#0:#8}	|convert back to IEEE ext format
428
	beqs	xdnrm_store
429
	bsetb	#sign_bit,LOCAL_EX(%a0)
430
xdnrm_store:
431
	fmovemx (%a0),%fp0-%fp0		|store result in fp0
432
	rts
433

434
|
435
| This subroutine is used for dyadic operations that use an extended
436
| denorm within the kernel. The approach used is to capture the frame,
437
| fix/restore.
438
|
439
	.global	t_avoid_unsupp
440
t_avoid_unsupp:
441
	link	%a2,#-LOCAL_SIZE		|so that a2 fpsp.h negative
442
|					;offsets may be used
443
	fsave	-(%a7)
444
	tstb	1(%a7)			|check if idle, exit if so
445
	beq	idle_end
446
	btstb	#E1,E_BYTE(%a2)		|check for an E1 exception if
447
|					;enabled, there is an unsupp
448
	beq	end_avun		|else, exit
449
	btstb	#7,DTAG(%a2)		|check for denorm destination
450
	beqs	src_den			|else, must be a source denorm
451
|
452
| handle destination denorm
453
|
454
	lea	FPTEMP(%a2),%a0
455
	btstb	#sign_bit,LOCAL_EX(%a0)
456
	sne	LOCAL_SGN(%a0)		|convert to internal ext format
457
	bclrb	#7,DTAG(%a2)		|set DTAG to norm
458
	bsr	nrm_set			|normalize result, exponent
459
|					;will become negative
460
	bclrb	#sign_bit,LOCAL_EX(%a0)	|get rid of fake sign
461
	bfclr	LOCAL_SGN(%a0){#0:#8}	|convert back to IEEE ext format
462
	beqs	ck_src_den		|check if source is also denorm
463
	bsetb	#sign_bit,LOCAL_EX(%a0)
464
ck_src_den:
465
	btstb	#7,STAG(%a2)
466
	beqs	end_avun
467
src_den:
468
	lea	ETEMP(%a2),%a0
469
	btstb	#sign_bit,LOCAL_EX(%a0)
470
	sne	LOCAL_SGN(%a0)		|convert to internal ext format
471
	bclrb	#7,STAG(%a2)		|set STAG to norm
472
	bsr	nrm_set			|normalize result, exponent
473
|					;will become negative
474
	bclrb	#sign_bit,LOCAL_EX(%a0)	|get rid of fake sign
475
	bfclr	LOCAL_SGN(%a0){#0:#8}	|convert back to IEEE ext format
476
	beqs	den_com
477
	bsetb	#sign_bit,LOCAL_EX(%a0)
478
den_com:
479
	moveb	#0xfe,CU_SAVEPC(%a2)	|set continue frame
480
	clrw	NMNEXC(%a2)		|clear NMNEXC
481
	bclrb	#E1,E_BYTE(%a2)
482
|	fmove.l	%FPSR,FPSR_SHADOW(%a2)
483
|	bset.b	#SFLAG,E_BYTE(%a2)
484
|	bset.b	#XFLAG,T_BYTE(%a2)
485
end_avun:
486
	frestore (%a7)+
487
	unlk	%a2
488
	rts
489
idle_end:
490
	addl	#4,%a7
491
	unlk	%a2
492
	rts
493
	|end
494

495
Product

Resources

Company