Context Navigation

res_func.s @ f9b93da

4.104.114.84.95

Last change on this file since f9b93da was f9b93da, checked in by Joel Sherrill <joel.sherrill@…>, on 04/16/97 at 17:33:04
Added the MC68040 Floating Point Support Package. This was ported to RTEMS by Eric Norum. It is freely distributable and was acquired from the Motorola WWW site. More info is in the FPSP README.
Property mode set to `100644`
File size: 53.0 KB

Line
1	//
2	// res_func.sa 3.9 7/29/91
3	//
4	// Normalizes denormalized numbers if necessary and updates the
5	// stack frame. The function is then restored back into the
6	// machine and the 040 completes the operation. This routine
7	// is only used by the unsupported data type/format handler.
8	// (Exception vector 55).
9	//
10	// For packed move out (fmove.p fpm,<ea>) the operation is
11	// completed here; data is packed and moved to user memory.
12	// The stack is restored to the 040 only in the case of a
13	// reportable exception in the conversion.
14	//
15	//
16	// Copyright (C) Motorola, Inc. 1990
17	// All Rights Reserved
18	//
19	// THIS IS UNPUBLISHED PROPRIETARY SOURCE CODE OF MOTOROLA
20	// The copyright notice above does not evidence any
21	// actual or intended publication of such source code.
22
23	RES_FUNC: //idnt 2,1 \| Motorola 040 Floating Point Software Package
24
25	\|section 8
26
27	.include "fpsp.defs"
28
29	sp_bnds: .short 0x3f81,0x407e
30	.short 0x3f6a,0x0000
31	dp_bnds: .short 0x3c01,0x43fe
32	.short 0x3bcd,0x0000
33
34	\|xref mem_write
35	\|xref bindec
36	\|xref get_fline
37	\|xref round
38	\|xref denorm
39	\|xref dest_ext
40	\|xref dest_dbl
41	\|xref dest_sgl
42	\|xref unf_sub
43	\|xref nrm_set
44	\|xref dnrm_lp
45	\|xref ovf_res
46	\|xref reg_dest
47	\|xref t_ovfl
48	\|xref t_unfl
49
50	.global res_func
51	.global p_move
52
53	res_func:
54	clrb DNRM_FLG(%a6)
55	clrb RES_FLG(%a6)
56	clrb CU_ONLY(%a6)
57	tstb DY_MO_FLG(%a6)
58	beqs monadic
59	dyadic:
60	btstb #7,DTAG(%a6) //if dop = norm=000, zero=001,
61	// ;inf=010 or nan=011
62	beqs monadic //then branch
63	// ;else denorm
64	// HANDLE DESTINATION DENORM HERE
65	// ;set dtag to norm
66	// ;write the tag & fpte15 to the fstack
67	leal FPTEMP(%a6),%a0
68
69	bclrb #sign_bit,LOCAL_EX(%a0)
70	sne LOCAL_SGN(%a0)
71
72	bsr nrm_set //normalize number (exp will go negative)
73	bclrb #sign_bit,LOCAL_EX(%a0) //get rid of false sign
74	bfclr LOCAL_SGN(%a0){#0:#8} //change back to IEEE ext format
75	beqs dpos
76	bsetb #sign_bit,LOCAL_EX(%a0)
77	dpos:
78	bfclr DTAG(%a6){#0:#4} //set tag to normalized, FPTE15 = 0
79	bsetb #4,DTAG(%a6) //set FPTE15
80	orb #0x0f,DNRM_FLG(%a6)
81	monadic:
82	leal ETEMP(%a6),%a0
83	btstb #direction_bit,CMDREG1B(%a6) //check direction
84	bne opclass3 //it is a mv out
85	//
86	// At this point, only opclass 0 and 2 possible
87	//
88	btstb #7,STAG(%a6) //if sop = norm=000, zero=001,
89	// ;inf=010 or nan=011
90	bne mon_dnrm //else denorm
91	tstb DY_MO_FLG(%a6) //all cases of dyadic instructions would
92	bne normal //require normalization of denorm
93
94	// At this point:
95	// monadic instructions: fabs = $18 fneg = $1a ftst = $3a
96	// fmove = $00 fsmove = $40 fdmove = $44
97	// fsqrt = $05* fssqrt = $41 fdsqrt = $45
98	// (*fsqrt reencoded to $05)
99	//
100	movew CMDREG1B(%a6),%d0 //get command register
101	andil #0x7f,%d0 //strip to only command word
102	//
103	// At this point, fabs, fneg, fsmove, fdmove, ftst, fsqrt, fssqrt, and
104	// fdsqrt are possible.
105	// For cases fabs, fneg, fsmove, and fdmove goto spos (do not normalize)
106	// For cases fsqrt, fssqrt, and fdsqrt goto nrm_src (do normalize)
107	//
108	btstl #0,%d0
109	bne normal //weed out fsqrt instructions
110	//
111	// cu_norm handles fmove in instructions with normalized inputs.
112	// The routine round is used to correctly round the input for the
113	// destination precision and mode.
114	//
115	cu_norm:
116	st CU_ONLY(%a6) //set cu-only inst flag
117	movew CMDREG1B(%a6),%d0
118	andib #0x3b,%d0 //isolate bits to select inst
119	tstb %d0
120	beql cu_nmove //if zero, it is an fmove
121	cmpib #0x18,%d0
122	beql cu_nabs //if $18, it is fabs
123	cmpib #0x1a,%d0
124	beql cu_nneg //if $1a, it is fneg
125	//
126	// Inst is ftst. Check the source operand and set the cc's accordingly.
127	// No write is done, so simply rts.
128	//
129	cu_ntst:
130	movew LOCAL_EX(%a0),%d0
131	bclrl #15,%d0
132	sne LOCAL_SGN(%a0)
133	beqs cu_ntpo
134	orl #neg_mask,USER_FPSR(%a6) //set N
135	cu_ntpo:
136	cmpiw #0x7fff,%d0 //test for inf/nan
137	bnes cu_ntcz
138	tstl LOCAL_HI(%a0)
139	bnes cu_ntn
140	tstl LOCAL_LO(%a0)
141	bnes cu_ntn
142	orl #inf_mask,USER_FPSR(%a6)
143	rts
144	cu_ntn:
145	orl #nan_mask,USER_FPSR(%a6)
146	movel ETEMP_EX(%a6),FPTEMP_EX(%a6) //set up fptemp sign for
147	// ;snan handler
148
149	rts
150	cu_ntcz:
151	tstl LOCAL_HI(%a0)
152	bnel cu_ntsx
153	tstl LOCAL_LO(%a0)
154	bnel cu_ntsx
155	orl #z_mask,USER_FPSR(%a6)
156	cu_ntsx:
157	rts
158	//
159	// Inst is fabs. Execute the absolute value function on the input.
160	// Branch to the fmove code. If the operand is NaN, do nothing.
161	//
162	cu_nabs:
163	moveb STAG(%a6),%d0
164	btstl #5,%d0 //test for NaN or zero
165	bne wr_etemp //if either, simply write it
166	bclrb #7,LOCAL_EX(%a0) //do abs
167	bras cu_nmove //fmove code will finish
168	//
169	// Inst is fneg. Execute the negate value function on the input.
170	// Fall though to the fmove code. If the operand is NaN, do nothing.
171	//
172	cu_nneg:
173	moveb STAG(%a6),%d0
174	btstl #5,%d0 //test for NaN or zero
175	bne wr_etemp //if either, simply write it
176	bchgb #7,LOCAL_EX(%a0) //do neg
177	//
178	// Inst is fmove. This code also handles all result writes.
179	// If bit 2 is set, round is forced to double. If it is clear,
180	// and bit 6 is set, round is forced to single. If both are clear,
181	// the round precision is found in the fpcr. If the rounding precision
182	// is double or single, round the result before the write.
183	//
184	cu_nmove:
185	moveb STAG(%a6),%d0
186	andib #0xe0,%d0 //isolate stag bits
187	bne wr_etemp //if not norm, simply write it
188	btstb #2,CMDREG1B+1(%a6) //check for rd
189	bne cu_nmrd
190	btstb #6,CMDREG1B+1(%a6) //check for rs
191	bne cu_nmrs
192	//
193	// The move or operation is not with forced precision. Test for
194	// nan or inf as the input; if so, simply write it to FPn. Use the
195	// FPCR_MODE byte to get rounding on norms and zeros.
196	//
197	cu_nmnr:
198	bfextu FPCR_MODE(%a6){#0:#2},%d0
199	tstb %d0 //check for extended
200	beq cu_wrexn //if so, just write result
201	cmpib #1,%d0 //check for single
202	beq cu_nmrs //fall through to double
203	//
204	// The move is fdmove or round precision is double.
205	//
206	cu_nmrd:
207	movel #2,%d0 //set up the size for denorm
208	movew LOCAL_EX(%a0),%d1 //compare exponent to double threshold
209	andw #0x7fff,%d1
210	cmpw #0x3c01,%d1
211	bls cu_nunfl
212	bfextu FPCR_MODE(%a6){#2:#2},%d1 //get rmode
213	orl #0x00020000,%d1 //or in rprec (double)
214	clrl %d0 //clear g,r,s for round
215	bclrb #sign_bit,LOCAL_EX(%a0) //convert to internal format
216	sne LOCAL_SGN(%a0)
217	bsrl round
218	bfclr LOCAL_SGN(%a0){#0:#8}
219	beqs cu_nmrdc
220	bsetb #sign_bit,LOCAL_EX(%a0)
221	cu_nmrdc:
222	movew LOCAL_EX(%a0),%d1 //check for overflow
223	andw #0x7fff,%d1
224	cmpw #0x43ff,%d1
225	bge cu_novfl //take care of overflow case
226	bra cu_wrexn
227	//
228	// The move is fsmove or round precision is single.
229	//
230	cu_nmrs:
231	movel #1,%d0
232	movew LOCAL_EX(%a0),%d1
233	andw #0x7fff,%d1
234	cmpw #0x3f81,%d1
235	bls cu_nunfl
236	bfextu FPCR_MODE(%a6){#2:#2},%d1
237	orl #0x00010000,%d1
238	clrl %d0
239	bclrb #sign_bit,LOCAL_EX(%a0)
240	sne LOCAL_SGN(%a0)
241	bsrl round
242	bfclr LOCAL_SGN(%a0){#0:#8}
243	beqs cu_nmrsc
244	bsetb #sign_bit,LOCAL_EX(%a0)
245	cu_nmrsc:
246	movew LOCAL_EX(%a0),%d1
247	andw #0x7FFF,%d1
248	cmpw #0x407f,%d1
249	blt cu_wrexn
250	//
251	// The operand is above precision boundaries. Use t_ovfl to
252	// generate the correct value.
253	//
254	cu_novfl:
255	bsr t_ovfl
256	bra cu_wrexn
257	//
258	// The operand is below precision boundaries. Use denorm to
259	// generate the correct value.
260	//
261	cu_nunfl:
262	bclrb #sign_bit,LOCAL_EX(%a0)
263	sne LOCAL_SGN(%a0)
264	bsr denorm
265	bfclr LOCAL_SGN(%a0){#0:#8} //change back to IEEE ext format
266	beqs cu_nucont
267	bsetb #sign_bit,LOCAL_EX(%a0)
268	cu_nucont:
269	bfextu FPCR_MODE(%a6){#2:#2},%d1
270	btstb #2,CMDREG1B+1(%a6) //check for rd
271	bne inst_d
272	btstb #6,CMDREG1B+1(%a6) //check for rs
273	bne inst_s
274	swap %d1
275	moveb FPCR_MODE(%a6),%d1
276	lsrb #6,%d1
277	swap %d1
278	bra inst_sd
279	inst_d:
280	orl #0x00020000,%d1
281	bra inst_sd
282	inst_s:
283	orl #0x00010000,%d1
284	inst_sd:
285	bclrb #sign_bit,LOCAL_EX(%a0)
286	sne LOCAL_SGN(%a0)
287	bsrl round
288	bfclr LOCAL_SGN(%a0){#0:#8}
289	beqs cu_nuflp
290	bsetb #sign_bit,LOCAL_EX(%a0)
291	cu_nuflp:
292	btstb #inex2_bit,FPSR_EXCEPT(%a6)
293	beqs cu_nuninx
294	orl #aunfl_mask,USER_FPSR(%a6) //if the round was inex, set AUNFL
295	cu_nuninx:
296	tstl LOCAL_HI(%a0) //test for zero
297	bnes cu_nunzro
298	tstl LOCAL_LO(%a0)
299	bnes cu_nunzro
300	//
301	// The mantissa is zero from the denorm loop. Check sign and rmode
302	// to see if rounding should have occurred which would leave the lsb.
303	//
304	movel USER_FPCR(%a6),%d0
305	andil #0x30,%d0 //isolate rmode
306	cmpil #0x20,%d0
307	blts cu_nzro
308	bnes cu_nrp
309	cu_nrm:
310	tstw LOCAL_EX(%a0) //if positive, set lsb
311	bges cu_nzro
312	btstb #7,FPCR_MODE(%a6) //check for double
313	beqs cu_nincs
314	bras cu_nincd
315	cu_nrp:
316	tstw LOCAL_EX(%a0) //if positive, set lsb
317	blts cu_nzro
318	btstb #7,FPCR_MODE(%a6) //check for double
319	beqs cu_nincs
320	cu_nincd:
321	orl #0x800,LOCAL_LO(%a0) //inc for double
322	bra cu_nunzro
323	cu_nincs:
324	orl #0x100,LOCAL_HI(%a0) //inc for single
325	bra cu_nunzro
326	cu_nzro:
327	orl #z_mask,USER_FPSR(%a6)
328	moveb STAG(%a6),%d0
329	andib #0xe0,%d0
330	cmpib #0x40,%d0 //check if input was tagged zero
331	beqs cu_numv
332	cu_nunzro:
333	orl #unfl_mask,USER_FPSR(%a6) //set unfl
334	cu_numv:
335	movel (%a0),ETEMP(%a6)
336	movel 4(%a0),ETEMP_HI(%a6)
337	movel 8(%a0),ETEMP_LO(%a6)
338	//
339	// Write the result to memory, setting the fpsr cc bits. NaN and Inf
340	// bypass cu_wrexn.
341	//
342	cu_wrexn:
343	tstw LOCAL_EX(%a0) //test for zero
344	beqs cu_wrzero
345	cmpw #0x8000,LOCAL_EX(%a0) //test for zero
346	bnes cu_wreon
347	cu_wrzero:
348	orl #z_mask,USER_FPSR(%a6) //set Z bit
349	cu_wreon:
350	tstw LOCAL_EX(%a0)
351	bpl wr_etemp
352	orl #neg_mask,USER_FPSR(%a6)
353	bra wr_etemp
354
355	//
356	// HANDLE SOURCE DENORM HERE
357	//
358	// ;clear denorm stag to norm
359	// ;write the new tag & ete15 to the fstack
360	mon_dnrm:
361	//
362	// At this point, check for the cases in which normalizing the
363	// denorm produces incorrect results.
364	//
365	tstb DY_MO_FLG(%a6) //all cases of dyadic instructions would
366	bnes nrm_src //require normalization of denorm
367
368	// At this point:
369	// monadic instructions: fabs = $18 fneg = $1a ftst = $3a
370	// fmove = $00 fsmove = $40 fdmove = $44
371	// fsqrt = $05* fssqrt = $41 fdsqrt = $45
372	// (*fsqrt reencoded to $05)
373	//
374	movew CMDREG1B(%a6),%d0 //get command register
375	andil #0x7f,%d0 //strip to only command word
376	//
377	// At this point, fabs, fneg, fsmove, fdmove, ftst, fsqrt, fssqrt, and
378	// fdsqrt are possible.
379	// For cases fabs, fneg, fsmove, and fdmove goto spos (do not normalize)
380	// For cases fsqrt, fssqrt, and fdsqrt goto nrm_src (do normalize)
381	//
382	btstl #0,%d0
383	bnes nrm_src //weed out fsqrt instructions
384	st CU_ONLY(%a6) //set cu-only inst flag
385	bra cu_dnrm //fmove, fabs, fneg, ftst
386	// ;cases go to cu_dnrm
387	nrm_src:
388	bclrb #sign_bit,LOCAL_EX(%a0)
389	sne LOCAL_SGN(%a0)
390	bsr nrm_set //normalize number (exponent will go
391	// ; negative)
392	bclrb #sign_bit,LOCAL_EX(%a0) //get rid of false sign
393
394	bfclr LOCAL_SGN(%a0){#0:#8} //change back to IEEE ext format
395	beqs spos
396	bsetb #sign_bit,LOCAL_EX(%a0)
397	spos:
398	bfclr STAG(%a6){#0:#4} //set tag to normalized, FPTE15 = 0
399	bsetb #4,STAG(%a6) //set ETE15
400	orb #0xf0,DNRM_FLG(%a6)
401	normal:
402	tstb DNRM_FLG(%a6) //check if any of the ops were denorms
403	bne ck_wrap //if so, check if it is a potential
404	// ;wrap-around case
405	fix_stk:
406	moveb #0xfe,CU_SAVEPC(%a6)
407	bclrb #E1,E_BYTE(%a6)
408
409	clrw NMNEXC(%a6)
410
411	st RES_FLG(%a6) //indicate that a restore is needed
412	rts
413
414	//
415	// cu_dnrm handles all cu-only instructions (fmove, fabs, fneg, and
416	// ftst) completely in software without an frestore to the 040.
417	//
418	cu_dnrm:
419	st CU_ONLY(%a6)
420	movew CMDREG1B(%a6),%d0
421	andib #0x3b,%d0 //isolate bits to select inst
422	tstb %d0
423	beql cu_dmove //if zero, it is an fmove
424	cmpib #0x18,%d0
425	beql cu_dabs //if $18, it is fabs
426	cmpib #0x1a,%d0
427	beql cu_dneg //if $1a, it is fneg
428	//
429	// Inst is ftst. Check the source operand and set the cc's accordingly.
430	// No write is done, so simply rts.
431	//
432	cu_dtst:
433	movew LOCAL_EX(%a0),%d0
434	bclrl #15,%d0
435	sne LOCAL_SGN(%a0)
436	beqs cu_dtpo
437	orl #neg_mask,USER_FPSR(%a6) //set N
438	cu_dtpo:
439	cmpiw #0x7fff,%d0 //test for inf/nan
440	bnes cu_dtcz
441	tstl LOCAL_HI(%a0)
442	bnes cu_dtn
443	tstl LOCAL_LO(%a0)
444	bnes cu_dtn
445	orl #inf_mask,USER_FPSR(%a6)
446	rts
447	cu_dtn:
448	orl #nan_mask,USER_FPSR(%a6)
449	movel ETEMP_EX(%a6),FPTEMP_EX(%a6) //set up fptemp sign for
450	// ;snan handler
451	rts
452	cu_dtcz:
453	tstl LOCAL_HI(%a0)
454	bnel cu_dtsx
455	tstl LOCAL_LO(%a0)
456	bnel cu_dtsx
457	orl #z_mask,USER_FPSR(%a6)
458	cu_dtsx:
459	rts
460	//
461	// Inst is fabs. Execute the absolute value function on the input.
462	// Branch to the fmove code.
463	//
464	cu_dabs:
465	bclrb #7,LOCAL_EX(%a0) //do abs
466	bras cu_dmove //fmove code will finish
467	//
468	// Inst is fneg. Execute the negate value function on the input.
469	// Fall though to the fmove code.
470	//
471	cu_dneg:
472	bchgb #7,LOCAL_EX(%a0) //do neg
473	//
474	// Inst is fmove. This code also handles all result writes.
475	// If bit 2 is set, round is forced to double. If it is clear,
476	// and bit 6 is set, round is forced to single. If both are clear,
477	// the round precision is found in the fpcr. If the rounding precision
478	// is double or single, the result is zero, and the mode is checked
479	// to determine if the lsb of the result should be set.
480	//
481	cu_dmove:
482	btstb #2,CMDREG1B+1(%a6) //check for rd
483	bne cu_dmrd
484	btstb #6,CMDREG1B+1(%a6) //check for rs
485	bne cu_dmrs
486	//
487	// The move or operation is not with forced precision. Use the
488	// FPCR_MODE byte to get rounding.
489	//
490	cu_dmnr:
491	bfextu FPCR_MODE(%a6){#0:#2},%d0
492	tstb %d0 //check for extended
493	beq cu_wrexd //if so, just write result
494	cmpib #1,%d0 //check for single
495	beq cu_dmrs //fall through to double
496	//
497	// The move is fdmove or round precision is double. Result is zero.
498	// Check rmode for rp or rm and set lsb accordingly.
499	//
500	cu_dmrd:
501	bfextu FPCR_MODE(%a6){#2:#2},%d1 //get rmode
502	tstw LOCAL_EX(%a0) //check sign
503	blts cu_dmdn
504	cmpib #3,%d1 //check for rp
505	bne cu_dpd //load double pos zero
506	bra cu_dpdr //load double pos zero w/lsb
507	cu_dmdn:
508	cmpib #2,%d1 //check for rm
509	bne cu_dnd //load double neg zero
510	bra cu_dndr //load double neg zero w/lsb
511	//
512	// The move is fsmove or round precision is single. Result is zero.
513	// Check for rp or rm and set lsb accordingly.
514	//
515	cu_dmrs:
516	bfextu FPCR_MODE(%a6){#2:#2},%d1 //get rmode
517	tstw LOCAL_EX(%a0) //check sign
518	blts cu_dmsn
519	cmpib #3,%d1 //check for rp
520	bne cu_spd //load single pos zero
521	bra cu_spdr //load single pos zero w/lsb
522	cu_dmsn:
523	cmpib #2,%d1 //check for rm
524	bne cu_snd //load single neg zero
525	bra cu_sndr //load single neg zero w/lsb
526	//
527	// The precision is extended, so the result in etemp is correct.
528	// Simply set unfl (not inex2 or aunfl) and write the result to
529	// the correct fp register.
530	cu_wrexd:
531	orl #unfl_mask,USER_FPSR(%a6)
532	tstw LOCAL_EX(%a0)
533	beq wr_etemp
534	orl #neg_mask,USER_FPSR(%a6)
535	bra wr_etemp
536	//
537	// These routines write +/- zero in double format. The routines
538	// cu_dpdr and cu_dndr set the double lsb.
539	//
540	cu_dpd:
541	movel #0x3c010000,LOCAL_EX(%a0) //force pos double zero
542	clrl LOCAL_HI(%a0)
543	clrl LOCAL_LO(%a0)
544	orl #z_mask,USER_FPSR(%a6)
545	orl #unfinx_mask,USER_FPSR(%a6)
546	bra wr_etemp
547	cu_dpdr:
548	movel #0x3c010000,LOCAL_EX(%a0) //force pos double zero
549	clrl LOCAL_HI(%a0)
550	movel #0x800,LOCAL_LO(%a0) //with lsb set
551	orl #unfinx_mask,USER_FPSR(%a6)
552	bra wr_etemp
553	cu_dnd:
554	movel #0xbc010000,LOCAL_EX(%a0) //force pos double zero
555	clrl LOCAL_HI(%a0)
556	clrl LOCAL_LO(%a0)
557	orl #z_mask,USER_FPSR(%a6)
558	orl #neg_mask,USER_FPSR(%a6)
559	orl #unfinx_mask,USER_FPSR(%a6)
560	bra wr_etemp
561	cu_dndr:
562	movel #0xbc010000,LOCAL_EX(%a0) //force pos double zero
563	clrl LOCAL_HI(%a0)
564	movel #0x800,LOCAL_LO(%a0) //with lsb set
565	orl #neg_mask,USER_FPSR(%a6)
566	orl #unfinx_mask,USER_FPSR(%a6)
567	bra wr_etemp
568	//
569	// These routines write +/- zero in single format. The routines
570	// cu_dpdr and cu_dndr set the single lsb.
571	//
572	cu_spd:
573	movel #0x3f810000,LOCAL_EX(%a0) //force pos single zero
574	clrl LOCAL_HI(%a0)
575	clrl LOCAL_LO(%a0)
576	orl #z_mask,USER_FPSR(%a6)
577	orl #unfinx_mask,USER_FPSR(%a6)
578	bra wr_etemp
579	cu_spdr:
580	movel #0x3f810000,LOCAL_EX(%a0) //force pos single zero
581	movel #0x100,LOCAL_HI(%a0) //with lsb set
582	clrl LOCAL_LO(%a0)
583	orl #unfinx_mask,USER_FPSR(%a6)
584	bra wr_etemp
585	cu_snd:
586	movel #0xbf810000,LOCAL_EX(%a0) //force pos single zero
587	clrl LOCAL_HI(%a0)
588	clrl LOCAL_LO(%a0)
589	orl #z_mask,USER_FPSR(%a6)
590	orl #neg_mask,USER_FPSR(%a6)
591	orl #unfinx_mask,USER_FPSR(%a6)
592	bra wr_etemp
593	cu_sndr:
594	movel #0xbf810000,LOCAL_EX(%a0) //force pos single zero
595	movel #0x100,LOCAL_HI(%a0) //with lsb set
596	clrl LOCAL_LO(%a0)
597	orl #neg_mask,USER_FPSR(%a6)
598	orl #unfinx_mask,USER_FPSR(%a6)
599	bra wr_etemp
600
601	//
602	// This code checks for 16-bit overflow conditions on dyadic
603	// operations which are not restorable into the floating-point
604	// unit and must be completed in software. Basically, this
605	// condition exists with a very large norm and a denorm. One
606	// of the operands must be denormalized to enter this code.
607	//
608	// Flags used:
609	// DY_MO_FLG contains 0 for monadic op, $ff for dyadic
610	// DNRM_FLG contains $00 for neither op denormalized
611	// $0f for the destination op denormalized
612	// $f0 for the source op denormalized
613	// $ff for both ops denormalized
614	//
615	// The wrap-around condition occurs for add, sub, div, and cmp
616	// when
617	//
618	// abs(dest_exp - src_exp) >= $8000
619	//
620	// and for mul when
621	//
622	// (dest_exp + src_exp) < $0
623	//
624	// we must process the operation here if this case is true.
625	//
626	// The rts following the frcfpn routine is the exit from res_func
627	// for this condition. The restore flag (RES_FLG) is left clear.
628	// No frestore is done unless an exception is to be reported.
629	//
630	// For fadd:
631	// if(sign_of(dest) != sign_of(src))
632	// replace exponent of src with $3fff (keep sign)
633	// use fpu to perform dest+new_src (user's rmode and X)
634	// clr sticky
635	// else
636	// set sticky
637	// call round with user's precision and mode
638	// move result to fpn and wbtemp
639	//
640	// For fsub:
641	// if(sign_of(dest) == sign_of(src))
642	// replace exponent of src with $3fff (keep sign)
643	// use fpu to perform dest+new_src (user's rmode and X)
644	// clr sticky
645	// else
646	// set sticky
647	// call round with user's precision and mode
648	// move result to fpn and wbtemp
649	//
650	// For fdiv/fsgldiv:
651	// if(both operands are denorm)
652	// restore_to_fpu;
653	// if(dest is norm)
654	// force_ovf;
655	// else(dest is denorm)
656	// force_unf:
657	//
658	// For fcmp:
659	// if(dest is norm)
660	// N = sign_of(dest);
661	// else(dest is denorm)
662	// N = sign_of(src);
663	//
664	// For fmul:
665	// if(both operands are denorm)
666	// force_unf;
667	// if((dest_exp + src_exp) < 0)
668	// force_unf:
669	// else
670	// restore_to_fpu;
671	//
672	// local equates:
673	.set addcode,0x22
674	.set subcode,0x28
675	.set mulcode,0x23
676	.set divcode,0x20
677	.set cmpcode,0x38
678	ck_wrap:
679	\| tstb DY_MO_FLG(%a6) ;check for fsqrt
680	beq fix_stk //if zero, it is fsqrt
681	movew CMDREG1B(%a6),%d0
682	andiw #0x3b,%d0 //strip to command bits
683	cmpiw #addcode,%d0
684	beq wrap_add
685	cmpiw #subcode,%d0
686	beq wrap_sub
687	cmpiw #mulcode,%d0
688	beq wrap_mul
689	cmpiw #cmpcode,%d0
690	beq wrap_cmp
691	//
692	// Inst is fdiv.
693	//
694	wrap_div:
695	cmpb #0xff,DNRM_FLG(%a6) //if both ops denorm,
696	beq fix_stk //restore to fpu
697	//
698	// One of the ops is denormalized. Test for wrap condition
699	// and force the result.
700	//
701	cmpb #0x0f,DNRM_FLG(%a6) //check for dest denorm
702	bnes div_srcd
703	div_destd:
704	bsrl ckinf_ns
705	bne fix_stk
706	bfextu ETEMP_EX(%a6){#1:#15},%d0 //get src exp (always pos)
707	bfexts FPTEMP_EX(%a6){#1:#15},%d1 //get dest exp (always neg)
708	subl %d1,%d0 //subtract dest from src
709	cmpl #0x7fff,%d0
710	blt fix_stk //if less, not wrap case
711	clrb WBTEMP_SGN(%a6)
712	movew ETEMP_EX(%a6),%d0 //find the sign of the result
713	movew FPTEMP_EX(%a6),%d1
714	eorw %d1,%d0
715	andiw #0x8000,%d0
716	beq force_unf
717	st WBTEMP_SGN(%a6)
718	bra force_unf
719
720	ckinf_ns:
721	moveb STAG(%a6),%d0 //check source tag for inf or nan
722	bra ck_in_com
723	ckinf_nd:
724	moveb DTAG(%a6),%d0 //check destination tag for inf or nan
725	ck_in_com:
726	andib #0x60,%d0 //isolate tag bits
727	cmpb #0x40,%d0 //is it inf?
728	beq nan_or_inf //not wrap case
729	cmpb #0x60,%d0 //is it nan?
730	beq nan_or_inf //yes, not wrap case?
731	cmpb #0x20,%d0 //is it a zero?
732	beq nan_or_inf //yes
733	clrl %d0
734	rts //then ; it is either a zero of norm,
735	// ;check wrap case
736	nan_or_inf:
737	moveql #-1,%d0
738	rts
739
740
741
742	div_srcd:
743	bsrl ckinf_nd
744	bne fix_stk
745	bfextu FPTEMP_EX(%a6){#1:#15},%d0 //get dest exp (always pos)
746	bfexts ETEMP_EX(%a6){#1:#15},%d1 //get src exp (always neg)
747	subl %d1,%d0 //subtract src from dest
748	cmpl #0x8000,%d0
749	blt fix_stk //if less, not wrap case
750	clrb WBTEMP_SGN(%a6)
751	movew ETEMP_EX(%a6),%d0 //find the sign of the result
752	movew FPTEMP_EX(%a6),%d1
753	eorw %d1,%d0
754	andiw #0x8000,%d0
755	beqs force_ovf
756	st WBTEMP_SGN(%a6)
757	//
758	// This code handles the case of the instruction resulting in
759	// an overflow condition.
760	//
761	force_ovf:
762	bclrb #E1,E_BYTE(%a6)
763	orl #ovfl_inx_mask,USER_FPSR(%a6)
764	clrw NMNEXC(%a6)
765	leal WBTEMP(%a6),%a0 //point a0 to memory location
766	movew CMDREG1B(%a6),%d0
767	btstl #6,%d0 //test for forced precision
768	beqs frcovf_fpcr
769	btstl #2,%d0 //check for double
770	bnes frcovf_dbl
771	movel #0x1,%d0 //inst is forced single
772	bras frcovf_rnd
773	frcovf_dbl:
774	movel #0x2,%d0 //inst is forced double
775	bras frcovf_rnd
776	frcovf_fpcr:
777	bfextu FPCR_MODE(%a6){#0:#2},%d0 //inst not forced - use fpcr prec
778	frcovf_rnd:
779
780	// The 881/882 does not set inex2 for the following case, so the
781	// line is commented out to be compatible with 881/882
782	// tst.b %d0
783	// beq.b frcovf_x
784	// or.l #inex2_mask,USER_FPSR(%a6) ;if prec is s or d, set inex2
785
786	//frcovf_x:
787	bsrl ovf_res //get correct result based on
788	// ;round precision/mode. This
789	// ;sets FPSR_CC correctly
790	// ;returns in external format
791	bfclr WBTEMP_SGN(%a6){#0:#8}
792	beq frcfpn
793	bsetb #sign_bit,WBTEMP_EX(%a6)
794	bra frcfpn
795	//
796	// Inst is fadd.
797	//
798	wrap_add:
799	cmpb #0xff,DNRM_FLG(%a6) //if both ops denorm,
800	beq fix_stk //restore to fpu
801	//
802	// One of the ops is denormalized. Test for wrap condition
803	// and complete the instruction.
804	//
805	cmpb #0x0f,DNRM_FLG(%a6) //check for dest denorm
806	bnes add_srcd
807	add_destd:
808	bsrl ckinf_ns
809	bne fix_stk
810	bfextu ETEMP_EX(%a6){#1:#15},%d0 //get src exp (always pos)
811	bfexts FPTEMP_EX(%a6){#1:#15},%d1 //get dest exp (always neg)
812	subl %d1,%d0 //subtract dest from src
813	cmpl #0x8000,%d0
814	blt fix_stk //if less, not wrap case
815	bra add_wrap
816	add_srcd:
817	bsrl ckinf_nd
818	bne fix_stk
819	bfextu FPTEMP_EX(%a6){#1:#15},%d0 //get dest exp (always pos)
820	bfexts ETEMP_EX(%a6){#1:#15},%d1 //get src exp (always neg)
821	subl %d1,%d0 //subtract src from dest
822	cmpl #0x8000,%d0
823	blt fix_stk //if less, not wrap case
824	//
825	// Check the signs of the operands. If they are unlike, the fpu
826	// can be used to add the norm and 1.0 with the sign of the
827	// denorm and it will correctly generate the result in extended
828	// precision. We can then call round with no sticky and the result
829	// will be correct for the user's rounding mode and precision. If
830	// the signs are the same, we call round with the sticky bit set
831	// and the result will be correct for the user's rounding mode and
832	// precision.
833	//
834	add_wrap:
835	movew ETEMP_EX(%a6),%d0
836	movew FPTEMP_EX(%a6),%d1
837	eorw %d1,%d0
838	andiw #0x8000,%d0
839	beq add_same
840	//
841	// The signs are unlike.
842	//
843	cmpb #0x0f,DNRM_FLG(%a6) //is dest the denorm?
844	bnes add_u_srcd
845	movew FPTEMP_EX(%a6),%d0
846	andiw #0x8000,%d0
847	orw #0x3fff,%d0 //force the exponent to +/- 1
848	movew %d0,FPTEMP_EX(%a6) //in the denorm
849	movel USER_FPCR(%a6),%d0
850	andil #0x30,%d0
851	fmovel %d0,%fpcr //set up users rmode and X
852	fmovex ETEMP(%a6),%fp0
853	faddx FPTEMP(%a6),%fp0
854	leal WBTEMP(%a6),%a0 //point a0 to wbtemp in frame
855	fmovel %fpsr,%d1
856	orl %d1,USER_FPSR(%a6) //capture cc's and inex from fadd
857	fmovex %fp0,WBTEMP(%a6) //write result to memory
858	lsrl #4,%d0 //put rmode in lower 2 bits
859	movel USER_FPCR(%a6),%d1
860	andil #0xc0,%d1
861	lsrl #6,%d1 //put precision in upper word
862	swap %d1
863	orl %d0,%d1 //set up for round call
864	clrl %d0 //force sticky to zero
865	bclrb #sign_bit,WBTEMP_EX(%a6)
866	sne WBTEMP_SGN(%a6)
867	bsrl round //round result to users rmode & prec
868	bfclr WBTEMP_SGN(%a6){#0:#8} //convert back to IEEE ext format
869	beq frcfpnr
870	bsetb #sign_bit,WBTEMP_EX(%a6)
871	bra frcfpnr
872	add_u_srcd:
873	movew ETEMP_EX(%a6),%d0
874	andiw #0x8000,%d0
875	orw #0x3fff,%d0 //force the exponent to +/- 1
876	movew %d0,ETEMP_EX(%a6) //in the denorm
877	movel USER_FPCR(%a6),%d0
878	andil #0x30,%d0
879	fmovel %d0,%fpcr //set up users rmode and X
880	fmovex ETEMP(%a6),%fp0
881	faddx FPTEMP(%a6),%fp0
882	fmovel %fpsr,%d1
883	orl %d1,USER_FPSR(%a6) //capture cc's and inex from fadd
884	leal WBTEMP(%a6),%a0 //point a0 to wbtemp in frame
885	fmovex %fp0,WBTEMP(%a6) //write result to memory
886	lsrl #4,%d0 //put rmode in lower 2 bits
887	movel USER_FPCR(%a6),%d1
888	andil #0xc0,%d1
889	lsrl #6,%d1 //put precision in upper word
890	swap %d1
891	orl %d0,%d1 //set up for round call
892	clrl %d0 //force sticky to zero
893	bclrb #sign_bit,WBTEMP_EX(%a6)
894	sne WBTEMP_SGN(%a6) //use internal format for round
895	bsrl round //round result to users rmode & prec
896	bfclr WBTEMP_SGN(%a6){#0:#8} //convert back to IEEE ext format
897	beq frcfpnr
898	bsetb #sign_bit,WBTEMP_EX(%a6)
899	bra frcfpnr
900	//
901	// Signs are alike:
902	//
903	add_same:
904	cmpb #0x0f,DNRM_FLG(%a6) //is dest the denorm?
905	bnes add_s_srcd
906	add_s_destd:
907	leal ETEMP(%a6),%a0
908	movel USER_FPCR(%a6),%d0
909	andil #0x30,%d0
910	lsrl #4,%d0 //put rmode in lower 2 bits
911	movel USER_FPCR(%a6),%d1
912	andil #0xc0,%d1
913	lsrl #6,%d1 //put precision in upper word
914	swap %d1
915	orl %d0,%d1 //set up for round call
916	movel #0x20000000,%d0 //set sticky for round
917	bclrb #sign_bit,ETEMP_EX(%a6)
918	sne ETEMP_SGN(%a6)
919	bsrl round //round result to users rmode & prec
920	bfclr ETEMP_SGN(%a6){#0:#8} //convert back to IEEE ext format
921	beqs add_s_dclr
922	bsetb #sign_bit,ETEMP_EX(%a6)
923	add_s_dclr:
924	leal WBTEMP(%a6),%a0
925	movel ETEMP(%a6),(%a0) //write result to wbtemp
926	movel ETEMP_HI(%a6),4(%a0)
927	movel ETEMP_LO(%a6),8(%a0)
928	tstw ETEMP_EX(%a6)
929	bgt add_ckovf
930	orl #neg_mask,USER_FPSR(%a6)
931	bra add_ckovf
932	add_s_srcd:
933	leal FPTEMP(%a6),%a0
934	movel USER_FPCR(%a6),%d0
935	andil #0x30,%d0
936	lsrl #4,%d0 //put rmode in lower 2 bits
937	movel USER_FPCR(%a6),%d1
938	andil #0xc0,%d1
939	lsrl #6,%d1 //put precision in upper word
940	swap %d1
941	orl %d0,%d1 //set up for round call
942	movel #0x20000000,%d0 //set sticky for round
943	bclrb #sign_bit,FPTEMP_EX(%a6)
944	sne FPTEMP_SGN(%a6)
945	bsrl round //round result to users rmode & prec
946	bfclr FPTEMP_SGN(%a6){#0:#8} //convert back to IEEE ext format
947	beqs add_s_sclr
948	bsetb #sign_bit,FPTEMP_EX(%a6)
949	add_s_sclr:
950	leal WBTEMP(%a6),%a0
951	movel FPTEMP(%a6),(%a0) //write result to wbtemp
952	movel FPTEMP_HI(%a6),4(%a0)
953	movel FPTEMP_LO(%a6),8(%a0)
954	tstw FPTEMP_EX(%a6)
955	bgt add_ckovf
956	orl #neg_mask,USER_FPSR(%a6)
957	add_ckovf:
958	movew WBTEMP_EX(%a6),%d0
959	andiw #0x7fff,%d0
960	cmpiw #0x7fff,%d0
961	bne frcfpnr
962	//
963	// The result has overflowed to $7fff exponent. Set I, ovfl,
964	// and aovfl, and clr the mantissa (incorrectly set by the
965	// round routine.)
966	//
967	orl #inf_mask+ovfl_inx_mask,USER_FPSR(%a6)
968	clrl 4(%a0)
969	bra frcfpnr
970	//
971	// Inst is fsub.
972	//
973	wrap_sub:
974	cmpb #0xff,DNRM_FLG(%a6) //if both ops denorm,
975	beq fix_stk //restore to fpu
976	//
977	// One of the ops is denormalized. Test for wrap condition
978	// and complete the instruction.
979	//
980	cmpb #0x0f,DNRM_FLG(%a6) //check for dest denorm
981	bnes sub_srcd
982	sub_destd:
983	bsrl ckinf_ns
984	bne fix_stk
985	bfextu ETEMP_EX(%a6){#1:#15},%d0 //get src exp (always pos)
986	bfexts FPTEMP_EX(%a6){#1:#15},%d1 //get dest exp (always neg)
987	subl %d1,%d0 //subtract src from dest
988	cmpl #0x8000,%d0
989	blt fix_stk //if less, not wrap case
990	bra sub_wrap
991	sub_srcd:
992	bsrl ckinf_nd
993	bne fix_stk
994	bfextu FPTEMP_EX(%a6){#1:#15},%d0 //get dest exp (always pos)
995	bfexts ETEMP_EX(%a6){#1:#15},%d1 //get src exp (always neg)
996	subl %d1,%d0 //subtract dest from src
997	cmpl #0x8000,%d0
998	blt fix_stk //if less, not wrap case
999	//
1000	// Check the signs of the operands. If they are alike, the fpu
1001	// can be used to subtract from the norm 1.0 with the sign of the
1002	// denorm and it will correctly generate the result in extended
1003	// precision. We can then call round with no sticky and the result
1004	// will be correct for the user's rounding mode and precision. If
1005	// the signs are unlike, we call round with the sticky bit set
1006	// and the result will be correct for the user's rounding mode and
1007	// precision.
1008	//
1009	sub_wrap:
1010	movew ETEMP_EX(%a6),%d0
1011	movew FPTEMP_EX(%a6),%d1
1012	eorw %d1,%d0
1013	andiw #0x8000,%d0
1014	bne sub_diff
1015	//
1016	// The signs are alike.
1017	//
1018	cmpb #0x0f,DNRM_FLG(%a6) //is dest the denorm?
1019	bnes sub_u_srcd
1020	movew FPTEMP_EX(%a6),%d0
1021	andiw #0x8000,%d0
1022	orw #0x3fff,%d0 //force the exponent to +/- 1
1023	movew %d0,FPTEMP_EX(%a6) //in the denorm
1024	movel USER_FPCR(%a6),%d0
1025	andil #0x30,%d0
1026	fmovel %d0,%fpcr //set up users rmode and X
1027	fmovex FPTEMP(%a6),%fp0
1028	fsubx ETEMP(%a6),%fp0
1029	fmovel %fpsr,%d1
1030	orl %d1,USER_FPSR(%a6) //capture cc's and inex from fadd
1031	leal WBTEMP(%a6),%a0 //point a0 to wbtemp in frame
1032	fmovex %fp0,WBTEMP(%a6) //write result to memory
1033	lsrl #4,%d0 //put rmode in lower 2 bits
1034	movel USER_FPCR(%a6),%d1
1035	andil #0xc0,%d1
1036	lsrl #6,%d1 //put precision in upper word
1037	swap %d1
1038	orl %d0,%d1 //set up for round call
1039	clrl %d0 //force sticky to zero
1040	bclrb #sign_bit,WBTEMP_EX(%a6)
1041	sne WBTEMP_SGN(%a6)
1042	bsrl round //round result to users rmode & prec
1043	bfclr WBTEMP_SGN(%a6){#0:#8} //convert back to IEEE ext format
1044	beq frcfpnr
1045	bsetb #sign_bit,WBTEMP_EX(%a6)
1046	bra frcfpnr
1047	sub_u_srcd:
1048	movew ETEMP_EX(%a6),%d0
1049	andiw #0x8000,%d0
1050	orw #0x3fff,%d0 //force the exponent to +/- 1
1051	movew %d0,ETEMP_EX(%a6) //in the denorm
1052	movel USER_FPCR(%a6),%d0
1053	andil #0x30,%d0
1054	fmovel %d0,%fpcr //set up users rmode and X
1055	fmovex FPTEMP(%a6),%fp0
1056	fsubx ETEMP(%a6),%fp0
1057	fmovel %fpsr,%d1
1058	orl %d1,USER_FPSR(%a6) //capture cc's and inex from fadd
1059	leal WBTEMP(%a6),%a0 //point a0 to wbtemp in frame
1060	fmovex %fp0,WBTEMP(%a6) //write result to memory
1061	lsrl #4,%d0 //put rmode in lower 2 bits
1062	movel USER_FPCR(%a6),%d1
1063	andil #0xc0,%d1
1064	lsrl #6,%d1 //put precision in upper word
1065	swap %d1
1066	orl %d0,%d1 //set up for round call
1067	clrl %d0 //force sticky to zero
1068	bclrb #sign_bit,WBTEMP_EX(%a6)
1069	sne WBTEMP_SGN(%a6)
1070	bsrl round //round result to users rmode & prec
1071	bfclr WBTEMP_SGN(%a6){#0:#8} //convert back to IEEE ext format
1072	beq frcfpnr
1073	bsetb #sign_bit,WBTEMP_EX(%a6)
1074	bra frcfpnr
1075	//
1076	// Signs are unlike:
1077	//
1078	sub_diff:
1079	cmpb #0x0f,DNRM_FLG(%a6) //is dest the denorm?
1080	bnes sub_s_srcd
1081	sub_s_destd:
1082	leal ETEMP(%a6),%a0
1083	movel USER_FPCR(%a6),%d0
1084	andil #0x30,%d0
1085	lsrl #4,%d0 //put rmode in lower 2 bits
1086	movel USER_FPCR(%a6),%d1
1087	andil #0xc0,%d1
1088	lsrl #6,%d1 //put precision in upper word
1089	swap %d1
1090	orl %d0,%d1 //set up for round call
1091	movel #0x20000000,%d0 //set sticky for round
1092	//
1093	// Since the dest is the denorm, the sign is the opposite of the
1094	// norm sign.
1095	//
1096	eoriw #0x8000,ETEMP_EX(%a6) //flip sign on result
1097	tstw ETEMP_EX(%a6)
1098	bgts sub_s_dwr
1099	orl #neg_mask,USER_FPSR(%a6)
1100	sub_s_dwr:
1101	bclrb #sign_bit,ETEMP_EX(%a6)
1102	sne ETEMP_SGN(%a6)
1103	bsrl round //round result to users rmode & prec
1104	bfclr ETEMP_SGN(%a6){#0:#8} //convert back to IEEE ext format
1105	beqs sub_s_dclr
1106	bsetb #sign_bit,ETEMP_EX(%a6)
1107	sub_s_dclr:
1108	leal WBTEMP(%a6),%a0
1109	movel ETEMP(%a6),(%a0) //write result to wbtemp
1110	movel ETEMP_HI(%a6),4(%a0)
1111	movel ETEMP_LO(%a6),8(%a0)
1112	bra sub_ckovf
1113	sub_s_srcd:
1114	leal FPTEMP(%a6),%a0
1115	movel USER_FPCR(%a6),%d0
1116	andil #0x30,%d0
1117	lsrl #4,%d0 //put rmode in lower 2 bits
1118	movel USER_FPCR(%a6),%d1
1119	andil #0xc0,%d1
1120	lsrl #6,%d1 //put precision in upper word
1121	swap %d1
1122	orl %d0,%d1 //set up for round call
1123	movel #0x20000000,%d0 //set sticky for round
1124	bclrb #sign_bit,FPTEMP_EX(%a6)
1125	sne FPTEMP_SGN(%a6)
1126	bsrl round //round result to users rmode & prec
1127	bfclr FPTEMP_SGN(%a6){#0:#8} //convert back to IEEE ext format
1128	beqs sub_s_sclr
1129	bsetb #sign_bit,FPTEMP_EX(%a6)
1130	sub_s_sclr:
1131	leal WBTEMP(%a6),%a0
1132	movel FPTEMP(%a6),(%a0) //write result to wbtemp
1133	movel FPTEMP_HI(%a6),4(%a0)
1134	movel FPTEMP_LO(%a6),8(%a0)
1135	tstw FPTEMP_EX(%a6)
1136	bgt sub_ckovf
1137	orl #neg_mask,USER_FPSR(%a6)
1138	sub_ckovf:
1139	movew WBTEMP_EX(%a6),%d0
1140	andiw #0x7fff,%d0
1141	cmpiw #0x7fff,%d0
1142	bne frcfpnr
1143	//
1144	// The result has overflowed to $7fff exponent. Set I, ovfl,
1145	// and aovfl, and clr the mantissa (incorrectly set by the
1146	// round routine.)
1147	//
1148	orl #inf_mask+ovfl_inx_mask,USER_FPSR(%a6)
1149	clrl 4(%a0)
1150	bra frcfpnr
1151	//
1152	// Inst is fcmp.
1153	//
1154	wrap_cmp:
1155	cmpb #0xff,DNRM_FLG(%a6) //if both ops denorm,
1156	beq fix_stk //restore to fpu
1157	//
1158	// One of the ops is denormalized. Test for wrap condition
1159	// and complete the instruction.
1160	//
1161	cmpb #0x0f,DNRM_FLG(%a6) //check for dest denorm
1162	bnes cmp_srcd
1163	cmp_destd:
1164	bsrl ckinf_ns
1165	bne fix_stk
1166	bfextu ETEMP_EX(%a6){#1:#15},%d0 //get src exp (always pos)
1167	bfexts FPTEMP_EX(%a6){#1:#15},%d1 //get dest exp (always neg)
1168	subl %d1,%d0 //subtract dest from src
1169	cmpl #0x8000,%d0
1170	blt fix_stk //if less, not wrap case
1171	tstw ETEMP_EX(%a6) //set N to ~sign_of(src)
1172	bge cmp_setn
1173	rts
1174	cmp_srcd:
1175	bsrl ckinf_nd
1176	bne fix_stk
1177	bfextu FPTEMP_EX(%a6){#1:#15},%d0 //get dest exp (always pos)
1178	bfexts ETEMP_EX(%a6){#1:#15},%d1 //get src exp (always neg)
1179	subl %d1,%d0 //subtract src from dest
1180	cmpl #0x8000,%d0
1181	blt fix_stk //if less, not wrap case
1182	tstw FPTEMP_EX(%a6) //set N to sign_of(dest)
1183	blt cmp_setn
1184	rts
1185	cmp_setn:
1186	orl #neg_mask,USER_FPSR(%a6)
1187	rts
1188
1189	//
1190	// Inst is fmul.
1191	//
1192	wrap_mul:
1193	cmpb #0xff,DNRM_FLG(%a6) //if both ops denorm,
1194	beq force_unf //force an underflow (really!)
1195	//
1196	// One of the ops is denormalized. Test for wrap condition
1197	// and complete the instruction.
1198	//
1199	cmpb #0x0f,DNRM_FLG(%a6) //check for dest denorm
1200	bnes mul_srcd
1201	mul_destd:
1202	bsrl ckinf_ns
1203	bne fix_stk
1204	bfextu ETEMP_EX(%a6){#1:#15},%d0 //get src exp (always pos)
1205	bfexts FPTEMP_EX(%a6){#1:#15},%d1 //get dest exp (always neg)
1206	addl %d1,%d0 //subtract dest from src
1207	bgt fix_stk
1208	bra force_unf
1209	mul_srcd:
1210	bsrl ckinf_nd
1211	bne fix_stk
1212	bfextu FPTEMP_EX(%a6){#1:#15},%d0 //get dest exp (always pos)
1213	bfexts ETEMP_EX(%a6){#1:#15},%d1 //get src exp (always neg)
1214	addl %d1,%d0 //subtract src from dest
1215	bgt fix_stk
1216
1217	//
1218	// This code handles the case of the instruction resulting in
1219	// an underflow condition.
1220	//
1221	force_unf:
1222	bclrb #E1,E_BYTE(%a6)
1223	orl #unfinx_mask,USER_FPSR(%a6)
1224	clrw NMNEXC(%a6)
1225	clrb WBTEMP_SGN(%a6)
1226	movew ETEMP_EX(%a6),%d0 //find the sign of the result
1227	movew FPTEMP_EX(%a6),%d1
1228	eorw %d1,%d0
1229	andiw #0x8000,%d0
1230	beqs frcunfcont
1231	st WBTEMP_SGN(%a6)
1232	frcunfcont:
1233	lea WBTEMP(%a6),%a0 //point a0 to memory location
1234	movew CMDREG1B(%a6),%d0
1235	btstl #6,%d0 //test for forced precision
1236	beqs frcunf_fpcr
1237	btstl #2,%d0 //check for double
1238	bnes frcunf_dbl
1239	movel #0x1,%d0 //inst is forced single
1240	bras frcunf_rnd
1241	frcunf_dbl:
1242	movel #0x2,%d0 //inst is forced double
1243	bras frcunf_rnd
1244	frcunf_fpcr:
1245	bfextu FPCR_MODE(%a6){#0:#2},%d0 //inst not forced - use fpcr prec
1246	frcunf_rnd:
1247	bsrl unf_sub //get correct result based on
1248	// ;round precision/mode. This
1249	// ;sets FPSR_CC correctly
1250	bfclr WBTEMP_SGN(%a6){#0:#8} //convert back to IEEE ext format
1251	beqs frcfpn
1252	bsetb #sign_bit,WBTEMP_EX(%a6)
1253	bra frcfpn
1254
1255	//
1256	// Write the result to the user's fpn. All results must be HUGE to be
1257	// written; otherwise the results would have overflowed or underflowed.
1258	// If the rounding precision is single or double, the ovf_res routine
1259	// is needed to correctly supply the max value.
1260	//
1261	frcfpnr:
1262	movew CMDREG1B(%a6),%d0
1263	btstl #6,%d0 //test for forced precision
1264	beqs frcfpn_fpcr
1265	btstl #2,%d0 //check for double
1266	bnes frcfpn_dbl
1267	movel #0x1,%d0 //inst is forced single
1268	bras frcfpn_rnd
1269	frcfpn_dbl:
1270	movel #0x2,%d0 //inst is forced double
1271	bras frcfpn_rnd
1272	frcfpn_fpcr:
1273	bfextu FPCR_MODE(%a6){#0:#2},%d0 //inst not forced - use fpcr prec
1274	tstb %d0
1275	beqs frcfpn //if extended, write what you got
1276	frcfpn_rnd:
1277	bclrb #sign_bit,WBTEMP_EX(%a6)
1278	sne WBTEMP_SGN(%a6)
1279	bsrl ovf_res //get correct result based on
1280	// ;round precision/mode. This
1281	// ;sets FPSR_CC correctly
1282	bfclr WBTEMP_SGN(%a6){#0:#8} //convert back to IEEE ext format
1283	beqs frcfpn_clr
1284	bsetb #sign_bit,WBTEMP_EX(%a6)
1285	frcfpn_clr:
1286	orl #ovfinx_mask,USER_FPSR(%a6)
1287	//
1288	// Perform the write.
1289	//
1290	frcfpn:
1291	bfextu CMDREG1B(%a6){#6:#3},%d0 //extract fp destination register
1292	cmpib #3,%d0
1293	bles frc0123 //check if dest is fp0-fp3
1294	movel #7,%d1
1295	subl %d0,%d1
1296	clrl %d0
1297	bsetl %d1,%d0
1298	fmovemx WBTEMP(%a6),%d0
1299	rts
1300	frc0123:
1301	cmpib #0,%d0
1302	beqs frc0_dst
1303	cmpib #1,%d0
1304	beqs frc1_dst
1305	cmpib #2,%d0
1306	beqs frc2_dst
1307	frc3_dst:
1308	movel WBTEMP_EX(%a6),USER_FP3(%a6)
1309	movel WBTEMP_HI(%a6),USER_FP3+4(%a6)
1310	movel WBTEMP_LO(%a6),USER_FP3+8(%a6)
1311	rts
1312	frc2_dst:
1313	movel WBTEMP_EX(%a6),USER_FP2(%a6)
1314	movel WBTEMP_HI(%a6),USER_FP2+4(%a6)
1315	movel WBTEMP_LO(%a6),USER_FP2+8(%a6)
1316	rts
1317	frc1_dst:
1318	movel WBTEMP_EX(%a6),USER_FP1(%a6)
1319	movel WBTEMP_HI(%a6),USER_FP1+4(%a6)
1320	movel WBTEMP_LO(%a6),USER_FP1+8(%a6)
1321	rts
1322	frc0_dst:
1323	movel WBTEMP_EX(%a6),USER_FP0(%a6)
1324	movel WBTEMP_HI(%a6),USER_FP0+4(%a6)
1325	movel WBTEMP_LO(%a6),USER_FP0+8(%a6)
1326	rts
1327
1328	//
1329	// Write etemp to fpn.
1330	// A check is made on enabled and signalled snan exceptions,
1331	// and the destination is not overwritten if this condition exists.
1332	// This code is designed to make fmoveins of unsupported data types
1333	// faster.
1334	//
1335	wr_etemp:
1336	btstb #snan_bit,FPSR_EXCEPT(%a6) //if snan is set, and
1337	beqs fmoveinc //enabled, force restore
1338	btstb #snan_bit,FPCR_ENABLE(%a6) //and don't overwrite
1339	beqs fmoveinc //the dest
1340	movel ETEMP_EX(%a6),FPTEMP_EX(%a6) //set up fptemp sign for
1341	// ;snan handler
1342	tstb ETEMP(%a6) //check for negative
1343	blts snan_neg
1344	rts
1345	snan_neg:
1346	orl #neg_bit,USER_FPSR(%a6) //snan is negative; set N
1347	rts
1348	fmoveinc:
1349	clrw NMNEXC(%a6)
1350	bclrb #E1,E_BYTE(%a6)
1351	moveb STAG(%a6),%d0 //check if stag is inf
1352	andib #0xe0,%d0
1353	cmpib #0x40,%d0
1354	bnes fminc_cnan
1355	orl #inf_mask,USER_FPSR(%a6) //if inf, nothing yet has set I
1356	tstw LOCAL_EX(%a0) //check sign
1357	bges fminc_con
1358	orl #neg_mask,USER_FPSR(%a6)
1359	bra fminc_con
1360	fminc_cnan:
1361	cmpib #0x60,%d0 //check if stag is NaN
1362	bnes fminc_czero
1363	orl #nan_mask,USER_FPSR(%a6) //if nan, nothing yet has set NaN
1364	movel ETEMP_EX(%a6),FPTEMP_EX(%a6) //set up fptemp sign for
1365	// ;snan handler
1366	tstw LOCAL_EX(%a0) //check sign
1367	bges fminc_con
1368	orl #neg_mask,USER_FPSR(%a6)
1369	bra fminc_con
1370	fminc_czero:
1371	cmpib #0x20,%d0 //check if zero
1372	bnes fminc_con
1373	orl #z_mask,USER_FPSR(%a6) //if zero, set Z
1374	tstw LOCAL_EX(%a0) //check sign
1375	bges fminc_con
1376	orl #neg_mask,USER_FPSR(%a6)
1377	fminc_con:
1378	bfextu CMDREG1B(%a6){#6:#3},%d0 //extract fp destination register
1379	cmpib #3,%d0
1380	bles fp0123 //check if dest is fp0-fp3
1381	movel #7,%d1
1382	subl %d0,%d1
1383	clrl %d0
1384	bsetl %d1,%d0
1385	fmovemx ETEMP(%a6),%d0
1386	rts
1387
1388	fp0123:
1389	cmpib #0,%d0
1390	beqs fp0_dst
1391	cmpib #1,%d0
1392	beqs fp1_dst
1393	cmpib #2,%d0
1394	beqs fp2_dst
1395	fp3_dst:
1396	movel ETEMP_EX(%a6),USER_FP3(%a6)
1397	movel ETEMP_HI(%a6),USER_FP3+4(%a6)
1398	movel ETEMP_LO(%a6),USER_FP3+8(%a6)
1399	rts
1400	fp2_dst:
1401	movel ETEMP_EX(%a6),USER_FP2(%a6)
1402	movel ETEMP_HI(%a6),USER_FP2+4(%a6)
1403	movel ETEMP_LO(%a6),USER_FP2+8(%a6)
1404	rts
1405	fp1_dst:
1406	movel ETEMP_EX(%a6),USER_FP1(%a6)
1407	movel ETEMP_HI(%a6),USER_FP1+4(%a6)
1408	movel ETEMP_LO(%a6),USER_FP1+8(%a6)
1409	rts
1410	fp0_dst:
1411	movel ETEMP_EX(%a6),USER_FP0(%a6)
1412	movel ETEMP_HI(%a6),USER_FP0+4(%a6)
1413	movel ETEMP_LO(%a6),USER_FP0+8(%a6)
1414	rts
1415
1416	opclass3:
1417	st CU_ONLY(%a6)
1418	movew CMDREG1B(%a6),%d0 //check if packed moveout
1419	andiw #0x0c00,%d0 //isolate last 2 bits of size field
1420	cmpiw #0x0c00,%d0 //if size is 011 or 111, it is packed
1421	beq pack_out //else it is norm or denorm
1422	bra mv_out
1423
1424
1425	//
1426	// MOVE OUT
1427	//
1428
1429	mv_tbl:
1430	.long li
1431	.long sgp
1432	.long xp
1433	.long mvout_end //should never be taken
1434	.long wi
1435	.long dp
1436	.long bi
1437	.long mvout_end //should never be taken
1438	mv_out:
1439	bfextu CMDREG1B(%a6){#3:#3},%d1 //put source specifier in d1
1440	leal mv_tbl,%a0
1441	movel %a0@(%d1:l:4),%a0
1442	jmp (%a0)
1443
1444	//
1445	// This exit is for move-out to memory. The aunfl bit is
1446	// set if the result is inex and unfl is signalled.
1447	//
1448	mvout_end:
1449	btstb #inex2_bit,FPSR_EXCEPT(%a6)
1450	beqs no_aufl
1451	btstb #unfl_bit,FPSR_EXCEPT(%a6)
1452	beqs no_aufl
1453	bsetb #aunfl_bit,FPSR_AEXCEPT(%a6)
1454	no_aufl:
1455	clrw NMNEXC(%a6)
1456	bclrb #E1,E_BYTE(%a6)
1457	fmovel #0,%FPSR //clear any cc bits from res_func
1458	//
1459	// Return ETEMP to extended format from internal extended format so
1460	// that gen_except will have a correctly signed value for ovfl/unfl
1461	// handlers.
1462	//
1463	bfclr ETEMP_SGN(%a6){#0:#8}
1464	beqs mvout_con
1465	bsetb #sign_bit,ETEMP_EX(%a6)
1466	mvout_con:
1467	rts
1468	//
1469	// This exit is for move-out to int register. The aunfl bit is
1470	// not set in any case for this move.
1471	//
1472	mvouti_end:
1473	clrw NMNEXC(%a6)
1474	bclrb #E1,E_BYTE(%a6)
1475	fmovel #0,%FPSR //clear any cc bits from res_func
1476	//
1477	// Return ETEMP to extended format from internal extended format so
1478	// that gen_except will have a correctly signed value for ovfl/unfl
1479	// handlers.
1480	//
1481	bfclr ETEMP_SGN(%a6){#0:#8}
1482	beqs mvouti_con
1483	bsetb #sign_bit,ETEMP_EX(%a6)
1484	mvouti_con:
1485	rts
1486	//
1487	// li is used to handle a long integer source specifier
1488	//
1489
1490	li:
1491	moveql #4,%d0 //set byte count
1492
1493	btstb #7,STAG(%a6) //check for extended denorm
1494	bne int_dnrm //if so, branch
1495
1496	fmovemx ETEMP(%a6),%fp0-%fp0
1497	fcmpd #0x41dfffffffc00000,%fp0
1498	// 41dfffffffc00000 in dbl prec = 401d0000fffffffe00000000 in ext prec
1499	fbge lo_plrg
1500	fcmpd #0xc1e0000000000000,%fp0
1501	// c1e0000000000000 in dbl prec = c01e00008000000000000000 in ext prec
1502	fble lo_nlrg
1503	//
1504	// at this point, the answer is between the largest pos and neg values
1505	//
1506	movel USER_FPCR(%a6),%d1 //use user's rounding mode
1507	andil #0x30,%d1
1508	fmovel %d1,%fpcr
1509	fmovel %fp0,L_SCR1(%a6) //let the 040 perform conversion
1510	fmovel %fpsr,%d1
1511	orl %d1,USER_FPSR(%a6) //capture inex2/ainex if set
1512	bra int_wrt
1513
1514
1515	lo_plrg:
1516	movel #0x7fffffff,L_SCR1(%a6) //answer is largest positive int
1517	fbeq int_wrt //exact answer
1518	fcmpd #0x41dfffffffe00000,%fp0
1519	// 41dfffffffe00000 in dbl prec = 401d0000ffffffff00000000 in ext prec
1520	fbge int_operr //set operr
1521	bra int_inx //set inexact
1522
1523	lo_nlrg:
1524	movel #0x80000000,L_SCR1(%a6)
1525	fbeq int_wrt //exact answer
1526	fcmpd #0xc1e0000000100000,%fp0
1527	// c1e0000000100000 in dbl prec = c01e00008000000080000000 in ext prec
1528	fblt int_operr //set operr
1529	bra int_inx //set inexact
1530
1531	//
1532	// wi is used to handle a word integer source specifier
1533	//
1534
1535	wi:
1536	moveql #2,%d0 //set byte count
1537
1538	btstb #7,STAG(%a6) //check for extended denorm
1539	bne int_dnrm //branch if so
1540
1541	fmovemx ETEMP(%a6),%fp0-%fp0
1542	fcmps #0x46fffe00,%fp0
1543	// 46fffe00 in sgl prec = 400d0000fffe000000000000 in ext prec
1544	fbge wo_plrg
1545	fcmps #0xc7000000,%fp0
1546	// c7000000 in sgl prec = c00e00008000000000000000 in ext prec
1547	fble wo_nlrg
1548
1549	//
1550	// at this point, the answer is between the largest pos and neg values
1551	//
1552	movel USER_FPCR(%a6),%d1 //use user's rounding mode
1553	andil #0x30,%d1
1554	fmovel %d1,%fpcr
1555	fmovew %fp0,L_SCR1(%a6) //let the 040 perform conversion
1556	fmovel %fpsr,%d1
1557	orl %d1,USER_FPSR(%a6) //capture inex2/ainex if set
1558	bra int_wrt
1559
1560	wo_plrg:
1561	movew #0x7fff,L_SCR1(%a6) //answer is largest positive int
1562	fbeq int_wrt //exact answer
1563	fcmps #0x46ffff00,%fp0
1564	// 46ffff00 in sgl prec = 400d0000ffff000000000000 in ext prec
1565	fbge int_operr //set operr
1566	bra int_inx //set inexact
1567
1568	wo_nlrg:
1569	movew #0x8000,L_SCR1(%a6)
1570	fbeq int_wrt //exact answer
1571	fcmps #0xc7000080,%fp0
1572	// c7000080 in sgl prec = c00e00008000800000000000 in ext prec
1573	fblt int_operr //set operr
1574	bra int_inx //set inexact
1575
1576	//
1577	// bi is used to handle a byte integer source specifier
1578	//
1579
1580	bi:
1581	moveql #1,%d0 //set byte count
1582
1583	btstb #7,STAG(%a6) //check for extended denorm
1584	bne int_dnrm //branch if so
1585
1586	fmovemx ETEMP(%a6),%fp0-%fp0
1587	fcmps #0x42fe0000,%fp0
1588	// 42fe0000 in sgl prec = 40050000fe00000000000000 in ext prec
1589	fbge by_plrg
1590	fcmps #0xc3000000,%fp0
1591	// c3000000 in sgl prec = c00600008000000000000000 in ext prec
1592	fble by_nlrg
1593
1594	//
1595	// at this point, the answer is between the largest pos and neg values
1596	//
1597	movel USER_FPCR(%a6),%d1 //use user's rounding mode
1598	andil #0x30,%d1
1599	fmovel %d1,%fpcr
1600	fmoveb %fp0,L_SCR1(%a6) //let the 040 perform conversion
1601	fmovel %fpsr,%d1
1602	orl %d1,USER_FPSR(%a6) //capture inex2/ainex if set
1603	bra int_wrt
1604
1605	by_plrg:
1606	moveb #0x7f,L_SCR1(%a6) //answer is largest positive int
1607	fbeq int_wrt //exact answer
1608	fcmps #0x42ff0000,%fp0
1609	// 42ff0000 in sgl prec = 40050000ff00000000000000 in ext prec
1610	fbge int_operr //set operr
1611	bra int_inx //set inexact
1612
1613	by_nlrg:
1614	moveb #0x80,L_SCR1(%a6)
1615	fbeq int_wrt //exact answer
1616	fcmps #0xc3008000,%fp0
1617	// c3008000 in sgl prec = c00600008080000000000000 in ext prec
1618	fblt int_operr //set operr
1619	bra int_inx //set inexact
1620
1621	//
1622	// Common integer routines
1623	//
1624	// int_drnrm---account for possible nonzero result for round up with positive
1625	// operand and round down for negative answer. In the first case (result = 1)
1626	// byte-width (store in d0) of result must be honored. In the second case,
1627	// -1 in L_SCR1(a6) will cover all contingencies (FMOVE.B/W/L out).
1628
1629	int_dnrm:
1630	movel #0,L_SCR1(%a6) // initialize result to 0
1631	bfextu FPCR_MODE(%a6){#2:#2},%d1 // d1 is the rounding mode
1632	cmpb #2,%d1
1633	bmis int_inx // if RN or RZ, done
1634	bnes int_rp // if RP, continue below
1635	tstw ETEMP(%a6) // RM: store -1 in L_SCR1 if src is negative
1636	bpls int_inx // otherwise result is 0
1637	movel #-1,L_SCR1(%a6)
1638	bras int_inx
1639	int_rp:
1640	tstw ETEMP(%a6) // RP: store +1 of proper width in L_SCR1 if
1641	// ; source is greater than 0
1642	bmis int_inx // otherwise, result is 0
1643	lea L_SCR1(%a6),%a1 // a1 is address of L_SCR1
1644	addal %d0,%a1 // offset by destination width -1
1645	subal #1,%a1
1646	bsetb #0,(%a1) // set low bit at a1 address
1647	int_inx:
1648	oril #inx2a_mask,USER_FPSR(%a6)
1649	bras int_wrt
1650	int_operr:
1651	fmovemx %fp0-%fp0,FPTEMP(%a6) //FPTEMP must contain the extended
1652	// ;precision source that needs to be
1653	// ;converted to integer this is required
1654	// ;if the operr exception is enabled.
1655	// ;set operr/aiop (no inex2 on int ovfl)
1656
1657	oril #opaop_mask,USER_FPSR(%a6)
1658	// ;fall through to perform int_wrt
1659	int_wrt:
1660	movel EXC_EA(%a6),%a1 //load destination address
1661	tstl %a1 //check to see if it is a dest register
1662	beqs wrt_dn //write data register
1663	lea L_SCR1(%a6),%a0 //point to supervisor source address
1664	bsrl mem_write
1665	bra mvouti_end
1666
1667	wrt_dn:
1668	movel %d0,-(%sp) //d0 currently contains the size to write
1669	bsrl get_fline //get_fline returns Dn in d0
1670	andiw #0x7,%d0 //isolate register
1671	movel (%sp)+,%d1 //get size
1672	cmpil #4,%d1 //most frequent case
1673	beqs sz_long
1674	cmpil #2,%d1
1675	bnes sz_con
1676	orl #8,%d0 //add 'word' size to register#
1677	bras sz_con
1678	sz_long:
1679	orl #0x10,%d0 //add 'long' size to register#
1680	sz_con:
1681	movel %d0,%d1 //reg_dest expects size:reg in d1
1682	bsrl reg_dest //load proper data register
1683	bra mvouti_end
1684	xp:
1685	lea ETEMP(%a6),%a0
1686	bclrb #sign_bit,LOCAL_EX(%a0)
1687	sne LOCAL_SGN(%a0)
1688	btstb #7,STAG(%a6) //check for extended denorm
1689	bne xdnrm
1690	clrl %d0
1691	bras do_fp //do normal case
1692	sgp:
1693	lea ETEMP(%a6),%a0
1694	bclrb #sign_bit,LOCAL_EX(%a0)
1695	sne LOCAL_SGN(%a0)
1696	btstb #7,STAG(%a6) //check for extended denorm
1697	bne sp_catas //branch if so
1698	movew LOCAL_EX(%a0),%d0
1699	lea sp_bnds,%a1
1700	cmpw (%a1),%d0
1701	blt sp_under
1702	cmpw 2(%a1),%d0
1703	bgt sp_over
1704	movel #1,%d0 //set destination format to single
1705	bras do_fp //do normal case
1706	dp:
1707	lea ETEMP(%a6),%a0
1708	bclrb #sign_bit,LOCAL_EX(%a0)
1709	sne LOCAL_SGN(%a0)
1710
1711	btstb #7,STAG(%a6) //check for extended denorm
1712	bne dp_catas //branch if so
1713
1714	movew LOCAL_EX(%a0),%d0
1715	lea dp_bnds,%a1
1716
1717	cmpw (%a1),%d0
1718	blt dp_under
1719	cmpw 2(%a1),%d0
1720	bgt dp_over
1721
1722	movel #2,%d0 //set destination format to double
1723	// ;fall through to do_fp
1724	//
1725	do_fp:
1726	bfextu FPCR_MODE(%a6){#2:#2},%d1 //rnd mode in d1
1727	swap %d0 //rnd prec in upper word
1728	addl %d0,%d1 //d1 has PREC/MODE info
1729
1730	clrl %d0 //clear g,r,s
1731
1732	bsrl round //round
1733
1734	movel %a0,%a1
1735	movel EXC_EA(%a6),%a0
1736
1737	bfextu CMDREG1B(%a6){#3:#3},%d1 //extract destination format
1738	// ;at this point only the dest
1739	// ;formats sgl, dbl, ext are
1740	// ;possible
1741	cmpb #2,%d1
1742	bgts ddbl //double=5, extended=2, single=1
1743	bnes dsgl
1744	// ;fall through to dext
1745	dext:
1746	bsrl dest_ext
1747	bra mvout_end
1748	dsgl:
1749	bsrl dest_sgl
1750	bra mvout_end
1751	ddbl:
1752	bsrl dest_dbl
1753	bra mvout_end
1754
1755	//
1756	// Handle possible denorm or catastrophic underflow cases here
1757	//
1758	xdnrm:
1759	bsr set_xop //initialize WBTEMP
1760	bsetb #wbtemp15_bit,WB_BYTE(%a6) //set wbtemp15
1761
1762	movel %a0,%a1
1763	movel EXC_EA(%a6),%a0 //a0 has the destination pointer
1764	bsrl dest_ext //store to memory
1765	bsetb #unfl_bit,FPSR_EXCEPT(%a6)
1766	bra mvout_end
1767
1768	sp_under:
1769	bsetb #etemp15_bit,STAG(%a6)
1770
1771	cmpw 4(%a1),%d0
1772	blts sp_catas //catastrophic underflow case
1773
1774	movel #1,%d0 //load in round precision
1775	movel #sgl_thresh,%d1 //load in single denorm threshold
1776	bsrl dpspdnrm //expects d1 to have the proper
1777	// ;denorm threshold
1778	bsrl dest_sgl //stores value to destination
1779	bsetb #unfl_bit,FPSR_EXCEPT(%a6)
1780	bra mvout_end //exit
1781
1782	dp_under:
1783	bsetb #etemp15_bit,STAG(%a6)
1784
1785	cmpw 4(%a1),%d0
1786	blts dp_catas //catastrophic underflow case
1787
1788	movel #dbl_thresh,%d1 //load in double precision threshold
1789	movel #2,%d0
1790	bsrl dpspdnrm //expects d1 to have proper
1791	// ;denorm threshold
1792	// ;expects d0 to have round precision
1793	bsrl dest_dbl //store value to destination
1794	bsetb #unfl_bit,FPSR_EXCEPT(%a6)
1795	bra mvout_end //exit
1796
1797	//
1798	// Handle catastrophic underflow cases here
1799	//
1800	sp_catas:
1801	// Temp fix for z bit set in unf_sub
1802	movel USER_FPSR(%a6),-(%a7)
1803
1804	movel #1,%d0 //set round precision to sgl
1805
1806	bsrl unf_sub //a0 points to result
1807
1808	movel (%a7)+,USER_FPSR(%a6)
1809
1810	movel #1,%d0
1811	subw %d0,LOCAL_EX(%a0) //account for difference between
1812	// ;denorm/norm bias
1813
1814	movel %a0,%a1 //a1 has the operand input
1815	movel EXC_EA(%a6),%a0 //a0 has the destination pointer
1816
1817	bsrl dest_sgl //store the result
1818	oril #unfinx_mask,USER_FPSR(%a6)
1819	bra mvout_end
1820
1821	dp_catas:
1822	// Temp fix for z bit set in unf_sub
1823	movel USER_FPSR(%a6),-(%a7)
1824
1825	movel #2,%d0 //set round precision to dbl
1826	bsrl unf_sub //a0 points to result
1827
1828	movel (%a7)+,USER_FPSR(%a6)
1829
1830	movel #1,%d0
1831	subw %d0,LOCAL_EX(%a0) //account for difference between
1832	// ;denorm/norm bias
1833
1834	movel %a0,%a1 //a1 has the operand input
1835	movel EXC_EA(%a6),%a0 //a0 has the destination pointer
1836
1837	bsrl dest_dbl //store the result
1838	oril #unfinx_mask,USER_FPSR(%a6)
1839	bra mvout_end
1840
1841	//
1842	// Handle catastrophic overflow cases here
1843	//
1844	sp_over:
1845	// Temp fix for z bit set in unf_sub
1846	movel USER_FPSR(%a6),-(%a7)
1847
1848	movel #1,%d0
1849	leal FP_SCR1(%a6),%a0 //use FP_SCR1 for creating result
1850	movel ETEMP_EX(%a6),(%a0)
1851	movel ETEMP_HI(%a6),4(%a0)
1852	movel ETEMP_LO(%a6),8(%a0)
1853	bsrl ovf_res
1854
1855	movel (%a7)+,USER_FPSR(%a6)
1856
1857	movel %a0,%a1
1858	movel EXC_EA(%a6),%a0
1859	bsrl dest_sgl
1860	orl #ovfinx_mask,USER_FPSR(%a6)
1861	bra mvout_end
1862
1863	dp_over:
1864	// Temp fix for z bit set in ovf_res
1865	movel USER_FPSR(%a6),-(%a7)
1866
1867	movel #2,%d0
1868	leal FP_SCR1(%a6),%a0 //use FP_SCR1 for creating result
1869	movel ETEMP_EX(%a6),(%a0)
1870	movel ETEMP_HI(%a6),4(%a0)
1871	movel ETEMP_LO(%a6),8(%a0)
1872	bsrl ovf_res
1873
1874	movel (%a7)+,USER_FPSR(%a6)
1875
1876	movel %a0,%a1
1877	movel EXC_EA(%a6),%a0
1878	bsrl dest_dbl
1879	orl #ovfinx_mask,USER_FPSR(%a6)
1880	bra mvout_end
1881
1882	//
1883	// DPSPDNRM
1884	//
1885	// This subroutine takes an extended normalized number and denormalizes
1886	// it to the given round precision. This subroutine also decrements
1887	// the input operand's exponent by 1 to account for the fact that
1888	// dest_sgl or dest_dbl expects a normalized number's bias.
1889	//
1890	// Input: a0 points to a normalized number in internal extended format
1891	// d0 is the round precision (=1 for sgl; =2 for dbl)
1892	// d1 is the the single precision or double precision
1893	// denorm threshold
1894	//
1895	// Output: (In the format for dest_sgl or dest_dbl)
1896	// a0 points to the destination
1897	// a1 points to the operand
1898	//
1899	// Exceptions: Reports inexact 2 exception by setting USER_FPSR bits
1900	//
1901	dpspdnrm:
1902	movel %d0,-(%a7) //save round precision
1903	clrl %d0 //clear initial g,r,s
1904	bsrl dnrm_lp //careful with d0, it's needed by round
1905
1906	bfextu FPCR_MODE(%a6){#2:#2},%d1 //get rounding mode
1907	swap %d1
1908	movew 2(%a7),%d1 //set rounding precision
1909	swap %d1 //at this point d1 has PREC/MODE info
1910	bsrl round //round result, sets the inex bit in
1911	// ;USER_FPSR if needed
1912
1913	movew #1,%d0
1914	subw %d0,LOCAL_EX(%a0) //account for difference in denorm
1915	// ;vs norm bias
1916
1917	movel %a0,%a1 //a1 has the operand input
1918	movel EXC_EA(%a6),%a0 //a0 has the destination pointer
1919	addw #4,%a7 //pop stack
1920	rts
1921	//
1922	// SET_XOP initialized WBTEMP with the value pointed to by a0
1923	// input: a0 points to input operand in the internal extended format
1924	//
1925	set_xop:
1926	movel LOCAL_EX(%a0),WBTEMP_EX(%a6)
1927	movel LOCAL_HI(%a0),WBTEMP_HI(%a6)
1928	movel LOCAL_LO(%a0),WBTEMP_LO(%a6)
1929	bfclr WBTEMP_SGN(%a6){#0:#8}
1930	beqs sxop
1931	bsetb #sign_bit,WBTEMP_EX(%a6)
1932	sxop:
1933	bfclr STAG(%a6){#5:#4} //clear wbtm66,wbtm1,wbtm0,sbit
1934	rts
1935	//
1936	// P_MOVE
1937	//
1938	p_movet:
1939	.long p_move
1940	.long p_movez
1941	.long p_movei
1942	.long p_moven
1943	.long p_move
1944	p_regd:
1945	.long p_dyd0
1946	.long p_dyd1
1947	.long p_dyd2
1948	.long p_dyd3
1949	.long p_dyd4
1950	.long p_dyd5
1951	.long p_dyd6
1952	.long p_dyd7
1953
1954	pack_out:
1955	leal p_movet,%a0 //load jmp table address
1956	movew STAG(%a6),%d0 //get source tag
1957	bfextu %d0{#16:#3},%d0 //isolate source bits
1958	movel (%a0,%d0.w*4),%a0 //load a0 with routine label for tag
1959	jmp (%a0) //go to the routine
1960
1961	p_write:
1962	movel #0x0c,%d0 //get byte count
1963	movel EXC_EA(%a6),%a1 //get the destination address
1964	bsr mem_write //write the user's destination
1965	moveb #0,CU_SAVEPC(%a6) //set the cu save pc to all 0's
1966
1967	//
1968	// Also note that the dtag must be set to norm here - this is because
1969	// the 040 uses the dtag to execute the correct microcode.
1970	//
1971	bfclr DTAG(%a6){#0:#3} //set dtag to norm
1972
1973	rts
1974
1975	// Notes on handling of special case (zero, inf, and nan) inputs:
1976	// 1. Operr is not signalled if the k-factor is greater than 18.
1977	// 2. Per the manual, status bits are not set.
1978	//
1979
1980	p_move:
1981	movew CMDREG1B(%a6),%d0
1982	btstl #kfact_bit,%d0 //test for dynamic k-factor
1983	beqs statick //if clear, k-factor is static
1984	dynamick:
1985	bfextu %d0{#25:#3},%d0 //isolate register for dynamic k-factor
1986	lea p_regd,%a0
1987	movel %a0@(%d0:l:4),%a0
1988	jmp (%a0)
1989	statick:
1990	andiw #0x007f,%d0 //get k-factor
1991	bfexts %d0{#25:#7},%d0 //sign extend d0 for bindec
1992	leal ETEMP(%a6),%a0 //a0 will point to the packed decimal
1993	bsrl bindec //perform the convert; data at a6
1994	leal FP_SCR1(%a6),%a0 //load a0 with result address
1995	bral p_write
1996	p_movez:
1997	leal ETEMP(%a6),%a0 //a0 will point to the packed decimal
1998	clrw 2(%a0) //clear lower word of exp
1999	clrl 4(%a0) //load second lword of ZERO
2000	clrl 8(%a0) //load third lword of ZERO
2001	bra p_write //go write results
2002	p_movei:
2003	fmovel #0,%FPSR //clear aiop
2004	leal ETEMP(%a6),%a0 //a0 will point to the packed decimal
2005	clrw 2(%a0) //clear lower word of exp
2006	bra p_write //go write the result
2007	p_moven:
2008	leal ETEMP(%a6),%a0 //a0 will point to the packed decimal
2009	clrw 2(%a0) //clear lower word of exp
2010	bra p_write //go write the result
2011
2012	//
2013	// Routines to read the dynamic k-factor from Dn.
2014	//
2015	p_dyd0:
2016	movel USER_D0(%a6),%d0
2017	bras statick
2018	p_dyd1:
2019	movel USER_D1(%a6),%d0
2020	bras statick
2021	p_dyd2:
2022	movel %d2,%d0
2023	bras statick
2024	p_dyd3:
2025	movel %d3,%d0
2026	bras statick
2027	p_dyd4:
2028	movel %d4,%d0
2029	bras statick
2030	p_dyd5:
2031	movel %d5,%d0
2032	bras statick
2033	p_dyd6:
2034	movel %d6,%d0
2035	bra statick
2036	p_dyd7:
2037	movel %d7,%d0
2038	bra statick
2039
2040	\|end

Note: See TracBrowser for help on using the repository browser.

Download in other formats:

Original Format