Context Navigation

← Previous Revision
Latest Revision
Next Revision →
Blame
Revision Log

div_ext.fc@ 10

Last change on this file since 10 was 9, checked in by Mattia Monga, 14 years ago
Minix 3.1.2a
File size: 6.1 KB

Line
1	/*
2	(c) copyright 1988 by the Vrije Universiteit, Amsterdam, The Netherlands.
3	See the copyright notice in the ACK home directory, in the file "Copyright".
4	*/
5
6	/* $Header: /cvsup/minix/src/lib/ack/fphook/div_ext.fc,v 1.1 2005/10/10 15:27:43 beng Exp $ */
7
8	/*
9	DIVIDE EXTENDED FORMAT
10	*/
11
12	#include "FP_bias.h"
13	#include "FP_trap.h"
14	#include "FP_types.h"
15
16	/*
17	November 15, 1984
18
19	This is a routine to do the work.
20	There are two versions:
21	One is based on the partial products method
22	and makes no use possible machine instructions
23	to divide (hardware dividers).
24	The other is used when USE_DIVIDE is defined. It is much faster on
25	machines with fast 4 byte operations.
26	*/
27	/********************************************************/
28
29	void
30	div_ext(e1,e2)
31	EXTEND e1,e2;
32	{
33	short error = 0;
34	B64 result;
35	register unsigned long *lp;
36	#ifndef USE_DIVIDE
37	short count;
38	#else
39	unsigned short u[9], v[5];
40	register int j;
41	register unsigned short *u_p = u;
42	int maxv = 4;
43	#endif
44
45	if ((e2->m1 \| e2->m2) == 0) {
46	/*
47	* Exception 8.2 - Divide by zero
48	*/
49	trap(EFDIVZ);
50	e1->m1 = e1->m2 = 0L;
51	e1->exp = EXT_MAX;
52	return;
53	}
54	if ((e1->m1 \| e1->m2) == 0) { /* 0 / anything == 0 */
55	e1->exp = 0; /* make sure */
56	return;
57	}
58	#ifndef USE_DIVIDE
59	/*
60	* numbers are right shifted one bit to make sure
61	* that m1 is quaranteed to be larger if its
62	* maximum bit is set
63	*/
64	b64_rsft(&e1->mantissa); /* 64 bit shift right */
65	b64_rsft(&e2->mantissa); /* 64 bit shift right */
66	e1->exp++;
67	e2->exp++;
68	#endif
69	/* check for underflow, divide by zero, etc */
70	e1->sign ^= e2->sign;
71	e1->exp -= e2->exp;
72
73	#ifndef USE_DIVIDE
74	/* do division of mantissas */
75	/* uses partial product method */
76	/* init control variables */
77
78	count = 64;
79	result.h_32 = 0L;
80	result.l_32 = 0L;
81
82	/* partial product division loop */
83
84	while (count--) {
85	/* first left shift result 1 bit */
86	/* this is ALWAYS done */
87
88	b64_lsft(&result);
89
90	/* compare dividend and divisor */
91	/* if dividend >= divisor add a bit */
92	/* and subtract divisior from dividend */
93
94	if ( (e1->m1 < e2->m1) \|\|
95	((e1->m1 == e2->m1) && (e1->m2 < e2->m2) ))
96	; /* null statement */
97	/* i.e., don't add or subtract */
98	else {
99	result.l_32++; /* ADD */
100	if (e2->m2 > e1->m2)
101	e1->m1 -= 1; /* carry in */
102	e1->m1 -= e2->m1; /* do SUBTRACTION */
103	e1->m2 -= e2->m2; /* SUBTRACTION */
104	}
105
106	/* shift dividend left one bit OR */
107	/* IF it equals ZERO we can break out */
108	/* of the loop, but still must shift */
109	/* the quotient the remaining count bits */
110	/* NB save the results of this test in error */
111	/* if not zero, then the result is inexact. */
112	/* this would be reported in IEEE standard */
113
114	/* lp points to dividend */
115	lp = &e1->m1;
116
117	error = ((lp \| (lp+1)) != 0L) ? 1 : 0;
118	if (error) { /* more work */
119	/* assume max bit == 0 (see above) */
120	b64_lsft(&e1->mantissa);
121	continue;
122	}
123	else
124	break; /* leave loop */
125	} /* end of divide by subtraction loop */
126
127	if (count > 0) {
128	lp = &result.h_32;
129	if (count > 31) { /* move to higher word */
130	lp = (lp+1);
131	count -= 32;
132	(lp+1) = 0L; / clear low word */
133	}
134	if (*lp)
135	lp <<= count; / shift rest of way */
136	lp++; /* == &result.l_32 */
137	if (*lp) {
138	result.h_32 \|= (*lp >> 32-count);
139	*lp <<= count;
140	}
141	}
142	#else /* USE_DIVIDE */
143
144	u[4] = (e1->m2 & 1) << 15;
145	b64_rsft(&(e1->mantissa));
146	u[0] = e1->m1 >> 16;
147	u[1] = e1->m1;
148	u[2] = e1->m2 >> 16;
149	u[3] = e1->m2;
150	u[5] = 0; u[6] = 0; u[7] = 0;
151	v[1] = e2->m1 >> 16;
152	v[2] = e2->m1;
153	v[3] = e2->m2 >> 16;
154	v[4] = e2->m2;
155	while (! v[maxv]) maxv--;
156	result.h_32 = 0;
157	result.l_32 = 0;
158	lp = &result.h_32;
159
160	/*
161	* Use an algorithm of Knuth (The art of programming, Seminumerical
162	* algorithms), to divide u by v. u and v are both seen as numbers
163	* with base 65536.
164	*/
165	for (j = 0; j <= 3; j++, u_p++) {
166	unsigned long q_est, temp;
167
168	if (j == 2) lp++;
169	if (u_p[0] == 0 && u_p[1] < v[1]) continue;
170	temp = ((unsigned long)u_p[0] << 16) + u_p[1];
171	if (u_p[0] >= v[1]) {
172	q_est = 0x0000FFFFL;
173	}
174	else {
175	q_est = temp / v[1];
176	}
177	temp -= q_est * v[1];
178	while (temp < 0x10000 && v[2]*q_est > ((temp<<16)+u_p[2])) {
179	q_est--;
180	temp += v[1];
181	}
182	/* Now, according to Knuth, we have an estimate of the
183	quotient, that is either correct or one too big, but
184	almost always correct.
185	*/
186	if (q_est != 0) {
187	int i;
188	unsigned long k = 0;
189	int borrow = 0;
190
191	for (i = maxv; i > 0; i--) {
192	unsigned long tmp = q_est * v[i] + k + borrow;
193	unsigned short md = tmp;
194
195	borrow = (md > u_p[i]);
196	u_p[i] -= md;
197	k = tmp >> 16;
198	}
199	k += borrow;
200	borrow = u_p[0] < k;
201	u_p[0] -= k;
202
203	if (borrow) {
204	/* So, this does not happen often; the estimate
205	was one too big; correct this
206	*/
207	*lp \|= (j & 1) ? (q_est - 1) : ((q_est-1)<<16);
208	borrow = 0;
209	for (i = maxv; i > 0; i--) {
210	unsigned long tmp
211	= v[i]+(unsigned long)u_p[i]+borrow;
212
213	u_p[i] = tmp;
214	borrow = tmp >> 16;
215	}
216	u_p[0] += borrow;
217	}
218	else *lp \|= (j & 1) ? q_est : (q_est<<16);
219	}
220	}
221	#ifdef EXCEPTION_INEXACT
222	u_p = &u[0];
223	for (j = 7; j >= 0; j--) {
224	if (*u_p++) {
225	error = 1;
226	break;
227	}
228	}
229	#endif
230	#endif
231
232	#ifdef EXCEPTION_INEXACT
233	if (error) {
234	/*
235	* report here exception 8.5 - Inexact
236	* from Draft 8.0 of IEEE P754:
237	* In the absence of an invalid operation exception,
238	* if the rounded result of an operation is not exact or if
239	* it overflows without a trap, then the inexact exception
240	* shall be assigned. The rounded or overflowed result
241	* shall be delivered to the destination.
242	*/
243	INEXACT();
244	#endif
245	e1->mantissa = result;
246
247	nrm_ext(e1);
248	if (e1->exp < EXT_MIN) {
249	/*
250	* Exception 8.4 - Underflow
251	*/
252	trap(EFUNFL); /* underflow */
253	e1->exp = EXT_MIN;
254	e1->m1 = e1->m2 = 0L;
255	return;
256	}
257	if (e1->exp >= EXT_MAX) {
258	/*
259	* Exception 8.3 - Overflow
260	*/
261	trap(EFOVFL); /* overflow */
262	e1->exp = EXT_MAX;
263	e1->m1 = e1->m2 = 0L;
264	return;
265	}
266	}

Note: See TracBrowser for help on using the repository browser.

Download in other formats:

Original Format