diff options
author | Linus Torvalds <torvalds@ppc970.osdl.org> | 2005-04-16 18:20:36 -0400 |
---|---|---|
committer | Linus Torvalds <torvalds@ppc970.osdl.org> | 2005-04-16 18:20:36 -0400 |
commit | 1da177e4c3f41524e886b7f1b8a0c1fc7321cac2 (patch) | |
tree | 0bba044c4ce775e45a88a51686b5d9f90697ea9d /arch/m68k/fpsp040/scale.S |
Linux-2.6.12-rc2v2.6.12-rc2
Initial git repository build. I'm not bothering with the full history,
even though we have it. We can create a separate "historical" git
archive of that later if we want to, and in the meantime it's about
3.2GB when imported into git - space that would just make the early
git days unnecessarily complicated, when we don't have a lot of good
infrastructure for it.
Let it rip!
Diffstat (limited to 'arch/m68k/fpsp040/scale.S')
-rw-r--r-- | arch/m68k/fpsp040/scale.S | 371 |
1 files changed, 371 insertions, 0 deletions
diff --git a/arch/m68k/fpsp040/scale.S b/arch/m68k/fpsp040/scale.S new file mode 100644 index 000000000000..5c9b805265f2 --- /dev/null +++ b/arch/m68k/fpsp040/scale.S | |||
@@ -0,0 +1,371 @@ | |||
1 | | | ||
2 | | scale.sa 3.3 7/30/91 | ||
3 | | | ||
4 | | The entry point sSCALE computes the destination operand | ||
5 | | scaled by the source operand. If the absolute value of | ||
6 | | the source operand is (>= 2^14) an overflow or underflow | ||
7 | | is returned. | ||
8 | | | ||
9 | | The entry point sscale is called from do_func to emulate | ||
10 | | the fscale unimplemented instruction. | ||
11 | | | ||
12 | | Input: Double-extended destination operand in FPTEMP, | ||
13 | | double-extended source operand in ETEMP. | ||
14 | | | ||
15 | | Output: The function returns scale(X,Y) to fp0. | ||
16 | | | ||
17 | | Modifies: fp0. | ||
18 | | | ||
19 | | Algorithm: | ||
20 | | | ||
21 | | Copyright (C) Motorola, Inc. 1990 | ||
22 | | All Rights Reserved | ||
23 | | | ||
24 | | THIS IS UNPUBLISHED PROPRIETARY SOURCE CODE OF MOTOROLA | ||
25 | | The copyright notice above does not evidence any | ||
26 | | actual or intended publication of such source code. | ||
27 | |||
28 | |SCALE idnt 2,1 | Motorola 040 Floating Point Software Package | ||
29 | |||
30 | |section 8 | ||
31 | |||
32 | #include "fpsp.h" | ||
33 | |||
34 | |xref t_ovfl2 | ||
35 | |xref t_unfl | ||
36 | |xref round | ||
37 | |xref t_resdnrm | ||
38 | |||
39 | SRC_BNDS: .short 0x3fff,0x400c | ||
40 | |||
41 | | | ||
42 | | This entry point is used by the unimplemented instruction exception | ||
43 | | handler. | ||
44 | | | ||
45 | | | ||
46 | | | ||
47 | | FSCALE | ||
48 | | | ||
49 | .global sscale | ||
50 | sscale: | ||
51 | fmovel #0,%fpcr |clr user enabled exc | ||
52 | clrl %d1 | ||
53 | movew FPTEMP(%a6),%d1 |get dest exponent | ||
54 | smi L_SCR1(%a6) |use L_SCR1 to hold sign | ||
55 | andil #0x7fff,%d1 |strip sign | ||
56 | movew ETEMP(%a6),%d0 |check src bounds | ||
57 | andiw #0x7fff,%d0 |clr sign bit | ||
58 | cmp2w SRC_BNDS,%d0 | ||
59 | bccs src_in | ||
60 | cmpiw #0x400c,%d0 |test for too large | ||
61 | bge src_out | ||
62 | | | ||
63 | | The source input is below 1, so we check for denormalized numbers | ||
64 | | and set unfl. | ||
65 | | | ||
66 | src_small: | ||
67 | moveb DTAG(%a6),%d0 | ||
68 | andib #0xe0,%d0 | ||
69 | tstb %d0 | ||
70 | beqs no_denorm | ||
71 | st STORE_FLG(%a6) |dest already contains result | ||
72 | orl #unfl_mask,USER_FPSR(%a6) |set UNFL | ||
73 | den_done: | ||
74 | leal FPTEMP(%a6),%a0 | ||
75 | bra t_resdnrm | ||
76 | no_denorm: | ||
77 | fmovel USER_FPCR(%a6),%FPCR | ||
78 | fmovex FPTEMP(%a6),%fp0 |simply return dest | ||
79 | rts | ||
80 | |||
81 | |||
82 | | | ||
83 | | Source is within 2^14 range. To perform the int operation, | ||
84 | | move it to d0. | ||
85 | | | ||
86 | src_in: | ||
87 | fmovex ETEMP(%a6),%fp0 |move in src for int | ||
88 | fmovel #rz_mode,%fpcr |force rz for src conversion | ||
89 | fmovel %fp0,%d0 |int src to d0 | ||
90 | fmovel #0,%FPSR |clr status from above | ||
91 | tstw ETEMP(%a6) |check src sign | ||
92 | blt src_neg | ||
93 | | | ||
94 | | Source is positive. Add the src to the dest exponent. | ||
95 | | The result can be denormalized, if src = 0, or overflow, | ||
96 | | if the result of the add sets a bit in the upper word. | ||
97 | | | ||
98 | src_pos: | ||
99 | tstw %d1 |check for denorm | ||
100 | beq dst_dnrm | ||
101 | addl %d0,%d1 |add src to dest exp | ||
102 | beqs denorm |if zero, result is denorm | ||
103 | cmpil #0x7fff,%d1 |test for overflow | ||
104 | bges ovfl | ||
105 | tstb L_SCR1(%a6) | ||
106 | beqs spos_pos | ||
107 | orw #0x8000,%d1 | ||
108 | spos_pos: | ||
109 | movew %d1,FPTEMP(%a6) |result in FPTEMP | ||
110 | fmovel USER_FPCR(%a6),%FPCR | ||
111 | fmovex FPTEMP(%a6),%fp0 |write result to fp0 | ||
112 | rts | ||
113 | ovfl: | ||
114 | tstb L_SCR1(%a6) | ||
115 | beqs sovl_pos | ||
116 | orw #0x8000,%d1 | ||
117 | sovl_pos: | ||
118 | movew FPTEMP(%a6),ETEMP(%a6) |result in ETEMP | ||
119 | movel FPTEMP_HI(%a6),ETEMP_HI(%a6) | ||
120 | movel FPTEMP_LO(%a6),ETEMP_LO(%a6) | ||
121 | bra t_ovfl2 | ||
122 | |||
123 | denorm: | ||
124 | tstb L_SCR1(%a6) | ||
125 | beqs den_pos | ||
126 | orw #0x8000,%d1 | ||
127 | den_pos: | ||
128 | tstl FPTEMP_HI(%a6) |check j bit | ||
129 | blts nden_exit |if set, not denorm | ||
130 | movew %d1,ETEMP(%a6) |input expected in ETEMP | ||
131 | movel FPTEMP_HI(%a6),ETEMP_HI(%a6) | ||
132 | movel FPTEMP_LO(%a6),ETEMP_LO(%a6) | ||
133 | orl #unfl_bit,USER_FPSR(%a6) |set unfl | ||
134 | leal ETEMP(%a6),%a0 | ||
135 | bra t_resdnrm | ||
136 | nden_exit: | ||
137 | movew %d1,FPTEMP(%a6) |result in FPTEMP | ||
138 | fmovel USER_FPCR(%a6),%FPCR | ||
139 | fmovex FPTEMP(%a6),%fp0 |write result to fp0 | ||
140 | rts | ||
141 | |||
142 | | | ||
143 | | Source is negative. Add the src to the dest exponent. | ||
144 | | (The result exponent will be reduced). The result can be | ||
145 | | denormalized. | ||
146 | | | ||
147 | src_neg: | ||
148 | addl %d0,%d1 |add src to dest | ||
149 | beqs denorm |if zero, result is denorm | ||
150 | blts fix_dnrm |if negative, result is | ||
151 | | ;needing denormalization | ||
152 | tstb L_SCR1(%a6) | ||
153 | beqs sneg_pos | ||
154 | orw #0x8000,%d1 | ||
155 | sneg_pos: | ||
156 | movew %d1,FPTEMP(%a6) |result in FPTEMP | ||
157 | fmovel USER_FPCR(%a6),%FPCR | ||
158 | fmovex FPTEMP(%a6),%fp0 |write result to fp0 | ||
159 | rts | ||
160 | |||
161 | |||
162 | | | ||
163 | | The result exponent is below denorm value. Test for catastrophic | ||
164 | | underflow and force zero if true. If not, try to shift the | ||
165 | | mantissa right until a zero exponent exists. | ||
166 | | | ||
167 | fix_dnrm: | ||
168 | cmpiw #0xffc0,%d1 |lower bound for normalization | ||
169 | blt fix_unfl |if lower, catastrophic unfl | ||
170 | movew %d1,%d0 |use d0 for exp | ||
171 | movel %d2,-(%a7) |free d2 for norm | ||
172 | movel FPTEMP_HI(%a6),%d1 | ||
173 | movel FPTEMP_LO(%a6),%d2 | ||
174 | clrl L_SCR2(%a6) | ||
175 | fix_loop: | ||
176 | addw #1,%d0 |drive d0 to 0 | ||
177 | lsrl #1,%d1 |while shifting the | ||
178 | roxrl #1,%d2 |mantissa to the right | ||
179 | bccs no_carry | ||
180 | st L_SCR2(%a6) |use L_SCR2 to capture inex | ||
181 | no_carry: | ||
182 | tstw %d0 |it is finished when | ||
183 | blts fix_loop |d0 is zero or the mantissa | ||
184 | tstb L_SCR2(%a6) | ||
185 | beqs tst_zero | ||
186 | orl #unfl_inx_mask,USER_FPSR(%a6) | ||
187 | | ;set unfl, aunfl, ainex | ||
188 | | | ||
189 | | Test for zero. If zero, simply use fmove to return +/- zero | ||
190 | | to the fpu. | ||
191 | | | ||
192 | tst_zero: | ||
193 | clrw FPTEMP_EX(%a6) | ||
194 | tstb L_SCR1(%a6) |test for sign | ||
195 | beqs tst_con | ||
196 | orw #0x8000,FPTEMP_EX(%a6) |set sign bit | ||
197 | tst_con: | ||
198 | movel %d1,FPTEMP_HI(%a6) | ||
199 | movel %d2,FPTEMP_LO(%a6) | ||
200 | movel (%a7)+,%d2 | ||
201 | tstl %d1 | ||
202 | bnes not_zero | ||
203 | tstl FPTEMP_LO(%a6) | ||
204 | bnes not_zero | ||
205 | | | ||
206 | | Result is zero. Check for rounding mode to set lsb. If the | ||
207 | | mode is rp, and the zero is positive, return smallest denorm. | ||
208 | | If the mode is rm, and the zero is negative, return smallest | ||
209 | | negative denorm. | ||
210 | | | ||
211 | btstb #5,FPCR_MODE(%a6) |test if rm or rp | ||
212 | beqs no_dir | ||
213 | btstb #4,FPCR_MODE(%a6) |check which one | ||
214 | beqs zer_rm | ||
215 | zer_rp: | ||
216 | tstb L_SCR1(%a6) |check sign | ||
217 | bnes no_dir |if set, neg op, no inc | ||
218 | movel #1,FPTEMP_LO(%a6) |set lsb | ||
219 | bras sm_dnrm | ||
220 | zer_rm: | ||
221 | tstb L_SCR1(%a6) |check sign | ||
222 | beqs no_dir |if clr, neg op, no inc | ||
223 | movel #1,FPTEMP_LO(%a6) |set lsb | ||
224 | orl #neg_mask,USER_FPSR(%a6) |set N | ||
225 | bras sm_dnrm | ||
226 | no_dir: | ||
227 | fmovel USER_FPCR(%a6),%FPCR | ||
228 | fmovex FPTEMP(%a6),%fp0 |use fmove to set cc's | ||
229 | rts | ||
230 | |||
231 | | | ||
232 | | The rounding mode changed the zero to a smallest denorm. Call | ||
233 | | t_resdnrm with exceptional operand in ETEMP. | ||
234 | | | ||
235 | sm_dnrm: | ||
236 | movel FPTEMP_EX(%a6),ETEMP_EX(%a6) | ||
237 | movel FPTEMP_HI(%a6),ETEMP_HI(%a6) | ||
238 | movel FPTEMP_LO(%a6),ETEMP_LO(%a6) | ||
239 | leal ETEMP(%a6),%a0 | ||
240 | bra t_resdnrm | ||
241 | |||
242 | | | ||
243 | | Result is still denormalized. | ||
244 | | | ||
245 | not_zero: | ||
246 | orl #unfl_mask,USER_FPSR(%a6) |set unfl | ||
247 | tstb L_SCR1(%a6) |check for sign | ||
248 | beqs fix_exit | ||
249 | orl #neg_mask,USER_FPSR(%a6) |set N | ||
250 | fix_exit: | ||
251 | bras sm_dnrm | ||
252 | |||
253 | |||
254 | | | ||
255 | | The result has underflowed to zero. Return zero and set | ||
256 | | unfl, aunfl, and ainex. | ||
257 | | | ||
258 | fix_unfl: | ||
259 | orl #unfl_inx_mask,USER_FPSR(%a6) | ||
260 | btstb #5,FPCR_MODE(%a6) |test if rm or rp | ||
261 | beqs no_dir2 | ||
262 | btstb #4,FPCR_MODE(%a6) |check which one | ||
263 | beqs zer_rm2 | ||
264 | zer_rp2: | ||
265 | tstb L_SCR1(%a6) |check sign | ||
266 | bnes no_dir2 |if set, neg op, no inc | ||
267 | clrl FPTEMP_EX(%a6) | ||
268 | clrl FPTEMP_HI(%a6) | ||
269 | movel #1,FPTEMP_LO(%a6) |set lsb | ||
270 | bras sm_dnrm |return smallest denorm | ||
271 | zer_rm2: | ||
272 | tstb L_SCR1(%a6) |check sign | ||
273 | beqs no_dir2 |if clr, neg op, no inc | ||
274 | movew #0x8000,FPTEMP_EX(%a6) | ||
275 | clrl FPTEMP_HI(%a6) | ||
276 | movel #1,FPTEMP_LO(%a6) |set lsb | ||
277 | orl #neg_mask,USER_FPSR(%a6) |set N | ||
278 | bra sm_dnrm |return smallest denorm | ||
279 | |||
280 | no_dir2: | ||
281 | tstb L_SCR1(%a6) | ||
282 | bges pos_zero | ||
283 | neg_zero: | ||
284 | clrl FP_SCR1(%a6) |clear the exceptional operand | ||
285 | clrl FP_SCR1+4(%a6) |for gen_except. | ||
286 | clrl FP_SCR1+8(%a6) | ||
287 | fmoves #0x80000000,%fp0 | ||
288 | rts | ||
289 | pos_zero: | ||
290 | clrl FP_SCR1(%a6) |clear the exceptional operand | ||
291 | clrl FP_SCR1+4(%a6) |for gen_except. | ||
292 | clrl FP_SCR1+8(%a6) | ||
293 | fmoves #0x00000000,%fp0 | ||
294 | rts | ||
295 | |||
296 | | | ||
297 | | The destination is a denormalized number. It must be handled | ||
298 | | by first shifting the bits in the mantissa until it is normalized, | ||
299 | | then adding the remainder of the source to the exponent. | ||
300 | | | ||
301 | dst_dnrm: | ||
302 | moveml %d2/%d3,-(%a7) | ||
303 | movew FPTEMP_EX(%a6),%d1 | ||
304 | movel FPTEMP_HI(%a6),%d2 | ||
305 | movel FPTEMP_LO(%a6),%d3 | ||
306 | dst_loop: | ||
307 | tstl %d2 |test for normalized result | ||
308 | blts dst_norm |exit loop if so | ||
309 | tstl %d0 |otherwise, test shift count | ||
310 | beqs dst_fin |if zero, shifting is done | ||
311 | subil #1,%d0 |dec src | ||
312 | lsll #1,%d3 | ||
313 | roxll #1,%d2 | ||
314 | bras dst_loop | ||
315 | | | ||
316 | | Destination became normalized. Simply add the remaining | ||
317 | | portion of the src to the exponent. | ||
318 | | | ||
319 | dst_norm: | ||
320 | addw %d0,%d1 |dst is normalized; add src | ||
321 | tstb L_SCR1(%a6) | ||
322 | beqs dnrm_pos | ||
323 | orl #0x8000,%d1 | ||
324 | dnrm_pos: | ||
325 | movemw %d1,FPTEMP_EX(%a6) | ||
326 | moveml %d2,FPTEMP_HI(%a6) | ||
327 | moveml %d3,FPTEMP_LO(%a6) | ||
328 | fmovel USER_FPCR(%a6),%FPCR | ||
329 | fmovex FPTEMP(%a6),%fp0 | ||
330 | moveml (%a7)+,%d2/%d3 | ||
331 | rts | ||
332 | |||
333 | | | ||
334 | | Destination remained denormalized. Call t_excdnrm with | ||
335 | | exceptional operand in ETEMP. | ||
336 | | | ||
337 | dst_fin: | ||
338 | tstb L_SCR1(%a6) |check for sign | ||
339 | beqs dst_exit | ||
340 | orl #neg_mask,USER_FPSR(%a6) |set N | ||
341 | orl #0x8000,%d1 | ||
342 | dst_exit: | ||
343 | movemw %d1,ETEMP_EX(%a6) | ||
344 | moveml %d2,ETEMP_HI(%a6) | ||
345 | moveml %d3,ETEMP_LO(%a6) | ||
346 | orl #unfl_mask,USER_FPSR(%a6) |set unfl | ||
347 | moveml (%a7)+,%d2/%d3 | ||
348 | leal ETEMP(%a6),%a0 | ||
349 | bra t_resdnrm | ||
350 | |||
351 | | | ||
352 | | Source is outside of 2^14 range. Test the sign and branch | ||
353 | | to the appropriate exception handler. | ||
354 | | | ||
355 | src_out: | ||
356 | tstb L_SCR1(%a6) | ||
357 | beqs scro_pos | ||
358 | orl #0x8000,%d1 | ||
359 | scro_pos: | ||
360 | movel FPTEMP_HI(%a6),ETEMP_HI(%a6) | ||
361 | movel FPTEMP_LO(%a6),ETEMP_LO(%a6) | ||
362 | tstw ETEMP(%a6) | ||
363 | blts res_neg | ||
364 | res_pos: | ||
365 | movew %d1,ETEMP(%a6) |result in ETEMP | ||
366 | bra t_ovfl2 | ||
367 | res_neg: | ||
368 | movew %d1,ETEMP(%a6) |result in ETEMP | ||
369 | leal ETEMP(%a6),%a0 | ||
370 | bra t_unfl | ||
371 | |end | ||