[PATCH] powerpc: Move arch/ppc*/kernel/vecemu.c to arch/powerpc

This file is the same in both architectures so create arch/powerpc/kernel and move it there. Signed-off-by: Stephen Rothwell <sfr@canb.auug.org.au> Signed-off-by: Paul Mackerras <paulus@samba.org>
author: Stephen Rothwell <sfr@canb.auug.org.au> 2005-09-19 03:33:25 -0400
committer: Paul Mackerras <paulus@samba.org> 2005-09-21 05:21:07 -0400
commit: 564ee7a5668e8b6d3b369fd807c75c77285c88d4 (patch)
tree: 15eb17f5bcef733122460d57abc99234c15a6542 /arch/ppc
parent: 17b1dc07aebdef9ee43c06525bee702d5f0e9db1 (diff)
2 files changed, 2 insertions, 345 deletions
diff --git a/arch/ppc/kernel/Makefile b/arch/ppc/kernel/Makefile
index 1fb92f16acd6..abf10dcb787b 100644
--- a/arch/ppc/kernel/Makefile
+++ b/arch/ppc/kernel/Makefile
@@ -36,3 +36,5 @@ ifndef CONFIG_MATH_EMULATION
 obj-$(CONFIG_8xx)               += softemu8xx.o
 endif
+# These are here while we do the architecture merge
+vecemu-y                        += ../../powerpc/kernel/vecemu.o
diff --git a/arch/ppc/kernel/vecemu.c b/arch/ppc/kernel/vecemu.c
deleted file mode 100644
index 604d0947cb20..000000000000
--- a/arch/ppc/kernel/vecemu.c
+++ /dev/null
@@ -1,345 +0,0 @@
-/*
- * Routines to emulate some Altivec/VMX instructions, specifically
- * those that can trap when given denormalized operands in Java mode.
- */
-#include <linux/kernel.h>
-#include <linux/errno.h>
-#include <linux/sched.h>
-#include <asm/ptrace.h>
-#include <asm/processor.h>
-#include <asm/uaccess.h>
-/* Functions in vector.S */
-extern void vaddfp(vector128 *dst, vector128 *a, vector128 *b);
-extern void vsubfp(vector128 *dst, vector128 *a, vector128 *b);
-extern void vmaddfp(vector128 *dst, vector128 *a, vector128 *b, vector128 *c);
-extern void vnmsubfp(vector128 *dst, vector128 *a, vector128 *b, vector128 *c);
-extern void vrefp(vector128 *dst, vector128 *src);
-extern void vrsqrtefp(vector128 *dst, vector128 *src);
-extern void vexptep(vector128 *dst, vector128 *src);
-static unsigned int exp2s[8] = {
-        0x800000,
-        0x8b95c2,
-        0x9837f0,
-        0xa5fed7,
-        0xb504f3,
-        0xc5672a,
-        0xd744fd,
-        0xeac0c7
-};
-/*
- * Computes an estimate of 2^x.  The `s' argument is the 32-bit
- * single-precision floating-point representation of x.
- */
-static unsigned int eexp2(unsigned int s)
-{
-        int exp, pwr;
-        unsigned int mant, frac;
-        /* extract exponent field from input */
-        exp = ((s >> 23) & 0xff) - 127;
-        if (exp > 7) {
-                /* check for NaN input */
-                if (exp == 128 && (s & 0x7fffff) != 0)
-                        return s | 0x400000;    /* return QNaN */
-                /* 2^-big = 0, 2^+big = +Inf */
-                return (s & 0x80000000)? 0: 0x7f800000; /* 0 or +Inf */
-        }
-        if (exp < -23)
-                return 0x3f800000;      /* 1.0 */
-        /* convert to fixed point integer in 9.23 representation */
-        pwr = (s & 0x7fffff) | 0x800000;
-        if (exp > 0)
-                pwr <<= exp;
-        else
-                pwr >>= -exp;
-        if (s & 0x80000000)
-                pwr = -pwr;
-        /* extract integer part, which becomes exponent part of result */
-        exp = (pwr >> 23) + 126;
-        if (exp >= 254)
-                return 0x7f800000;
-        if (exp < -23)
-                return 0;
-        /* table lookup on top 3 bits of fraction to get mantissa */
-        mant = exp2s[(pwr >> 20) & 7];
-        /* linear interpolation using remaining 20 bits of fraction */
-        asm("mulhwu %0,%1,%2" : "=r" (frac)
-            : "r" (pwr << 12), "r" (0x172b83ff));
-        asm("mulhwu %0,%1,%2" : "=r" (frac) : "r" (frac), "r" (mant));
-        mant += frac;
-        if (exp >= 0)
-                return mant + (exp << 23);
-        /* denormalized result */
-        exp = -exp;
-        mant += 1 << (exp - 1);
-        return mant >> exp;
-}
-/*
- * Computes an estimate of log_2(x).  The `s' argument is the 32-bit
- * single-precision floating-point representation of x.
- */
-static unsigned int elog2(unsigned int s)
-{
-        int exp, mant, lz, frac;
-        exp = s & 0x7f800000;
-        mant = s & 0x7fffff;
-        if (exp == 0x7f800000) {        /* Inf or NaN */
-                if (mant != 0)
-                        s |= 0x400000;  /* turn NaN into QNaN */
-                return s;
-        }
-        if ((exp | mant) == 0)          /* +0 or -0 */
-                return 0xff800000;      /* return -Inf */
-        if (exp == 0) {
-                /* denormalized */
-                asm("cntlzw %0,%1" : "=r" (lz) : "r" (mant));
-                mant <<= lz - 8;
-                exp = (-118 - lz) << 23;
-        } else {
-                mant |= 0x800000;
-                exp -= 127 << 23;
-        }
-        if (mant >= 0xb504f3) {                         /* 2^0.5 * 2^23 */
-                exp |= 0x400000;                        /* 0.5 * 2^23 */
-                asm("mulhwu %0,%1,%2" : "=r" (mant)
-                    : "r" (mant), "r" (0xb504f334));    /* 2^-0.5 * 2^32 */
-        }
-        if (mant >= 0x9837f0) {                         /* 2^0.25 * 2^23 */
-                exp |= 0x200000;                        /* 0.25 * 2^23 */
-                asm("mulhwu %0,%1,%2" : "=r" (mant)
-                    : "r" (mant), "r" (0xd744fccb));    /* 2^-0.25 * 2^32 */
-        }
-        if (mant >= 0x8b95c2) {                         /* 2^0.125 * 2^23 */
-                exp |= 0x100000;                        /* 0.125 * 2^23 */
-                asm("mulhwu %0,%1,%2" : "=r" (mant)
-                    : "r" (mant), "r" (0xeac0c6e8));    /* 2^-0.125 * 2^32 */
-        }
-        if (mant > 0x800000) {                          /* 1.0 * 2^23 */
-                /* calculate (mant - 1) * 1.381097463 */
-                /* 1.381097463 == 0.125 / (2^0.125 - 1) */
-                asm("mulhwu %0,%1,%2" : "=r" (frac)
-                    : "r" ((mant - 0x800000) << 1), "r" (0xb0c7cd3a));
-                exp += frac;
-        }
-        s = exp & 0x80000000;
-        if (exp != 0) {
-                if (s)
-                        exp = -exp;
-                asm("cntlzw %0,%1" : "=r" (lz) : "r" (exp));
-                lz = 8 - lz;
-                if (lz > 0)
-                        exp >>= lz;
-                else if (lz < 0)
-                        exp <<= -lz;
-                s += ((lz + 126) << 23) + exp;
-        }
-        return s;
-}
-#define VSCR_SAT        1
-static int ctsxs(unsigned int x, int scale, unsigned int *vscrp)
-{
-        int exp, mant;
-        exp = (x >> 23) & 0xff;
-        mant = x & 0x7fffff;
-        if (exp == 255 && mant != 0)
-                return 0;               /* NaN -> 0 */
-        exp = exp - 127 + scale;
-        if (exp < 0)
-                return 0;               /* round towards zero */
-        if (exp >= 31) {
-                /* saturate, unless the result would be -2^31 */
-                if (x + (scale << 23) != 0xcf000000)
-                        *vscrp |= VSCR_SAT;
-                return (x & 0x80000000)? 0x80000000: 0x7fffffff;
-        }
-        mant |= 0x800000;
-        mant = (mant << 7) >> (30 - exp);
-        return (x & 0x80000000)? -mant: mant;
-}
-static unsigned int ctuxs(unsigned int x, int scale, unsigned int *vscrp)
-{
-        int exp;
-        unsigned int mant;
-        exp = (x >> 23) & 0xff;
-        mant = x & 0x7fffff;
-        if (exp == 255 && mant != 0)
-                return 0;               /* NaN -> 0 */
-        exp = exp - 127 + scale;
-        if (exp < 0)
-                return 0;               /* round towards zero */
-        if (x & 0x80000000) {
-                /* negative => saturate to 0 */
-                *vscrp |= VSCR_SAT;
-                return 0;
-        }
-        if (exp >= 32) {
-                /* saturate */
-                *vscrp |= VSCR_SAT;
-                return 0xffffffff;
-        }
-        mant |= 0x800000;
-        mant = (mant << 8) >> (31 - exp);
-        return mant;
-}
-/* Round to floating integer, towards 0 */
-static unsigned int rfiz(unsigned int x)
-{
-        int exp;
-        exp = ((x >> 23) & 0xff) - 127;
-        if (exp == 128 && (x & 0x7fffff) != 0)
-                return x | 0x400000;    /* NaN -> make it a QNaN */
-        if (exp >= 23)
-                return x;               /* it's an integer already (or Inf) */
-        if (exp < 0)
-                return x & 0x80000000;  /* |x| < 1.0 rounds to 0 */
-        return x & ~(0x7fffff >> exp);
-}
-/* Round to floating integer, towards +/- Inf */
-static unsigned int rfii(unsigned int x)
-{
-        int exp, mask;
-        exp = ((x >> 23) & 0xff) - 127;
-        if (exp == 128 && (x & 0x7fffff) != 0)
-                return x | 0x400000;    /* NaN -> make it a QNaN */
-        if (exp >= 23)
-                return x;               /* it's an integer already (or Inf) */
-        if ((x & 0x7fffffff) == 0)
-                return x;               /* +/-0 -> +/-0 */
-        if (exp < 0)
-                /* 0 < |x| < 1.0 rounds to +/- 1.0 */
-                return (x & 0x80000000) | 0x3f800000;
-        mask = 0x7fffff >> exp;
-        /* mantissa overflows into exponent - that's OK,
-           it can't overflow into the sign bit */
-        return (x + mask) & ~mask;
-}
-/* Round to floating integer, to nearest */
-static unsigned int rfin(unsigned int x)
-{
-        int exp, half;
-        exp = ((x >> 23) & 0xff) - 127;
-        if (exp == 128 && (x & 0x7fffff) != 0)
-                return x | 0x400000;    /* NaN -> make it a QNaN */
-        if (exp >= 23)
-                return x;               /* it's an integer already (or Inf) */
-        if (exp < -1)
-                return x & 0x80000000;  /* |x| < 0.5 -> +/-0 */
-        if (exp == -1)
-                /* 0.5 <= |x| < 1.0 rounds to +/- 1.0 */
-                return (x & 0x80000000) | 0x3f800000;
-        half = 0x400000 >> exp;
-        /* add 0.5 to the magnitude and chop off the fraction bits */
-        return (x + half) & ~(0x7fffff >> exp);
-}
-int emulate_altivec(struct pt_regs *regs)
-{
-        unsigned int instr, i;
-        unsigned int va, vb, vc, vd;
-        vector128 *vrs;
-        if (get_user(instr, (unsigned int __user *) regs->nip))
-                return -EFAULT;
-        if ((instr >> 26) != 4)
-                return -EINVAL;         /* not an altivec instruction */
-        vd = (instr >> 21) & 0x1f;
-        va = (instr >> 16) & 0x1f;
-        vb = (instr >> 11) & 0x1f;
-        vc = (instr >> 6) & 0x1f;
-        vrs = current->thread.vr;
-        switch (instr & 0x3f) {
-        case 10:
-                switch (vc) {
-                case 0: /* vaddfp */
-                        vaddfp(&vrs[vd], &vrs[va], &vrs[vb]);
-                        break;
-                case 1: /* vsubfp */
-                        vsubfp(&vrs[vd], &vrs[va], &vrs[vb]);
-                        break;
-                case 4: /* vrefp */
-                        vrefp(&vrs[vd], &vrs[vb]);
-                        break;
-                case 5: /* vrsqrtefp */
-                        vrsqrtefp(&vrs[vd], &vrs[vb]);
-                        break;
-                case 6: /* vexptefp */
-                        for (i = 0; i < 4; ++i)
-                                vrs[vd].u[i] = eexp2(vrs[vb].u[i]);
-                        break;
-                case 7: /* vlogefp */
-                        for (i = 0; i < 4; ++i)
-                                vrs[vd].u[i] = elog2(vrs[vb].u[i]);
-                        break;
-                case 8:         /* vrfin */
-                        for (i = 0; i < 4; ++i)
-                                vrs[vd].u[i] = rfin(vrs[vb].u[i]);
-                        break;
-                case 9:         /* vrfiz */
-                        for (i = 0; i < 4; ++i)
-                                vrs[vd].u[i] = rfiz(vrs[vb].u[i]);
-                        break;
-                case 10:        /* vrfip */
-                        for (i = 0; i < 4; ++i) {
-                                u32 x = vrs[vb].u[i];
-                                x = (x & 0x80000000)? rfiz(x): rfii(x);
-                                vrs[vd].u[i] = x;
-                        }
-                        break;
-                case 11:        /* vrfim */
-                        for (i = 0; i < 4; ++i) {
-                                u32 x = vrs[vb].u[i];
-                                x = (x & 0x80000000)? rfii(x): rfiz(x);
-                                vrs[vd].u[i] = x;
-                        }
-                        break;
-                case 14:        /* vctuxs */
-                        for (i = 0; i < 4; ++i)
-                                vrs[vd].u[i] = ctuxs(vrs[vb].u[i], va,
-                                                &current->thread.vscr.u[3]);
-                        break;
-                case 15:        /* vctsxs */
-                        for (i = 0; i < 4; ++i)
-                                vrs[vd].u[i] = ctsxs(vrs[vb].u[i], va,
-                                                &current->thread.vscr.u[3]);
-                        break;
-                default:
-                        return -EINVAL;
-                }
-                break;
-        case 46:        /* vmaddfp */
-                vmaddfp(&vrs[vd], &vrs[va], &vrs[vb], &vrs[vc]);
-                break;
-        case 47:        /* vnmsubfp */
-                vnmsubfp(&vrs[vd], &vrs[va], &vrs[vb], &vrs[vc]);
-                break;
-        default:
-                return -EINVAL;
-        }
-        return 0;
-}
author	Stephen Rothwell <sfr@canb.auug.org.au>	2005-09-19 03:33:25 -0400
committer	Paul Mackerras <paulus@samba.org>	2005-09-21 05:21:07 -0400
commit	564ee7a5668e8b6d3b369fd807c75c77285c88d4 (patch)
tree	15eb17f5bcef733122460d57abc99234c15a6542 /arch/ppc
parent	17b1dc07aebdef9ee43c06525bee702d5f0e9db1 (diff)

diff --git a/arch/ppc/kernel/Makefile b/arch/ppc/kernel/Makefile index 1fb92f16acd6..abf10dcb787b 100644 --- a/arch/ppc/kernel/Makefile +++ b/arch/ppc/kernel/Makefile
@@ -36,3 +36,5 @@ ifndef CONFIG_MATH_EMULATION
36	obj-$(CONFIG_8xx) += softemu8xx.o	36	obj-$(CONFIG_8xx) += softemu8xx.o
37	endif	37	endif
38		38
		39	# These are here while we do the architecture merge
		40	vecemu-y += ../../powerpc/kernel/vecemu.o


diff --git a/arch/ppc/kernel/vecemu.c b/arch/ppc/kernel/vecemu.c deleted file mode 100644 index 604d0947cb20..000000000000 --- a/arch/ppc/kernel/vecemu.c +++ /dev/null
@@ -1,345 +0,0 @@
1	/*
2	* Routines to emulate some Altivec/VMX instructions, specifically
3	* those that can trap when given denormalized operands in Java mode.
4	*/
5	#include <linux/kernel.h>
6	#include <linux/errno.h>
7	#include <linux/sched.h>
8	#include <asm/ptrace.h>
9	#include <asm/processor.h>
10	#include <asm/uaccess.h>
11
12	/* Functions in vector.S */
13	extern void vaddfp(vector128 dst, vector128 a, vector128 *b);
14	extern void vsubfp(vector128 dst, vector128 a, vector128 *b);
15	extern void vmaddfp(vector128 dst, vector128 a, vector128 b, vector128 c);
16	extern void vnmsubfp(vector128 dst, vector128 a, vector128 b, vector128 c);
17	extern void vrefp(vector128 dst, vector128 src);
18	extern void vrsqrtefp(vector128 dst, vector128 src);
19	extern void vexptep(vector128 dst, vector128 src);
20
21	static unsigned int exp2s[8] = {
22	0x800000,
23	0x8b95c2,
24	0x9837f0,
25	0xa5fed7,
26	0xb504f3,
27	0xc5672a,
28	0xd744fd,
29	0xeac0c7
30	};
31
32	/*
33	* Computes an estimate of 2^x. The `s' argument is the 32-bit
34	* single-precision floating-point representation of x.
35	*/
36	static unsigned int eexp2(unsigned int s)
37	{
38	int exp, pwr;
39	unsigned int mant, frac;
40
41	/* extract exponent field from input */
42	exp = ((s >> 23) & 0xff) - 127;
43	if (exp > 7) {
44	/* check for NaN input */
45	if (exp == 128 && (s & 0x7fffff) != 0)
46	return s \| 0x400000; /* return QNaN */
47	/* 2^-big = 0, 2^+big = +Inf */
48	return (s & 0x80000000)? 0: 0x7f800000; /* 0 or +Inf */
49	}
50	if (exp < -23)
51	return 0x3f800000; /* 1.0 */
52
53	/* convert to fixed point integer in 9.23 representation */
54	pwr = (s & 0x7fffff) \| 0x800000;
55	if (exp > 0)
56	pwr <<= exp;
57	else
58	pwr >>= -exp;
59	if (s & 0x80000000)
60	pwr = -pwr;
61
62	/* extract integer part, which becomes exponent part of result */
63	exp = (pwr >> 23) + 126;
64	if (exp >= 254)
65	return 0x7f800000;
66	if (exp < -23)
67	return 0;
68
69	/* table lookup on top 3 bits of fraction to get mantissa */
70	mant = exp2s[(pwr >> 20) & 7];
71
72	/* linear interpolation using remaining 20 bits of fraction */
73	asm("mulhwu %0,%1,%2" : "=r" (frac)
74	: "r" (pwr << 12), "r" (0x172b83ff));
75	asm("mulhwu %0,%1,%2" : "=r" (frac) : "r" (frac), "r" (mant));
76	mant += frac;
77
78	if (exp >= 0)
79	return mant + (exp << 23);
80
81	/* denormalized result */
82	exp = -exp;
83	mant += 1 << (exp - 1);
84	return mant >> exp;
85	}
86
87	/*
88	* Computes an estimate of log_2(x). The `s' argument is the 32-bit
89	* single-precision floating-point representation of x.
90	*/
91	static unsigned int elog2(unsigned int s)
92	{
93	int exp, mant, lz, frac;
94
95	exp = s & 0x7f800000;
96	mant = s & 0x7fffff;
97	if (exp == 0x7f800000) { /* Inf or NaN */
98	if (mant != 0)
99	s \|= 0x400000; /* turn NaN into QNaN */
100	return s;
101	}
102	if ((exp \| mant) == 0) /* +0 or -0 */
103	return 0xff800000; /* return -Inf */
104
105	if (exp == 0) {
106	/* denormalized */
107	asm("cntlzw %0,%1" : "=r" (lz) : "r" (mant));
108	mant <<= lz - 8;
109	exp = (-118 - lz) << 23;
110	} else {
111	mant \|= 0x800000;
112	exp -= 127 << 23;
113	}
114
115	if (mant >= 0xb504f3) { /* 2^0.5 * 2^23 */
116	exp \|= 0x400000; /* 0.5 * 2^23 */
117	asm("mulhwu %0,%1,%2" : "=r" (mant)
118	: "r" (mant), "r" (0xb504f334)); /* 2^-0.5 * 2^32 */
119	}
120	if (mant >= 0x9837f0) { /* 2^0.25 * 2^23 */
121	exp \|= 0x200000; /* 0.25 * 2^23 */
122	asm("mulhwu %0,%1,%2" : "=r" (mant)
123	: "r" (mant), "r" (0xd744fccb)); /* 2^-0.25 * 2^32 */
124	}
125	if (mant >= 0x8b95c2) { /* 2^0.125 * 2^23 */
126	exp \|= 0x100000; /* 0.125 * 2^23 */
127	asm("mulhwu %0,%1,%2" : "=r" (mant)
128	: "r" (mant), "r" (0xeac0c6e8)); /* 2^-0.125 * 2^32 */
129	}
130	if (mant > 0x800000) { /* 1.0 * 2^23 */
131	/* calculate (mant - 1) * 1.381097463 */
132	/* 1.381097463 == 0.125 / (2^0.125 - 1) */
133	asm("mulhwu %0,%1,%2" : "=r" (frac)
134	: "r" ((mant - 0x800000) << 1), "r" (0xb0c7cd3a));
135	exp += frac;
136	}
137	s = exp & 0x80000000;
138	if (exp != 0) {
139	if (s)
140	exp = -exp;
141	asm("cntlzw %0,%1" : "=r" (lz) : "r" (exp));
142	lz = 8 - lz;
143	if (lz > 0)
144	exp >>= lz;
145	else if (lz < 0)
146	exp <<= -lz;
147	s += ((lz + 126) << 23) + exp;
148	}
149	return s;
150	}
151
152	#define VSCR_SAT 1
153
154	static int ctsxs(unsigned int x, int scale, unsigned int *vscrp)
155	{
156	int exp, mant;
157
158	exp = (x >> 23) & 0xff;
159	mant = x & 0x7fffff;
160	if (exp == 255 && mant != 0)
161	return 0; /* NaN -> 0 */
162	exp = exp - 127 + scale;
163	if (exp < 0)
164	return 0; /* round towards zero */
165	if (exp >= 31) {
166	/* saturate, unless the result would be -2^31 */
167	if (x + (scale << 23) != 0xcf000000)
168	*vscrp \|= VSCR_SAT;
169	return (x & 0x80000000)? 0x80000000: 0x7fffffff;
170	}
171	mant \|= 0x800000;
172	mant = (mant << 7) >> (30 - exp);
173	return (x & 0x80000000)? -mant: mant;
174	}
175
176	static unsigned int ctuxs(unsigned int x, int scale, unsigned int *vscrp)
177	{
178	int exp;
179	unsigned int mant;
180
181	exp = (x >> 23) & 0xff;
182	mant = x & 0x7fffff;
183	if (exp == 255 && mant != 0)
184	return 0; /* NaN -> 0 */
185	exp = exp - 127 + scale;
186	if (exp < 0)
187	return 0; /* round towards zero */
188	if (x & 0x80000000) {
189	/* negative => saturate to 0 */
190	*vscrp \|= VSCR_SAT;
191	return 0;
192	}
193	if (exp >= 32) {
194	/* saturate */
195	*vscrp \|= VSCR_SAT;
196	return 0xffffffff;
197	}
198	mant \|= 0x800000;
199	mant = (mant << 8) >> (31 - exp);
200	return mant;
201	}
202
203	/* Round to floating integer, towards 0 */
204	static unsigned int rfiz(unsigned int x)
205	{
206	int exp;
207
208	exp = ((x >> 23) & 0xff) - 127;
209	if (exp == 128 && (x & 0x7fffff) != 0)
210	return x \| 0x400000; /* NaN -> make it a QNaN */
211	if (exp >= 23)
212	return x; /* it's an integer already (or Inf) */
213	if (exp < 0)
214	return x & 0x80000000; /* \|x\| < 1.0 rounds to 0 */
215	return x & ~(0x7fffff >> exp);
216	}
217
218	/* Round to floating integer, towards +/- Inf */
219	static unsigned int rfii(unsigned int x)
220	{
221	int exp, mask;
222
223	exp = ((x >> 23) & 0xff) - 127;
224	if (exp == 128 && (x & 0x7fffff) != 0)
225	return x \| 0x400000; /* NaN -> make it a QNaN */
226	if (exp >= 23)
227	return x; /* it's an integer already (or Inf) */
228	if ((x & 0x7fffffff) == 0)
229	return x; /* +/-0 -> +/-0 */
230	if (exp < 0)
231	/* 0 < \|x\| < 1.0 rounds to +/- 1.0 */
232	return (x & 0x80000000) \| 0x3f800000;
233	mask = 0x7fffff >> exp;
234	/* mantissa overflows into exponent - that's OK,
235	it can't overflow into the sign bit */
236	return (x + mask) & ~mask;
237	}
238
239	/* Round to floating integer, to nearest */
240	static unsigned int rfin(unsigned int x)
241	{
242	int exp, half;
243
244	exp = ((x >> 23) & 0xff) - 127;
245	if (exp == 128 && (x & 0x7fffff) != 0)
246	return x \| 0x400000; /* NaN -> make it a QNaN */
247	if (exp >= 23)
248	return x; /* it's an integer already (or Inf) */
249	if (exp < -1)
250	return x & 0x80000000; /* \|x\| < 0.5 -> +/-0 */
251	if (exp == -1)
252	/* 0.5 <= \|x\| < 1.0 rounds to +/- 1.0 */
253	return (x & 0x80000000) \| 0x3f800000;
254	half = 0x400000 >> exp;
255	/* add 0.5 to the magnitude and chop off the fraction bits */
256	return (x + half) & ~(0x7fffff >> exp);
257	}
258
259	int emulate_altivec(struct pt_regs *regs)
260	{
261	unsigned int instr, i;
262	unsigned int va, vb, vc, vd;
263	vector128 *vrs;
264
265	if (get_user(instr, (unsigned int __user *) regs->nip))
266	return -EFAULT;
267	if ((instr >> 26) != 4)
268	return -EINVAL; /* not an altivec instruction */
269	vd = (instr >> 21) & 0x1f;
270	va = (instr >> 16) & 0x1f;
271	vb = (instr >> 11) & 0x1f;
272	vc = (instr >> 6) & 0x1f;
273
274	vrs = current->thread.vr;
275	switch (instr & 0x3f) {
276	case 10:
277	switch (vc) {
278	case 0: /* vaddfp */
279	vaddfp(&vrs[vd], &vrs[va], &vrs[vb]);
280	break;
281	case 1: /* vsubfp */
282	vsubfp(&vrs[vd], &vrs[va], &vrs[vb]);
283	break;
284	case 4: /* vrefp */
285	vrefp(&vrs[vd], &vrs[vb]);
286	break;
287	case 5: /* vrsqrtefp */
288	vrsqrtefp(&vrs[vd], &vrs[vb]);
289	break;
290	case 6: /* vexptefp */
291	for (i = 0; i < 4; ++i)
292	vrs[vd].u[i] = eexp2(vrs[vb].u[i]);
293	break;
294	case 7: /* vlogefp */
295	for (i = 0; i < 4; ++i)
296	vrs[vd].u[i] = elog2(vrs[vb].u[i]);
297	break;
298	case 8: /* vrfin */
299	for (i = 0; i < 4; ++i)
300	vrs[vd].u[i] = rfin(vrs[vb].u[i]);
301	break;
302	case 9: /* vrfiz */
303	for (i = 0; i < 4; ++i)
304	vrs[vd].u[i] = rfiz(vrs[vb].u[i]);
305	break;
306	case 10: /* vrfip */
307	for (i = 0; i < 4; ++i) {
308	u32 x = vrs[vb].u[i];
309	x = (x & 0x80000000)? rfiz(x): rfii(x);
310	vrs[vd].u[i] = x;
311	}
312	break;
313	case 11: /* vrfim */
314	for (i = 0; i < 4; ++i) {
315	u32 x = vrs[vb].u[i];
316	x = (x & 0x80000000)? rfii(x): rfiz(x);
317	vrs[vd].u[i] = x;
318	}
319	break;
320	case 14: /* vctuxs */
321	for (i = 0; i < 4; ++i)
322	vrs[vd].u[i] = ctuxs(vrs[vb].u[i], va,
323	&current->thread.vscr.u[3]);
324	break;
325	case 15: /* vctsxs */
326	for (i = 0; i < 4; ++i)
327	vrs[vd].u[i] = ctsxs(vrs[vb].u[i], va,
328	&current->thread.vscr.u[3]);
329	break;
330	default:
331	return -EINVAL;
332	}
333	break;
334	case 46: /* vmaddfp */
335	vmaddfp(&vrs[vd], &vrs[va], &vrs[vb], &vrs[vc]);
336	break;
337	case 47: /* vnmsubfp */
338	vnmsubfp(&vrs[vd], &vrs[va], &vrs[vb], &vrs[vc]);
339	break;
340	default:
341	return -EINVAL;
342	}
343
344	return 0;
345	}