diff options
author | Atsushi Nemoto <anemo@mba.ocn.ne.jp> | 2006-12-17 10:07:40 -0500 |
---|---|---|
committer | Ralf Baechle <ralf@linux-mips.org> | 2007-02-06 11:53:12 -0500 |
commit | a583158c9ce822c96a718fbf877cec1e5f9ad75d (patch) | |
tree | d253705a57eab4ed485d1eebc55b6e5ad7b81969 | |
parent | c44e8d5e47b8ba672440b92eab0735628469116c (diff) |
[MIPS] Unify memset.S
The 32-bit version and 64-bit version are almost equal. Unify them.
This makes further improvements (for example, supporting CDEX, etc.)
easier.
Signed-off-by: Atsushi Nemoto <anemo@mba.ocn.ne.jp>
Signed-off-by: Ralf Baechle <ralf@linux-mips.org>
-rw-r--r-- | arch/mips/lib-32/Makefile | 2 | ||||
-rw-r--r-- | arch/mips/lib-64/Makefile | 2 | ||||
-rw-r--r-- | arch/mips/lib-64/memset.S | 142 | ||||
-rw-r--r-- | arch/mips/lib/Makefile | 2 | ||||
-rw-r--r-- | arch/mips/lib/memset.S (renamed from arch/mips/lib-32/memset.S) | 35 |
5 files changed, 31 insertions, 152 deletions
diff --git a/arch/mips/lib-32/Makefile b/arch/mips/lib-32/Makefile index dcd4d2ed2ac4..2036cf5e6857 100644 --- a/arch/mips/lib-32/Makefile +++ b/arch/mips/lib-32/Makefile | |||
@@ -2,7 +2,7 @@ | |||
2 | # Makefile for MIPS-specific library files.. | 2 | # Makefile for MIPS-specific library files.. |
3 | # | 3 | # |
4 | 4 | ||
5 | lib-y += memset.o watch.o | 5 | lib-y += watch.o |
6 | 6 | ||
7 | obj-$(CONFIG_CPU_MIPS32) += dump_tlb.o | 7 | obj-$(CONFIG_CPU_MIPS32) += dump_tlb.o |
8 | obj-$(CONFIG_CPU_MIPS64) += dump_tlb.o | 8 | obj-$(CONFIG_CPU_MIPS64) += dump_tlb.o |
diff --git a/arch/mips/lib-64/Makefile b/arch/mips/lib-64/Makefile index dcd4d2ed2ac4..2036cf5e6857 100644 --- a/arch/mips/lib-64/Makefile +++ b/arch/mips/lib-64/Makefile | |||
@@ -2,7 +2,7 @@ | |||
2 | # Makefile for MIPS-specific library files.. | 2 | # Makefile for MIPS-specific library files.. |
3 | # | 3 | # |
4 | 4 | ||
5 | lib-y += memset.o watch.o | 5 | lib-y += watch.o |
6 | 6 | ||
7 | obj-$(CONFIG_CPU_MIPS32) += dump_tlb.o | 7 | obj-$(CONFIG_CPU_MIPS32) += dump_tlb.o |
8 | obj-$(CONFIG_CPU_MIPS64) += dump_tlb.o | 8 | obj-$(CONFIG_CPU_MIPS64) += dump_tlb.o |
diff --git a/arch/mips/lib-64/memset.S b/arch/mips/lib-64/memset.S deleted file mode 100644 index e2c42c85113b..000000000000 --- a/arch/mips/lib-64/memset.S +++ /dev/null | |||
@@ -1,142 +0,0 @@ | |||
1 | /* | ||
2 | * This file is subject to the terms and conditions of the GNU General Public | ||
3 | * License. See the file "COPYING" in the main directory of this archive | ||
4 | * for more details. | ||
5 | * | ||
6 | * Copyright (C) 1998, 1999, 2000 by Ralf Baechle | ||
7 | * Copyright (C) 1999, 2000 Silicon Graphics, Inc. | ||
8 | */ | ||
9 | #include <asm/asm.h> | ||
10 | #include <asm/asm-offsets.h> | ||
11 | #include <asm/regdef.h> | ||
12 | |||
13 | #define EX(insn,reg,addr,handler) \ | ||
14 | 9: insn reg, addr; \ | ||
15 | .section __ex_table,"a"; \ | ||
16 | PTR 9b, handler; \ | ||
17 | .previous | ||
18 | |||
19 | .macro f_fill64 dst, offset, val, fixup | ||
20 | EX(LONG_S, \val, (\offset + 0 * LONGSIZE)(\dst), \fixup) | ||
21 | EX(LONG_S, \val, (\offset + 1 * LONGSIZE)(\dst), \fixup) | ||
22 | EX(LONG_S, \val, (\offset + 2 * LONGSIZE)(\dst), \fixup) | ||
23 | EX(LONG_S, \val, (\offset + 3 * LONGSIZE)(\dst), \fixup) | ||
24 | EX(LONG_S, \val, (\offset + 4 * LONGSIZE)(\dst), \fixup) | ||
25 | EX(LONG_S, \val, (\offset + 5 * LONGSIZE)(\dst), \fixup) | ||
26 | EX(LONG_S, \val, (\offset + 6 * LONGSIZE)(\dst), \fixup) | ||
27 | EX(LONG_S, \val, (\offset + 7 * LONGSIZE)(\dst), \fixup) | ||
28 | .endm | ||
29 | |||
30 | /* | ||
31 | * memset(void *s, int c, size_t n) | ||
32 | * | ||
33 | * a0: start of area to clear | ||
34 | * a1: char to fill with | ||
35 | * a2: size of area to clear | ||
36 | */ | ||
37 | .set noreorder | ||
38 | .align 5 | ||
39 | LEAF(memset) | ||
40 | beqz a1, 1f | ||
41 | move v0, a0 /* result */ | ||
42 | |||
43 | andi a1, 0xff /* spread fillword */ | ||
44 | dsll t1, a1, 8 | ||
45 | or a1, t1 | ||
46 | dsll t1, a1, 16 | ||
47 | or a1, t1 | ||
48 | dsll t1, a1, 32 | ||
49 | or a1, t1 | ||
50 | 1: | ||
51 | |||
52 | FEXPORT(__bzero) | ||
53 | sltiu t0, a2, LONGSIZE /* very small region? */ | ||
54 | bnez t0, small_memset | ||
55 | andi t0, a0, LONGMASK /* aligned? */ | ||
56 | |||
57 | beqz t0, 1f | ||
58 | PTR_SUBU t0, LONGSIZE /* alignment in bytes */ | ||
59 | |||
60 | #ifdef __MIPSEB__ | ||
61 | EX(sdl, a1, (a0), first_fixup) /* make dword aligned */ | ||
62 | #endif | ||
63 | #ifdef __MIPSEL__ | ||
64 | EX(sdr, a1, (a0), first_fixup) /* make dword aligned */ | ||
65 | #endif | ||
66 | PTR_SUBU a0, t0 /* long align ptr */ | ||
67 | PTR_ADDU a2, t0 /* correct size */ | ||
68 | |||
69 | 1: ori t1, a2, 0x3f /* # of full blocks */ | ||
70 | xori t1, 0x3f | ||
71 | beqz t1, memset_partial /* no block to fill */ | ||
72 | andi t0, a2, 0x38 | ||
73 | |||
74 | PTR_ADDU t1, a0 /* end address */ | ||
75 | .set reorder | ||
76 | 1: PTR_ADDIU a0, 64 | ||
77 | f_fill64 a0, -64, a1, fwd_fixup | ||
78 | bne t1, a0, 1b | ||
79 | .set noreorder | ||
80 | |||
81 | memset_partial: | ||
82 | PTR_LA t1, 2f /* where to start */ | ||
83 | .set noat | ||
84 | dsrl AT, t0, 1 | ||
85 | PTR_SUBU t1, AT | ||
86 | .set noat | ||
87 | jr t1 | ||
88 | PTR_ADDU a0, t0 /* dest ptr */ | ||
89 | |||
90 | .set push | ||
91 | .set noreorder | ||
92 | .set nomacro | ||
93 | f_fill64 a0, -64, a1, partial_fixup /* ... but first do longs ... */ | ||
94 | 2: .set pop | ||
95 | andi a2, LONGMASK /* At most one long to go */ | ||
96 | |||
97 | beqz a2, 1f | ||
98 | PTR_ADDU a0, a2 /* What's left */ | ||
99 | #ifdef __MIPSEB__ | ||
100 | EX(sdr, a1, -1(a0), last_fixup) | ||
101 | #endif | ||
102 | #ifdef __MIPSEL__ | ||
103 | EX(sdl, a1, -1(a0), last_fixup) | ||
104 | #endif | ||
105 | 1: jr ra | ||
106 | move a2, zero | ||
107 | |||
108 | small_memset: | ||
109 | beqz a2, 2f | ||
110 | PTR_ADDU t1, a0, a2 | ||
111 | |||
112 | 1: PTR_ADDIU a0, 1 /* fill bytewise */ | ||
113 | bne t1, a0, 1b | ||
114 | sb a1, -1(a0) | ||
115 | |||
116 | 2: jr ra /* done */ | ||
117 | move a2, zero | ||
118 | END(memset) | ||
119 | |||
120 | first_fixup: | ||
121 | jr ra | ||
122 | nop | ||
123 | |||
124 | fwd_fixup: | ||
125 | PTR_L t0, TI_TASK($28) | ||
126 | LONG_L t0, THREAD_BUADDR(t0) | ||
127 | andi a2, 0x3f | ||
128 | LONG_ADDU a2, t1 | ||
129 | jr ra | ||
130 | LONG_SUBU a2, t0 | ||
131 | |||
132 | partial_fixup: | ||
133 | PTR_L t0, TI_TASK($28) | ||
134 | LONG_L t0, THREAD_BUADDR(t0) | ||
135 | andi a2, LONGMASK | ||
136 | LONG_ADDU a2, t1 | ||
137 | jr ra | ||
138 | LONG_SUBU a2, t0 | ||
139 | |||
140 | last_fixup: | ||
141 | jr ra | ||
142 | andi v1, a2, LONGMASK | ||
diff --git a/arch/mips/lib/Makefile b/arch/mips/lib/Makefile index 989c900b8b14..5ad501b30b43 100644 --- a/arch/mips/lib/Makefile +++ b/arch/mips/lib/Makefile | |||
@@ -2,7 +2,7 @@ | |||
2 | # Makefile for MIPS-specific library files.. | 2 | # Makefile for MIPS-specific library files.. |
3 | # | 3 | # |
4 | 4 | ||
5 | lib-y += csum_partial.o memcpy.o promlib.o \ | 5 | lib-y += csum_partial.o memcpy.o memset.o promlib.o \ |
6 | strlen_user.o strncpy_user.o strnlen_user.o uncached.o | 6 | strlen_user.o strncpy_user.o strnlen_user.o uncached.o |
7 | 7 | ||
8 | obj-y += iomap.o | 8 | obj-y += iomap.o |
diff --git a/arch/mips/lib-32/memset.S b/arch/mips/lib/memset.S index 1981485bd48b..3f8b8b3d0b23 100644 --- a/arch/mips/lib-32/memset.S +++ b/arch/mips/lib/memset.S | |||
@@ -10,6 +10,14 @@ | |||
10 | #include <asm/asm-offsets.h> | 10 | #include <asm/asm-offsets.h> |
11 | #include <asm/regdef.h> | 11 | #include <asm/regdef.h> |
12 | 12 | ||
13 | #if LONGSIZE == 4 | ||
14 | #define LONG_S_L swl | ||
15 | #define LONG_S_R swr | ||
16 | #else | ||
17 | #define LONG_S_L sdl | ||
18 | #define LONG_S_R sdr | ||
19 | #endif | ||
20 | |||
13 | #define EX(insn,reg,addr,handler) \ | 21 | #define EX(insn,reg,addr,handler) \ |
14 | 9: insn reg, addr; \ | 22 | 9: insn reg, addr; \ |
15 | .section __ex_table,"a"; \ | 23 | .section __ex_table,"a"; \ |
@@ -25,6 +33,7 @@ | |||
25 | EX(LONG_S, \val, (\offset + 5 * LONGSIZE)(\dst), \fixup) | 33 | EX(LONG_S, \val, (\offset + 5 * LONGSIZE)(\dst), \fixup) |
26 | EX(LONG_S, \val, (\offset + 6 * LONGSIZE)(\dst), \fixup) | 34 | EX(LONG_S, \val, (\offset + 6 * LONGSIZE)(\dst), \fixup) |
27 | EX(LONG_S, \val, (\offset + 7 * LONGSIZE)(\dst), \fixup) | 35 | EX(LONG_S, \val, (\offset + 7 * LONGSIZE)(\dst), \fixup) |
36 | #if LONGSIZE == 4 | ||
28 | EX(LONG_S, \val, (\offset + 8 * LONGSIZE)(\dst), \fixup) | 37 | EX(LONG_S, \val, (\offset + 8 * LONGSIZE)(\dst), \fixup) |
29 | EX(LONG_S, \val, (\offset + 9 * LONGSIZE)(\dst), \fixup) | 38 | EX(LONG_S, \val, (\offset + 9 * LONGSIZE)(\dst), \fixup) |
30 | EX(LONG_S, \val, (\offset + 10 * LONGSIZE)(\dst), \fixup) | 39 | EX(LONG_S, \val, (\offset + 10 * LONGSIZE)(\dst), \fixup) |
@@ -33,6 +42,7 @@ | |||
33 | EX(LONG_S, \val, (\offset + 13 * LONGSIZE)(\dst), \fixup) | 42 | EX(LONG_S, \val, (\offset + 13 * LONGSIZE)(\dst), \fixup) |
34 | EX(LONG_S, \val, (\offset + 14 * LONGSIZE)(\dst), \fixup) | 43 | EX(LONG_S, \val, (\offset + 14 * LONGSIZE)(\dst), \fixup) |
35 | EX(LONG_S, \val, (\offset + 15 * LONGSIZE)(\dst), \fixup) | 44 | EX(LONG_S, \val, (\offset + 15 * LONGSIZE)(\dst), \fixup) |
45 | #endif | ||
36 | .endm | 46 | .endm |
37 | 47 | ||
38 | /* | 48 | /* |
@@ -49,9 +59,13 @@ LEAF(memset) | |||
49 | move v0, a0 /* result */ | 59 | move v0, a0 /* result */ |
50 | 60 | ||
51 | andi a1, 0xff /* spread fillword */ | 61 | andi a1, 0xff /* spread fillword */ |
52 | sll t1, a1, 8 | 62 | LONG_SLL t1, a1, 8 |
53 | or a1, t1 | 63 | or a1, t1 |
54 | sll t1, a1, 16 | 64 | LONG_SLL t1, a1, 16 |
65 | #if LONGSIZE == 8 | ||
66 | or a1, t1 | ||
67 | LONG_SLL t1, a1, 32 | ||
68 | #endif | ||
55 | or a1, t1 | 69 | or a1, t1 |
56 | 1: | 70 | 1: |
57 | 71 | ||
@@ -64,10 +78,10 @@ FEXPORT(__bzero) | |||
64 | PTR_SUBU t0, LONGSIZE /* alignment in bytes */ | 78 | PTR_SUBU t0, LONGSIZE /* alignment in bytes */ |
65 | 79 | ||
66 | #ifdef __MIPSEB__ | 80 | #ifdef __MIPSEB__ |
67 | EX(swl, a1, (a0), first_fixup) /* make word aligned */ | 81 | EX(LONG_S_L, a1, (a0), first_fixup) /* make word/dword aligned */ |
68 | #endif | 82 | #endif |
69 | #ifdef __MIPSEL__ | 83 | #ifdef __MIPSEL__ |
70 | EX(swr, a1, (a0), first_fixup) /* make word aligned */ | 84 | EX(LONG_S_R, a1, (a0), first_fixup) /* make word/dword aligned */ |
71 | #endif | 85 | #endif |
72 | PTR_SUBU a0, t0 /* long align ptr */ | 86 | PTR_SUBU a0, t0 /* long align ptr */ |
73 | PTR_ADDU a2, t0 /* correct size */ | 87 | PTR_ADDU a2, t0 /* correct size */ |
@@ -75,7 +89,7 @@ FEXPORT(__bzero) | |||
75 | 1: ori t1, a2, 0x3f /* # of full blocks */ | 89 | 1: ori t1, a2, 0x3f /* # of full blocks */ |
76 | xori t1, 0x3f | 90 | xori t1, 0x3f |
77 | beqz t1, memset_partial /* no block to fill */ | 91 | beqz t1, memset_partial /* no block to fill */ |
78 | andi t0, a2, 0x3c | 92 | andi t0, a2, 0x40-LONGSIZE |
79 | 93 | ||
80 | PTR_ADDU t1, a0 /* end address */ | 94 | PTR_ADDU t1, a0 /* end address */ |
81 | .set reorder | 95 | .set reorder |
@@ -86,7 +100,14 @@ FEXPORT(__bzero) | |||
86 | 100 | ||
87 | memset_partial: | 101 | memset_partial: |
88 | PTR_LA t1, 2f /* where to start */ | 102 | PTR_LA t1, 2f /* where to start */ |
103 | #if LONGSIZE == 4 | ||
89 | PTR_SUBU t1, t0 | 104 | PTR_SUBU t1, t0 |
105 | #else | ||
106 | .set noat | ||
107 | LONG_SRL AT, t0, 1 | ||
108 | PTR_SUBU t1, AT | ||
109 | .set noat | ||
110 | #endif | ||
90 | jr t1 | 111 | jr t1 |
91 | PTR_ADDU a0, t0 /* dest ptr */ | 112 | PTR_ADDU a0, t0 /* dest ptr */ |
92 | 113 | ||
@@ -100,10 +121,10 @@ memset_partial: | |||
100 | beqz a2, 1f | 121 | beqz a2, 1f |
101 | PTR_ADDU a0, a2 /* What's left */ | 122 | PTR_ADDU a0, a2 /* What's left */ |
102 | #ifdef __MIPSEB__ | 123 | #ifdef __MIPSEB__ |
103 | EX(swr, a1, -1(a0), last_fixup) | 124 | EX(LONG_S_R, a1, -1(a0), last_fixup) |
104 | #endif | 125 | #endif |
105 | #ifdef __MIPSEL__ | 126 | #ifdef __MIPSEL__ |
106 | EX(swl, a1, -1(a0), last_fixup) | 127 | EX(LONG_S_L, a1, -1(a0), last_fixup) |
107 | #endif | 128 | #endif |
108 | 1: jr ra | 129 | 1: jr ra |
109 | move a2, zero | 130 | move a2, zero |