diff options
author | Andy Lutomirski <luto@kernel.org> | 2018-04-17 10:36:36 -0400 |
---|---|---|
committer | Thomas Gleixner <tglx@linutronix.de> | 2018-04-27 11:07:58 -0400 |
commit | 8bb2610bc4967f19672444a7b0407367f1540028 (patch) | |
tree | c0d0fec57aa9866fad60d843fa32f6b84d5c9ed8 /tools | |
parent | 316d097c4cd4e7f2ef50c40cff2db266593c4ec4 (diff) |
x86/entry/64/compat: Preserve r8-r11 in int $0x80
32-bit user code that uses int $80 doesn't care about r8-r11. There is,
however, some 64-bit user code that intentionally uses int $0x80 to invoke
32-bit system calls. From what I've seen, basically all such code assumes
that r8-r15 are all preserved, but the kernel clobbers r8-r11. Since I
doubt that there's any code that depends on int $0x80 zeroing r8-r11,
change the kernel to preserve them.
I suspect that very little user code is broken by the old clobber, since
r8-r11 are only rarely allocated by gcc, and they're clobbered by function
calls, so they only way we'd see a problem is if the same function that
invokes int $0x80 also spills something important to one of these
registers.
The current behavior seems to date back to the historical commit
"[PATCH] x86-64 merge for 2.6.4". Before that, all regs were
preserved. I can't find any explanation of why this change was made.
Update the test_syscall_vdso_32 testcase as well to verify the new
behavior, and it strengthens the test to make sure that the kernel doesn't
accidentally permute r8..r15.
Suggested-by: Denys Vlasenko <dvlasenk@redhat.com>
Signed-off-by: Andy Lutomirski <luto@kernel.org>
Signed-off-by: Thomas Gleixner <tglx@linutronix.de>
Cc: Borislav Petkov <bp@alien8.de>
Cc: Dominik Brodowski <linux@dominikbrodowski.net>
Link: https://lkml.kernel.org/r/d4c4d9985fbe64f8c9e19291886453914b48caee.1523975710.git.luto@kernel.org
Diffstat (limited to 'tools')
-rw-r--r-- | tools/testing/selftests/x86/test_syscall_vdso.c | 35 |
1 files changed, 21 insertions, 14 deletions
diff --git a/tools/testing/selftests/x86/test_syscall_vdso.c b/tools/testing/selftests/x86/test_syscall_vdso.c index 40370354d4c1..c9c3281077bc 100644 --- a/tools/testing/selftests/x86/test_syscall_vdso.c +++ b/tools/testing/selftests/x86/test_syscall_vdso.c | |||
@@ -100,12 +100,19 @@ asm ( | |||
100 | " shl $32, %r8\n" | 100 | " shl $32, %r8\n" |
101 | " orq $0x7f7f7f7f, %r8\n" | 101 | " orq $0x7f7f7f7f, %r8\n" |
102 | " movq %r8, %r9\n" | 102 | " movq %r8, %r9\n" |
103 | " movq %r8, %r10\n" | 103 | " incq %r9\n" |
104 | " movq %r8, %r11\n" | 104 | " movq %r9, %r10\n" |
105 | " movq %r8, %r12\n" | 105 | " incq %r10\n" |
106 | " movq %r8, %r13\n" | 106 | " movq %r10, %r11\n" |
107 | " movq %r8, %r14\n" | 107 | " incq %r11\n" |
108 | " movq %r8, %r15\n" | 108 | " movq %r11, %r12\n" |
109 | " incq %r12\n" | ||
110 | " movq %r12, %r13\n" | ||
111 | " incq %r13\n" | ||
112 | " movq %r13, %r14\n" | ||
113 | " incq %r14\n" | ||
114 | " movq %r14, %r15\n" | ||
115 | " incq %r15\n" | ||
109 | " ret\n" | 116 | " ret\n" |
110 | " .code32\n" | 117 | " .code32\n" |
111 | " .popsection\n" | 118 | " .popsection\n" |
@@ -128,12 +135,13 @@ int check_regs64(void) | |||
128 | int err = 0; | 135 | int err = 0; |
129 | int num = 8; | 136 | int num = 8; |
130 | uint64_t *r64 = ®s64.r8; | 137 | uint64_t *r64 = ®s64.r8; |
138 | uint64_t expected = 0x7f7f7f7f7f7f7f7fULL; | ||
131 | 139 | ||
132 | if (!kernel_is_64bit) | 140 | if (!kernel_is_64bit) |
133 | return 0; | 141 | return 0; |
134 | 142 | ||
135 | do { | 143 | do { |
136 | if (*r64 == 0x7f7f7f7f7f7f7f7fULL) | 144 | if (*r64 == expected++) |
137 | continue; /* register did not change */ | 145 | continue; /* register did not change */ |
138 | if (syscall_addr != (long)&int80) { | 146 | if (syscall_addr != (long)&int80) { |
139 | /* | 147 | /* |
@@ -147,18 +155,17 @@ int check_regs64(void) | |||
147 | continue; | 155 | continue; |
148 | } | 156 | } |
149 | } else { | 157 | } else { |
150 | /* INT80 syscall entrypoint can be used by | 158 | /* |
159 | * INT80 syscall entrypoint can be used by | ||
151 | * 64-bit programs too, unlike SYSCALL/SYSENTER. | 160 | * 64-bit programs too, unlike SYSCALL/SYSENTER. |
152 | * Therefore it must preserve R12+ | 161 | * Therefore it must preserve R12+ |
153 | * (they are callee-saved registers in 64-bit C ABI). | 162 | * (they are callee-saved registers in 64-bit C ABI). |
154 | * | 163 | * |
155 | * This was probably historically not intended, | 164 | * Starting in Linux 4.17 (and any kernel that |
156 | * but R8..11 are clobbered (cleared to 0). | 165 | * backports the change), R8..11 are preserved. |
157 | * IOW: they are the only registers which aren't | 166 | * Historically (and probably unintentionally), they |
158 | * preserved across INT80 syscall. | 167 | * were clobbered or zeroed. |
159 | */ | 168 | */ |
160 | if (*r64 == 0 && num <= 11) | ||
161 | continue; | ||
162 | } | 169 | } |
163 | printf("[FAIL]\tR%d has changed:%016llx\n", num, *r64); | 170 | printf("[FAIL]\tR%d has changed:%016llx\n", num, *r64); |
164 | err++; | 171 | err++; |