Skip to content

Commit 8bb2610

Browse files
amlutoKAGA-KOKO
authored andcommitted
x86/entry/64/compat: Preserve r8-r11 in int $0x80
32-bit user code that uses int $80 doesn't care about r8-r11. There is, however, some 64-bit user code that intentionally uses int $0x80 to invoke 32-bit system calls. From what I've seen, basically all such code assumes that r8-r15 are all preserved, but the kernel clobbers r8-r11. Since I doubt that there's any code that depends on int $0x80 zeroing r8-r11, change the kernel to preserve them. I suspect that very little user code is broken by the old clobber, since r8-r11 are only rarely allocated by gcc, and they're clobbered by function calls, so they only way we'd see a problem is if the same function that invokes int $0x80 also spills something important to one of these registers. The current behavior seems to date back to the historical commit "[PATCH] x86-64 merge for 2.6.4". Before that, all regs were preserved. I can't find any explanation of why this change was made. Update the test_syscall_vdso_32 testcase as well to verify the new behavior, and it strengthens the test to make sure that the kernel doesn't accidentally permute r8..r15. Suggested-by: Denys Vlasenko <[email protected]> Signed-off-by: Andy Lutomirski <[email protected]> Signed-off-by: Thomas Gleixner <[email protected]> Cc: Borislav Petkov <[email protected]> Cc: Dominik Brodowski <[email protected]> Link: https://lkml.kernel.org/r/d4c4d9985fbe64f8c9e19291886453914b48caee.1523975710.git.luto@kernel.org
1 parent 316d097 commit 8bb2610

File tree

2 files changed

+25
-18
lines changed

2 files changed

+25
-18
lines changed

arch/x86/entry/entry_64_compat.S

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -84,13 +84,13 @@ ENTRY(entry_SYSENTER_compat)
8484
pushq %rdx /* pt_regs->dx */
8585
pushq %rcx /* pt_regs->cx */
8686
pushq $-ENOSYS /* pt_regs->ax */
87-
pushq $0 /* pt_regs->r8 = 0 */
87+
pushq %r8 /* pt_regs->r8 */
8888
xorl %r8d, %r8d /* nospec r8 */
89-
pushq $0 /* pt_regs->r9 = 0 */
89+
pushq %r9 /* pt_regs->r9 */
9090
xorl %r9d, %r9d /* nospec r9 */
91-
pushq $0 /* pt_regs->r10 = 0 */
91+
pushq %r10 /* pt_regs->r10 */
9292
xorl %r10d, %r10d /* nospec r10 */
93-
pushq $0 /* pt_regs->r11 = 0 */
93+
pushq %r11 /* pt_regs->r11 */
9494
xorl %r11d, %r11d /* nospec r11 */
9595
pushq %rbx /* pt_regs->rbx */
9696
xorl %ebx, %ebx /* nospec rbx */

tools/testing/selftests/x86/test_syscall_vdso.c

Lines changed: 21 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -100,12 +100,19 @@ asm (
100100
" shl $32, %r8\n"
101101
" orq $0x7f7f7f7f, %r8\n"
102102
" movq %r8, %r9\n"
103-
" movq %r8, %r10\n"
104-
" movq %r8, %r11\n"
105-
" movq %r8, %r12\n"
106-
" movq %r8, %r13\n"
107-
" movq %r8, %r14\n"
108-
" movq %r8, %r15\n"
103+
" incq %r9\n"
104+
" movq %r9, %r10\n"
105+
" incq %r10\n"
106+
" movq %r10, %r11\n"
107+
" incq %r11\n"
108+
" movq %r11, %r12\n"
109+
" incq %r12\n"
110+
" movq %r12, %r13\n"
111+
" incq %r13\n"
112+
" movq %r13, %r14\n"
113+
" incq %r14\n"
114+
" movq %r14, %r15\n"
115+
" incq %r15\n"
109116
" ret\n"
110117
" .code32\n"
111118
" .popsection\n"
@@ -128,12 +135,13 @@ int check_regs64(void)
128135
int err = 0;
129136
int num = 8;
130137
uint64_t *r64 = &regs64.r8;
138+
uint64_t expected = 0x7f7f7f7f7f7f7f7fULL;
131139

132140
if (!kernel_is_64bit)
133141
return 0;
134142

135143
do {
136-
if (*r64 == 0x7f7f7f7f7f7f7f7fULL)
144+
if (*r64 == expected++)
137145
continue; /* register did not change */
138146
if (syscall_addr != (long)&int80) {
139147
/*
@@ -147,18 +155,17 @@ int check_regs64(void)
147155
continue;
148156
}
149157
} else {
150-
/* INT80 syscall entrypoint can be used by
158+
/*
159+
* INT80 syscall entrypoint can be used by
151160
* 64-bit programs too, unlike SYSCALL/SYSENTER.
152161
* Therefore it must preserve R12+
153162
* (they are callee-saved registers in 64-bit C ABI).
154163
*
155-
* This was probably historically not intended,
156-
* but R8..11 are clobbered (cleared to 0).
157-
* IOW: they are the only registers which aren't
158-
* preserved across INT80 syscall.
164+
* Starting in Linux 4.17 (and any kernel that
165+
* backports the change), R8..11 are preserved.
166+
* Historically (and probably unintentionally), they
167+
* were clobbered or zeroed.
159168
*/
160-
if (*r64 == 0 && num <= 11)
161-
continue;
162169
}
163170
printf("[FAIL]\tR%d has changed:%016llx\n", num, *r64);
164171
err++;

0 commit comments

Comments
 (0)