2 * 32-bit syscall ABI conformance test.
4 * Copyright (c) 2015 Denys Vlasenko
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms and conditions of the GNU General Public License,
8 * version 2, as published by the Free Software Foundation.
10 * This program is distributed in the hope it will be useful, but
11 * WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * General Public License for more details.
16 * Can be built statically:
17 * gcc -Os -Wall -static -m32 test_syscall_vdso.c thunks_32.S
28 #include <sys/types.h>
29 #include <sys/select.h>
32 #include <sys/ptrace.h>
35 #if !defined(__i386__)
36 int main(int argc, char **argv, char **envp)
38 printf("[SKIP]\tNot a 32-bit x86 userspace\n");
44 long get_syscall(char **envp)
47 while (*envp++ != NULL)
49 for (auxv = (void *)envp; auxv->a_type != AT_NULL; auxv++)
50 if (auxv->a_type == AT_SYSINFO)
51 return auxv->a_un.a_val;
52 printf("[WARN]\tAT_SYSINFO not supplied\n");
57 " .pushsection .text\n"
67 uint64_t rax, rbx, rcx, rdx;
68 uint64_t rsi, rdi, rbp, rsp;
69 uint64_t r8, r9, r10, r11;
70 uint64_t r12, r13, r14, r15;
76 " .pushsection .text\n"
80 " mov $regs64, %eax\n"
82 " movq %rbx, 1*8(%rax)\n"
83 " movq %rcx, 2*8(%rax)\n"
84 " movq %rdx, 3*8(%rax)\n"
85 " movq %rsi, 4*8(%rax)\n"
86 " movq %rdi, 5*8(%rax)\n"
87 " movq %rbp, 6*8(%rax)\n"
88 " movq %rsp, 7*8(%rax)\n"
89 " movq %r8, 8*8(%rax)\n"
90 " movq %r9, 9*8(%rax)\n"
91 " movq %r10, 10*8(%rax)\n"
92 " movq %r11, 11*8(%rax)\n"
93 " movq %r12, 12*8(%rax)\n"
94 " movq %r13, 13*8(%rax)\n"
95 " movq %r14, 14*8(%rax)\n"
96 " movq %r15, 15*8(%rax)\n"
99 " movq $0x7f7f7f7f, %r8\n"
101 " orq $0x7f7f7f7f, %r8\n"
120 extern void get_regs64(void);
121 extern void poison_regs64(void);
122 extern unsigned long call64_from_32(void (*function)(void));
123 void print_regs64(void)
125 if (!kernel_is_64bit)
127 printf("ax:%016llx bx:%016llx cx:%016llx dx:%016llx\n", regs64.rax, regs64.rbx, regs64.rcx, regs64.rdx);
128 printf("si:%016llx di:%016llx bp:%016llx sp:%016llx\n", regs64.rsi, regs64.rdi, regs64.rbp, regs64.rsp);
129 printf(" 8:%016llx 9:%016llx 10:%016llx 11:%016llx\n", regs64.r8 , regs64.r9 , regs64.r10, regs64.r11);
130 printf("12:%016llx 13:%016llx 14:%016llx 15:%016llx\n", regs64.r12, regs64.r13, regs64.r14, regs64.r15);
133 int check_regs64(void)
137 uint64_t *r64 = ®s64.r8;
138 uint64_t expected = 0x7f7f7f7f7f7f7f7fULL;
140 if (!kernel_is_64bit)
144 if (*r64 == expected++)
145 continue; /* register did not change */
146 if (syscall_addr != (long)&int80) {
148 * Non-INT80 syscall entrypoints are allowed to clobber R8+ regs:
149 * either clear them to 0, or for R11, load EFLAGS.
154 printf("[NOTE]\tR11 has changed:%016llx - assuming clobbered by SYSRET insn\n", *r64);
159 * INT80 syscall entrypoint can be used by
160 * 64-bit programs too, unlike SYSCALL/SYSENTER.
161 * Therefore it must preserve R12+
162 * (they are callee-saved registers in 64-bit C ABI).
164 * Starting in Linux 4.17 (and any kernel that
165 * backports the change), R8..11 are preserved.
166 * Historically (and probably unintentionally), they
167 * were clobbered or zeroed.
170 printf("[FAIL]\tR%d has changed:%016llx\n", num, *r64);
172 } while (r64++, ++num < 16);
175 printf("[OK]\tR8..R15 did not leak kernel data\n");
183 struct timespec timeout;
200 timeout.tv_nsec = 123;
201 sigemptyset(&sigmask);
202 sigaddset(&sigmask, SIGINT);
203 sigaddset(&sigmask, SIGUSR2);
204 sigaddset(&sigmask, SIGRTMAX);
205 sigmask_desc.sp = &sigmask;
206 sigmask_desc.sz = 8; /* bytes */
209 static void print_flags(const char *name, unsigned long r)
211 static const char *bitarray[] = {
212 "\n" ,"c\n" ,/* Carry Flag */
213 "0 " ,"1 " ,/* Bit 1 - always on */
214 "" ,"p " ,/* Parity Flag */
216 "" ,"a " ,/* Auxiliary carry Flag */
218 "" ,"z " ,/* Zero Flag */
219 "" ,"s " ,/* Sign Flag */
220 "" ,"t " ,/* Trap Flag */
221 "" ,"i " ,/* Interrupt Flag */
222 "" ,"d " ,/* Direction Flag */
223 "" ,"o " ,/* Overflow Flag */
224 "0 " ,"1 " ,/* I/O Privilege Level (2 bits) */
225 "0" ,"1" ,/* I/O Privilege Level (2 bits) */
226 "" ,"n " ,/* Nested Task */
228 "" ,"r " ,/* Resume Flag */
229 "" ,"v " ,/* Virtual Mode */
230 "" ,"ac " ,/* Alignment Check/Access Control */
231 "" ,"vif ",/* Virtual Interrupt Flag */
232 "" ,"vip ",/* Virtual Interrupt Pending */
233 "" ,"id " ,/* CPUID detection */
239 printf("%s=%016lx ", name, r);
240 bitstr = bitarray + 42;
243 printf("(extra bits are set) ");
245 if (bitstr[(r >> bit) & 1][0])
246 fputs(bitstr[(r >> bit) & 1], stdout);
252 int run_syscall(void)
259 call64_from_32(poison_regs64);
263 /* Try 6-arg syscall: pselect. It should return quickly */
265 " mov $308, %%eax\n" /* PSELECT */
266 " mov nfds, %%ebx\n" /* ebx arg1 */
267 " mov $rfds, %%ecx\n" /* ecx arg2 */
268 " mov $wfds, %%edx\n" /* edx arg3 */
269 " mov $efds, %%esi\n" /* esi arg4 */
270 " mov $timeout, %%edi\n" /* edi arg5 */
271 " mov $sigmask_desc, %%ebp\n" /* %ebp arg6 */
272 " push $0x200ed7\n" /* set almost all flags */
273 " popf\n" /* except TF, IOPL, NT, RF, VM, AC, VIF, VIP */
274 " call *syscall_addr\n"
275 /* Check that registers are not clobbered */
279 " cmp nfds, %%ebx\n" /* ebx arg1 */
282 " cmp $rfds, %%ecx\n" /* ecx arg2 */
285 " cmp $wfds, %%edx\n" /* edx arg3 */
288 " cmp $efds, %%esi\n" /* esi arg4 */
291 " cmp $timeout, %%edi\n" /* edi arg5 */
294 " cmpl $sigmask_desc, %%ebp\n" /* %ebp arg6 */
300 : "=a" (flags), "=b" (bad_arg)
302 : "cx", "dx", "si", "di"
305 if (kernel_is_64bit) {
306 memset(®s64, 0x77, sizeof(regs64));
307 call64_from_32(get_regs64);
312 * On paravirt kernels, flags are not preserved across syscalls.
313 * Thus, we do not consider it a bug if some are changed.
314 * We just show ones which do.
316 if ((0x200ed7 ^ flags) != 0) {
317 print_flags("[WARN]\tFlags before", 0x200ed7);
318 print_flags("[WARN]\tFlags after", flags);
319 print_flags("[WARN]\tFlags change", (0x200ed7 ^ flags));
323 printf("[FAIL]\targ#%ld clobbered\n", bad_arg);
326 printf("[OK]\tArguments are preserved across syscall\n");
328 return check_regs64();
331 int run_syscall_twice()
337 printf("[RUN]\tExecuting 6-argument 32-bit syscall via VDSO\n");
338 exitcode = run_syscall();
341 syscall_addr = (long)&int80;
342 printf("[RUN]\tExecuting 6-argument 32-bit syscall via INT 80\n");
343 exitcode += run_syscall();
358 if (ptrace(PTRACE_TRACEME, 0L, 0L, 0L) != 0)
364 printf("[RUN]\tRunning tests under ptrace\n");
367 pid = waitpid(-1, &status, __WALL);
368 if (WIFEXITED(status))
369 exit(WEXITSTATUS(status));
370 if (WIFSIGNALED(status))
371 exit(WTERMSIG(status));
372 if (pid <= 0 || !WIFSTOPPED(status)) /* paranoia */
375 * Note: we do not inject sig = WSTOPSIG(status).
376 * We probably should, but careful: do not inject SIGTRAP
377 * generated by syscall entry/exit stops.
378 * That kills the child.
380 ptrace(PTRACE_SYSCALL, pid, 0L, 0L /*sig*/);
384 int main(int argc, char **argv, char **envp)
390 " movl %%cs, %%eax\n"
393 kernel_is_64bit = (cs == 0x23);
394 if (!kernel_is_64bit)
395 printf("[NOTE]\tNot a 64-bit kernel, won't test R8..R15 leaks\n");
397 /* This only works for non-static builds:
398 * syscall_addr = dlsym(dlopen("linux-gate.so.1", RTLD_NOW), "__kernel_vsyscall");
400 syscall_addr = get_syscall(envp);
402 exitcode += run_syscall_twice();
404 exitcode += run_syscall_twice();