Make the machdep.svs_enabled sysctl writable, and add the kernel code

needed to disable SVS at runtime.

We set 'svs_enabled' to false, and hotpatch the kernel entry/exit points
to eliminate the context switch code.

We need to make sure there is no remote CPU that is executing the code we
are hotpatching. So we use two barriers:

 * After the first one each CPU is guaranteed to be executing in
   svs_disable_cpu with interrupts disabled (this way it can't leave this
   place).

 * After the second one it is guaranteed that SVS is disabled, so we flush
   the cache, enable interrupts and continue execution normally.

Between the two barriers, cpu0 will disable SVS (svs_enabled=false and
hotpatch), and each CPU will restore the generic syscall entry point.

Three notes:

 * We should call svs_pgg_update(true) afterwards, to put back PG_G on
   the kernel pages (for better performance). This will be done in another
   commit.

 * The fact that we disable interrupts does not prevent us from receiving
   an NMI, and it would be problematic. So we need to add some code to
   verify that PMCs are disabled before hotpatching. This will be done
   in another commit.

 * In svs_disable() we expect each CPU to be online. We need to add a
   check to make sure they indeed are.

The sysctl allows only a 1->0 transition. There is no point in doing 0->1
transitions anyway, and it would be complicated to implement because we
need to re-synchronize the CPU user page tables with the current ones (we
lost track of them in the last 1->0 transition).
This commit is contained in:
maxv 2018-02-22 10:42:10 +00:00
parent f929364d1e
commit 5ab8a4e764
4 changed files with 176 additions and 24 deletions

View File

@ -1,4 +1,4 @@
/* $NetBSD: locore.S,v 1.152 2018/02/22 08:56:51 maxv Exp $ */
/* $NetBSD: locore.S,v 1.153 2018/02/22 10:42:10 maxv Exp $ */
/*
* Copyright-o-rama!
@ -1591,14 +1591,14 @@ END(intrfastexit)
TEXT_USER_END
#ifdef SVS
.globl svs_enter
.globl svs_enter_end
.globl svs_enter_altstack
.globl svs_enter_altstack_end
.globl svs_leave
.globl svs_leave_end
.globl svs_leave_altstack
.globl svs_leave_altstack_end
.globl svs_enter, svs_enter_end
.globl svs_enter_altstack, svs_enter_altstack_end
.globl svs_leave, svs_leave_end
.globl svs_leave_altstack, svs_leave_altstack_end
.globl nosvs_enter, nosvs_enter_end
.globl nosvs_enter_altstack, nosvs_enter_altstack_end
.globl nosvs_leave, nosvs_leave_end
.globl nosvs_leave_altstack, nosvs_leave_altstack_end
LABEL(svs_enter)
movq SVS_UTLS+UTLS_KPDIRPA,%rax
@ -1630,4 +1630,20 @@ LABEL(svs_leave_altstack)
movq %rax,%cr3
1234:
LABEL(svs_leave_altstack_end)
LABEL(nosvs_enter)
NOSVS_ENTER
LABEL(nosvs_enter_end)
LABEL(nosvs_enter_altstack)
NOSVS_ENTER_ALTSTACK
LABEL(nosvs_enter_altstack_end)
LABEL(nosvs_leave)
NOSVS_LEAVE
LABEL(nosvs_leave_end)
LABEL(nosvs_leave_altstack)
NOSVS_LEAVE_ALTSTACK
LABEL(nosvs_leave_altstack_end)
#endif

View File

@ -1,4 +1,4 @@
/* $NetBSD: frameasm.h,v 1.35 2018/02/22 08:56:51 maxv Exp $ */
/* $NetBSD: frameasm.h,v 1.36 2018/02/22 10:42:11 maxv Exp $ */
#ifndef _AMD64_MACHINE_FRAMEASM_H
#define _AMD64_MACHINE_FRAMEASM_H
@ -112,28 +112,36 @@
#define UTLS_RSP0 16
#define SVS_ENTER_BYTES 22
#define SVS_ENTER \
HOTPATCH(HP_NAME_SVS_ENTER, SVS_ENTER_BYTES) ; \
#define NOSVS_ENTER \
.byte 0xEB, (SVS_ENTER_BYTES-2) /* jmp */ ; \
.fill (SVS_ENTER_BYTES-2),1,0xCC
#define SVS_ENTER \
HOTPATCH(HP_NAME_SVS_ENTER, SVS_ENTER_BYTES) ; \
NOSVS_ENTER
#define SVS_LEAVE_BYTES 31
#define SVS_LEAVE \
HOTPATCH(HP_NAME_SVS_LEAVE, SVS_LEAVE_BYTES) ; \
#define NOSVS_LEAVE \
.byte 0xEB, (SVS_LEAVE_BYTES-2) /* jmp */ ; \
.fill (SVS_LEAVE_BYTES-2),1,0xCC
#define SVS_LEAVE \
HOTPATCH(HP_NAME_SVS_LEAVE, SVS_LEAVE_BYTES) ; \
NOSVS_LEAVE
#define SVS_ENTER_ALT_BYTES 23
#define SVS_ENTER_ALTSTACK \
HOTPATCH(HP_NAME_SVS_ENTER_ALT, SVS_ENTER_ALT_BYTES) ; \
#define NOSVS_ENTER_ALTSTACK \
.byte 0xEB, (SVS_ENTER_ALT_BYTES-2) /* jmp */ ; \
.fill (SVS_ENTER_ALT_BYTES-2),1,0xCC
#define SVS_ENTER_ALTSTACK \
HOTPATCH(HP_NAME_SVS_ENTER_ALT, SVS_ENTER_ALT_BYTES) ; \
NOSVS_ENTER_ALTSTACK
#define SVS_LEAVE_ALT_BYTES 22
#define SVS_LEAVE_ALTSTACK \
HOTPATCH(HP_NAME_SVS_LEAVE_ALT, SVS_LEAVE_ALT_BYTES) ; \
#define NOSVS_LEAVE_ALTSTACK \
.byte 0xEB, (SVS_LEAVE_ALT_BYTES-2) /* jmp */ ; \
.fill (SVS_LEAVE_ALT_BYTES-2),1,0xCC
#define SVS_LEAVE_ALTSTACK \
HOTPATCH(HP_NAME_SVS_LEAVE_ALT, SVS_LEAVE_ALT_BYTES) ; \
NOSVS_LEAVE_ALTSTACK
#else
#define SVS_ENTER /* nothing */

View File

@ -1,4 +1,4 @@
/* $NetBSD: svs.c,v 1.5 2018/02/22 09:41:06 maxv Exp $ */
/* $NetBSD: svs.c,v 1.6 2018/02/22 10:42:11 maxv Exp $ */
/*
* Copyright (c) 2018 The NetBSD Foundation, Inc.
@ -30,7 +30,7 @@
*/
#include <sys/cdefs.h>
__KERNEL_RCSID(0, "$NetBSD: svs.c,v 1.5 2018/02/22 09:41:06 maxv Exp $");
__KERNEL_RCSID(0, "$NetBSD: svs.c,v 1.6 2018/02/22 10:42:11 maxv Exp $");
#include "opt_svs.h"
@ -38,6 +38,8 @@ __KERNEL_RCSID(0, "$NetBSD: svs.c,v 1.5 2018/02/22 09:41:06 maxv Exp $");
#include <sys/systm.h>
#include <sys/proc.h>
#include <sys/cpu.h>
#include <sys/sysctl.h>
#include <sys/xcall.h>
#include <x86/cputypes.h>
#include <machine/cpuvar.h>
@ -541,6 +543,131 @@ svs_enable(void)
x86_patch_window_close(psl, cr0);
}
static void
svs_disable_hotpatch(void)
{
extern uint8_t nosvs_enter, nosvs_enter_end;
extern uint8_t nosvs_enter_altstack, nosvs_enter_altstack_end;
extern uint8_t nosvs_leave, nosvs_leave_end;
extern uint8_t nosvs_leave_altstack, nosvs_leave_altstack_end;
u_long psl, cr0;
uint8_t *bytes;
size_t size;
x86_patch_window_open(&psl, &cr0);
bytes = &nosvs_enter;
size = (size_t)&nosvs_enter_end - (size_t)&nosvs_enter;
x86_hotpatch(HP_NAME_SVS_ENTER, bytes, size);
bytes = &nosvs_enter_altstack;
size = (size_t)&nosvs_enter_altstack_end -
(size_t)&nosvs_enter_altstack;
x86_hotpatch(HP_NAME_SVS_ENTER_ALT, bytes, size);
bytes = &nosvs_leave;
size = (size_t)&nosvs_leave_end - (size_t)&nosvs_leave;
x86_hotpatch(HP_NAME_SVS_LEAVE, bytes, size);
bytes = &nosvs_leave_altstack;
size = (size_t)&nosvs_leave_altstack_end -
(size_t)&nosvs_leave_altstack;
x86_hotpatch(HP_NAME_SVS_LEAVE_ALT, bytes, size);
x86_patch_window_close(psl, cr0);
}
static volatile unsigned long svs_cpu_barrier1 __cacheline_aligned;
static volatile unsigned long svs_cpu_barrier2 __cacheline_aligned;
typedef void (vector)(void);
static void
svs_disable_cpu(void *arg1, void *arg2)
{
struct cpu_info *ci = curcpu();
extern vector Xsyscall;
u_long psl;
psl = x86_read_psl();
atomic_dec_ulong(&svs_cpu_barrier1);
while (atomic_cas_ulong(&svs_cpu_barrier1, 0, 0) != 0) {
x86_pause();
}
/* cpu0 is the one that does the hotpatch job */
if (ci == &cpu_info_primary) {
svs_enabled = false;
svs_disable_hotpatch();
}
/* put back the non-SVS syscall entry point */
wrmsr(MSR_LSTAR, (uint64_t)Xsyscall);
atomic_dec_ulong(&svs_cpu_barrier2);
while (atomic_cas_ulong(&svs_cpu_barrier2, 0, 0) != 0) {
x86_pause();
}
/* Write back and invalidate cache, flush pipelines. */
wbinvd();
x86_flush();
x86_write_psl(psl);
}
static void
svs_disable(void)
{
uint64_t xc;
/*
* We expect all the CPUs to be online. XXX ensure they are.
*/
svs_cpu_barrier1 = ncpu;
svs_cpu_barrier2 = ncpu;
printf("[+] Disabling SVS\n");
xc = xc_broadcast(0, svs_disable_cpu, NULL, NULL);
xc_wait(xc);
/*
* XXX printf("[+] Installing PG_G\n");
* XXX svs_pgg_update(true);
*/
printf("[+] Done\n");
}
int sysctl_machdep_svs_enabled(SYSCTLFN_ARGS);
int
sysctl_machdep_svs_enabled(SYSCTLFN_ARGS)
{
struct sysctlnode node;
int error, val;
val = *(int *)rnode->sysctl_data;
node = *rnode;
node.sysctl_data = &val;
error = sysctl_lookup(SYSCTLFN_CALL(&node));
if (error != 0 || newp == NULL)
return error;
if (val == 1) {
error = EINVAL;
} else {
if (svs_enabled) {
svs_disable();
}
error = 0;
}
return error;
}
void
svs_init(bool early)
{

View File

@ -1,4 +1,4 @@
/* $NetBSD: x86_machdep.c,v 1.105 2018/02/22 09:41:06 maxv Exp $ */
/* $NetBSD: x86_machdep.c,v 1.106 2018/02/22 10:42:11 maxv Exp $ */
/*-
* Copyright (c) 2002, 2006, 2007 YAMAMOTO Takashi,
@ -31,7 +31,7 @@
*/
#include <sys/cdefs.h>
__KERNEL_RCSID(0, "$NetBSD: x86_machdep.c,v 1.105 2018/02/22 09:41:06 maxv Exp $");
__KERNEL_RCSID(0, "$NetBSD: x86_machdep.c,v 1.106 2018/02/22 10:42:11 maxv Exp $");
#include "opt_modular.h"
#include "opt_physmem.h"
@ -1259,11 +1259,12 @@ SYSCTL_SETUP(sysctl_machdep_setup, "sysctl machdep subtree setup")
CTL_MACHDEP, CTL_CREATE, CTL_EOL);
#endif
#ifdef SVS
int sysctl_machdep_svs_enabled(SYSCTLFN_ARGS);
sysctl_createv(clog, 0, NULL, NULL,
CTLFLAG_PERMANENT,
CTLFLAG_READWRITE,
CTLTYPE_BOOL, "svs_enabled",
SYSCTL_DESCR("Whether the kernel uses SVS"),
NULL, 0, &svs_enabled, 0,
sysctl_machdep_svs_enabled, 0, &svs_enabled, 0,
CTL_MACHDEP, CTL_CREATE, CTL_EOL);
#endif