mirror of
https://github.com/opnsense/src.git
synced 2026-04-21 14:17:06 -04:00
Save and restore (also known as suspend and resume) permits a snapshot to be taken of a guest's state that can later be resumed. In the current implementation, bhyve(8) creates a UNIX domain socket that is used by bhyvectl(8) to send a request to save a snapshot (and optionally exit after the snapshot has been taken). A snapshot currently consists of two files: the first holds a copy of guest RAM, and the second file holds other guest state such as vCPU register values and device model state. To resume a guest, bhyve(8) must be started with a matching pair of command line arguments to instantiate the same set of device models as well as a pointer to the saved snapshot. While the current implementation is useful for several uses cases, it has a few limitations. The file format for saving the guest state is tied to the ABI of internal bhyve structures and is not self-describing (in that it does not communicate the set of device models present in the system). In addition, the state saved for some device models closely matches the internal data structures which might prove a challenge for compatibility of snapshot files across a range of bhyve versions. The file format also does not currently support versioning of individual chunks of state. As a result, the current file format is not a fixed binary format and future revisions to save and restore will break binary compatiblity of snapshot files. The goal is to move to a more flexible format that adds versioning, etc. and at that point to commit to providing a reasonable level of compatibility. As a result, the current implementation is not enabled by default. It can be enabled via the WITH_BHYVE_SNAPSHOT=yes option for userland builds, and the kernel option BHYVE_SHAPSHOT. Submitted by: Mihai Tiganus, Flavius Anton, Darius Mihai Submitted by: Elena Mihailescu, Mihai Carabas, Sergiu Weisz Relnotes: yes Sponsored by: University Politehnica of Bucharest Sponsored by: Matthew Grooms (student scholarships) Sponsored by: iXsystems Differential Revision: https://reviews.freebsd.org/D19495
180 lines
4.4 KiB
C
180 lines
4.4 KiB
C
/*-
|
|
* SPDX-License-Identifier: BSD-2-Clause-FreeBSD
|
|
*
|
|
* Copyright (c) 2014, Neel Natu (neel@freebsd.org)
|
|
* All rights reserved.
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are permitted provided that the following conditions
|
|
* are met:
|
|
* 1. Redistributions of source code must retain the above copyright
|
|
* notice unmodified, this list of conditions, and the following
|
|
* disclaimer.
|
|
* 2. Redistributions in binary form must reproduce the above copyright
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
* documentation and/or other materials provided with the distribution.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
|
|
* IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
|
|
* OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
|
|
* IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
|
|
* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
|
|
* NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
|
|
* THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
*/
|
|
|
|
#include <sys/cdefs.h>
|
|
__FBSDID("$FreeBSD$");
|
|
|
|
#include "opt_bhyve_snapshot.h"
|
|
|
|
#include <sys/param.h>
|
|
#include <sys/errno.h>
|
|
#include <sys/systm.h>
|
|
|
|
#include <machine/cpufunc.h>
|
|
#include <machine/specialreg.h>
|
|
#include <machine/vmm.h>
|
|
|
|
#include "svm.h"
|
|
#include "vmcb.h"
|
|
#include "svm_softc.h"
|
|
#include "svm_msr.h"
|
|
|
|
#ifndef MSR_AMDK8_IPM
|
|
#define MSR_AMDK8_IPM 0xc0010055
|
|
#endif
|
|
|
|
enum {
|
|
IDX_MSR_LSTAR,
|
|
IDX_MSR_CSTAR,
|
|
IDX_MSR_STAR,
|
|
IDX_MSR_SF_MASK,
|
|
HOST_MSR_NUM /* must be the last enumeration */
|
|
};
|
|
|
|
static uint64_t host_msrs[HOST_MSR_NUM];
|
|
|
|
void
|
|
svm_msr_init(void)
|
|
{
|
|
/*
|
|
* It is safe to cache the values of the following MSRs because they
|
|
* don't change based on curcpu, curproc or curthread.
|
|
*/
|
|
host_msrs[IDX_MSR_LSTAR] = rdmsr(MSR_LSTAR);
|
|
host_msrs[IDX_MSR_CSTAR] = rdmsr(MSR_CSTAR);
|
|
host_msrs[IDX_MSR_STAR] = rdmsr(MSR_STAR);
|
|
host_msrs[IDX_MSR_SF_MASK] = rdmsr(MSR_SF_MASK);
|
|
}
|
|
|
|
void
|
|
svm_msr_guest_init(struct svm_softc *sc, int vcpu)
|
|
{
|
|
/*
|
|
* All the MSRs accessible to the guest are either saved/restored by
|
|
* hardware on every #VMEXIT/VMRUN (e.g., G_PAT) or are saved/restored
|
|
* by VMSAVE/VMLOAD (e.g., MSR_GSBASE).
|
|
*
|
|
* There are no guest MSRs that are saved/restored "by hand" so nothing
|
|
* more to do here.
|
|
*/
|
|
return;
|
|
}
|
|
|
|
void
|
|
svm_msr_guest_enter(struct svm_softc *sc, int vcpu)
|
|
{
|
|
/*
|
|
* Save host MSRs (if any) and restore guest MSRs (if any).
|
|
*/
|
|
}
|
|
|
|
void
|
|
svm_msr_guest_exit(struct svm_softc *sc, int vcpu)
|
|
{
|
|
/*
|
|
* Save guest MSRs (if any) and restore host MSRs.
|
|
*/
|
|
wrmsr(MSR_LSTAR, host_msrs[IDX_MSR_LSTAR]);
|
|
wrmsr(MSR_CSTAR, host_msrs[IDX_MSR_CSTAR]);
|
|
wrmsr(MSR_STAR, host_msrs[IDX_MSR_STAR]);
|
|
wrmsr(MSR_SF_MASK, host_msrs[IDX_MSR_SF_MASK]);
|
|
|
|
/* MSR_KGSBASE will be restored on the way back to userspace */
|
|
}
|
|
|
|
int
|
|
svm_rdmsr(struct svm_softc *sc, int vcpu, u_int num, uint64_t *result,
|
|
bool *retu)
|
|
{
|
|
int error = 0;
|
|
|
|
switch (num) {
|
|
case MSR_MCG_CAP:
|
|
case MSR_MCG_STATUS:
|
|
*result = 0;
|
|
break;
|
|
case MSR_MTRRcap:
|
|
case MSR_MTRRdefType:
|
|
case MSR_MTRR4kBase ... MSR_MTRR4kBase + 8:
|
|
case MSR_MTRR16kBase ... MSR_MTRR16kBase + 1:
|
|
case MSR_MTRR64kBase:
|
|
case MSR_SYSCFG:
|
|
case MSR_AMDK8_IPM:
|
|
case MSR_EXTFEATURES:
|
|
*result = 0;
|
|
break;
|
|
default:
|
|
error = EINVAL;
|
|
break;
|
|
}
|
|
|
|
return (error);
|
|
}
|
|
|
|
int
|
|
svm_wrmsr(struct svm_softc *sc, int vcpu, u_int num, uint64_t val, bool *retu)
|
|
{
|
|
int error = 0;
|
|
|
|
switch (num) {
|
|
case MSR_MCG_CAP:
|
|
case MSR_MCG_STATUS:
|
|
break; /* ignore writes */
|
|
case MSR_MTRRcap:
|
|
vm_inject_gp(sc->vm, vcpu);
|
|
break;
|
|
case MSR_MTRRdefType:
|
|
case MSR_MTRR4kBase ... MSR_MTRR4kBase + 8:
|
|
case MSR_MTRR16kBase ... MSR_MTRR16kBase + 1:
|
|
case MSR_MTRR64kBase:
|
|
case MSR_SYSCFG:
|
|
break; /* Ignore writes */
|
|
case MSR_AMDK8_IPM:
|
|
/*
|
|
* Ignore writes to the "Interrupt Pending Message" MSR.
|
|
*/
|
|
break;
|
|
case MSR_K8_UCODE_UPDATE:
|
|
/*
|
|
* Ignore writes to microcode update register.
|
|
*/
|
|
break;
|
|
#ifdef BHYVE_SNAPSHOT
|
|
case MSR_TSC:
|
|
error = svm_set_tsc_offset(sc, vcpu, val - rdtsc());
|
|
break;
|
|
#endif
|
|
case MSR_EXTFEATURES:
|
|
break;
|
|
default:
|
|
error = EINVAL;
|
|
break;
|
|
}
|
|
|
|
return (error);
|
|
}
|