cloud-hypervisor/vmm/src/cpu.rs

// Copyright © 2020, Oracle and/or its affiliates.
//
// Copyright 2018 Amazon.com, Inc. or its affiliates. All Rights Reserved.
//
// Portions Copyright 2017 The Chromium OS Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE-BSD-3-Clause file.
//
// Copyright © 2019 Intel Corporation
//
// SPDX-License-Identifier: Apache-2.0 AND BSD-3-Clause
//

#[cfg(target_arch = "x86_64")]
use crate::config::CpuTopology;
use crate::config::CpusConfig;
use crate::device_manager::DeviceManager;
use crate::memory_manager::MemoryManager;
use crate::seccomp_filters::{get_seccomp_filter, Thread};
use crate::vm::physical_bits;
use crate::CPU_MANAGER_SNAPSHOT_ID;
#[cfg(feature = "acpi")]
use acpi_tables::{aml, aml::Aml, sdt::SDT};
use anyhow::anyhow;
#[cfg(feature = "acpi")]
use arch::layout;
#[cfg(target_arch = "x86_64")]
use arch::x86_64::SgxEpcSection;
#[cfg(target_arch = "x86_64")]
use arch::CpuidPatch;
use arch::EntryPoint;
use devices::interrupt_controller::InterruptController;
#[cfg(target_arch = "aarch64")]
use hypervisor::kvm::kvm_bindings;
#[cfg(target_arch = "x86_64")]
use hypervisor::CpuId;
use hypervisor::{vm::VmmOps, CpuState, HypervisorCpuError, VmExit};
use libc::{c_void, siginfo_t};
use seccomp::{SeccompAction, SeccompFilter};
use std::os::unix::thread::JoinHandleExt;
use std::sync::atomic::{AtomicBool, Ordering};
use std::sync::{Arc, Barrier, Mutex};
use std::{cmp, io, result, thread};
use vm_device::BusDevice;
#[cfg(target_arch = "x86_64")]
use vm_memory::GuestAddress;
use vm_memory::{GuestMemoryAtomic, GuestMemoryMmap};
use vm_migration::{
    Migratable, MigratableError, Pausable, Snapshot, SnapshotDataSection, Snapshottable,
    Transportable,
};
use vmm_sys_util::eventfd::EventFd;
use vmm_sys_util::signal::{register_signal_handler, SIGRTMIN};

// CPUID feature bits
#[cfg(target_arch = "x86_64")]
const TSC_DEADLINE_TIMER_ECX_BIT: u8 = 24; // tsc deadline timer ecx bit.
#[cfg(target_arch = "x86_64")]
const HYPERVISOR_ECX_BIT: u8 = 31; // Hypervisor ecx bit.
#[cfg(target_arch = "x86_64")]
const MTRR_EDX_BIT: u8 = 12; // Hypervisor ecx bit.

#[derive(Debug)]
pub enum Error {
    /// Cannot create the vCPU.
    VcpuCreate(anyhow::Error),

    /// Cannot run the VCPUs.
    VcpuRun(anyhow::Error),

    /// Cannot spawn a new vCPU thread.
    VcpuSpawn(io::Error),

    /// Cannot patch the CPU ID
    PatchCpuId(anyhow::Error),

    /// The call to KVM_SET_CPUID2 failed.
    SetSupportedCpusFailed(anyhow::Error),

    #[cfg(target_arch = "x86_64")]
    /// Cannot set the local interruption due to bad configuration.
    LocalIntConfiguration(anyhow::Error),

    /// Error configuring VCPU
    VcpuConfiguration(arch::Error),

    #[cfg(target_arch = "aarch64")]
    /// Error fetching prefered target
    VcpuArmPreferredTarget(hypervisor::HypervisorVmError),

    #[cfg(target_arch = "aarch64")]
    /// Error doing vCPU init on Arm.
    VcpuArmInit(hypervisor::HypervisorCpuError),

    /// Failed to join on vCPU threads
    ThreadCleanup(std::boxed::Box<dyn std::any::Any + std::marker::Send>),

    /// Cannot add legacy device to Bus.
    BusError(vm_device::BusError),

    /// Failed to allocate IO port
    AllocateIOPort,

    /// Asking for more vCPUs that we can have
    DesiredVCPUCountExceedsMax,

    /// Failed to get KVM vcpu lapic.
    VcpuGetLapic(anyhow::Error),

    /// Failed to set KVM vcpu lapic.
    VcpuSetLapic(anyhow::Error),

    /// Failed to get KVM vcpu MP state.
    VcpuGetMpState(anyhow::Error),

    /// Failed to set KVM vcpu MP state.
    VcpuSetMpState(anyhow::Error),

    /// Failed to get KVM vcpu msrs.
    VcpuGetMsrs(anyhow::Error),

    /// Failed to set KVM vcpu msrs.
    VcpuSetMsrs(anyhow::Error),

    /// Failed to get KVM vcpu regs.
    VcpuGetRegs(anyhow::Error),

    /// Failed to set KVM vcpu regs.
    VcpuSetRegs(anyhow::Error),

    /// Failed to get KVM vcpu sregs.
    VcpuGetSregs(anyhow::Error),

    /// Failed to set KVM vcpu sregs.
    VcpuSetSregs(anyhow::Error),

    /// Failed to get KVM vcpu events.
    VcpuGetVcpuEvents(anyhow::Error),

    /// Failed to set KVM vcpu events.
    VcpuSetVcpuEvents(anyhow::Error),

    /// Failed to get KVM vcpu FPU.
    VcpuGetFpu(anyhow::Error),

    /// Failed to set KVM vcpu FPU.
    VcpuSetFpu(anyhow::Error),

    /// Failed to get KVM vcpu XSAVE.
    VcpuGetXsave(anyhow::Error),

    /// Failed to set KVM vcpu XSAVE.
    VcpuSetXsave(anyhow::Error),

    /// Failed to get KVM vcpu XCRS.
    VcpuGetXcrs(anyhow::Error),

    /// Failed to set KVM vcpu XCRS.
    VcpuSetXcrs(anyhow::Error),

    /// Error resuming vCPU on shutdown
    ResumeOnShutdown(MigratableError),

    /// Cannot create seccomp filter
    CreateSeccompFilter(seccomp::SeccompError),

    /// Cannot apply seccomp filter
    ApplySeccompFilter(seccomp::Error),

    /// Error starting vCPU after restore
    StartRestoreVcpu(anyhow::Error),

    /// Error because an unexpected VmExit type was received.
    UnexpectedVmExit,
}
pub type Result<T> = result::Result<T, Error>;

#[cfg(feature = "acpi")]
#[repr(packed)]
struct LocalAPIC {
    pub r#type: u8,
    pub length: u8,
    pub processor_id: u8,
    pub apic_id: u8,
    pub flags: u32,
}

#[repr(packed)]
#[derive(Default)]
struct IOAPIC {
    pub r#type: u8,
    pub length: u8,
    pub ioapic_id: u8,
    _reserved: u8,
    pub apic_address: u32,
    pub gsi_base: u32,
}

#[repr(packed)]
#[derive(Default)]
struct InterruptSourceOverride {
    pub r#type: u8,
    pub length: u8,
    pub bus: u8,
    pub source: u8,
    pub gsi: u32,
    pub flags: u16,
}

/// A wrapper around creating and using a kvm-based VCPU.
pub struct Vcpu {
    // The hypervisor abstracted CPU.
    vcpu: Arc<dyn hypervisor::Vcpu>,
    id: u8,
    #[cfg(target_arch = "aarch64")]
    mpidr: u64,
    saved_state: Option<CpuState>,
}

impl Vcpu {
    /// Constructs a new VCPU for `vm`.
    ///
    /// # Arguments
    ///
    /// * `id` - Represents the CPU number between [0, max vcpus).
    /// * `vm` - The virtual machine this vcpu will get attached to.
    /// * `vmmops` - Optional object for exit handling.
    pub fn new(
        id: u8,
        vm: &Arc<dyn hypervisor::Vm>,
        vmmops: Option<Arc<Box<dyn VmmOps>>>,
    ) -> Result<Arc<Mutex<Self>>> {
        let vcpu = vm
            .create_vcpu(id, vmmops)
            .map_err(|e| Error::VcpuCreate(e.into()))?;
        // Initially the cpuid per vCPU is the one supported by this VM.
        Ok(Arc::new(Mutex::new(Vcpu {
            vcpu,
            id,
            #[cfg(target_arch = "aarch64")]
            mpidr: 0,
            saved_state: None,
        })))
    }

    /// Configures a vcpu and should be called once per vcpu when created.
    ///
    /// # Arguments
    ///
    /// * `kernel_entry_point` - Kernel entry point address in guest memory and boot protocol used.
    /// * `vm_memory` - Guest memory.
    /// * `cpuid` - (x86_64) CpuId, wrapper over the `kvm_cpuid2` structure.
    pub fn configure(
        &mut self,
        #[cfg(target_arch = "aarch64")] vm: &Arc<dyn hypervisor::Vm>,
        kernel_entry_point: Option<EntryPoint>,
        vm_memory: &GuestMemoryAtomic<GuestMemoryMmap>,
        #[cfg(target_arch = "x86_64")] cpuid: CpuId,
        #[cfg(target_arch = "x86_64")] kvm_hyperv: bool,
        phys_bits: u8,
    ) -> Result<()> {
        #[cfg(target_arch = "aarch64")]
        {
            self.init(vm)?;
            self.mpidr = arch::configure_vcpu(
                &self.vcpu,
                self.id,
                kernel_entry_point,
                vm_memory,
                phys_bits,
            )
            .map_err(Error::VcpuConfiguration)?;
        }

        #[cfg(target_arch = "x86_64")]
        arch::configure_vcpu(
            &self.vcpu,
            self.id,
            kernel_entry_point,
            vm_memory,
            cpuid,
            kvm_hyperv,
            phys_bits,
        )
        .map_err(Error::VcpuConfiguration)?;

        Ok(())
    }

    /// Gets the MPIDR register value.
    #[cfg(target_arch = "aarch64")]
    pub fn get_mpidr(&self) -> u64 {
        self.mpidr
    }

    /// Gets the saved vCPU state.
    #[cfg(target_arch = "aarch64")]
    pub fn get_saved_state(&self) -> Option<CpuState> {
        self.saved_state.clone()
    }

    /// Initializes an aarch64 specific vcpu for booting Linux.
    #[cfg(target_arch = "aarch64")]
    pub fn init(&self, vm: &Arc<dyn hypervisor::Vm>) -> Result<()> {
        let mut kvi: kvm_bindings::kvm_vcpu_init = kvm_bindings::kvm_vcpu_init::default();

        // This reads back the kernel's preferred target type.
        vm.get_preferred_target(&mut kvi)
            .map_err(Error::VcpuArmPreferredTarget)?;
        // We already checked that the capability is supported.
        kvi.features[0] |= 1 << kvm_bindings::KVM_ARM_VCPU_PSCI_0_2;
        // Non-boot cpus are powered off initially.
        if self.id > 0 {
            kvi.features[0] |= 1 << kvm_bindings::KVM_ARM_VCPU_POWER_OFF;
        }
        self.vcpu.vcpu_init(&kvi).map_err(Error::VcpuArmInit)
    }

    /// Runs the VCPU until it exits, returning the reason.
    ///
    /// Note that the state of the VCPU and associated VM must be setup first for this to do
    /// anything useful.
    pub fn run(&self) -> std::result::Result<VmExit, HypervisorCpuError> {
        self.vcpu.run()
    }
}

const VCPU_SNAPSHOT_ID: &str = "vcpu";
impl Pausable for Vcpu {
    fn pause(&mut self) -> std::result::Result<(), MigratableError> {
        self.saved_state =
            Some(self.vcpu.state().map_err(|e| {
                MigratableError::Pause(anyhow!("Could not get vCPU state {:?}", e))
            })?);

        Ok(())
    }

    fn resume(&mut self) -> std::result::Result<(), MigratableError> {
        if let Some(vcpu_state) = &self.saved_state {
            self.vcpu.set_state(vcpu_state).map_err(|e| {
                MigratableError::Pause(anyhow!("Could not set the vCPU state {:?}", e))
            })?;
        }

        Ok(())
    }
}
impl Snapshottable for Vcpu {
    fn id(&self) -> String {
        VCPU_SNAPSHOT_ID.to_string()
    }

    fn snapshot(&mut self) -> std::result::Result<Snapshot, MigratableError> {
        let snapshot = serde_json::to_vec(&self.saved_state)
            .map_err(|e| MigratableError::Snapshot(e.into()))?;

        let mut vcpu_snapshot = Snapshot::new(&format!("{}", self.id));
        vcpu_snapshot.add_data_section(SnapshotDataSection {
            id: format!("{}-section", VCPU_SNAPSHOT_ID),
            snapshot,
        });

        Ok(vcpu_snapshot)
    }

    fn restore(&mut self, snapshot: Snapshot) -> std::result::Result<(), MigratableError> {
        if let Some(vcpu_section) = snapshot
            .snapshot_data
            .get(&format!("{}-section", VCPU_SNAPSHOT_ID))
        {
            let vcpu_state = match serde_json::from_slice(&vcpu_section.snapshot) {
                Ok(state) => state,
                Err(error) => {
                    return Err(MigratableError::Restore(anyhow!(
                        "Could not deserialize the vCPU snapshot {}",
                        error
                    )))
                }
            };

            self.saved_state = Some(vcpu_state);

            Ok(())
        } else {
            Err(MigratableError::Restore(anyhow!(
                "Could not find the vCPU snapshot section"
            )))
        }
    }
}

pub struct CpuManager {
    config: CpusConfig,
    #[cfg_attr(target_arch = "aarch64", allow(dead_code))]
    interrupt_controller: Option<Arc<Mutex<dyn InterruptController>>>,
    #[cfg_attr(target_arch = "aarch64", allow(dead_code))]
    vm_memory: GuestMemoryAtomic<GuestMemoryMmap>,
    #[cfg(target_arch = "x86_64")]
    cpuid: CpuId,
    #[cfg_attr(target_arch = "aarch64", allow(dead_code))]
    vm: Arc<dyn hypervisor::Vm>,
    vcpus_kill_signalled: Arc<AtomicBool>,
    vcpus_pause_signalled: Arc<AtomicBool>,
    exit_evt: EventFd,
    #[cfg_attr(target_arch = "aarch64", allow(dead_code))]
    reset_evt: EventFd,
    vcpu_states: Vec<VcpuState>,
    selected_cpu: u8,
    vcpus: Vec<Arc<Mutex<Vcpu>>>,
    seccomp_action: SeccompAction,
    vmmops: Arc<Box<dyn VmmOps>>,
}

const CPU_ENABLE_FLAG: usize = 0;
const CPU_INSERTING_FLAG: usize = 1;
const CPU_REMOVING_FLAG: usize = 2;
const CPU_EJECT_FLAG: usize = 3;

const CPU_STATUS_OFFSET: u64 = 4;
const CPU_SELECTION_OFFSET: u64 = 0;

impl BusDevice for CpuManager {
    fn read(&mut self, _base: u64, offset: u64, data: &mut [u8]) {
        match offset {
            CPU_STATUS_OFFSET => {
                if self.selected_cpu < self.present_vcpus() {
                    let state = &self.vcpu_states[usize::from(self.selected_cpu)];
                    if state.active() {
                        data[0] |= 1 << CPU_ENABLE_FLAG;
                    }
                    if state.inserting {
                        data[0] |= 1 << CPU_INSERTING_FLAG;
                    }
                    if state.removing {
                        data[0] |= 1 << CPU_REMOVING_FLAG;
                    }
                }
            }
            _ => {
                warn!(
                    "Unexpected offset for accessing CPU manager device: {:#}",
                    offset
                );
            }
        }
    }

    fn write(&mut self, _base: u64, offset: u64, data: &[u8]) {
        match offset {
            CPU_SELECTION_OFFSET => {
                self.selected_cpu = data[0];
            }
            CPU_STATUS_OFFSET => {
                let state = &mut self.vcpu_states[usize::from(self.selected_cpu)];
                // The ACPI code writes back a 1 to acknowledge the insertion
                if (data[0] & (1 << CPU_INSERTING_FLAG) == 1 << CPU_INSERTING_FLAG)
                    && state.inserting
                {
                    state.inserting = false;
                }
                // Ditto for removal
                if (data[0] & (1 << CPU_REMOVING_FLAG) == 1 << CPU_REMOVING_FLAG) && state.removing
                {
                    state.removing = false;
                }
                // Trigger removal of vCPU
                if data[0] & (1 << CPU_EJECT_FLAG) == 1 << CPU_EJECT_FLAG {
                    if let Err(e) = self.remove_vcpu(self.selected_cpu) {
                        error!("Error removing vCPU: {:?}", e);
                    }
                }
            }
            _ => {
                warn!(
                    "Unexpected offset for accessing CPU manager device: {:#}",
                    offset
                );
            }
        }
    }
}

#[derive(Default)]
struct VcpuState {
    inserting: bool,
    removing: bool,
    handle: Option<thread::JoinHandle<()>>,
    kill: Arc<AtomicBool>,
    vcpu_run_interrupted: Arc<AtomicBool>,
}

impl VcpuState {
    fn active(&self) -> bool {
        self.handle.is_some()
    }

    fn signal_thread(&self) {
        if let Some(handle) = self.handle.as_ref() {
            loop {
                unsafe {
                    libc::pthread_kill(handle.as_pthread_t() as _, SIGRTMIN());
                }
                if self.vcpu_run_interrupted.load(Ordering::SeqCst) {
                    break;
                } else {
                    // This is more effective than thread::yield_now() at
                    // avoiding a priority inversion with the vCPU thread
                    thread::sleep(std::time::Duration::from_millis(1));
                }
            }
        }
    }

    fn join_thread(&mut self) -> Result<()> {
        if let Some(handle) = self.handle.take() {
            handle.join().map_err(Error::ThreadCleanup)?
        }

        Ok(())
    }

    fn unpark_thread(&self) {
        if let Some(handle) = self.handle.as_ref() {
            handle.thread().unpark()
        }
    }
}

impl CpuManager {
    #[allow(unused_variables)]
    #[allow(clippy::too_many_arguments)]
    pub fn new(
        config: &CpusConfig,
        device_manager: &Arc<Mutex<DeviceManager>>,
        memory_manager: &Arc<Mutex<MemoryManager>>,
        vm: Arc<dyn hypervisor::Vm>,
        exit_evt: EventFd,
        reset_evt: EventFd,
        hypervisor: Arc<dyn hypervisor::Hypervisor>,
        seccomp_action: SeccompAction,
        vmmops: Arc<Box<dyn VmmOps>>,
    ) -> Result<Arc<Mutex<CpuManager>>> {
        let guest_memory = memory_manager.lock().unwrap().guest_memory();
        let mut vcpu_states = Vec::with_capacity(usize::from(config.max_vcpus));
        vcpu_states.resize_with(usize::from(config.max_vcpus), VcpuState::default);

        #[cfg(target_arch = "x86_64")]
        let sgx_epc_sections =
            if let Some(sgx_epc_region) = memory_manager.lock().unwrap().sgx_epc_region() {
                Some(sgx_epc_region.epc_sections().clone())
            } else {
                None
            };
        #[cfg(target_arch = "x86_64")]
        let cpuid = CpuManager::patch_cpuid(hypervisor, &config.topology, sgx_epc_sections)?;

        let device_manager = device_manager.lock().unwrap();
        let cpu_manager = Arc::new(Mutex::new(CpuManager {
            config: config.clone(),
            interrupt_controller: device_manager.interrupt_controller().clone(),
            vm_memory: guest_memory,
            #[cfg(target_arch = "x86_64")]
            cpuid,
            vm,
            vcpus_kill_signalled: Arc::new(AtomicBool::new(false)),
            vcpus_pause_signalled: Arc::new(AtomicBool::new(false)),
            vcpu_states,
            exit_evt,
            reset_evt,
            selected_cpu: 0,
            vcpus: Vec::with_capacity(usize::from(config.max_vcpus)),
            seccomp_action,
            vmmops,
        }));

        #[cfg(target_arch = "x86_64")]
        device_manager
            .allocator()
            .lock()
            .unwrap()
            .allocate_io_addresses(Some(GuestAddress(0x0cd8)), 0x8, None)
            .ok_or(Error::AllocateIOPort)?;

        #[cfg(target_arch = "x86_64")]
        device_manager
            .io_bus()
            .insert(cpu_manager.clone(), 0x0cd8, 0xc)
            .map_err(Error::BusError)?;

        Ok(cpu_manager)
    }

    #[cfg(target_arch = "x86_64")]
    fn patch_cpuid(
        hypervisor: Arc<dyn hypervisor::Hypervisor>,
        topology: &Option<CpuTopology>,
        sgx_epc_sections: Option<Vec<SgxEpcSection>>,
    ) -> Result<CpuId> {
        let mut cpuid_patches = Vec::new();

        // Patch tsc deadline timer bit
        cpuid_patches.push(CpuidPatch {
            function: 1,
            index: 0,
            flags_bit: None,
            eax_bit: None,
            ebx_bit: None,
            ecx_bit: Some(TSC_DEADLINE_TIMER_ECX_BIT),
            edx_bit: None,
        });

        // Patch hypervisor bit
        cpuid_patches.push(CpuidPatch {
            function: 1,
            index: 0,
            flags_bit: None,
            eax_bit: None,
            ebx_bit: None,
            ecx_bit: Some(HYPERVISOR_ECX_BIT),
            edx_bit: None,
        });

        // Enable MTRR feature
        cpuid_patches.push(CpuidPatch {
            function: 1,
            index: 0,
            flags_bit: None,
            eax_bit: None,
            ebx_bit: None,
            ecx_bit: None,
            edx_bit: Some(MTRR_EDX_BIT),
        });

        // Supported CPUID
        let mut cpuid = hypervisor
            .get_cpuid()
            .map_err(|e| Error::PatchCpuId(e.into()))?;

        CpuidPatch::patch_cpuid(&mut cpuid, cpuid_patches);

        if let Some(t) = topology {
            arch::x86_64::update_cpuid_topology(
                &mut cpuid,
                t.threads_per_core,
                t.cores_per_die,
                t.dies_per_package,
            );
        }

        if let Some(sgx_epc_sections) = sgx_epc_sections {
            arch::x86_64::update_cpuid_sgx(&mut cpuid, sgx_epc_sections).unwrap();
        }

        Ok(cpuid)
    }

    fn create_vcpu(
        &mut self,
        cpu_id: u8,
        entry_point: Option<EntryPoint>,
        snapshot: Option<Snapshot>,
    ) -> Result<Arc<Mutex<Vcpu>>> {
        info!("Creating vCPU: cpu_id = {}", cpu_id);

        let vcpu = Vcpu::new(cpu_id, &self.vm, Some(self.vmmops.clone()))?;

        if let Some(snapshot) = snapshot {
            // AArch64 vCPUs should be initialized after created.
            #[cfg(target_arch = "aarch64")]
            vcpu.lock().unwrap().init(&self.vm)?;

            vcpu.lock()
                .unwrap()
                .restore(snapshot)
                .expect("Failed to restore vCPU");
        } else {
            let vm_memory = self.vm_memory.clone();

            let phys_bits = physical_bits(self.config.max_phys_bits);

            #[cfg(target_arch = "x86_64")]
            vcpu.lock()
                .unwrap()
                .configure(
                    entry_point,
                    &vm_memory,
                    self.cpuid.clone(),
                    self.config.kvm_hyperv,
                    phys_bits,
                )
                .expect("Failed to configure vCPU");

            #[cfg(target_arch = "aarch64")]
            vcpu.lock()
                .unwrap()
                .configure(&self.vm, entry_point, &vm_memory, phys_bits)
                .expect("Failed to configure vCPU");
        }

        // Adding vCPU to the CpuManager's vCPU list.
        self.vcpus.push(Arc::clone(&vcpu));

        Ok(vcpu)
    }

    /// Only create new vCPUs if there aren't any inactive ones to reuse
    fn create_vcpus(&mut self, desired_vcpus: u8, entry_point: Option<EntryPoint>) -> Result<()> {
        info!(
            "Request to create new vCPUs: desired = {}, max = {}, allocated = {}, present = {}",
            desired_vcpus,
            self.config.max_vcpus,
            self.vcpus.len(),
            self.present_vcpus()
        );

        if desired_vcpus > self.config.max_vcpus {
            return Err(Error::DesiredVCPUCountExceedsMax);
        }

        // Only create vCPUs in excess of all the allocated vCPUs.
        for cpu_id in self.vcpus.len() as u8..desired_vcpus {
            self.create_vcpu(cpu_id, entry_point, None)?;
        }

        Ok(())
    }

    fn start_vcpu(
        &mut self,
        vcpu: Arc<Mutex<Vcpu>>,
        vcpu_thread_barrier: Arc<Barrier>,
        inserting: bool,
    ) -> Result<()> {
        let cpu_id = vcpu.lock().unwrap().id;
        let reset_evt = self.reset_evt.try_clone().unwrap();
        let exit_evt = self.exit_evt.try_clone().unwrap();
        let vcpu_kill_signalled = self.vcpus_kill_signalled.clone();
        let vcpu_pause_signalled = self.vcpus_pause_signalled.clone();

        let vcpu_kill = self.vcpu_states[usize::from(cpu_id)].kill.clone();
        let vcpu_run_interrupted = self.vcpu_states[usize::from(cpu_id)]
            .vcpu_run_interrupted
            .clone();

        info!("Starting vCPU: cpu_id = {}", cpu_id);

        // Retrieve seccomp filter for vcpu thread
        let vcpu_seccomp_filter = get_seccomp_filter(&self.seccomp_action, Thread::Vcpu)
            .map_err(Error::CreateSeccompFilter)?;

        #[cfg(target_arch = "x86_64")]
        let interrupt_controller_clone =
            if let Some(interrupt_controller) = &self.interrupt_controller {
                Some(interrupt_controller.clone())
            } else {
                None
            };

        let handle = Some(
            thread::Builder::new()
                .name(format!("vcpu{}", cpu_id))
                .spawn(move || {
                    // Apply seccomp filter for vcpu thread.
                    if let Err(e) =
                        SeccompFilter::apply(vcpu_seccomp_filter).map_err(Error::ApplySeccompFilter)
                    {
                        error!("Error applying seccomp filter: {:?}", e);
                        return;
                    }

                    extern "C" fn handle_signal(_: i32, _: *mut siginfo_t, _: *mut c_void) {}
                    // This uses an async signal safe handler to kill the vcpu handles.
                    register_signal_handler(SIGRTMIN(), handle_signal)
                        .expect("Failed to register vcpu signal handler");

                    // Block until all CPUs are ready.
                    vcpu_thread_barrier.wait();

                    loop {
                        // If we are being told to pause, we park the thread
                        // until the pause boolean is toggled.
                        // The resume operation is responsible for toggling
                        // the boolean and unpark the thread.
                        // We enter a loop because park() could spuriously
                        // return. We will then park() again unless the
                        // pause boolean has been toggled.

                        // Need to use Ordering::SeqCst as we have multiple
                        // loads and stores to different atomics and we need
                        // to see them in a consistent order in all threads

                        if vcpu_pause_signalled.load(Ordering::SeqCst) {
                            vcpu_run_interrupted.store(true, Ordering::SeqCst);
                            while vcpu_pause_signalled.load(Ordering::SeqCst) {
                                thread::park();
                            }
                            vcpu_run_interrupted.store(false, Ordering::SeqCst);
                        }

                        // We've been told to terminate
                        if vcpu_kill_signalled.load(Ordering::SeqCst)
                            || vcpu_kill.load(Ordering::SeqCst)
                        {
                            vcpu_run_interrupted.store(true, Ordering::SeqCst);
                            break;
                        }

                        // vcpu.run() returns false on a triple-fault so trigger a reset
                        match vcpu.lock().unwrap().run() {
                            Ok(run) => match run {
                                #[cfg(target_arch = "x86_64")]
                                VmExit::IoapicEoi(vector) => {
                                    if let Some(interrupt_controller) = &interrupt_controller_clone
                                    {
                                        interrupt_controller
                                            .lock()
                                            .unwrap()
                                            .end_of_interrupt(vector);
                                    }
                                }
                                VmExit::Ignore => {}
                                VmExit::Hyperv => {}
                                VmExit::Reset => {
                                    debug!("VmExit::Reset");
                                    vcpu_run_interrupted.store(true, Ordering::SeqCst);
                                    reset_evt.write(1).unwrap();
                                    break;
                                }
                                VmExit::Shutdown => {
                                    debug!("VmExit::Shutdown");
                                    vcpu_run_interrupted.store(true, Ordering::SeqCst);
                                    exit_evt.write(1).unwrap();
                                    break;
                                }
                                _ => {
                                    error!("VCPU generated error: {:?}", Error::UnexpectedVmExit);
                                    break;
                                }
                            },

                            Err(e) => {
                                error!("VCPU generated error: {:?}", Error::VcpuRun(e.into()));
                                break;
                            }
                        }

                        // We've been told to terminate
                        if vcpu_kill_signalled.load(Ordering::SeqCst)
                            || vcpu_kill.load(Ordering::SeqCst)
                        {
                            vcpu_run_interrupted.store(true, Ordering::SeqCst);
                            break;
                        }
                    }
                })
                .map_err(Error::VcpuSpawn)?,
        );

        // On hot plug calls into this function entry_point is None. It is for
        // those hotplug CPU additions that we need to set the inserting flag.
        self.vcpu_states[usize::from(cpu_id)].handle = handle;
        self.vcpu_states[usize::from(cpu_id)].inserting = inserting;

        Ok(())
    }

    /// Start up as many vCPUs threads as needed to reach `desired_vcpus`
    fn activate_vcpus(&mut self, desired_vcpus: u8, inserting: bool) -> Result<()> {
        if desired_vcpus > self.config.max_vcpus {
            return Err(Error::DesiredVCPUCountExceedsMax);
        }

        let vcpu_thread_barrier = Arc::new(Barrier::new(
            (desired_vcpus - self.present_vcpus() + 1) as usize,
        ));

        info!(
            "Starting vCPUs: desired = {}, allocated = {}, present = {}",
            desired_vcpus,
            self.vcpus.len(),
            self.present_vcpus()
        );

        // This reuses any inactive vCPUs as well as any that were newly created
        for cpu_id in self.present_vcpus()..desired_vcpus {
            let vcpu = Arc::clone(&self.vcpus[cpu_id as usize]);
            self.start_vcpu(vcpu, vcpu_thread_barrier.clone(), inserting)?;
        }

        // Unblock all CPU threads.
        vcpu_thread_barrier.wait();
        Ok(())
    }

    fn mark_vcpus_for_removal(&mut self, desired_vcpus: u8) -> Result<()> {
        // Mark vCPUs for removal, actual removal happens on ejection
        for cpu_id in desired_vcpus..self.present_vcpus() {
            self.vcpu_states[usize::from(cpu_id)].removing = true;
        }
        Ok(())
    }

    fn remove_vcpu(&mut self, cpu_id: u8) -> Result<()> {
        info!("Removing vCPU: cpu_id = {}", cpu_id);
        let mut state = &mut self.vcpu_states[usize::from(cpu_id)];
        state.kill.store(true, Ordering::SeqCst);
        state.signal_thread();
        state.join_thread()?;
        state.handle = None;

        // Once the thread has exited, clear the "kill" so that it can reused
        state.kill.store(false, Ordering::SeqCst);

        Ok(())
    }

    pub fn create_boot_vcpus(&mut self, entry_point: EntryPoint) -> Result<()> {
        self.create_vcpus(self.boot_vcpus(), Some(entry_point))
    }

    // Starts all the vCPUs that the VM is booting with. Blocks until all vCPUs are running.
    pub fn start_boot_vcpus(&mut self) -> Result<()> {
        self.activate_vcpus(self.boot_vcpus(), false)
    }

    pub fn start_restored_vcpus(&mut self) -> Result<()> {
        let vcpu_numbers = self.vcpus.len();
        let vcpu_thread_barrier = Arc::new(Barrier::new((vcpu_numbers + 1) as usize));
        // Restore the vCPUs in "paused" state.
        self.vcpus_pause_signalled.store(true, Ordering::SeqCst);

        for vcpu_index in 0..vcpu_numbers {
            let vcpu = Arc::clone(&self.vcpus[vcpu_index as usize]);

            self.start_vcpu(vcpu, vcpu_thread_barrier.clone(), false)
                .map_err(|e| {
                    Error::StartRestoreVcpu(anyhow!("Failed to start restored vCPUs: {:#?}", e))
                })?;
        }
        // Unblock all restored CPU threads.
        vcpu_thread_barrier.wait();
        Ok(())
    }

    pub fn resize(&mut self, desired_vcpus: u8) -> Result<bool> {
        match desired_vcpus.cmp(&self.present_vcpus()) {
            cmp::Ordering::Greater => {
                self.create_vcpus(desired_vcpus, None)?;
                self.activate_vcpus(desired_vcpus, true)?;
                Ok(true)
            }
            cmp::Ordering::Less => self.mark_vcpus_for_removal(desired_vcpus).and(Ok(true)),
            _ => Ok(false),
        }
    }

    pub fn shutdown(&mut self) -> Result<()> {
        // Tell the vCPUs to stop themselves next time they go through the loop
        self.vcpus_kill_signalled.store(true, Ordering::SeqCst);

        // Toggle the vCPUs pause boolean
        self.vcpus_pause_signalled.store(false, Ordering::SeqCst);

        // Unpark all the VCPU threads.
        for state in self.vcpu_states.iter() {
            state.unpark_thread();
        }

        // Signal to the spawned threads (vCPUs and console signal handler). For the vCPU threads
        // this will interrupt the KVM_RUN ioctl() allowing the loop to check the boolean set
        // above.
        for state in self.vcpu_states.iter() {
            state.signal_thread();
        }

        // Wait for all the threads to finish. This removes the state from the vector.
        for mut state in self.vcpu_states.drain(..) {
            state.join_thread()?;
        }

        Ok(())
    }

    pub fn boot_vcpus(&self) -> u8 {
        self.config.boot_vcpus
    }

    pub fn max_vcpus(&self) -> u8 {
        self.config.max_vcpus
    }

    fn present_vcpus(&self) -> u8 {
        self.vcpu_states
            .iter()
            .fold(0, |acc, state| acc + state.active() as u8)
    }

    #[cfg(target_arch = "aarch64")]
    pub fn get_mpidrs(&self) -> Vec<u64> {
        self.vcpus
            .iter()
            .map(|cpu| cpu.lock().unwrap().get_mpidr())
            .collect()
    }

    #[cfg(target_arch = "aarch64")]
    pub fn get_saved_states(&self) -> Vec<CpuState> {
        self.vcpus
            .iter()
            .map(|cpu| cpu.lock().unwrap().get_saved_state().unwrap())
            .collect()
    }

    #[cfg(feature = "acpi")]
    pub fn create_madt(&self) -> SDT {
        // This is also checked in the commandline parsing.
        assert!(self.config.boot_vcpus <= self.config.max_vcpus);

        let mut madt = SDT::new(*b"APIC", 44, 5, *b"CLOUDH", *b"CHMADT  ", 1);
        madt.write(36, layout::APIC_START);

        for cpu in 0..self.config.max_vcpus {
            let lapic = LocalAPIC {
                r#type: 0,
                length: 8,
                processor_id: cpu,
                apic_id: cpu,
                flags: if cpu < self.config.boot_vcpus {
                    1 << MADT_CPU_ENABLE_FLAG
                } else {
                    0
                },
            };
            madt.append(lapic);
        }

        madt.append(IOAPIC {
            r#type: 1,
            length: 12,
            ioapic_id: 0,
            apic_address: layout::IOAPIC_START.0 as u32,
            gsi_base: 0,
            ..Default::default()
        });

        madt.append(InterruptSourceOverride {
            r#type: 2,
            length: 10,
            bus: 0,
            source: 4,
            gsi: 4,
            flags: 0,
        });

        madt
    }
}

#[cfg(feature = "acpi")]
struct CPU {
    cpu_id: u8,
}

#[cfg(feature = "acpi")]
const MADT_CPU_ENABLE_FLAG: usize = 0;

#[cfg(feature = "acpi")]
impl Aml for CPU {
    fn to_aml_bytes(&self) -> Vec<u8> {
        let lapic = LocalAPIC {
            r#type: 0,
            length: 8,
            processor_id: self.cpu_id,
            apic_id: self.cpu_id,
            flags: 1 << MADT_CPU_ENABLE_FLAG,
        };

        let mut mat_data: Vec<u8> = Vec::new();
        mat_data.resize(std::mem::size_of_val(&lapic), 0);
        unsafe { *(mat_data.as_mut_ptr() as *mut LocalAPIC) = lapic };

        aml::Device::new(
            format!("C{:03}", self.cpu_id).as_str().into(),
            vec![
                &aml::Name::new("_HID".into(), &"ACPI0007"),
                &aml::Name::new("_UID".into(), &self.cpu_id),
                /*
                _STA return value:
                Bit [0] – Set if the device is present.
                Bit [1] – Set if the device is enabled and decoding its resources.
                Bit [2] – Set if the device should be shown in the UI.
                Bit [3] – Set if the device is functioning properly (cleared if device failed its diagnostics).
                Bit [4] – Set if the battery is present.
                Bits [31:5] – Reserved (must be cleared).
                */
                &aml::Method::new(
                    "_STA".into(),
                    0,
                    false,
                    // Call into CSTA method which will interrogate device
                    vec![&aml::Return::new(&aml::MethodCall::new(
                        "CSTA".into(),
                        vec![&self.cpu_id],
                    ))],
                ),
                // The Linux kernel expects every CPU device to have a _MAT entry
                // containing the LAPIC for this processor with the enabled bit set
                // even it if is disabled in the MADT (non-boot CPU)
                &aml::Name::new("_MAT".into(), &aml::Buffer::new(mat_data)),
                // Trigger CPU ejection
                &aml::Method::new(
                    "_EJ0".into(),
                    1,
                    false,
                    // Call into CEJ0 method which will actually eject device
                    vec![&aml::Return::new(&aml::MethodCall::new(
                        "CEJ0".into(),
                        vec![&self.cpu_id],
                    ))],
                ),
            ],
        )
        .to_aml_bytes()
    }
}

#[cfg(feature = "acpi")]
struct CPUNotify {
    cpu_id: u8,
}

#[cfg(feature = "acpi")]
impl Aml for CPUNotify {
    fn to_aml_bytes(&self) -> Vec<u8> {
        let object = aml::Path::new(&format!("C{:03}", self.cpu_id));
        aml::If::new(
            &aml::Equal::new(&aml::Arg(0), &self.cpu_id),
            vec![&aml::Notify::new(&object, &aml::Arg(1))],
        )
        .to_aml_bytes()
    }
}

#[cfg(feature = "acpi")]
struct CPUMethods {
    max_vcpus: u8,
}

#[cfg(feature = "acpi")]
impl Aml for CPUMethods {
    fn to_aml_bytes(&self) -> Vec<u8> {
        let mut bytes = Vec::new();
        bytes.extend_from_slice(
            // CPU status method
            &aml::Method::new(
                "CSTA".into(),
                1,
                true,
                vec![
                    // Take lock defined above
                    &aml::Acquire::new("\\_SB_.PRES.CPLK".into(), 0xfff),
                    // Write CPU number (in first argument) to I/O port via field
                    &aml::Store::new(&aml::Path::new("\\_SB_.PRES.CSEL"), &aml::Arg(0)),
                    &aml::Store::new(&aml::Local(0), &aml::ZERO),
                    // Check if CPEN bit is set, if so make the local variable 0xf (see _STA for details of meaning)
                    &aml::If::new(
                        &aml::Equal::new(&aml::Path::new("\\_SB_.PRES.CPEN"), &aml::ONE),
                        vec![&aml::Store::new(&aml::Local(0), &0xfu8)],
                    ),
                    // Release lock
                    &aml::Release::new("\\_SB_.PRES.CPLK".into()),
                    // Return 0 or 0xf
                    &aml::Return::new(&aml::Local(0)),
                ],
            )
            .to_aml_bytes(),
        );

        let mut cpu_notifies = Vec::new();
        for cpu_id in 0..self.max_vcpus {
            cpu_notifies.push(CPUNotify { cpu_id });
        }

        let mut cpu_notifies_refs: Vec<&dyn aml::Aml> = Vec::new();
        for cpu_id in 0..self.max_vcpus {
            cpu_notifies_refs.push(&cpu_notifies[usize::from(cpu_id)]);
        }

        bytes.extend_from_slice(
            &aml::Method::new("CTFY".into(), 2, true, cpu_notifies_refs).to_aml_bytes(),
        );

        bytes.extend_from_slice(
            &aml::Method::new(
                "CEJ0".into(),
                1,
                true,
                vec![
                    &aml::Acquire::new("\\_SB_.PRES.CPLK".into(), 0xfff),
                    // Write CPU number (in first argument) to I/O port via field
                    &aml::Store::new(&aml::Path::new("\\_SB_.PRES.CSEL"), &aml::Arg(0)),
                    // Set CEJ0 bit
                    &aml::Store::new(&aml::Path::new("\\_SB_.PRES.CEJ0"), &aml::ONE),
                    &aml::Release::new("\\_SB_.PRES.CPLK".into()),
                ],
            )
            .to_aml_bytes(),
        );

        bytes.extend_from_slice(
            &aml::Method::new(
                "CSCN".into(),
                0,
                true,
                vec![
                    // Take lock defined above
                    &aml::Acquire::new("\\_SB_.PRES.CPLK".into(), 0xfff),
                    &aml::Store::new(&aml::Local(0), &aml::ZERO),
                    &aml::While::new(
                        &aml::LessThan::new(&aml::Local(0), &self.max_vcpus),
                        vec![
                            // Write CPU number (in first argument) to I/O port via field
                            &aml::Store::new(&aml::Path::new("\\_SB_.PRES.CSEL"), &aml::Local(0)),
                            // Check if CINS bit is set
                            &aml::If::new(
                                &aml::Equal::new(&aml::Path::new("\\_SB_.PRES.CINS"), &aml::ONE),
                                // Notify device if it is
                                vec![
                                    &aml::MethodCall::new(
                                        "CTFY".into(),
                                        vec![&aml::Local(0), &aml::ONE],
                                    ),
                                    // Reset CINS bit
                                    &aml::Store::new(
                                        &aml::Path::new("\\_SB_.PRES.CINS"),
                                        &aml::ONE,
                                    ),
                                ],
                            ),
                            // Check if CRMV bit is set
                            &aml::If::new(
                                &aml::Equal::new(&aml::Path::new("\\_SB_.PRES.CRMV"), &aml::ONE),
                                // Notify device if it is (with the eject constant 0x3)
                                vec![
                                    &aml::MethodCall::new(
                                        "CTFY".into(),
                                        vec![&aml::Local(0), &3u8],
                                    ),
                                    // Reset CRMV bit
                                    &aml::Store::new(
                                        &aml::Path::new("\\_SB_.PRES.CRMV"),
                                        &aml::ONE,
                                    ),
                                ],
                            ),
                            &aml::Add::new(&aml::Local(0), &aml::Local(0), &aml::ONE),
                        ],
                    ),
                    // Release lock
                    &aml::Release::new("\\_SB_.PRES.CPLK".into()),
                ],
            )
            .to_aml_bytes(),
        );
        bytes
    }
}

#[cfg(feature = "acpi")]
impl Aml for CpuManager {
    fn to_aml_bytes(&self) -> Vec<u8> {
        let mut bytes = Vec::new();
        // CPU hotplug controller
        bytes.extend_from_slice(
            &aml::Device::new(
                "_SB_.PRES".into(),
                vec![
                    &aml::Name::new("_HID".into(), &aml::EISAName::new("PNP0A06")),
                    &aml::Name::new("_UID".into(), &"CPU Hotplug Controller"),
                    // Mutex to protect concurrent access as we write to choose CPU and then read back status
                    &aml::Mutex::new("CPLK".into(), 0),
                    // I/O port for CPU controller
                    &aml::Name::new(
                        "_CRS".into(),
                        &aml::ResourceTemplate::new(vec![&aml::IO::new(
                            0x0cd8, 0x0cd8, 0x01, 0x0c,
                        )]),
                    ),
                    // OpRegion and Fields map I/O port into individual field values
                    &aml::OpRegion::new("PRST".into(), aml::OpRegionSpace::SystemIO, 0x0cd8, 0x0c),
                    &aml::Field::new(
                        "PRST".into(),
                        aml::FieldAccessType::Byte,
                        aml::FieldUpdateRule::WriteAsZeroes,
                        vec![
                            aml::FieldEntry::Reserved(32),
                            aml::FieldEntry::Named(*b"CPEN", 1),
                            aml::FieldEntry::Named(*b"CINS", 1),
                            aml::FieldEntry::Named(*b"CRMV", 1),
                            aml::FieldEntry::Named(*b"CEJ0", 1),
                            aml::FieldEntry::Reserved(4),
                            aml::FieldEntry::Named(*b"CCMD", 8),
                        ],
                    ),
                    &aml::Field::new(
                        "PRST".into(),
                        aml::FieldAccessType::DWord,
                        aml::FieldUpdateRule::Preserve,
                        vec![
                            aml::FieldEntry::Named(*b"CSEL", 32),
                            aml::FieldEntry::Reserved(32),
                            aml::FieldEntry::Named(*b"CDAT", 32),
                        ],
                    ),
                ],
            )
            .to_aml_bytes(),
        );

        // CPU devices
        let hid = aml::Name::new("_HID".into(), &"ACPI0010");
        let uid = aml::Name::new("_CID".into(), &aml::EISAName::new("PNP0A05"));
        // Bundle methods together under a common object
        let methods = CPUMethods {
            max_vcpus: self.config.max_vcpus,
        };
        let mut cpu_data_inner: Vec<&dyn aml::Aml> = vec![&hid, &uid, &methods];

        let mut cpu_devices = Vec::new();
        for cpu_id in 0..self.config.max_vcpus {
            let cpu_device = CPU { cpu_id };

            cpu_devices.push(cpu_device);
        }

        for cpu_device in cpu_devices.iter() {
            cpu_data_inner.push(cpu_device);
        }

        bytes.extend_from_slice(
            &aml::Device::new("_SB_.CPUS".into(), cpu_data_inner).to_aml_bytes(),
        );
        bytes
    }
}

impl Pausable for CpuManager {
    fn pause(&mut self) -> std::result::Result<(), MigratableError> {
        // Tell the vCPUs to pause themselves next time they exit
        self.vcpus_pause_signalled.store(true, Ordering::SeqCst);

        // Signal to the spawned threads (vCPUs and console signal handler). For the vCPU threads
        // this will interrupt the KVM_RUN ioctl() allowing the loop to check the boolean set
        // above.
        for state in self.vcpu_states.iter() {
            state.signal_thread();
        }

        for vcpu in self.vcpus.iter() {
            let mut vcpu = vcpu.lock().unwrap();
            vcpu.pause()?;
            #[cfg(all(feature = "kvm", target_arch = "x86_64"))]
            if !self.config.kvm_hyperv {
                vcpu.vcpu.notify_guest_clock_paused().map_err(|e| {
                    MigratableError::Pause(anyhow!(
                        "Could not notify guest it has been paused {:?}",
                        e
                    ))
                })?;
            }
        }

        Ok(())
    }

    fn resume(&mut self) -> std::result::Result<(), MigratableError> {
        for vcpu in self.vcpus.iter() {
            vcpu.lock().unwrap().resume()?;
        }

        // Toggle the vCPUs pause boolean
        self.vcpus_pause_signalled.store(false, Ordering::SeqCst);

        // Unpark all the VCPU threads.
        // Once unparked, the next thing they will do is checking for the pause
        // boolean. Since it'll be set to false, they will exit their pause loop
        // and go back to vmx root.
        for state in self.vcpu_states.iter() {
            state.unpark_thread();
        }
        Ok(())
    }
}

impl Snapshottable for CpuManager {
    fn id(&self) -> String {
        CPU_MANAGER_SNAPSHOT_ID.to_string()
    }

    fn snapshot(&mut self) -> std::result::Result<Snapshot, MigratableError> {
        let mut cpu_manager_snapshot = Snapshot::new(CPU_MANAGER_SNAPSHOT_ID);

        // The CpuManager snapshot is a collection of all vCPUs snapshots.
        for vcpu in &self.vcpus {
            let cpu_snapshot = vcpu.lock().unwrap().snapshot()?;
            cpu_manager_snapshot.add_snapshot(cpu_snapshot);
        }

        Ok(cpu_manager_snapshot)
    }

    fn restore(&mut self, snapshot: Snapshot) -> std::result::Result<(), MigratableError> {
        for (cpu_id, snapshot) in snapshot.snapshots.iter() {
            debug!("Restoring VCPU {}", cpu_id);
            self.create_vcpu(cpu_id.parse::<u8>().unwrap(), None, Some(*snapshot.clone()))
                .map_err(|e| MigratableError::Restore(anyhow!("Could not create vCPU {:?}", e)))?;
        }

        Ok(())
    }
}

impl Transportable for CpuManager {}
impl Migratable for CpuManager {}

#[cfg(all(feature = "kvm", target_arch = "x86_64"))]
#[cfg(test)]
mod tests {

    use super::*;
    use arch::x86_64::interrupts::*;
    use arch::x86_64::regs::*;
    use arch::x86_64::BootProtocol;
    use hypervisor::x86_64::{FpuState, LapicState, SpecialRegisters, StandardRegisters};

    #[test]
    fn test_setlint() {
        let hv = hypervisor::new().unwrap();
        let vm = hv.create_vm().expect("new VM fd creation failed");
        assert!(hv.check_capability(hypervisor::kvm::Cap::Irqchip));
        // Calling get_lapic will fail if there is no irqchip before hand.
        assert!(vm.create_irq_chip().is_ok());
        let vcpu = vm.create_vcpu(0, None).unwrap();
        let klapic_before: LapicState = vcpu.get_lapic().unwrap();

        // Compute the value that is expected to represent LVT0 and LVT1.
        let lint0 = get_klapic_reg(&klapic_before, APIC_LVT0);
        let lint1 = get_klapic_reg(&klapic_before, APIC_LVT1);
        let lint0_mode_expected = set_apic_delivery_mode(lint0, APIC_MODE_EXTINT);
        let lint1_mode_expected = set_apic_delivery_mode(lint1, APIC_MODE_NMI);

        set_lint(&vcpu).unwrap();

        // Compute the value that represents LVT0 and LVT1 after set_lint.
        let klapic_actual: LapicState = vcpu.get_lapic().unwrap();
        let lint0_mode_actual = get_klapic_reg(&klapic_actual, APIC_LVT0);
        let lint1_mode_actual = get_klapic_reg(&klapic_actual, APIC_LVT1);
        assert_eq!(lint0_mode_expected, lint0_mode_actual);
        assert_eq!(lint1_mode_expected, lint1_mode_actual);
    }

    #[test]
    fn test_setup_fpu() {
        let hv = hypervisor::new().unwrap();
        let vm = hv.create_vm().expect("new VM fd creation failed");
        let vcpu = vm.create_vcpu(0, None).unwrap();
        setup_fpu(&vcpu).unwrap();

        let expected_fpu: FpuState = FpuState {
            fcw: 0x37f,
            mxcsr: 0x1f80,
            ..Default::default()
        };
        let actual_fpu: FpuState = vcpu.get_fpu().unwrap();
        // TODO: auto-generate kvm related structures with PartialEq on.
        assert_eq!(expected_fpu.fcw, actual_fpu.fcw);
        // Setting the mxcsr register from FpuState inside setup_fpu does not influence anything.
        // See 'kvm_arch_vcpu_ioctl_set_fpu' from arch/x86/kvm/x86.c.
        // The mxcsr will stay 0 and the assert below fails. Decide whether or not we should
        // remove it at all.
        // assert!(expected_fpu.mxcsr == actual_fpu.mxcsr);
    }

    #[test]
    fn test_setup_msrs() {
        use hypervisor::arch::x86::msr_index;
        use hypervisor::x86_64::{MsrEntries, MsrEntry};

        let hv = hypervisor::new().unwrap();
        let vm = hv.create_vm().expect("new VM fd creation failed");
        let vcpu = vm.create_vcpu(0, None).unwrap();
        setup_msrs(&vcpu).unwrap();

        // This test will check against the last MSR entry configured (the tenth one).
        // See create_msr_entries for details.
        let mut msrs = MsrEntries::from_entries(&[MsrEntry {
            index: msr_index::MSR_IA32_MISC_ENABLE,
            ..Default::default()
        }]);

        // get_msrs returns the number of msrs that it succeed in reading. We only want to read 1
        // in this test case scenario.
        let read_msrs = vcpu.get_msrs(&mut msrs).unwrap();
        assert_eq!(read_msrs, 1);

        // Official entries that were setup when we did setup_msrs. We need to assert that the
        // tenth one (i.e the one with index msr_index::MSR_IA32_MISC_ENABLE has the data we
        // expect.
        let entry_vec = hypervisor::x86_64::boot_msr_entries();
        assert_eq!(entry_vec.as_slice()[9], msrs.as_slice()[0]);
    }

    #[test]
    fn test_setup_regs() {
        let hv = hypervisor::new().unwrap();
        let vm = hv.create_vm().expect("new VM fd creation failed");
        let vcpu = vm.create_vcpu(0, None).unwrap();

        let expected_regs: StandardRegisters = StandardRegisters {
            rflags: 0x0000000000000002u64,
            rip: 1,
            rsp: 2,
            rbp: 2,
            rsi: 3,
            ..Default::default()
        };

        setup_regs(
            &vcpu,
            expected_regs.rip,
            expected_regs.rsp,
            expected_regs.rsi,
            BootProtocol::LinuxBoot,
        )
        .unwrap();

        let actual_regs: StandardRegisters = vcpu.get_regs().unwrap();
        assert_eq!(actual_regs, expected_regs);
    }

    #[test]
    fn test_setup_sregs() {
        let hv = hypervisor::new().unwrap();
        let vm = hv.create_vm().expect("new VM fd creation failed");
        let vcpu = vm.create_vcpu(0, None).unwrap();

        let mut expected_sregs: SpecialRegisters = vcpu.get_sregs().unwrap();
        let gm = GuestMemoryMmap::from_ranges(&[(GuestAddress(0), 0x10000)]).unwrap();
        configure_segments_and_sregs(&gm, &mut expected_sregs, BootProtocol::LinuxBoot).unwrap();
        setup_page_tables(&gm, &mut expected_sregs).unwrap();

        setup_sregs(&gm, &vcpu, BootProtocol::LinuxBoot).unwrap();
        let actual_sregs: SpecialRegisters = vcpu.get_sregs().unwrap();
        assert_eq!(expected_sregs, actual_sregs);
    }
}

#[cfg(target_arch = "aarch64")]
#[cfg(test)]
mod tests {
    use arch::aarch64::layout;
    use arch::aarch64::regs::*;
    use hypervisor::kvm::aarch64::{is_system_register, MPIDR_EL1};
    use hypervisor::kvm::kvm_bindings::{
        kvm_one_reg, kvm_regs, kvm_vcpu_init, user_pt_regs, KVM_REG_ARM64, KVM_REG_ARM64_SYSREG,
        KVM_REG_ARM_CORE, KVM_REG_SIZE_U64,
    };
    use hypervisor::{arm64_core_reg_id, offset__of};
    use std::mem;
    use vm_memory::{GuestAddress, GuestMemoryMmap};

    #[test]
    fn test_setup_regs() {
        let hv = hypervisor::new().unwrap();
        let vm = hv.create_vm().unwrap();
        let vcpu = vm.create_vcpu(0, None).unwrap();
        let mut regions = Vec::new();
        regions.push((
            GuestAddress(layout::RAM_64BIT_START),
            (layout::FDT_MAX_SIZE + 0x1000) as usize,
        ));
        let mem = GuestMemoryMmap::from_ranges(&regions).expect("Cannot initialize memory");

        let res = setup_regs(&vcpu, 0, 0x0, &mem);
        // Must fail when vcpu is not initialized yet.
        assert!(res.is_err());

        let mut kvi: kvm_vcpu_init = kvm_vcpu_init::default();
        vm.get_preferred_target(&mut kvi).unwrap();
        vcpu.vcpu_init(&kvi).unwrap();

        assert!(setup_regs(&vcpu, 0, 0x0, &mem).is_ok());
    }

    #[test]
    fn test_read_mpidr() {
        let hv = hypervisor::new().unwrap();
        let vm = hv.create_vm().unwrap();
        let vcpu = vm.create_vcpu(0, None).unwrap();
        let mut kvi: kvm_vcpu_init = kvm_vcpu_init::default();
        vm.get_preferred_target(&mut kvi).unwrap();

        // Must fail when vcpu is not initialized yet.
        assert!(vcpu.read_mpidr().is_err());

        vcpu.vcpu_init(&kvi).unwrap();
        assert_eq!(vcpu.read_mpidr().unwrap(), 0x80000000);
    }

    #[test]
    fn test_is_system_register() {
        let offset = offset__of!(user_pt_regs, pc);
        let regid = arm64_core_reg_id!(KVM_REG_SIZE_U64, offset);
        assert!(!is_system_register(regid));
        let regid = KVM_REG_ARM64 as u64 | KVM_REG_SIZE_U64 as u64 | KVM_REG_ARM64_SYSREG as u64;
        assert!(is_system_register(regid));
    }

    #[test]
    fn test_save_restore_core_regs() {
        let hv = hypervisor::new().unwrap();
        let vm = hv.create_vm().unwrap();
        let vcpu = vm.create_vcpu(0, None).unwrap();
        let mut kvi: kvm_vcpu_init = kvm_vcpu_init::default();
        vm.get_preferred_target(&mut kvi).unwrap();

        // Must fail when vcpu is not initialized yet.
        let mut state = kvm_regs::default();
        let res = vcpu.core_registers(&mut state);
        assert!(res.is_err());
        assert_eq!(
            format!("{}", res.unwrap_err()),
            "Failed to get core register: Exec format error (os error 8)"
        );

        let res = vcpu.set_core_registers(&mut state);
        assert!(res.is_err());
        assert_eq!(
            format!("{}", res.unwrap_err()),
            "Failed to set core register: Exec format error (os error 8)"
        );

        vcpu.vcpu_init(&kvi).unwrap();
        assert!(vcpu.core_registers(&mut state).is_ok());
        assert_eq!(state.regs.pstate, 0x3C5);

        assert!(vcpu.set_core_registers(&state).is_ok());
        let off = offset__of!(user_pt_regs, pstate);
        let pstate = vcpu
            .get_reg(arm64_core_reg_id!(KVM_REG_SIZE_U64, off))
            .expect("Failed to call kvm get one reg");
        assert_eq!(state.regs.pstate, pstate);
    }

    #[test]
    fn test_save_restore_system_regs() {
        let hv = hypervisor::new().unwrap();
        let vm = hv.create_vm().unwrap();
        let vcpu = vm.create_vcpu(0, None).unwrap();
        let mut kvi: kvm_vcpu_init = kvm_vcpu_init::default();
        vm.get_preferred_target(&mut kvi).unwrap();

        // Must fail when vcpu is not initialized yet.
        let mut state: Vec<kvm_one_reg> = Vec::new();
        let res = vcpu.system_registers(&mut state);
        assert!(res.is_err());
        assert_eq!(
            format!("{}", res.unwrap_err()),
            "Failed to retrieve list of registers: Exec format error (os error 8)"
        );

        state.push(kvm_one_reg {
            id: MPIDR_EL1,
            addr: 0x00,
        });
        let res = vcpu.set_system_registers(&mut state);
        assert!(res.is_err());
        assert_eq!(
            format!("{}", res.unwrap_err()),
            "Failed to set system register: Exec format error (os error 8)"
        );

        vcpu.vcpu_init(&kvi).unwrap();
        assert!(vcpu.system_registers(&mut state).is_ok());
        let initial_mpidr: u64 = vcpu.read_mpidr().expect("Fail to read mpidr");
        assert!(state.contains(&kvm_one_reg {
            id: MPIDR_EL1,
            addr: initial_mpidr
        }));

        assert!(vcpu.set_system_registers(&state).is_ok());
        let mpidr: u64 = vcpu.read_mpidr().expect("Fail to read mpidr");
        assert_eq!(initial_mpidr, mpidr);
    }

    #[test]
    fn test_get_set_mpstate() {
        let hv = hypervisor::new().unwrap();
        let vm = hv.create_vm().unwrap();
        let vcpu = vm.create_vcpu(0, None).unwrap();
        let mut kvi: kvm_vcpu_init = kvm_vcpu_init::default();
        vm.get_preferred_target(&mut kvi).unwrap();

        let res = vcpu.get_mp_state();
        assert!(res.is_ok());
        assert!(vcpu.set_mp_state(res.unwrap()).is_ok());
    }
}
-												pvh: Introduce EntryPoint struct

In order to properly initialize the kvm regs/sregs structs for
the guest, the load_kernel() return type must specify which
boot protocol to use with the entry point address it returns.

Make load_kernel() return an EntryPoint struct containing the
required information. This structure will later be used
in the vCPU configuration methods to setup the appropriate
initial conditions for the guest.

Signed-off-by: Alejandro Jimenez <alejandro.j.jimenez@oracle.com>

											
										
										
											2020-02-12 03:37:33 +00:00
+								// Copyright © 2020, Oracle and/or its affiliates.
 								//
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								// Copyright 2018 Amazon.com, Inc. or its affiliates. All Rights Reserved.
 								//
 								// Portions Copyright 2017 The Chromium OS Authors. All rights reserved.
 								// Use of this source code is governed by a BSD-style license that can be
 								// found in the LICENSE-BSD-3-Clause file.
 								//
 								// Copyright © 2019 Intel Corporation
 								//
 								// SPDX-License-Identifier: Apache-2.0 AND BSD-3-Clause
 								//
-												vmm: cpu: Pass CpusConfig to simplify the new() prototype

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-03-16 17:14:15 +00:00
-												vmm: cpu: Import CpuTopology conditionally on x86_64 only

The aarch64 build has no use for this structure at the moment.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-06-22 13:05:42 +00:00
+								#[cfg(target_arch = "x86_64")]
 								use crate::config::CpuTopology;
 								use crate::config::CpusConfig;
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								use crate::device_manager::DeviceManager;
-												vmm: Pass MemoryManager through CpuManager creation

Instead of passing the GuestMemoryMmap directly to the CpuManager upon
its creation, it's better to pass a reference to the MemoryManager. This
way we will be able to know if SGX EPC region along with one or multiple
sections are present.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-07-08 13:12:27 +00:00
+								use crate::memory_manager::MemoryManager;
-												vmm: seccomp: Add seccomp filters for the vcpu worker thread

Partially fixes: #925

Signed-off-by: Bo Chen <chen.bo@intel.com>

											
										
										
											2020-09-09 22:15:26 +00:00
+								use crate::seccomp_filters::{get_seccomp_filter, Thread};
-												vmm: cpu: Set CPU physical bits based on user input

If the user specified a maximum physical bits value through the
`max_phys_bits` option from `--cpus` parameter, the guest CPUID
will be patched accordingly to ensure the guest will find the
right amount of physical bits.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-10-13 08:22:44 +00:00
+								use crate::vm::physical_bits;
-												vmm: vm: Implement the Snapshottable trait

By aggregating snapshots from the CpuManager, the MemoryManager and the
DeviceManager, Vm implements the snapshot() function from the
Snapshottable trait.
And by restoring snapshots from the CpuManager, the MemoryManager and
the DeviceManager, Vm implements the restore() function from the
Snapshottable trait.

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>
Signed-off-by: Yi Sun <yi.y.sun@linux.intel.com>

											
										
										
											2019-05-12 11:53:47 +00:00
+								use crate::CPU_MANAGER_SNAPSHOT_ID;
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								#[cfg(feature = "acpi")]
 								use acpi_tables::{aml, aml::Aml, sdt::SDT};
-												vmm: cpu: Implement the Snapshottable trait

Implement the Snapshottable trait for Vcpu, and then implements it for
CpuManager. Note that CpuManager goes through the Snapshottable
implementation of Vcpu for every vCPU in order to implement the
Snapshottable trait for itself.

Signed-off-by: Yi Sun <yi.y.sun@linux.intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-18 15:44:41 +00:00
+								use anyhow::anyhow;
-												ci: Run clippy for each specific feature

The build is run against "--all-features", "pci,acpi", "pci" and "mmio"
separately. The clippy validation must be run against the same set of
features in order to validate the code is correct.

Because of these new checks, this commit includes multiple fixes
related to the errors generated when manually running the checks.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-01-21 08:32:50 +00:00
+								#[cfg(feature = "acpi")]
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								use arch::layout;
-												arch, hypervisor, vmm: Patch CPUID subleaves to expose EPC sections

The support for SGX is exposed to the guest through CPUID 0x12. KVM
passes static subleaves 0 and 1 from the host to the guest, without
needing any modification from the VMM itself.

But SGX also relies on dynamic subleaves 2 through N, used for
describing each EPC section. This is not handled by KVM, which means
the VMM is in charge of setting each subleaf starting from index 2
up to index N, depending on the number of EPC sections.

These subleaves 2 through N are not listed as part of the supported
CPUID entries from KVM. But it's important to set them as long as index
0 and 1 are present and indicate that SGX is supported.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-07-08 14:58:10 +00:00
+								#[cfg(target_arch = "x86_64")]
 								use arch::x86_64::SgxEpcSection;
-												vmm: Move Vcpu::configure() to arch crate

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-28 07:27:22 +00:00
+								#[cfg(target_arch = "x86_64")]
-												vmm, hypervisor: Fix snapshot/restore for Windows guest

The snasphot/restore feature is not working because some CPU states are
not properly saved, which means they can't be restored later on.

First thing, we ensure the CPUID is stored so that it can be properly
restored later. The code is simplified and pushed down to the hypervisor
crate.

Second thing, we identify for each vCPU if the Hyper-V SynIC device is
emulated or not. In case it is, that means some specific MSRs will be
set by the guest. These MSRs must be saved in order to properly restore
the VM.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-10-16 16:12:46 +00:00
+								use arch::CpuidPatch;
 								use arch::EntryPoint;
-												devices, vm-device: Move BusDevice and Bus into vm-device

This removes the dependency of the pci crate on the devices crate which
now only contains the device implementations themselves.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-09-09 14:30:31 +00:00
+								use devices::interrupt_controller::InterruptController;
-												vmm: decouple vCPU init from `configure_vcpus`

Since calling `KVM_GET_ONE_REG` before `KVM_VCPU_INIT` will
result in an error: Exec format error (os error 8). This commit
decouples the vCPU init process from `configure_vcpus`. Therefore
in the process of restoring the vCPUs, these vCPUs can be
initialized separately before started.

Signed-off-by: Henry Wang <Henry.Wang@arm.com>

											
										
										
											2020-09-06 02:23:39 +00:00
+								#[cfg(target_arch = "aarch64")]
 								use hypervisor::kvm::kvm_bindings;
-												build: Fixed build errors and warnings on AArch64

This is a preparing commit to build and test CH on AArch64. All building
issues were fixed, but no functionality was introduced.
For X86, the logic of code was not changed at all.
For ARM, the architecture specific part is still empty. And we applied
some tricks to workaround lint warnings. But such code will be replaced
later by other commits with real functionality.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-12 09:49:12 +00:00
+								#[cfg(target_arch = "x86_64")]
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								use hypervisor::CpuId;
-												hypervisor, vmm: Remove shared ownership of VmmOps

This interface is used by the vCPU thread to delegate responsibility for
handling MMIO/PIO operations and to support different approaches than a
VM exit.

During profiling I found that we were spending 13.75% of the boot CPU
uage acquiring access to the object holding the VmmOps via
ArcSwap::load_full()

    13.75%     6.02%  vcpu0            cloud-hypervisor    [.] arc_swap::ArcSwapAny<T,S>::load_full
            |
            ---arc_swap::ArcSwapAny<T,S>::load_full
               |
                --13.43%--<hypervisor::kvm::KvmVcpu as hypervisor::cpu::Vcpu>::run
                          std::sys_common::backtrace::__rust_begin_short_backtrace
                          core::ops::function::FnOnce::call_once{{vtable-shim}}
                          std::sys::unix::thread::Thread::new::thread_start

However since the object implementing VmmOps does not need to be mutable
and it is only used from the vCPU side we can change the ownership to
being a simple Arc<> that is passed in when calling create_vcpu().

This completely removes the above CPU usage from subsequent profiles.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-11-18 16:37:52 +00:00
+								use hypervisor::{vm::VmmOps, CpuState, HypervisorCpuError, VmExit};
-												vm-virtio, vmm, vfio: Store GuestMemoryMmap in an Arc<ArcSwap<T>>

This allows us to change the memory map that is being used by the
devices via an atomic swap (by replacing the map with another one). The
ArcSwap provides the mechanism for atomically swapping from to another
whilst still giving good read performace. It is inside an Arc so that we
can use a single ArcSwap for all users.

Not covered by this change is replacing the GuestMemoryMmap itself.

This change also removes some vertical whitespace from use blocks in the
files that this commit also changed. Vertical whitespace was being used
inconsistently and broke rustfmt's behaviour of ordering the imports as
it would only do it within the block.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-31 10:49:11 +00:00
+								use libc::{c_void, siginfo_t};
-												hypervisor, vmm: Remove shared ownership of VmmOps

This interface is used by the vCPU thread to delegate responsibility for
handling MMIO/PIO operations and to support different approaches than a
VM exit.

During profiling I found that we were spending 13.75% of the boot CPU
uage acquiring access to the object holding the VmmOps via
ArcSwap::load_full()

    13.75%     6.02%  vcpu0            cloud-hypervisor    [.] arc_swap::ArcSwapAny<T,S>::load_full
            |
            ---arc_swap::ArcSwapAny<T,S>::load_full
               |
                --13.43%--<hypervisor::kvm::KvmVcpu as hypervisor::cpu::Vcpu>::run
                          std::sys_common::backtrace::__rust_begin_short_backtrace
                          core::ops::function::FnOnce::call_once{{vtable-shim}}
                          std::sys::unix::thread::Thread::new::thread_start

However since the object implementing VmmOps does not need to be mutable
and it is only used from the vCPU side we can change the ownership to
being a simple Arc<> that is passed in when calling create_vcpu().

This completely removes the above CPU usage from subsequent profiles.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-11-18 16:37:52 +00:00
+								use seccomp::{SeccompAction, SeccompFilter};
-												vm-virtio, vmm, vfio: Store GuestMemoryMmap in an Arc<ArcSwap<T>>

This allows us to change the memory map that is being used by the
devices via an atomic swap (by replacing the map with another one). The
ArcSwap provides the mechanism for atomically swapping from to another
whilst still giving good read performace. It is inside an Arc so that we
can use a single ArcSwap for all users.

Not covered by this change is replacing the GuestMemoryMmap itself.

This change also removes some vertical whitespace from use blocks in the
files that this commit also changed. Vertical whitespace was being used
inconsistently and broke rustfmt's behaviour of ordering the imports as
it would only do it within the block.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-31 10:49:11 +00:00
+								use std::os::unix::thread::JoinHandleExt;
 								use std::sync::atomic::{AtomicBool, Ordering};
-												vmm: Remove all Weak references from CpuManager

Now that the BusDevice devices are stored as Weak references by the
IO and MMIO buses, there's no need to use Weak references from the
CpuManager anymore.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-03-04 15:19:37 +00:00
+								use std::sync::{Arc, Barrier, Mutex};
-												build: Fixed build errors and warnings on AArch64

This is a preparing commit to build and test CH on AArch64. All building
issues were fixed, but no functionality was introduced.
For X86, the logic of code was not changed at all.
For ARM, the architecture specific part is still empty. And we applied
some tricks to workaround lint warnings. But such code will be replaced
later by other commits with real functionality.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-12 09:49:12 +00:00
+								use std::{cmp, io, result, thread};
-												hypervisor, vmm: Introduce VmmOps trait

Run loop in hypervisor needs a callback mechanism to access resources
like guest memory, mmio, pio etc.

VmmOps trait is introduced here, which is implemented by vmm module.
While handling vcpuexits in run loop, this trait allows hypervisor
module access to the above mentioned resources via callbacks.

Signed-off-by: Praveen Paladugu <prapal@microsoft.com>
Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-09-03 20:50:56 +00:00
+								use vm_device::BusDevice;
-												vmm: Enable memory manager for AArch64

Screened IO space as it is not available on AArch64.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-06-09 06:54:15 +00:00
+								#[cfg(target_arch = "x86_64")]
 								use vm_memory::GuestAddress;
 								use vm_memory::{GuestMemoryAtomic, GuestMemoryMmap};
-												vmm: cpu: Implement the Snapshottable trait

Implement the Snapshottable trait for Vcpu, and then implements it for
CpuManager. Note that CpuManager goes through the Snapshottable
implementation of Vcpu for every vCPU in order to implement the
Snapshottable trait for itself.

Signed-off-by: Yi Sun <yi.y.sun@linux.intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-18 15:44:41 +00:00
+								use vm_migration::{
 								    Migratable, MigratableError, Pausable, Snapshot, SnapshotDataSection, Snapshottable,
 								    Transportable,
 								};
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								use vmm_sys_util::eventfd::EventFd;
-												vmm: Change booting process to cover AArch64 requirements

Between X86 and AArch64, there is some difference in booting a VM:
- X86_64 can setup IOAPIC before creating any VCPU.
- AArch64 have to create VCPU's before creating GIC.

The old process is:
1. load_kernel()
    load kernel binary
    configure system
2. activate_vcpus()
    create & start VCPU's

So we need to separate "activate_vcpus" into "create_vcpus" and
"activate_vcpus" (to start vcpus only). Setup GIC and create FDT
between the 2 steps.

The new procedure is:
1. load_kernel()
    load kernel binary
    (X86_64) configure system
2. create VCPU's
3. (AArch64) setup GIC
4. (AArch64) configure system
5. start VCPU's

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-26 07:20:22 +00:00
+								use vmm_sys_util::signal::{register_signal_handler, SIGRTMIN};
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
-												vmm: cpu: Move CPUID patching to CpuManager

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-03-16 15:15:38 +00:00
+								// CPUID feature bits
-												build: Fixed build errors and warnings on AArch64

This is a preparing commit to build and test CH on AArch64. All building
issues were fixed, but no functionality was introduced.
For X86, the logic of code was not changed at all.
For ARM, the architecture specific part is still empty. And we applied
some tricks to workaround lint warnings. But such code will be replaced
later by other commits with real functionality.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-12 09:49:12 +00:00
+								#[cfg(target_arch = "x86_64")]
-												vmm: cpu: Move CPUID patching to CpuManager

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-03-16 15:15:38 +00:00
+								const TSC_DEADLINE_TIMER_ECX_BIT: u8 = 24; // tsc deadline timer ecx bit.
-												build: Fixed build errors and warnings on AArch64

This is a preparing commit to build and test CH on AArch64. All building
issues were fixed, but no functionality was introduced.
For X86, the logic of code was not changed at all.
For ARM, the architecture specific part is still empty. And we applied
some tricks to workaround lint warnings. But such code will be replaced
later by other commits with real functionality.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-12 09:49:12 +00:00
+								#[cfg(target_arch = "x86_64")]
-												vmm: cpu: Move CPUID patching to CpuManager

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-03-16 15:15:38 +00:00
+								const HYPERVISOR_ECX_BIT: u8 = 31; // Hypervisor ecx bit.
-												vmm: cpu: x86: Enable MTRR feature in CPUID

The MTRR feature was missing from the CPUID, which is causing the guest
to ignore the MTRR settings exposed through dedicated MSRs.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-09-25 12:19:03 +00:00
+								#[cfg(target_arch = "x86_64")]
 								const MTRR_EDX_BIT: u8 = 12; // Hypervisor ecx bit.
-												vmm: cpu: Move CPUID patching to CpuManager

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-03-16 15:15:38 +00:00
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								#[derive(Debug)]
 								pub enum Error {
-												vmm: cpu: Rename fd variable into something more meaningful

The fd naming is quite KVM specific. Since we're now using the
hypervisor crate abstractions, we can rename those into something more
readable and meaningful. Like e.g. vcpu or vm.

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-07-03 08:57:35 +00:00
+								    /// Cannot create the vCPU.
 								    VcpuCreate(anyhow::Error),
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
 								    /// Cannot run the VCPUs.
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								    VcpuRun(anyhow::Error),
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
 								    /// Cannot spawn a new vCPU thread.
 								    VcpuSpawn(io::Error),
-												vmm: cpu: Move CPUID patching to CpuManager

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-03-16 15:15:38 +00:00
+								    /// Cannot patch the CPU ID
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								    PatchCpuId(anyhow::Error),
-												vmm: cpu: Move CPUID patching to CpuManager

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-03-16 15:15:38 +00:00
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								    /// The call to KVM_SET_CPUID2 failed.
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								    SetSupportedCpusFailed(anyhow::Error),
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
 								    #[cfg(target_arch = "x86_64")]
 								    /// Cannot set the local interruption due to bad configuration.
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								    LocalIntConfiguration(anyhow::Error),
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
-												vmm: Move Vcpu::configure() to arch crate

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-28 07:27:22 +00:00
+								    /// Error configuring VCPU
 								    VcpuConfiguration(arch::Error),
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
-												vmm: decouple vCPU init from `configure_vcpus`

Since calling `KVM_GET_ONE_REG` before `KVM_VCPU_INIT` will
result in an error: Exec format error (os error 8). This commit
decouples the vCPU init process from `configure_vcpus`. Therefore
in the process of restoring the vCPUs, these vCPUs can be
initialized separately before started.

Signed-off-by: Henry Wang <Henry.Wang@arm.com>

											
										
										
											2020-09-06 02:23:39 +00:00
+								    #[cfg(target_arch = "aarch64")]
 								    /// Error fetching prefered target
 								    VcpuArmPreferredTarget(hypervisor::HypervisorVmError),
 								    #[cfg(target_arch = "aarch64")]
 								    /// Error doing vCPU init on Arm.
 								    VcpuArmInit(hypervisor::HypervisorCpuError),
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								    /// Failed to join on vCPU threads
-												vmm: Fix map_err losing the inner error

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-01-24 08:34:51 +00:00
+								    ThreadCleanup(std::boxed::Box<dyn std::any::Any + std::marker::Send>),
-												vmm: cpu: Add the CpuManager onto the IO bus

This allows the kernel (via ACPI based controls) to query and control
the CPU state.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 14:56:10 +00:00
 								    /// Cannot add legacy device to Bus.
-												devices, vm-device: Move BusDevice and Bus into vm-device

This removes the dependency of the pci crate on the devices crate which
now only contains the device implementations themselves.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-09-09 14:30:31 +00:00
+								    BusError(vm_device::BusError),
-												vmm: cpu: Allocate I/O port for the CPU manager

The CPU manager uses an I/O port and to prevent potential clashes with
assignment for PCI devices ensure that it is allocated by the allocator.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-20 14:16:14 +00:00
-												Revert "vmm: Move CpuManager device to MMIO region"

This reverts commit 980e03fa0ab3d217fe91fd60d8459507c903d88b.

											
										
										
											2020-01-24 10:36:39 +00:00
+								    /// Failed to allocate IO port
 								    AllocateIOPort,
-												vmm: cpu: Refactor vCPU thread starting

Refactor the vCPU thread starting so that there is the possibility to
bring on extra vCPU threads.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 13:06:24 +00:00
 								    /// Asking for more vCPUs that we can have
 								    DesiredVCPUCountExceedsMax,
-												vmm: cpu: Get and set KVM vCPU state

These two new helpers will be useful to capture a vCPU state and being
able to restore it at a later time.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-16 20:42:42 +00:00
 								    /// Failed to get KVM vcpu lapic.
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								    VcpuGetLapic(anyhow::Error),
-												vmm: cpu: Get and set KVM vCPU state

These two new helpers will be useful to capture a vCPU state and being
able to restore it at a later time.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-16 20:42:42 +00:00
 								    /// Failed to set KVM vcpu lapic.
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								    VcpuSetLapic(anyhow::Error),
-												vmm: cpu: Get and set KVM vCPU state

These two new helpers will be useful to capture a vCPU state and being
able to restore it at a later time.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-16 20:42:42 +00:00
 								    /// Failed to get KVM vcpu MP state.
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								    VcpuGetMpState(anyhow::Error),
-												vmm: cpu: Get and set KVM vCPU state

These two new helpers will be useful to capture a vCPU state and being
able to restore it at a later time.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-16 20:42:42 +00:00
 								    /// Failed to set KVM vcpu MP state.
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								    VcpuSetMpState(anyhow::Error),
-												vmm: cpu: Get and set KVM vCPU state

These two new helpers will be useful to capture a vCPU state and being
able to restore it at a later time.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-16 20:42:42 +00:00
 								    /// Failed to get KVM vcpu msrs.
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								    VcpuGetMsrs(anyhow::Error),
-												vmm: cpu: Get and set KVM vCPU state

These two new helpers will be useful to capture a vCPU state and being
able to restore it at a later time.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-16 20:42:42 +00:00
 								    /// Failed to set KVM vcpu msrs.
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								    VcpuSetMsrs(anyhow::Error),
-												vmm: cpu: Get and set KVM vCPU state

These two new helpers will be useful to capture a vCPU state and being
able to restore it at a later time.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-16 20:42:42 +00:00
 								    /// Failed to get KVM vcpu regs.
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								    VcpuGetRegs(anyhow::Error),
-												vmm: cpu: Get and set KVM vCPU state

These two new helpers will be useful to capture a vCPU state and being
able to restore it at a later time.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-16 20:42:42 +00:00
 								    /// Failed to set KVM vcpu regs.
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								    VcpuSetRegs(anyhow::Error),
-												vmm: cpu: Get and set KVM vCPU state

These two new helpers will be useful to capture a vCPU state and being
able to restore it at a later time.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-16 20:42:42 +00:00
 								    /// Failed to get KVM vcpu sregs.
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								    VcpuGetSregs(anyhow::Error),
-												vmm: cpu: Get and set KVM vCPU state

These two new helpers will be useful to capture a vCPU state and being
able to restore it at a later time.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-16 20:42:42 +00:00
 								    /// Failed to set KVM vcpu sregs.
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								    VcpuSetSregs(anyhow::Error),
-												vmm: cpu: Get and set KVM vCPU state

These two new helpers will be useful to capture a vCPU state and being
able to restore it at a later time.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-16 20:42:42 +00:00
 								    /// Failed to get KVM vcpu events.
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								    VcpuGetVcpuEvents(anyhow::Error),
-												vmm: cpu: Get and set KVM vCPU state

These two new helpers will be useful to capture a vCPU state and being
able to restore it at a later time.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-16 20:42:42 +00:00
 								    /// Failed to set KVM vcpu events.
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								    VcpuSetVcpuEvents(anyhow::Error),
-												vmm: cpu: Get and set KVM vCPU state

These two new helpers will be useful to capture a vCPU state and being
able to restore it at a later time.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-16 20:42:42 +00:00
 								    /// Failed to get KVM vcpu FPU.
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								    VcpuGetFpu(anyhow::Error),
-												vmm: cpu: Get and set KVM vCPU state

These two new helpers will be useful to capture a vCPU state and being
able to restore it at a later time.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-16 20:42:42 +00:00
 								    /// Failed to set KVM vcpu FPU.
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								    VcpuSetFpu(anyhow::Error),
-												vmm: cpu: Get and set KVM vCPU state

These two new helpers will be useful to capture a vCPU state and being
able to restore it at a later time.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-16 20:42:42 +00:00
 								    /// Failed to get KVM vcpu XSAVE.
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								    VcpuGetXsave(anyhow::Error),
-												vmm: cpu: Get and set KVM vCPU state

These two new helpers will be useful to capture a vCPU state and being
able to restore it at a later time.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-16 20:42:42 +00:00
 								    /// Failed to set KVM vcpu XSAVE.
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								    VcpuSetXsave(anyhow::Error),
-												vmm: cpu: Get and set KVM vCPU state

These two new helpers will be useful to capture a vCPU state and being
able to restore it at a later time.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-16 20:42:42 +00:00
 								    /// Failed to get KVM vcpu XCRS.
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								    VcpuGetXcrs(anyhow::Error),
-												vmm: cpu: Get and set KVM vCPU state

These two new helpers will be useful to capture a vCPU state and being
able to restore it at a later time.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-16 20:42:42 +00:00
 								    /// Failed to set KVM vcpu XCRS.
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								    VcpuSetXcrs(anyhow::Error),
-												vmm: cpu: Unpause vCPU threads

After setting the kill signal flag for the vCPU thread release the pause
flag and unpark the threads. This ensures that that the vCPU thread will
wake up and check the kill signal flag if the VM is paused.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-05-06 09:24:19 +00:00
 								    /// Error resuming vCPU on shutdown
 								    ResumeOnShutdown(MigratableError),
-												vmm: seccomp: Add seccomp filters for the vcpu worker thread

Partially fixes: #925

Signed-off-by: Bo Chen <chen.bo@intel.com>

											
										
										
											2020-09-09 22:15:26 +00:00
 								    /// Cannot create seccomp filter
 								    CreateSeccompFilter(seccomp::SeccompError),
 								    /// Cannot apply seccomp filter
 								    ApplySeccompFilter(seccomp::Error),
-												vmm: refactor vCPU save/restore code in restoring VM

Similarly as the VM booting process, on AArch64 systems,
the vCPUs should be created before the creation of GIC. This
commit refactors the vCPU save/restore code to achieve the
above-mentioned restoring order.

Signed-off-by: Henry Wang <Henry.Wang@arm.com>

											
										
										
											2020-09-04 10:56:30 +00:00
 								    /// Error starting vCPU after restore
 								    StartRestoreVcpu(anyhow::Error),
-												hypervisor, vmm: Introduce VmmOps trait

Run loop in hypervisor needs a callback mechanism to access resources
like guest memory, mmio, pio etc.

VmmOps trait is introduced here, which is implemented by vmm module.
While handling vcpuexits in run loop, this trait allows hypervisor
module access to the above mentioned resources via callbacks.

Signed-off-by: Praveen Paladugu <prapal@microsoft.com>
Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-09-03 20:50:56 +00:00
 								    /// Error because an unexpected VmExit type was received.
 								    UnexpectedVmExit,
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								}
 								pub type Result<T> = result::Result<T, Error>;
-												ci: Run clippy for each specific feature

The build is run against "--all-features", "pci,acpi", "pci" and "mmio"
separately. The clippy validation must be run against the same set of
features in order to validate the code is correct.

Because of these new checks, this commit includes multiple fixes
related to the errors generated when manually running the checks.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-01-21 08:32:50 +00:00
+								#[cfg(feature = "acpi")]
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								#[repr(packed)]
 								struct LocalAPIC {
 								    pub r#type: u8,
 								    pub length: u8,
 								    pub processor_id: u8,
 								    pub apic_id: u8,
 								    pub flags: u32,
 								}
 								#[repr(packed)]
 								#[derive(Default)]
 								struct IOAPIC {
 								    pub r#type: u8,
 								    pub length: u8,
 								    pub ioapic_id: u8,
 								    _reserved: u8,
 								    pub apic_address: u32,
 								    pub gsi_base: u32,
 								}
 								#[repr(packed)]
 								#[derive(Default)]
 								struct InterruptSourceOverride {
 								    pub r#type: u8,
 								    pub length: u8,
 								    pub bus: u8,
 								    pub source: u8,
 								    pub gsi: u32,
 								    pub flags: u16,
 								}
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								/// A wrapper around creating and using a kvm-based VCPU.
 								pub struct Vcpu {
-												vmm: cpu: Rename fd variable into something more meaningful

The fd naming is quite KVM specific. Since we're now using the
hypervisor crate abstractions, we can rename those into something more
readable and meaningful. Like e.g. vcpu or vm.

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-07-03 08:57:35 +00:00
+								    // The hypervisor abstracted CPU.
 								    vcpu: Arc<dyn hypervisor::Vcpu>,
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								    id: u8,
-												vmm: Enable VCPU for AArch64

Added MPIDR which is needed in system configuration.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-06-09 07:24:23 +00:00
+								    #[cfg(target_arch = "aarch64")]
 								    mpidr: u64,
-												vmm: Save and restore vCPU states during pause/resume operations

We need consistency between pause/resume and snapshot/restore
operations. The symmetrical behavior of pausing/snapshotting
and restoring/resuming has been introduced recently, and we must
now ensure that no matter if we're using pause/resume or
snapshot/restore features, the resulting VM should be running in
the exact same way.

That's why the vCPU state is now stored upon VM pausing. The snapshot
operation being a simple serialization of the previously saved state.
The same way, the vCPU state is now restored upon VM resuming. The
restore operation being a simple deserialization of the previously
restored state.

It's interesting to note that this patch ensures time consistency from a
guest perspective, no matter which clocksource is being used. From a
previous patch, the KVM clock was saved/restored upon VM pause/resume.
We now have the same behavior for TSC, as the TSC from the vCPUs are
saved/restored upon VM pause/resume too.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-06-24 11:55:18 +00:00
+								    saved_state: Option<CpuState>,
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								}
 								impl Vcpu {
 								    /// Constructs a new VCPU for `vm`.
 								    ///
 								    /// # Arguments
 								    ///
 								    /// * `id` - Represents the CPU number between [0, max vcpus).
 								    /// * `vm` - The virtual machine this vcpu will get attached to.
-												hypervisor, vmm: Remove shared ownership of VmmOps

This interface is used by the vCPU thread to delegate responsibility for
handling MMIO/PIO operations and to support different approaches than a
VM exit.

During profiling I found that we were spending 13.75% of the boot CPU
uage acquiring access to the object holding the VmmOps via
ArcSwap::load_full()

    13.75%     6.02%  vcpu0            cloud-hypervisor    [.] arc_swap::ArcSwapAny<T,S>::load_full
            |
            ---arc_swap::ArcSwapAny<T,S>::load_full
               |
                --13.43%--<hypervisor::kvm::KvmVcpu as hypervisor::cpu::Vcpu>::run
                          std::sys_common::backtrace::__rust_begin_short_backtrace
                          core::ops::function::FnOnce::call_once{{vtable-shim}}
                          std::sys::unix::thread::Thread::new::thread_start

However since the object implementing VmmOps does not need to be mutable
and it is only used from the vCPU side we can change the ownership to
being a simple Arc<> that is passed in when calling create_vcpu().

This completely removes the above CPU usage from subsequent profiles.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-11-18 16:37:52 +00:00
+								    /// * `vmmops` - Optional object for exit handling.
 								    pub fn new(
 								        id: u8,
 								        vm: &Arc<dyn hypervisor::Vm>,
 								        vmmops: Option<Arc<Box<dyn VmmOps>>>,
 								    ) -> Result<Arc<Mutex<Self>>> {
-												vmm: cpu: Rename fd variable into something more meaningful

The fd naming is quite KVM specific. Since we're now using the
hypervisor crate abstractions, we can rename those into something more
readable and meaningful. Like e.g. vcpu or vm.

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-07-03 08:57:35 +00:00
+								        let vcpu = vm
-												hypervisor, vmm: Remove shared ownership of VmmOps

This interface is used by the vCPU thread to delegate responsibility for
handling MMIO/PIO operations and to support different approaches than a
VM exit.

During profiling I found that we were spending 13.75% of the boot CPU
uage acquiring access to the object holding the VmmOps via
ArcSwap::load_full()

    13.75%     6.02%  vcpu0            cloud-hypervisor    [.] arc_swap::ArcSwapAny<T,S>::load_full
            |
            ---arc_swap::ArcSwapAny<T,S>::load_full
               |
                --13.43%--<hypervisor::kvm::KvmVcpu as hypervisor::cpu::Vcpu>::run
                          std::sys_common::backtrace::__rust_begin_short_backtrace
                          core::ops::function::FnOnce::call_once{{vtable-shim}}
                          std::sys::unix::thread::Thread::new::thread_start

However since the object implementing VmmOps does not need to be mutable
and it is only used from the vCPU side we can change the ownership to
being a simple Arc<> that is passed in when calling create_vcpu().

This completely removes the above CPU usage from subsequent profiles.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-11-18 16:37:52 +00:00
+								            .create_vcpu(id, vmmops)
-												vmm: cpu: Rename fd variable into something more meaningful

The fd naming is quite KVM specific. Since we're now using the
hypervisor crate abstractions, we can rename those into something more
readable and meaningful. Like e.g. vcpu or vm.

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-07-03 08:57:35 +00:00
+								            .map_err(|e| Error::VcpuCreate(e.into()))?;
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								        // Initially the cpuid per vCPU is the one supported by this VM.
-												vmm: cpu: Track all Vcpus through CpuManager

In anticipation for the CpuManager to aggregate all Vcpu snapshots
together, this change makes sure the CpuManager has a handle onto
every vCPU.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-18 15:58:51 +00:00
+								        Ok(Arc::new(Mutex::new(Vcpu {
-												vmm: cpu: Rename fd variable into something more meaningful

The fd naming is quite KVM specific. Since we're now using the
hypervisor crate abstractions, we can rename those into something more
readable and meaningful. Like e.g. vcpu or vm.

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-07-03 08:57:35 +00:00
+								            vcpu,
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								            id,
-												vmm: Enable VCPU for AArch64

Added MPIDR which is needed in system configuration.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-06-09 07:24:23 +00:00
+								            #[cfg(target_arch = "aarch64")]
 								            mpidr: 0,
-												vmm: Save and restore vCPU states during pause/resume operations

We need consistency between pause/resume and snapshot/restore
operations. The symmetrical behavior of pausing/snapshotting
and restoring/resuming has been introduced recently, and we must
now ensure that no matter if we're using pause/resume or
snapshot/restore features, the resulting VM should be running in
the exact same way.

That's why the vCPU state is now stored upon VM pausing. The snapshot
operation being a simple serialization of the previously saved state.
The same way, the vCPU state is now restored upon VM resuming. The
restore operation being a simple deserialization of the previously
restored state.

It's interesting to note that this patch ensures time consistency from a
guest perspective, no matter which clocksource is being used. From a
previous patch, the KVM clock was saved/restored upon VM pause/resume.
We now have the same behavior for TSC, as the TSC from the vCPUs are
saved/restored upon VM pause/resume too.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-06-24 11:55:18 +00:00
+								            saved_state: None,
-												vmm: cpu: Track all Vcpus through CpuManager

In anticipation for the CpuManager to aggregate all Vcpu snapshots
together, this change makes sure the CpuManager has a handle onto
every vCPU.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-18 15:58:51 +00:00
+								        })))
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								    }
-												vmm: Move Vcpu::configure() to arch crate

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-28 07:27:22 +00:00
+								    /// Configures a vcpu and should be called once per vcpu when created.
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								    ///
 								    /// # Arguments
 								    ///
-												pvh: Introduce EntryPoint struct

In order to properly initialize the kvm regs/sregs structs for
the guest, the load_kernel() return type must specify which
boot protocol to use with the entry point address it returns.

Make load_kernel() return an EntryPoint struct containing the
required information. This structure will later be used
in the vCPU configuration methods to setup the appropriate
initial conditions for the guest.

Signed-off-by: Alejandro Jimenez <alejandro.j.jimenez@oracle.com>

											
										
										
											2020-02-12 03:37:33 +00:00
+								    /// * `kernel_entry_point` - Kernel entry point address in guest memory and boot protocol used.
-												vmm: Change booting process to cover AArch64 requirements

Between X86 and AArch64, there is some difference in booting a VM:
- X86_64 can setup IOAPIC before creating any VCPU.
- AArch64 have to create VCPU's before creating GIC.

The old process is:
1. load_kernel()
    load kernel binary
    configure system
2. activate_vcpus()
    create & start VCPU's

So we need to separate "activate_vcpus" into "create_vcpus" and
"activate_vcpus" (to start vcpus only). Setup GIC and create FDT
between the 2 steps.

The new procedure is:
1. load_kernel()
    load kernel binary
    (X86_64) configure system
2. create VCPU's
3. (AArch64) setup GIC
4. (AArch64) configure system
5. start VCPU's

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-26 07:20:22 +00:00
+								    /// * `vm_memory` - Guest memory.
-												vmm: Move Vcpu::configure() to arch crate

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-28 07:27:22 +00:00
+								    /// * `cpuid` - (x86_64) CpuId, wrapper over the `kvm_cpuid2` structure.
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								    pub fn configure(
-												vmm: Enable VCPU for AArch64

Added MPIDR which is needed in system configuration.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-06-09 07:24:23 +00:00
+								        &mut self,
-												vmm: cpu: Rename fd variable into something more meaningful

The fd naming is quite KVM specific. Since we're now using the
hypervisor crate abstractions, we can rename those into something more
readable and meaningful. Like e.g. vcpu or vm.

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-07-03 08:57:35 +00:00
+								        #[cfg(target_arch = "aarch64")] vm: &Arc<dyn hypervisor::Vm>,
-												pvh: Introduce EntryPoint struct

In order to properly initialize the kvm regs/sregs structs for
the guest, the load_kernel() return type must specify which
boot protocol to use with the entry point address it returns.

Make load_kernel() return an EntryPoint struct containing the
required information. This structure will later be used
in the vCPU configuration methods to setup the appropriate
initial conditions for the guest.

Signed-off-by: Alejandro Jimenez <alejandro.j.jimenez@oracle.com>

											
										
										
											2020-02-12 03:37:33 +00:00
+								        kernel_entry_point: Option<EntryPoint>,
-												vmm: Move codebase to GuestMemoryAtomic from vm-memory

Relying on the latest vm-memory version, including the freshly
introduced structure GuestMemoryAtomic, this patch replaces every
occurrence of Arc<ArcSwap<GuestMemoryMmap> with
GuestMemoryAtomic<GuestMemoryMmap>.

The point is to rely on the common RCU-like implementation from
vm-memory so that we don't have to do it from Cloud-Hypervisor.

Fixes #735

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-02-11 16:22:40 +00:00
+								        vm_memory: &GuestMemoryAtomic<GuestMemoryMmap>,
-												vmm: Move Vcpu::configure() to arch crate

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-28 07:27:22 +00:00
+								        #[cfg(target_arch = "x86_64")] cpuid: CpuId,
-												vmm, arch: Enable KVM HyperV support

Inject CPUID leaves for advertising KVM HyperV support when the
"kvm_hyperv" toggle is enabled. Currently we only enable a selection of
features required to boot.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-09-15 15:26:34 +00:00
+								        #[cfg(target_arch = "x86_64")] kvm_hyperv: bool,
-												vmm: cpu: Set CPU physical bits based on user input

If the user specified a maximum physical bits value through the
`max_phys_bits` option from `--cpus` parameter, the guest CPUID
will be patched accordingly to ensure the guest will find the
right amount of physical bits.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-10-13 08:22:44 +00:00
+								        phys_bits: u8,
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								    ) -> Result<()> {
-												vmm: Move Vcpu::configure() to arch crate

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-28 07:27:22 +00:00
+								        #[cfg(target_arch = "aarch64")]
-												vmm: Enable VCPU for AArch64

Added MPIDR which is needed in system configuration.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-06-09 07:24:23 +00:00
+								        {
-												vmm: decouple vCPU init from `configure_vcpus`

Since calling `KVM_GET_ONE_REG` before `KVM_VCPU_INIT` will
result in an error: Exec format error (os error 8). This commit
decouples the vCPU init process from `configure_vcpus`. Therefore
in the process of restoring the vCPUs, these vCPUs can be
initialized separately before started.

Signed-off-by: Henry Wang <Henry.Wang@arm.com>

											
										
										
											2020-09-06 02:23:39 +00:00
+								            self.init(vm)?;
-												vmm: cpu: Set CPU physical bits based on user input

If the user specified a maximum physical bits value through the
`max_phys_bits` option from `--cpus` parameter, the guest CPUID
will be patched accordingly to ensure the guest will find the
right amount of physical bits.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-10-13 08:22:44 +00:00
+								            self.mpidr = arch::configure_vcpu(
 								                &self.vcpu,
 								                self.id,
 								                kernel_entry_point,
 								                vm_memory,
 								                phys_bits,
 								            )
 								            .map_err(Error::VcpuConfiguration)?;
-												vmm: Enable VCPU for AArch64

Added MPIDR which is needed in system configuration.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-06-09 07:24:23 +00:00
+								        }
-												vmm: Move Vcpu::configure() to arch crate

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-28 07:27:22 +00:00
 								        #[cfg(target_arch = "x86_64")]
-												vmm, arch: Enable KVM HyperV support

Inject CPUID leaves for advertising KVM HyperV support when the
"kvm_hyperv" toggle is enabled. Currently we only enable a selection of
features required to boot.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-09-15 15:26:34 +00:00
+								        arch::configure_vcpu(
 								            &self.vcpu,
 								            self.id,
 								            kernel_entry_point,
 								            vm_memory,
 								            cpuid,
 								            kvm_hyperv,
-												vmm: cpu: Set CPU physical bits based on user input

If the user specified a maximum physical bits value through the
`max_phys_bits` option from `--cpus` parameter, the guest CPUID
will be patched accordingly to ensure the guest will find the
right amount of physical bits.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-10-13 08:22:44 +00:00
+								            phys_bits,
-												vmm, arch: Enable KVM HyperV support

Inject CPUID leaves for advertising KVM HyperV support when the
"kvm_hyperv" toggle is enabled. Currently we only enable a selection of
features required to boot.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-09-15 15:26:34 +00:00
+								        )
 								        .map_err(Error::VcpuConfiguration)?;
-												vmm: Move Vcpu::configure() to arch crate

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-28 07:27:22 +00:00
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								        Ok(())
 								    }
-												vmm: Enable VCPU for AArch64

Added MPIDR which is needed in system configuration.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-06-09 07:24:23 +00:00
+								    /// Gets the MPIDR register value.
 								    #[cfg(target_arch = "aarch64")]
 								    pub fn get_mpidr(&self) -> u64 {
 								        self.mpidr
 								    }
-												vmm: AArch64: add methods to get saved vCPU states

The construction of `GICR_TYPER` register will need vCPU states.
Therefore this commit adds methods to extract saved vCPU states
from the cpu manager.

Signed-off-by: Henry Wang <Henry.Wang@arm.com>

											
										
										
											2020-09-04 15:37:52 +00:00
+								    /// Gets the saved vCPU state.
 								    #[cfg(target_arch = "aarch64")]
 								    pub fn get_saved_state(&self) -> Option<CpuState> {
 								        self.saved_state.clone()
 								    }
-												vmm: decouple vCPU init from `configure_vcpus`

Since calling `KVM_GET_ONE_REG` before `KVM_VCPU_INIT` will
result in an error: Exec format error (os error 8). This commit
decouples the vCPU init process from `configure_vcpus`. Therefore
in the process of restoring the vCPUs, these vCPUs can be
initialized separately before started.

Signed-off-by: Henry Wang <Henry.Wang@arm.com>

											
										
										
											2020-09-06 02:23:39 +00:00
+								    /// Initializes an aarch64 specific vcpu for booting Linux.
 								    #[cfg(target_arch = "aarch64")]
 								    pub fn init(&self, vm: &Arc<dyn hypervisor::Vm>) -> Result<()> {
 								        let mut kvi: kvm_bindings::kvm_vcpu_init = kvm_bindings::kvm_vcpu_init::default();
 								        // This reads back the kernel's preferred target type.
 								        vm.get_preferred_target(&mut kvi)
 								            .map_err(Error::VcpuArmPreferredTarget)?;
 								        // We already checked that the capability is supported.
 								        kvi.features[0] |= 1 << kvm_bindings::KVM_ARM_VCPU_PSCI_0_2;
 								        // Non-boot cpus are powered off initially.
 								        if self.id > 0 {
 								            kvi.features[0] |= 1 << kvm_bindings::KVM_ARM_VCPU_POWER_OFF;
 								        }
 								        self.vcpu.vcpu_init(&kvi).map_err(Error::VcpuArmInit)
 								    }
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								    /// Runs the VCPU until it exits, returning the reason.
 								    ///
 								    /// Note that the state of the VCPU and associated VM must be setup first for this to do
 								    /// anything useful.
-												vmm: Handle hypervisor VCPU run result from Vcpu to VcpuManager

Now Vcpu::run() returns a boolean value to VcpuManager, indicating
whether the VM is going to reboot (false) or just continue (true).
Moving the handling of hypervisor VCPU run result from Vcpu to
VcpuManager gives us the flexibility to handle more scenarios like
shutting down on AArch64.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-10-30 13:01:53 +00:00
+								    pub fn run(&self) -> std::result::Result<VmExit, HypervisorCpuError> {
 								        self.vcpu.run()
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								    }
 								}
-												vmm: cpu: Implement the Snapshottable trait

Implement the Snapshottable trait for Vcpu, and then implements it for
CpuManager. Note that CpuManager goes through the Snapshottable
implementation of Vcpu for every vCPU in order to implement the
Snapshottable trait for itself.

Signed-off-by: Yi Sun <yi.y.sun@linux.intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-18 15:44:41 +00:00
+								const VCPU_SNAPSHOT_ID: &str = "vcpu";
-												vmm: Implement Pausable trait for Vcpu

We want each Vcpu to store the vCPU state upon VM pausing. This is the
reason why we need to explicitly implement the Pausable trait for the
Vcpu structure.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-06-24 09:59:17 +00:00
+								impl Pausable for Vcpu {
 								    fn pause(&mut self) -> std::result::Result<(), MigratableError> {
-												vmm: Save and restore vCPU states during pause/resume operations

We need consistency between pause/resume and snapshot/restore
operations. The symmetrical behavior of pausing/snapshotting
and restoring/resuming has been introduced recently, and we must
now ensure that no matter if we're using pause/resume or
snapshot/restore features, the resulting VM should be running in
the exact same way.

That's why the vCPU state is now stored upon VM pausing. The snapshot
operation being a simple serialization of the previously saved state.
The same way, the vCPU state is now restored upon VM resuming. The
restore operation being a simple deserialization of the previously
restored state.

It's interesting to note that this patch ensures time consistency from a
guest perspective, no matter which clocksource is being used. From a
previous patch, the KVM clock was saved/restored upon VM pause/resume.
We now have the same behavior for TSC, as the TSC from the vCPUs are
saved/restored upon VM pause/resume too.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-06-24 11:55:18 +00:00
+								        self.saved_state =
-												vmm: cpu: Rename fd variable into something more meaningful

The fd naming is quite KVM specific. Since we're now using the
hypervisor crate abstractions, we can rename those into something more
readable and meaningful. Like e.g. vcpu or vm.

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-07-03 08:57:35 +00:00
+								            Some(self.vcpu.state().map_err(|e| {
-												vmm: Save and restore vCPU states during pause/resume operations

We need consistency between pause/resume and snapshot/restore
operations. The symmetrical behavior of pausing/snapshotting
and restoring/resuming has been introduced recently, and we must
now ensure that no matter if we're using pause/resume or
snapshot/restore features, the resulting VM should be running in
the exact same way.

That's why the vCPU state is now stored upon VM pausing. The snapshot
operation being a simple serialization of the previously saved state.
The same way, the vCPU state is now restored upon VM resuming. The
restore operation being a simple deserialization of the previously
restored state.

It's interesting to note that this patch ensures time consistency from a
guest perspective, no matter which clocksource is being used. From a
previous patch, the KVM clock was saved/restored upon VM pause/resume.
We now have the same behavior for TSC, as the TSC from the vCPUs are
saved/restored upon VM pause/resume too.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-06-24 11:55:18 +00:00
+								                MigratableError::Pause(anyhow!("Could not get vCPU state {:?}", e))
 								            })?);
-												vmm: Implement Pausable trait for Vcpu

We want each Vcpu to store the vCPU state upon VM pausing. This is the
reason why we need to explicitly implement the Pausable trait for the
Vcpu structure.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-06-24 09:59:17 +00:00
+								        Ok(())
 								    }
 								    fn resume(&mut self) -> std::result::Result<(), MigratableError> {
-												vmm: Save and restore vCPU states during pause/resume operations

We need consistency between pause/resume and snapshot/restore
operations. The symmetrical behavior of pausing/snapshotting
and restoring/resuming has been introduced recently, and we must
now ensure that no matter if we're using pause/resume or
snapshot/restore features, the resulting VM should be running in
the exact same way.

That's why the vCPU state is now stored upon VM pausing. The snapshot
operation being a simple serialization of the previously saved state.
The same way, the vCPU state is now restored upon VM resuming. The
restore operation being a simple deserialization of the previously
restored state.

It's interesting to note that this patch ensures time consistency from a
guest perspective, no matter which clocksource is being used. From a
previous patch, the KVM clock was saved/restored upon VM pause/resume.
We now have the same behavior for TSC, as the TSC from the vCPUs are
saved/restored upon VM pause/resume too.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-06-24 11:55:18 +00:00
+								        if let Some(vcpu_state) = &self.saved_state {
-												vmm: cpu: Rename fd variable into something more meaningful

The fd naming is quite KVM specific. Since we're now using the
hypervisor crate abstractions, we can rename those into something more
readable and meaningful. Like e.g. vcpu or vm.

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-07-03 08:57:35 +00:00
+								            self.vcpu.set_state(vcpu_state).map_err(|e| {
-												vmm: Save and restore vCPU states during pause/resume operations

We need consistency between pause/resume and snapshot/restore
operations. The symmetrical behavior of pausing/snapshotting
and restoring/resuming has been introduced recently, and we must
now ensure that no matter if we're using pause/resume or
snapshot/restore features, the resulting VM should be running in
the exact same way.

That's why the vCPU state is now stored upon VM pausing. The snapshot
operation being a simple serialization of the previously saved state.
The same way, the vCPU state is now restored upon VM resuming. The
restore operation being a simple deserialization of the previously
restored state.

It's interesting to note that this patch ensures time consistency from a
guest perspective, no matter which clocksource is being used. From a
previous patch, the KVM clock was saved/restored upon VM pause/resume.
We now have the same behavior for TSC, as the TSC from the vCPUs are
saved/restored upon VM pause/resume too.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-06-24 11:55:18 +00:00
+								                MigratableError::Pause(anyhow!("Could not set the vCPU state {:?}", e))
 								            })?;
 								        }
-												vmm: Implement Pausable trait for Vcpu

We want each Vcpu to store the vCPU state upon VM pausing. This is the
reason why we need to explicitly implement the Pausable trait for the
Vcpu structure.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-06-24 09:59:17 +00:00
+								        Ok(())
 								    }
 								}
-												vmm: cpu: Implement the Snapshottable trait

Implement the Snapshottable trait for Vcpu, and then implements it for
CpuManager. Note that CpuManager goes through the Snapshottable
implementation of Vcpu for every vCPU in order to implement the
Snapshottable trait for itself.

Signed-off-by: Yi Sun <yi.y.sun@linux.intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-18 15:44:41 +00:00
+								impl Snapshottable for Vcpu {
 								    fn id(&self) -> String {
 								        VCPU_SNAPSHOT_ID.to_string()
 								    }
-												vm-migration: Make snapshot() mutable

There will be some cases where the implementation of the snapshot()
function from the Snapshottable trait will require to modify some
internal data, therefore we make this possible by updating the trait
definition with snapshot(&mut self).

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-08-21 12:31:58 +00:00
+								    fn snapshot(&mut self) -> std::result::Result<Snapshot, MigratableError> {
-												vmm: Save and restore vCPU states during pause/resume operations

We need consistency between pause/resume and snapshot/restore
operations. The symmetrical behavior of pausing/snapshotting
and restoring/resuming has been introduced recently, and we must
now ensure that no matter if we're using pause/resume or
snapshot/restore features, the resulting VM should be running in
the exact same way.

That's why the vCPU state is now stored upon VM pausing. The snapshot
operation being a simple serialization of the previously saved state.
The same way, the vCPU state is now restored upon VM resuming. The
restore operation being a simple deserialization of the previously
restored state.

It's interesting to note that this patch ensures time consistency from a
guest perspective, no matter which clocksource is being used. From a
previous patch, the KVM clock was saved/restored upon VM pause/resume.
We now have the same behavior for TSC, as the TSC from the vCPUs are
saved/restored upon VM pause/resume too.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-06-24 11:55:18 +00:00
+								        let snapshot = serde_json::to_vec(&self.saved_state)
 								            .map_err(|e| MigratableError::Snapshot(e.into()))?;
-												vmm: cpu: Implement the Snapshottable trait

Implement the Snapshottable trait for Vcpu, and then implements it for
CpuManager. Note that CpuManager goes through the Snapshottable
implementation of Vcpu for every vCPU in order to implement the
Snapshottable trait for itself.

Signed-off-by: Yi Sun <yi.y.sun@linux.intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-18 15:44:41 +00:00
 								        let mut vcpu_snapshot = Snapshot::new(&format!("{}", self.id));
 								        vcpu_snapshot.add_data_section(SnapshotDataSection {
 								            id: format!("{}-section", VCPU_SNAPSHOT_ID),
 								            snapshot,
 								        });
 								        Ok(vcpu_snapshot)
 								    }
 								    fn restore(&mut self, snapshot: Snapshot) -> std::result::Result<(), MigratableError> {
 								        if let Some(vcpu_section) = snapshot
 								            .snapshot_data
 								            .get(&format!("{}-section", VCPU_SNAPSHOT_ID))
 								        {
 								            let vcpu_state = match serde_json::from_slice(&vcpu_section.snapshot) {
 								                Ok(state) => state,
 								                Err(error) => {
 								                    return Err(MigratableError::Restore(anyhow!(
 								                        "Could not deserialize the vCPU snapshot {}",
 								                        error
 								                    )))
 								                }
 								            };
-												vmm: Save and restore vCPU states during pause/resume operations

We need consistency between pause/resume and snapshot/restore
operations. The symmetrical behavior of pausing/snapshotting
and restoring/resuming has been introduced recently, and we must
now ensure that no matter if we're using pause/resume or
snapshot/restore features, the resulting VM should be running in
the exact same way.

That's why the vCPU state is now stored upon VM pausing. The snapshot
operation being a simple serialization of the previously saved state.
The same way, the vCPU state is now restored upon VM resuming. The
restore operation being a simple deserialization of the previously
restored state.

It's interesting to note that this patch ensures time consistency from a
guest perspective, no matter which clocksource is being used. From a
previous patch, the KVM clock was saved/restored upon VM pause/resume.
We now have the same behavior for TSC, as the TSC from the vCPUs are
saved/restored upon VM pause/resume too.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-06-24 11:55:18 +00:00
+								            self.saved_state = Some(vcpu_state);
-												vmm: cpu: Implement the Snapshottable trait

Implement the Snapshottable trait for Vcpu, and then implements it for
CpuManager. Note that CpuManager goes through the Snapshottable
implementation of Vcpu for every vCPU in order to implement the
Snapshottable trait for itself.

Signed-off-by: Yi Sun <yi.y.sun@linux.intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-18 15:44:41 +00:00
 								            Ok(())
 								        } else {
 								            Err(MigratableError::Restore(anyhow!(
 								                "Could not find the vCPU snapshot section"
 								            )))
 								        }
 								    }
 								}
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								pub struct CpuManager {
-												vmm: cpu: Save CpusConfig into CpuManager

Rather than saving the individual parts into the CpuManager save the
full struct as it now also contains the topology data.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-06-16 10:52:07 +00:00
+								    config: CpusConfig,
-												build: Fixed build errors and warnings on AArch64

This is a preparing commit to build and test CH on AArch64. All building
issues were fixed, but no functionality was introduced.
For X86, the logic of code was not changed at all.
For ARM, the architecture specific part is still empty. And we applied
some tricks to workaround lint warnings. But such code will be replaced
later by other commits with real functionality.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-12 09:49:12 +00:00
+								    #[cfg_attr(target_arch = "aarch64", allow(dead_code))]
-												devices: Refactor IOAPIC to cover other architectures

IOAPIC, a X86 specific interrupt controller, is referenced by device
manager and CPU manager. To work with more architectures, a common
type for all architectures is needed.
This commit introduces trait InterruptController to provide architecture
agnostic functions. Device manager and CPU manager can use it without
caring what the underlying device is.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-25 08:27:08 +00:00
+								    interrupt_controller: Option<Arc<Mutex<dyn InterruptController>>>,
-												build: Fixed build errors and warnings on AArch64

This is a preparing commit to build and test CH on AArch64. All building
issues were fixed, but no functionality was introduced.
For X86, the logic of code was not changed at all.
For ARM, the architecture specific part is still empty. And we applied
some tricks to workaround lint warnings. But such code will be replaced
later by other commits with real functionality.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-12 09:49:12 +00:00
+								    #[cfg_attr(target_arch = "aarch64", allow(dead_code))]
-												vmm: Move codebase to GuestMemoryAtomic from vm-memory

Relying on the latest vm-memory version, including the freshly
introduced structure GuestMemoryAtomic, this patch replaces every
occurrence of Arc<ArcSwap<GuestMemoryMmap> with
GuestMemoryAtomic<GuestMemoryMmap>.

The point is to rely on the common RCU-like implementation from
vm-memory so that we don't have to do it from Cloud-Hypervisor.

Fixes #735

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-02-11 16:22:40 +00:00
+								    vm_memory: GuestMemoryAtomic<GuestMemoryMmap>,
-												build: Fixed build errors and warnings on AArch64

This is a preparing commit to build and test CH on AArch64. All building
issues were fixed, but no functionality was introduced.
For X86, the logic of code was not changed at all.
For ARM, the architecture specific part is still empty. And we applied
some tricks to workaround lint warnings. But such code will be replaced
later by other commits with real functionality.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-12 09:49:12 +00:00
+								    #[cfg(target_arch = "x86_64")]
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								    cpuid: CpuId,
-												build: Fixed build errors and warnings on AArch64

This is a preparing commit to build and test CH on AArch64. All building
issues were fixed, but no functionality was introduced.
For X86, the logic of code was not changed at all.
For ARM, the architecture specific part is still empty. And we applied
some tricks to workaround lint warnings. But such code will be replaced
later by other commits with real functionality.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-12 09:49:12 +00:00
+								    #[cfg_attr(target_arch = "aarch64", allow(dead_code))]
-												vmm: cpu: Rename fd variable into something more meaningful

The fd naming is quite KVM specific. Since we're now using the
hypervisor crate abstractions, we can rename those into something more
readable and meaningful. Like e.g. vcpu or vm.

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-07-03 08:57:35 +00:00
+								    vm: Arc<dyn hypervisor::Vm>,
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								    vcpus_kill_signalled: Arc<AtomicBool>,
 								    vcpus_pause_signalled: Arc<AtomicBool>,
-												vmm: Implement VM rebooting on AArch64

The logic to handle AArch64 system event was: SHUTDOWN and RESET were
all treated as RESET.

Now we handle them differently:
- RESET event will trigger Vmm::vm_reboot(),
- SHUTDOWN event will trigger Vmm::vm_shutdown().

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-10-30 13:34:16 +00:00
+								    exit_evt: EventFd,
-												build: Fixed build errors and warnings on AArch64

This is a preparing commit to build and test CH on AArch64. All building
issues were fixed, but no functionality was introduced.
For X86, the logic of code was not changed at all.
For ARM, the architecture specific part is still empty. And we applied
some tricks to workaround lint warnings. But such code will be replaced
later by other commits with real functionality.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-12 09:49:12 +00:00
+								    #[cfg_attr(target_arch = "aarch64", allow(dead_code))]
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								    reset_evt: EventFd,
-												vmm: cpu: Encapsulate vCPU state into its own struct

Currently this just holds the thread handle but will be enlarged to
encompass details such as whether the vCPU is currently being inserted
or ejected.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 11:32:36 +00:00
+								    vcpu_states: Vec<VcpuState>,
-												vmm: cpu & acpi: Query CPU manager for CPU status

Rather than hardcode the CPU status for all the CPUs instead query from
the CPU manager via the I/O port that is is on via the ACPI tables.

Each CPU device has a _STA method that calls into the CSTA method which
reads and writes the I/O ports via the PRST field which exposes the I/O
port through and OpRegion.

As we only support boot CPUS report that all the CPUs are enabled for
now.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-20 14:06:37 +00:00
+								    selected_cpu: u8,
-												vmm: cpu: Track all Vcpus through CpuManager

In anticipation for the CpuManager to aggregate all Vcpu snapshots
together, this change makes sure the CpuManager has a handle onto
every vCPU.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-18 15:58:51 +00:00
+								    vcpus: Vec<Arc<Mutex<Vcpu>>>,
-												vmm: seccomp: Add seccomp filters for the vcpu worker thread

Partially fixes: #925

Signed-off-by: Bo Chen <chen.bo@intel.com>

											
										
										
											2020-09-09 22:15:26 +00:00
+								    seccomp_action: SeccompAction,
-												hypervisor, vmm: Remove shared ownership of VmmOps

This interface is used by the vCPU thread to delegate responsibility for
handling MMIO/PIO operations and to support different approaches than a
VM exit.

During profiling I found that we were spending 13.75% of the boot CPU
uage acquiring access to the object holding the VmmOps via
ArcSwap::load_full()

    13.75%     6.02%  vcpu0            cloud-hypervisor    [.] arc_swap::ArcSwapAny<T,S>::load_full
            |
            ---arc_swap::ArcSwapAny<T,S>::load_full
               |
                --13.43%--<hypervisor::kvm::KvmVcpu as hypervisor::cpu::Vcpu>::run
                          std::sys_common::backtrace::__rust_begin_short_backtrace
                          core::ops::function::FnOnce::call_once{{vtable-shim}}
                          std::sys::unix::thread::Thread::new::thread_start

However since the object implementing VmmOps does not need to be mutable
and it is only used from the vCPU side we can change the ownership to
being a simple Arc<> that is passed in when calling create_vcpu().

This completely removes the above CPU usage from subsequent profiles.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-11-18 16:37:52 +00:00
+								    vmmops: Arc<Box<dyn VmmOps>>,
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								}
-												vmm: cpu & acpi: Query CPU manager for CPU status

Rather than hardcode the CPU status for all the CPUs instead query from
the CPU manager via the I/O port that is is on via the ACPI tables.

Each CPU device has a _STA method that calls into the CSTA method which
reads and writes the I/O ports via the PRST field which exposes the I/O
port through and OpRegion.

As we only support boot CPUS report that all the CPUs are enabled for
now.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-20 14:06:37 +00:00
+								const CPU_ENABLE_FLAG: usize = 0;
-												vmm: cpu: Only do ACPI notify on newly added vCPUs

When we add a vCPU set an "inserting" boolean that is exposed as an ACPI
field that will be checked for and reset when the ACPI GED notification
for CPU devices happens.

This change is a precursor for CPU unplug.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:42:29 +00:00
+								const CPU_INSERTING_FLAG: usize = 1;
-												vmm: cpu: Notify guest OS that it should offline vCPUs

Allow the resizing of the number of vCPUs to less than the current
active vCPUs. This does not currently remove them from the system but
the kernel will take them offline.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 10:49:05 +00:00
+								const CPU_REMOVING_FLAG: usize = 2;
-												vmm: cpu: Implement CPU removal

When the running OS has been told that a CPU should be removed it will
shutdown the CPU and then signal to the hypervisor via the "_EJ0" method
on the device that ultimately writes into an I/O port than the vCPU
should be shutdown. Upon notification the hypervisor signals to the
individual thread that it should shutdown and waits for that thread to
end.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 11:22:33 +00:00
+								const CPU_EJECT_FLAG: usize = 3;
-												vmm: cpu & acpi: Query CPU manager for CPU status

Rather than hardcode the CPU status for all the CPUs instead query from
the CPU manager via the I/O port that is is on via the ACPI tables.

Each CPU device has a _STA method that calls into the CSTA method which
reads and writes the I/O ports via the PRST field which exposes the I/O
port through and OpRegion.

As we only support boot CPUS report that all the CPUs are enabled for
now.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-20 14:06:37 +00:00
 								const CPU_STATUS_OFFSET: u64 = 4;
 								const CPU_SELECTION_OFFSET: u64 = 0;
-												vmm: cpu: Add the CpuManager onto the IO bus

This allows the kernel (via ACPI based controls) to query and control
the CPU state.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 14:56:10 +00:00
+								impl BusDevice for CpuManager {
-												vmm: cpu & acpi: Query CPU manager for CPU status

Rather than hardcode the CPU status for all the CPUs instead query from
the CPU manager via the I/O port that is is on via the ACPI tables.

Each CPU device has a _STA method that calls into the CSTA method which
reads and writes the I/O ports via the PRST field which exposes the I/O
port through and OpRegion.

As we only support boot CPUS report that all the CPUs are enabled for
now.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-20 14:06:37 +00:00
+								    fn read(&mut self, _base: u64, offset: u64, data: &mut [u8]) {
 								        match offset {
 								            CPU_STATUS_OFFSET => {
-												vmm: cpu: Encapsulate vCPU state into its own struct

Currently this just holds the thread handle but will be enlarged to
encompass details such as whether the vCPU is currently being inserted
or ejected.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 11:32:36 +00:00
+								                if self.selected_cpu < self.present_vcpus() {
 								                    let state = &self.vcpu_states[usize::from(self.selected_cpu)];
 								                    if state.active() {
 								                        data[0] |= 1 << CPU_ENABLE_FLAG;
 								                    }
-												vmm: cpu: Only do ACPI notify on newly added vCPUs

When we add a vCPU set an "inserting" boolean that is exposed as an ACPI
field that will be checked for and reset when the ACPI GED notification
for CPU devices happens.

This change is a precursor for CPU unplug.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:42:29 +00:00
+								                    if state.inserting {
 								                        data[0] |= 1 << CPU_INSERTING_FLAG;
 								                    }
-												vmm: cpu: Notify guest OS that it should offline vCPUs

Allow the resizing of the number of vCPUs to less than the current
active vCPUs. This does not currently remove them from the system but
the kernel will take them offline.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 10:49:05 +00:00
+								                    if state.removing {
 								                        data[0] |= 1 << CPU_REMOVING_FLAG;
 								                    }
-												vmm: cpu: Encapsulate vCPU state into its own struct

Currently this just holds the thread handle but will be enlarged to
encompass details such as whether the vCPU is currently being inserted
or ejected.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 11:32:36 +00:00
+								                }
-												vmm: cpu & acpi: Query CPU manager for CPU status

Rather than hardcode the CPU status for all the CPUs instead query from
the CPU manager via the I/O port that is is on via the ACPI tables.

Each CPU device has a _STA method that calls into the CSTA method which
reads and writes the I/O ports via the PRST field which exposes the I/O
port through and OpRegion.

As we only support boot CPUS report that all the CPUs are enabled for
now.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-20 14:06:37 +00:00
+								            }
 								            _ => {
 								                warn!(
 								                    "Unexpected offset for accessing CPU manager device: {:#}",
 								                    offset
 								                );
 								            }
 								        }
 								    }
-												vmm: cpu: Add the CpuManager onto the IO bus

This allows the kernel (via ACPI based controls) to query and control
the CPU state.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 14:56:10 +00:00
-												vmm: cpu & acpi: Query CPU manager for CPU status

Rather than hardcode the CPU status for all the CPUs instead query from
the CPU manager via the I/O port that is is on via the ACPI tables.

Each CPU device has a _STA method that calls into the CSTA method which
reads and writes the I/O ports via the PRST field which exposes the I/O
port through and OpRegion.

As we only support boot CPUS report that all the CPUs are enabled for
now.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-20 14:06:37 +00:00
+								    fn write(&mut self, _base: u64, offset: u64, data: &[u8]) {
 								        match offset {
 								            CPU_SELECTION_OFFSET => {
 								                self.selected_cpu = data[0];
 								            }
-												vmm: cpu: Only do ACPI notify on newly added vCPUs

When we add a vCPU set an "inserting" boolean that is exposed as an ACPI
field that will be checked for and reset when the ACPI GED notification
for CPU devices happens.

This change is a precursor for CPU unplug.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:42:29 +00:00
+								            CPU_STATUS_OFFSET => {
 								                let state = &mut self.vcpu_states[usize::from(self.selected_cpu)];
 								                // The ACPI code writes back a 1 to acknowledge the insertion
 								                if (data[0] & (1 << CPU_INSERTING_FLAG) == 1 << CPU_INSERTING_FLAG)
 								                    && state.inserting
 								                {
 								                    state.inserting = false;
 								                }
-												vmm: cpu: Notify guest OS that it should offline vCPUs

Allow the resizing of the number of vCPUs to less than the current
active vCPUs. This does not currently remove them from the system but
the kernel will take them offline.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 10:49:05 +00:00
+								                // Ditto for removal
 								                if (data[0] & (1 << CPU_REMOVING_FLAG) == 1 << CPU_REMOVING_FLAG) && state.removing
 								                {
 								                    state.removing = false;
 								                }
-												vmm: cpu: Implement CPU removal

When the running OS has been told that a CPU should be removed it will
shutdown the CPU and then signal to the hypervisor via the "_EJ0" method
on the device that ultimately writes into an I/O port than the vCPU
should be shutdown. Upon notification the hypervisor signals to the
individual thread that it should shutdown and waits for that thread to
end.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 11:22:33 +00:00
+								                // Trigger removal of vCPU
 								                if data[0] & (1 << CPU_EJECT_FLAG) == 1 << CPU_EJECT_FLAG {
 								                    if let Err(e) = self.remove_vcpu(self.selected_cpu) {
 								                        error!("Error removing vCPU: {:?}", e);
 								                    }
 								                }
-												vmm: cpu: Only do ACPI notify on newly added vCPUs

When we add a vCPU set an "inserting" boolean that is exposed as an ACPI
field that will be checked for and reset when the ACPI GED notification
for CPU devices happens.

This change is a precursor for CPU unplug.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:42:29 +00:00
+								            }
-												vmm: cpu & acpi: Query CPU manager for CPU status

Rather than hardcode the CPU status for all the CPUs instead query from
the CPU manager via the I/O port that is is on via the ACPI tables.

Each CPU device has a _STA method that calls into the CSTA method which
reads and writes the I/O ports via the PRST field which exposes the I/O
port through and OpRegion.

As we only support boot CPUS report that all the CPUs are enabled for
now.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-20 14:06:37 +00:00
+								            _ => {
 								                warn!(
 								                    "Unexpected offset for accessing CPU manager device: {:#}",
 								                    offset
 								                );
 								            }
 								        }
 								    }
-												vmm: cpu: Add the CpuManager onto the IO bus

This allows the kernel (via ACPI based controls) to query and control
the CPU state.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 14:56:10 +00:00
+								}
-												vmm: cpu: Create vCPU state for all possible vCPUs

This will make it more straightforward when we attempt to remove vCPUs.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 17:15:25 +00:00
+								#[derive(Default)]
-												vmm: cpu: Encapsulate vCPU state into its own struct

Currently this just holds the thread handle but will be enlarged to
encompass details such as whether the vCPU is currently being inserted
or ejected.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 11:32:36 +00:00
+								struct VcpuState {
-												vmm: cpu: Only do ACPI notify on newly added vCPUs

When we add a vCPU set an "inserting" boolean that is exposed as an ACPI
field that will be checked for and reset when the ACPI GED notification
for CPU devices happens.

This change is a precursor for CPU unplug.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:42:29 +00:00
+								    inserting: bool,
-												vmm: cpu: Notify guest OS that it should offline vCPUs

Allow the resizing of the number of vCPUs to less than the current
active vCPUs. This does not currently remove them from the system but
the kernel will take them offline.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 10:49:05 +00:00
+								    removing: bool,
-												vmm: cpu: Encapsulate vCPU state into its own struct

Currently this just holds the thread handle but will be enlarged to
encompass details such as whether the vCPU is currently being inserted
or ejected.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 11:32:36 +00:00
+								    handle: Option<thread::JoinHandle<()>>,
-												vmm: cpu: Implement CPU removal

When the running OS has been told that a CPU should be removed it will
shutdown the CPU and then signal to the hypervisor via the "_EJ0" method
on the device that ultimately writes into an I/O port than the vCPU
should be shutdown. Upon notification the hypervisor signals to the
individual thread that it should shutdown and waits for that thread to
end.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 11:22:33 +00:00
+								    kill: Arc<AtomicBool>,
-												vmm: cpu: Retry sending signals if necessary

To avoid a race condition where the signal might "miss" the KVM_RUN
ioctl() instead reapeatedly try sending a signal until the vCPU run is
interrupted (as indicated by setting a new per vCPU atomic.)

It important to also clear this atomic when coming out of a paused
state.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-05-06 10:34:19 +00:00
+								    vcpu_run_interrupted: Arc<AtomicBool>,
-												vmm: cpu: Encapsulate vCPU state into its own struct

Currently this just holds the thread handle but will be enlarged to
encompass details such as whether the vCPU is currently being inserted
or ejected.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 11:32:36 +00:00
+								}
 								impl VcpuState {
 								    fn active(&self) -> bool {
 								        self.handle.is_some()
 								    }
 								    fn signal_thread(&self) {
 								        if let Some(handle) = self.handle.as_ref() {
-												vmm: cpu: Retry sending signals if necessary

To avoid a race condition where the signal might "miss" the KVM_RUN
ioctl() instead reapeatedly try sending a signal until the vCPU run is
interrupted (as indicated by setting a new per vCPU atomic.)

It important to also clear this atomic when coming out of a paused
state.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-05-06 10:34:19 +00:00
+								            loop {
 								                unsafe {
 								                    libc::pthread_kill(handle.as_pthread_t() as _, SIGRTMIN());
 								                }
 								                if self.vcpu_run_interrupted.load(Ordering::SeqCst) {
 								                    break;
 								                } else {
 								                    // This is more effective than thread::yield_now() at
 								                    // avoiding a priority inversion with the vCPU thread
 								                    thread::sleep(std::time::Duration::from_millis(1));
 								                }
-												vmm: cpu: Encapsulate vCPU state into its own struct

Currently this just holds the thread handle but will be enlarged to
encompass details such as whether the vCPU is currently being inserted
or ejected.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 11:32:36 +00:00
+								            }
 								        }
 								    }
 								    fn join_thread(&mut self) -> Result<()> {
 								        if let Some(handle) = self.handle.take() {
-												vmm: Fix map_err losing the inner error

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-01-24 08:34:51 +00:00
+								            handle.join().map_err(Error::ThreadCleanup)?
-												vmm: cpu: Encapsulate vCPU state into its own struct

Currently this just holds the thread handle but will be enlarged to
encompass details such as whether the vCPU is currently being inserted
or ejected.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 11:32:36 +00:00
+								        }
 								        Ok(())
 								    }
 								    fn unpark_thread(&self) {
 								        if let Some(handle) = self.handle.as_ref() {
 								            handle.thread().unpark()
 								        }
 								    }
 								}
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								impl CpuManager {
-												hypervisor, arch: Fix warnings introduced in hypervisor crate

This commit fixes some warnings introduced in the previous
hyperviosr crate PR.Removed some unused variables from arch/aarch64
module.

Signed-off-by: Muminul Islam <muislam@microsoft.com>

											
										
										
											2020-06-22 19:38:23 +00:00
+								    #[allow(unused_variables)]
-												vmm: Implement VM rebooting on AArch64

The logic to handle AArch64 system event was: SHUTDOWN and RESET were
all treated as RESET.

Now we handle them differently:
- RESET event will trigger Vmm::vm_reboot(),
- SHUTDOWN event will trigger Vmm::vm_shutdown().

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-10-30 13:34:16 +00:00
+								    #[allow(clippy::too_many_arguments)]
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								    pub fn new(
-												vmm: cpu: Pass CpusConfig to simplify the new() prototype

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-03-16 17:14:15 +00:00
+								        config: &CpusConfig,
-												vmm: Move DeviceManager into an Arc<Mutex<>>

In anticipation of the support for device hotplug, this commit moves the
DeviceManager object into an Arc<Mutex<>> when the DeviceManager is
being created. The reason is, we need the DeviceManager to implement the
BusDevice trait and then provide it to the IO bus, so that IO accesses
related to device hotplug can be handled correctly.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-02-27 09:29:03 +00:00
+								        device_manager: &Arc<Mutex<DeviceManager>>,
-												vmm: Pass MemoryManager through CpuManager creation

Instead of passing the GuestMemoryMmap directly to the CpuManager upon
its creation, it's better to pass a reference to the MemoryManager. This
way we will be able to know if SGX EPC region along with one or multiple
sections are present.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-07-08 13:12:27 +00:00
+								        memory_manager: &Arc<Mutex<MemoryManager>>,
-												vmm: cpu: Rename fd variable into something more meaningful

The fd naming is quite KVM specific. Since we're now using the
hypervisor crate abstractions, we can rename those into something more
readable and meaningful. Like e.g. vcpu or vm.

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-07-03 08:57:35 +00:00
+								        vm: Arc<dyn hypervisor::Vm>,
-												vmm: Implement VM rebooting on AArch64

The logic to handle AArch64 system event was: SHUTDOWN and RESET were
all treated as RESET.

Now we handle them differently:
- RESET event will trigger Vmm::vm_reboot(),
- SHUTDOWN event will trigger Vmm::vm_shutdown().

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-10-30 13:34:16 +00:00
+								        exit_evt: EventFd,
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								        reset_evt: EventFd,
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								        hypervisor: Arc<dyn hypervisor::Hypervisor>,
-												vmm: seccomp: Add seccomp filters for the vcpu worker thread

Partially fixes: #925

Signed-off-by: Bo Chen <chen.bo@intel.com>

											
										
										
											2020-09-09 22:15:26 +00:00
+								        seccomp_action: SeccompAction,
-												hypervisor, vmm: Remove shared ownership of VmmOps

This interface is used by the vCPU thread to delegate responsibility for
handling MMIO/PIO operations and to support different approaches than a
VM exit.

During profiling I found that we were spending 13.75% of the boot CPU
uage acquiring access to the object holding the VmmOps via
ArcSwap::load_full()

    13.75%     6.02%  vcpu0            cloud-hypervisor    [.] arc_swap::ArcSwapAny<T,S>::load_full
            |
            ---arc_swap::ArcSwapAny<T,S>::load_full
               |
                --13.43%--<hypervisor::kvm::KvmVcpu as hypervisor::cpu::Vcpu>::run
                          std::sys_common::backtrace::__rust_begin_short_backtrace
                          core::ops::function::FnOnce::call_once{{vtable-shim}}
                          std::sys::unix::thread::Thread::new::thread_start

However since the object implementing VmmOps does not need to be mutable
and it is only used from the vCPU side we can change the ownership to
being a simple Arc<> that is passed in when calling create_vcpu().

This completely removes the above CPU usage from subsequent profiles.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-11-18 16:37:52 +00:00
+								        vmmops: Arc<Box<dyn VmmOps>>,
-												vmm: cpu: Add the CpuManager onto the IO bus

This allows the kernel (via ACPI based controls) to query and control
the CPU state.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 14:56:10 +00:00
+								    ) -> Result<Arc<Mutex<CpuManager>>> {
-												vmm: Pass MemoryManager through CpuManager creation

Instead of passing the GuestMemoryMmap directly to the CpuManager upon
its creation, it's better to pass a reference to the MemoryManager. This
way we will be able to know if SGX EPC region along with one or multiple
sections are present.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-07-08 13:12:27 +00:00
+								        let guest_memory = memory_manager.lock().unwrap().guest_memory();
-												vmm: cpu: Pass CpusConfig to simplify the new() prototype

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-03-16 17:14:15 +00:00
+								        let mut vcpu_states = Vec::with_capacity(usize::from(config.max_vcpus));
 								        vcpu_states.resize_with(usize::from(config.max_vcpus), VcpuState::default);
-												vmm: cpu: Create vCPU state for all possible vCPUs

This will make it more straightforward when we attempt to remove vCPUs.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 17:15:25 +00:00
-												build: Fixed build errors and warnings on AArch64

This is a preparing commit to build and test CH on AArch64. All building
issues were fixed, but no functionality was introduced.
For X86, the logic of code was not changed at all.
For ARM, the architecture specific part is still empty. And we applied
some tricks to workaround lint warnings. But such code will be replaced
later by other commits with real functionality.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-12 09:49:12 +00:00
+								        #[cfg(target_arch = "x86_64")]
-												arch, hypervisor, vmm: Patch CPUID subleaves to expose EPC sections

The support for SGX is exposed to the guest through CPUID 0x12. KVM
passes static subleaves 0 and 1 from the host to the guest, without
needing any modification from the VMM itself.

But SGX also relies on dynamic subleaves 2 through N, used for
describing each EPC section. This is not handled by KVM, which means
the VMM is in charge of setting each subleaf starting from index 2
up to index N, depending on the number of EPC sections.

These subleaves 2 through N are not listed as part of the supported
CPUID entries from KVM. But it's important to set them as long as index
0 and 1 are present and indicate that SGX is supported.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-07-08 14:58:10 +00:00
+								        let sgx_epc_sections =
 								            if let Some(sgx_epc_region) = memory_manager.lock().unwrap().sgx_epc_region() {
 								                Some(sgx_epc_region.epc_sections().clone())
 								            } else {
 								                None
 								            };
 								        #[cfg(target_arch = "x86_64")]
 								        let cpuid = CpuManager::patch_cpuid(hypervisor, &config.topology, sgx_epc_sections)?;
 								        let device_manager = device_manager.lock().unwrap();
-												vmm: Encase CpuManager within an Arc<Mutex<>>

This is necessary to be able to add the CpuManager onto the IO bus.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 14:31:11 +00:00
+								        let cpu_manager = Arc::new(Mutex::new(CpuManager {
-												vmm: cpu: Save CpusConfig into CpuManager

Rather than saving the individual parts into the CpuManager save the
full struct as it now also contains the topology data.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-06-16 10:52:07 +00:00
+								            config: config.clone(),
-												devices: Refactor IOAPIC to cover other architectures

IOAPIC, a X86 specific interrupt controller, is referenced by device
manager and CPU manager. To work with more architectures, a common
type for all architectures is needed.
This commit introduces trait InterruptController to provide architecture
agnostic functions. Device manager and CPU manager can use it without
caring what the underlying device is.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-25 08:27:08 +00:00
+								            interrupt_controller: device_manager.interrupt_controller().clone(),
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								            vm_memory: guest_memory,
-												build: Fixed build errors and warnings on AArch64

This is a preparing commit to build and test CH on AArch64. All building
issues were fixed, but no functionality was introduced.
For X86, the logic of code was not changed at all.
For ARM, the architecture specific part is still empty. And we applied
some tricks to workaround lint warnings. But such code will be replaced
later by other commits with real functionality.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-12 09:49:12 +00:00
+								            #[cfg(target_arch = "x86_64")]
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								            cpuid,
-												vmm: cpu: Rename fd variable into something more meaningful

The fd naming is quite KVM specific. Since we're now using the
hypervisor crate abstractions, we can rename those into something more
readable and meaningful. Like e.g. vcpu or vm.

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-07-03 08:57:35 +00:00
+								            vm,
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								            vcpus_kill_signalled: Arc::new(AtomicBool::new(false)),
 								            vcpus_pause_signalled: Arc::new(AtomicBool::new(false)),
-												vmm: cpu: Create vCPU state for all possible vCPUs

This will make it more straightforward when we attempt to remove vCPUs.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 17:15:25 +00:00
+								            vcpu_states,
-												vmm: Implement VM rebooting on AArch64

The logic to handle AArch64 system event was: SHUTDOWN and RESET were
all treated as RESET.

Now we handle them differently:
- RESET event will trigger Vmm::vm_reboot(),
- SHUTDOWN event will trigger Vmm::vm_shutdown().

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-10-30 13:34:16 +00:00
+								            exit_evt,
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								            reset_evt,
-												vmm: cpu & acpi: Query CPU manager for CPU status

Rather than hardcode the CPU status for all the CPUs instead query from
the CPU manager via the I/O port that is is on via the ACPI tables.

Each CPU device has a _STA method that calls into the CSTA method which
reads and writes the I/O ports via the PRST field which exposes the I/O
port through and OpRegion.

As we only support boot CPUS report that all the CPUs are enabled for
now.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-20 14:06:37 +00:00
+								            selected_cpu: 0,
-												vmm: cpu: Track all Vcpus through CpuManager

In anticipation for the CpuManager to aggregate all Vcpu snapshots
together, this change makes sure the CpuManager has a handle onto
every vCPU.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-18 15:58:51 +00:00
+								            vcpus: Vec::with_capacity(usize::from(config.max_vcpus)),
-												vmm: seccomp: Add seccomp filters for the vcpu worker thread

Partially fixes: #925

Signed-off-by: Bo Chen <chen.bo@intel.com>

											
										
										
											2020-09-09 22:15:26 +00:00
+								            seccomp_action,
-												hypervisor, vmm: Remove shared ownership of VmmOps

This interface is used by the vCPU thread to delegate responsibility for
handling MMIO/PIO operations and to support different approaches than a
VM exit.

During profiling I found that we were spending 13.75% of the boot CPU
uage acquiring access to the object holding the VmmOps via
ArcSwap::load_full()

    13.75%     6.02%  vcpu0            cloud-hypervisor    [.] arc_swap::ArcSwapAny<T,S>::load_full
            |
            ---arc_swap::ArcSwapAny<T,S>::load_full
               |
                --13.43%--<hypervisor::kvm::KvmVcpu as hypervisor::cpu::Vcpu>::run
                          std::sys_common::backtrace::__rust_begin_short_backtrace
                          core::ops::function::FnOnce::call_once{{vtable-shim}}
                          std::sys::unix::thread::Thread::new::thread_start

However since the object implementing VmmOps does not need to be mutable
and it is only used from the vCPU side we can change the ownership to
being a simple Arc<> that is passed in when calling create_vcpu().

This completely removes the above CPU usage from subsequent profiles.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-11-18 16:37:52 +00:00
+								            vmmops,
-												vmm: Encase CpuManager within an Arc<Mutex<>>

This is necessary to be able to add the CpuManager onto the IO bus.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 14:31:11 +00:00
+								        }));
-												vmm: Enable memory manager for AArch64

Screened IO space as it is not available on AArch64.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-06-09 06:54:15 +00:00
+								        #[cfg(target_arch = "x86_64")]
-												Revert "vmm: Move CpuManager device to MMIO region"

This reverts commit 980e03fa0ab3d217fe91fd60d8459507c903d88b.

											
										
										
											2020-01-24 10:36:39 +00:00
+								        device_manager
 								            .allocator()
 								            .lock()
 								            .unwrap()
 								            .allocate_io_addresses(Some(GuestAddress(0x0cd8)), 0x8, None)
 								            .ok_or(Error::AllocateIOPort)?;
-												vmm: Enable device manager for AArch64

Screened IO bus because it is not for AArch64.
Enabled Serial, RTC and Virtio devices with MMIO transport option.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-06-09 06:17:42 +00:00
+								        #[cfg(target_arch = "x86_64")]
-												hypervisor, vmm: Introduce VmmOps trait

Run loop in hypervisor needs a callback mechanism to access resources
like guest memory, mmio, pio etc.

VmmOps trait is introduced here, which is implemented by vmm module.
While handling vcpuexits in run loop, this trait allows hypervisor
module access to the above mentioned resources via callbacks.

Signed-off-by: Praveen Paladugu <prapal@microsoft.com>
Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-09-03 20:50:56 +00:00
+								        device_manager
 								            .io_bus()
-												Revert "vmm: Move CpuManager device to MMIO region"

This reverts commit 980e03fa0ab3d217fe91fd60d8459507c903d88b.

											
										
										
											2020-01-24 10:36:39 +00:00
+								            .insert(cpu_manager.clone(), 0x0cd8, 0xc)
-												vmm: cpu: Add the CpuManager onto the IO bus

This allows the kernel (via ACPI based controls) to query and control
the CPU state.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 14:56:10 +00:00
+								            .map_err(Error::BusError)?;
 								        Ok(cpu_manager)
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								    }
-												build: Fixed build errors and warnings on AArch64

This is a preparing commit to build and test CH on AArch64. All building
issues were fixed, but no functionality was introduced.
For X86, the logic of code was not changed at all.
For ARM, the architecture specific part is still empty. And we applied
some tricks to workaround lint warnings. But such code will be replaced
later by other commits with real functionality.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-12 09:49:12 +00:00
+								    #[cfg(target_arch = "x86_64")]
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								    fn patch_cpuid(
 								        hypervisor: Arc<dyn hypervisor::Hypervisor>,
 								        topology: &Option<CpuTopology>,
-												arch, hypervisor, vmm: Patch CPUID subleaves to expose EPC sections

The support for SGX is exposed to the guest through CPUID 0x12. KVM
passes static subleaves 0 and 1 from the host to the guest, without
needing any modification from the VMM itself.

But SGX also relies on dynamic subleaves 2 through N, used for
describing each EPC section. This is not handled by KVM, which means
the VMM is in charge of setting each subleaf starting from index 2
up to index N, depending on the number of EPC sections.

These subleaves 2 through N are not listed as part of the supported
CPUID entries from KVM. But it's important to set them as long as index
0 and 1 are present and indicate that SGX is supported.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-07-08 14:58:10 +00:00
+								        sgx_epc_sections: Option<Vec<SgxEpcSection>>,
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								    ) -> Result<CpuId> {
-												vmm: cpu: Move CPUID patching to CpuManager

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-03-16 15:15:38 +00:00
+								        let mut cpuid_patches = Vec::new();
 								        // Patch tsc deadline timer bit
 								        cpuid_patches.push(CpuidPatch {
 								            function: 1,
 								            index: 0,
 								            flags_bit: None,
 								            eax_bit: None,
 								            ebx_bit: None,
 								            ecx_bit: Some(TSC_DEADLINE_TIMER_ECX_BIT),
 								            edx_bit: None,
 								        });
 								        // Patch hypervisor bit
 								        cpuid_patches.push(CpuidPatch {
 								            function: 1,
 								            index: 0,
 								            flags_bit: None,
 								            eax_bit: None,
 								            ebx_bit: None,
 								            ecx_bit: Some(HYPERVISOR_ECX_BIT),
 								            edx_bit: None,
 								        });
-												vmm: cpu: x86: Enable MTRR feature in CPUID

The MTRR feature was missing from the CPUID, which is causing the guest
to ignore the MTRR settings exposed through dedicated MSRs.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-09-25 12:19:03 +00:00
+								        // Enable MTRR feature
 								        cpuid_patches.push(CpuidPatch {
 								            function: 1,
 								            index: 0,
 								            flags_bit: None,
 								            eax_bit: None,
 								            ebx_bit: None,
 								            ecx_bit: None,
 								            edx_bit: Some(MTRR_EDX_BIT),
 								        });
-												vmm: cpu: Move CPUID patching to CpuManager

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-03-16 15:15:38 +00:00
+								        // Supported CPUID
-												arch, pci, vmm: Initial switch to the hypervisor crate

Start moving the vmm, arch and pci crates to being hypervisor agnostic
by using the hypervisor trait and abstractions. This is not a complete
switch and there are still some remaining KVM dependencies.

Signed-off-by: Muminul Islam <muislam@microsoft.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-06-02 02:29:54 +00:00
+								        let mut cpuid = hypervisor
 								            .get_cpuid()
 								            .map_err(|e| Error::PatchCpuId(e.into()))?;
-												vmm: cpu: Move CPUID patching to CpuManager

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-03-16 15:15:38 +00:00
 								        CpuidPatch::patch_cpuid(&mut cpuid, cpuid_patches);
-												vmm, arch: x86_64: Fill the CPUID leaves with the topology

There are two CPUID leaves for handling CPU topology, 0xb and 0x1f. The
difference between the two is that the 0x1f leaf (Extended Topology
Leaf) supports exposing multiple die packages.

Fixes: #1284

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-06-16 13:48:37 +00:00
+								        if let Some(t) = topology {
 								            arch::x86_64::update_cpuid_topology(
 								                &mut cpuid,
 								                t.threads_per_core,
 								                t.cores_per_die,
 								                t.dies_per_package,
 								            );
 								        }
-												arch, hypervisor, vmm: Patch CPUID subleaves to expose EPC sections

The support for SGX is exposed to the guest through CPUID 0x12. KVM
passes static subleaves 0 and 1 from the host to the guest, without
needing any modification from the VMM itself.

But SGX also relies on dynamic subleaves 2 through N, used for
describing each EPC section. This is not handled by KVM, which means
the VMM is in charge of setting each subleaf starting from index 2
up to index N, depending on the number of EPC sections.

These subleaves 2 through N are not listed as part of the supported
CPUID entries from KVM. But it's important to set them as long as index
0 and 1 are present and indicate that SGX is supported.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-07-08 14:58:10 +00:00
+								        if let Some(sgx_epc_sections) = sgx_epc_sections {
 								            arch::x86_64::update_cpuid_sgx(&mut cpuid, sgx_epc_sections).unwrap();
 								        }
-												vmm: cpu: Move CPUID patching to CpuManager

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-03-16 15:15:38 +00:00
+								        Ok(cpuid)
 								    }
-												vmm: Change booting process to cover AArch64 requirements

Between X86 and AArch64, there is some difference in booting a VM:
- X86_64 can setup IOAPIC before creating any VCPU.
- AArch64 have to create VCPU's before creating GIC.

The old process is:
1. load_kernel()
    load kernel binary
    configure system
2. activate_vcpus()
    create & start VCPU's

So we need to separate "activate_vcpus" into "create_vcpus" and
"activate_vcpus" (to start vcpus only). Setup GIC and create FDT
between the 2 steps.

The new procedure is:
1. load_kernel()
    load kernel binary
    (X86_64) configure system
2. create VCPU's
3. (AArch64) setup GIC
4. (AArch64) configure system
5. start VCPU's

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-26 07:20:22 +00:00
+								    fn create_vcpu(
-												vmm: cpu: Factorize vcpu starting code

Anticipating the need for a slightly different function for restoring
vCPUs, this patch factorizes most of the vCPU creation, so that it can
be reused for migration purposes.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-04-03 12:27:41 +00:00
+								        &mut self,
 								        cpu_id: u8,
 								        entry_point: Option<EntryPoint>,
-												vmm: cpu: Implement the Snapshottable trait

Implement the Snapshottable trait for Vcpu, and then implements it for
CpuManager. Note that CpuManager goes through the Snapshottable
implementation of Vcpu for every vCPU in order to implement the
Snapshottable trait for itself.

Signed-off-by: Yi Sun <yi.y.sun@linux.intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-18 15:44:41 +00:00
+								        snapshot: Option<Snapshot>,
-												vmm: Change booting process to cover AArch64 requirements

Between X86 and AArch64, there is some difference in booting a VM:
- X86_64 can setup IOAPIC before creating any VCPU.
- AArch64 have to create VCPU's before creating GIC.

The old process is:
1. load_kernel()
    load kernel binary
    configure system
2. activate_vcpus()
    create & start VCPU's

So we need to separate "activate_vcpus" into "create_vcpus" and
"activate_vcpus" (to start vcpus only). Setup GIC and create FDT
between the 2 steps.

The new procedure is:
1. load_kernel()
    load kernel binary
    (X86_64) configure system
2. create VCPU's
3. (AArch64) setup GIC
4. (AArch64) configure system
5. start VCPU's

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-26 07:20:22 +00:00
+								    ) -> Result<Arc<Mutex<Vcpu>>> {
-												vmm: cpu: Add info!() level debugging to vCPU handling

These messages are intended to be useful to support debugging related to
vCPU hotplug/unplug issues.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-06-23 12:11:00 +00:00
+								        info!("Creating vCPU: cpu_id = {}", cpu_id);
-												hypervisor, vmm: Remove shared ownership of VmmOps

This interface is used by the vCPU thread to delegate responsibility for
handling MMIO/PIO operations and to support different approaches than a
VM exit.

During profiling I found that we were spending 13.75% of the boot CPU
uage acquiring access to the object holding the VmmOps via
ArcSwap::load_full()

    13.75%     6.02%  vcpu0            cloud-hypervisor    [.] arc_swap::ArcSwapAny<T,S>::load_full
            |
            ---arc_swap::ArcSwapAny<T,S>::load_full
               |
                --13.43%--<hypervisor::kvm::KvmVcpu as hypervisor::cpu::Vcpu>::run
                          std::sys_common::backtrace::__rust_begin_short_backtrace
                          core::ops::function::FnOnce::call_once{{vtable-shim}}
                          std::sys::unix::thread::Thread::new::thread_start

However since the object implementing VmmOps does not need to be mutable
and it is only used from the vCPU side we can change the ownership to
being a simple Arc<> that is passed in when calling create_vcpu().

This completely removes the above CPU usage from subsequent profiles.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-11-18 16:37:52 +00:00
+								        let vcpu = Vcpu::new(cpu_id, &self.vm, Some(self.vmmops.clone()))?;
-												vmm: cpu: Factorize vcpu starting code

Anticipating the need for a slightly different function for restoring
vCPUs, this patch factorizes most of the vCPU creation, so that it can
be reused for migration purposes.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-04-03 12:27:41 +00:00
-												vmm: cpu: Implement the Snapshottable trait

Implement the Snapshottable trait for Vcpu, and then implements it for
CpuManager. Note that CpuManager goes through the Snapshottable
implementation of Vcpu for every vCPU in order to implement the
Snapshottable trait for itself.

Signed-off-by: Yi Sun <yi.y.sun@linux.intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-18 15:44:41 +00:00
+								        if let Some(snapshot) = snapshot {
-												vmm: refactor vCPU save/restore code in restoring VM

Similarly as the VM booting process, on AArch64 systems,
the vCPUs should be created before the creation of GIC. This
commit refactors the vCPU save/restore code to achieve the
above-mentioned restoring order.

Signed-off-by: Henry Wang <Henry.Wang@arm.com>

											
										
										
											2020-09-04 10:56:30 +00:00
+								            // AArch64 vCPUs should be initialized after created.
 								            #[cfg(target_arch = "aarch64")]
 								            vcpu.lock().unwrap().init(&self.vm)?;
-												vmm: cpu: Implement the Snapshottable trait

Implement the Snapshottable trait for Vcpu, and then implements it for
CpuManager. Note that CpuManager goes through the Snapshottable
implementation of Vcpu for every vCPU in order to implement the
Snapshottable trait for itself.

Signed-off-by: Yi Sun <yi.y.sun@linux.intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-18 15:44:41 +00:00
+								            vcpu.lock()
 								                .unwrap()
 								                .restore(snapshot)
 								                .expect("Failed to restore vCPU");
 								        } else {
 								            let vm_memory = self.vm_memory.clone();
-												vmm: cpu: Set CPU physical bits based on user input

If the user specified a maximum physical bits value through the
`max_phys_bits` option from `--cpus` parameter, the guest CPUID
will be patched accordingly to ensure the guest will find the
right amount of physical bits.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-10-13 08:22:44 +00:00
+								            let phys_bits = physical_bits(self.config.max_phys_bits);
-												vmm: Change booting process to cover AArch64 requirements

Between X86 and AArch64, there is some difference in booting a VM:
- X86_64 can setup IOAPIC before creating any VCPU.
- AArch64 have to create VCPU's before creating GIC.

The old process is:
1. load_kernel()
    load kernel binary
    configure system
2. activate_vcpus()
    create & start VCPU's

So we need to separate "activate_vcpus" into "create_vcpus" and
"activate_vcpus" (to start vcpus only). Setup GIC and create FDT
between the 2 steps.

The new procedure is:
1. load_kernel()
    load kernel binary
    (X86_64) configure system
2. create VCPU's
3. (AArch64) setup GIC
4. (AArch64) configure system
5. start VCPU's

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-26 07:20:22 +00:00
+								            #[cfg(target_arch = "x86_64")]
-												vmm: cpu: Implement the Snapshottable trait

Implement the Snapshottable trait for Vcpu, and then implements it for
CpuManager. Note that CpuManager goes through the Snapshottable
implementation of Vcpu for every vCPU in order to implement the
Snapshottable trait for itself.

Signed-off-by: Yi Sun <yi.y.sun@linux.intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-18 15:44:41 +00:00
+								            vcpu.lock()
 								                .unwrap()
-												vmm, arch: Enable KVM HyperV support

Inject CPUID leaves for advertising KVM HyperV support when the
"kvm_hyperv" toggle is enabled. Currently we only enable a selection of
features required to boot.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-09-15 15:26:34 +00:00
+								                .configure(
 								                    entry_point,
 								                    &vm_memory,
 								                    self.cpuid.clone(),
 								                    self.config.kvm_hyperv,
-												vmm: cpu: Set CPU physical bits based on user input

If the user specified a maximum physical bits value through the
`max_phys_bits` option from `--cpus` parameter, the guest CPUID
will be patched accordingly to ensure the guest will find the
right amount of physical bits.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-10-13 08:22:44 +00:00
+								                    phys_bits,
-												vmm, arch: Enable KVM HyperV support

Inject CPUID leaves for advertising KVM HyperV support when the
"kvm_hyperv" toggle is enabled. Currently we only enable a selection of
features required to boot.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-09-15 15:26:34 +00:00
+								                )
-												vmm: cpu: Implement the Snapshottable trait

Implement the Snapshottable trait for Vcpu, and then implements it for
CpuManager. Note that CpuManager goes through the Snapshottable
implementation of Vcpu for every vCPU in order to implement the
Snapshottable trait for itself.

Signed-off-by: Yi Sun <yi.y.sun@linux.intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-18 15:44:41 +00:00
+								                .expect("Failed to configure vCPU");
-												vmm: Change booting process to cover AArch64 requirements

Between X86 and AArch64, there is some difference in booting a VM:
- X86_64 can setup IOAPIC before creating any VCPU.
- AArch64 have to create VCPU's before creating GIC.

The old process is:
1. load_kernel()
    load kernel binary
    configure system
2. activate_vcpus()
    create & start VCPU's

So we need to separate "activate_vcpus" into "create_vcpus" and
"activate_vcpus" (to start vcpus only). Setup GIC and create FDT
between the 2 steps.

The new procedure is:
1. load_kernel()
    load kernel binary
    (X86_64) configure system
2. create VCPU's
3. (AArch64) setup GIC
4. (AArch64) configure system
5. start VCPU's

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-26 07:20:22 +00:00
 								            #[cfg(target_arch = "aarch64")]
 								            vcpu.lock()
 								                .unwrap()
-												vmm: cpu: Set CPU physical bits based on user input

If the user specified a maximum physical bits value through the
`max_phys_bits` option from `--cpus` parameter, the guest CPUID
will be patched accordingly to ensure the guest will find the
right amount of physical bits.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-10-13 08:22:44 +00:00
+								                .configure(&self.vm, entry_point, &vm_memory, phys_bits)
-												vmm: Change booting process to cover AArch64 requirements

Between X86 and AArch64, there is some difference in booting a VM:
- X86_64 can setup IOAPIC before creating any VCPU.
- AArch64 have to create VCPU's before creating GIC.

The old process is:
1. load_kernel()
    load kernel binary
    configure system
2. activate_vcpus()
    create & start VCPU's

So we need to separate "activate_vcpus" into "create_vcpus" and
"activate_vcpus" (to start vcpus only). Setup GIC and create FDT
between the 2 steps.

The new procedure is:
1. load_kernel()
    load kernel binary
    (X86_64) configure system
2. create VCPU's
3. (AArch64) setup GIC
4. (AArch64) configure system
5. start VCPU's

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-26 07:20:22 +00:00
+								                .expect("Failed to configure vCPU");
-												vmm: cpu: Implement the Snapshottable trait

Implement the Snapshottable trait for Vcpu, and then implements it for
CpuManager. Note that CpuManager goes through the Snapshottable
implementation of Vcpu for every vCPU in order to implement the
Snapshottable trait for itself.

Signed-off-by: Yi Sun <yi.y.sun@linux.intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-18 15:44:41 +00:00
+								        }
-												vmm: cpu: Factorize vcpu starting code

Anticipating the need for a slightly different function for restoring
vCPUs, this patch factorizes most of the vCPU creation, so that it can
be reused for migration purposes.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-04-03 12:27:41 +00:00
-												vmm: Fill CpuManager's vCPU list on restore path

It's important that on restore path, the CpuManager's vCPU gets filled
with each new vCPU that is being created. In order to cover both boot
and restore paths, the list is being filled from the common function
create_vcpu().

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-06-24 08:18:46 +00:00
+								        // Adding vCPU to the CpuManager's vCPU list.
 								        self.vcpus.push(Arc::clone(&vcpu));
-												vmm: Change booting process to cover AArch64 requirements

Between X86 and AArch64, there is some difference in booting a VM:
- X86_64 can setup IOAPIC before creating any VCPU.
- AArch64 have to create VCPU's before creating GIC.

The old process is:
1. load_kernel()
    load kernel binary
    configure system
2. activate_vcpus()
    create & start VCPU's

So we need to separate "activate_vcpus" into "create_vcpus" and
"activate_vcpus" (to start vcpus only). Setup GIC and create FDT
between the 2 steps.

The new procedure is:
1. load_kernel()
    load kernel binary
    (X86_64) configure system
2. create VCPU's
3. (AArch64) setup GIC
4. (AArch64) configure system
5. start VCPU's

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-26 07:20:22 +00:00
-												vmm: Fill CpuManager's vCPU list on restore path

It's important that on restore path, the CpuManager's vCPU gets filled
with each new vCPU that is being created. In order to cover both boot
and restore paths, the list is being filled from the common function
create_vcpu().

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-06-24 08:18:46 +00:00
+								        Ok(vcpu)
-												vmm: Change booting process to cover AArch64 requirements

Between X86 and AArch64, there is some difference in booting a VM:
- X86_64 can setup IOAPIC before creating any VCPU.
- AArch64 have to create VCPU's before creating GIC.

The old process is:
1. load_kernel()
    load kernel binary
    configure system
2. activate_vcpus()
    create & start VCPU's

So we need to separate "activate_vcpus" into "create_vcpus" and
"activate_vcpus" (to start vcpus only). Setup GIC and create FDT
between the 2 steps.

The new procedure is:
1. load_kernel()
    load kernel binary
    (X86_64) configure system
2. create VCPU's
3. (AArch64) setup GIC
4. (AArch64) configure system
5. start VCPU's

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-26 07:20:22 +00:00
+								    }
-												vmm: cpu: Reuse already allocated vCPUs if available

When a request is made to increase the number of vCPUs in the VM attempt
to reuse any previously removed (and hence inactive) vCPUs before
creating new ones.

This ensures that the APIC ID is not reused for a different KVM vCPU
(which is not allowed) and that the APIC IDs are also sequential.

The two key changes to support this are:

* Clearing the "kill" bit on the old vCPU state so that it does not
  immediately exit upon thread recreation.
* Using the length of the vcpus vector (the number of allocated vcpus)
  rather than the number of active vCPUs (.present_vcpus()) to determine
  how many should be created.

This change also introduced some new info!() debugging on the vCPU
creation/removal path to aid further development in the future.

TEST=Expanded test_cpu_hotplug test.

Fixes: #1338

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-06-23 11:52:17 +00:00
+								    /// Only create new vCPUs if there aren't any inactive ones to reuse
-												vmm: Change booting process to cover AArch64 requirements

Between X86 and AArch64, there is some difference in booting a VM:
- X86_64 can setup IOAPIC before creating any VCPU.
- AArch64 have to create VCPU's before creating GIC.

The old process is:
1. load_kernel()
    load kernel binary
    configure system
2. activate_vcpus()
    create & start VCPU's

So we need to separate "activate_vcpus" into "create_vcpus" and
"activate_vcpus" (to start vcpus only). Setup GIC and create FDT
between the 2 steps.

The new procedure is:
1. load_kernel()
    load kernel binary
    (X86_64) configure system
2. create VCPU's
3. (AArch64) setup GIC
4. (AArch64) configure system
5. start VCPU's

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-26 07:20:22 +00:00
+								    fn create_vcpus(&mut self, desired_vcpus: u8, entry_point: Option<EntryPoint>) -> Result<()> {
-												vmm: cpu: Add info!() level debugging to vCPU handling

These messages are intended to be useful to support debugging related to
vCPU hotplug/unplug issues.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-06-23 12:11:00 +00:00
+								        info!(
 								            "Request to create new vCPUs: desired = {}, max = {}, allocated = {}, present = {}",
 								            desired_vcpus,
 								            self.config.max_vcpus,
 								            self.vcpus.len(),
 								            self.present_vcpus()
 								        );
-												vmm: cpu: Save CpusConfig into CpuManager

Rather than saving the individual parts into the CpuManager save the
full struct as it now also contains the topology data.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-06-16 10:52:07 +00:00
+								        if desired_vcpus > self.config.max_vcpus {
-												vmm: Change booting process to cover AArch64 requirements

Between X86 and AArch64, there is some difference in booting a VM:
- X86_64 can setup IOAPIC before creating any VCPU.
- AArch64 have to create VCPU's before creating GIC.

The old process is:
1. load_kernel()
    load kernel binary
    configure system
2. activate_vcpus()
    create & start VCPU's

So we need to separate "activate_vcpus" into "create_vcpus" and
"activate_vcpus" (to start vcpus only). Setup GIC and create FDT
between the 2 steps.

The new procedure is:
1. load_kernel()
    load kernel binary
    (X86_64) configure system
2. create VCPU's
3. (AArch64) setup GIC
4. (AArch64) configure system
5. start VCPU's

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-26 07:20:22 +00:00
+								            return Err(Error::DesiredVCPUCountExceedsMax);
 								        }
-												vmm: cpu: Reuse already allocated vCPUs if available

When a request is made to increase the number of vCPUs in the VM attempt
to reuse any previously removed (and hence inactive) vCPUs before
creating new ones.

This ensures that the APIC ID is not reused for a different KVM vCPU
(which is not allowed) and that the APIC IDs are also sequential.

The two key changes to support this are:

* Clearing the "kill" bit on the old vCPU state so that it does not
  immediately exit upon thread recreation.
* Using the length of the vcpus vector (the number of allocated vcpus)
  rather than the number of active vCPUs (.present_vcpus()) to determine
  how many should be created.

This change also introduced some new info!() debugging on the vCPU
creation/removal path to aid further development in the future.

TEST=Expanded test_cpu_hotplug test.

Fixes: #1338

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-06-23 11:52:17 +00:00
+								        // Only create vCPUs in excess of all the allocated vCPUs.
 								        for cpu_id in self.vcpus.len() as u8..desired_vcpus {
-												vmm: Fill CpuManager's vCPU list on restore path

It's important that on restore path, the CpuManager's vCPU gets filled
with each new vCPU that is being created. In order to cover both boot
and restore paths, the list is being filled from the common function
create_vcpu().

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-06-24 08:18:46 +00:00
+								            self.create_vcpu(cpu_id, entry_point, None)?;
-												vmm: Change booting process to cover AArch64 requirements

Between X86 and AArch64, there is some difference in booting a VM:
- X86_64 can setup IOAPIC before creating any VCPU.
- AArch64 have to create VCPU's before creating GIC.

The old process is:
1. load_kernel()
    load kernel binary
    configure system
2. activate_vcpus()
    create & start VCPU's

So we need to separate "activate_vcpus" into "create_vcpus" and
"activate_vcpus" (to start vcpus only). Setup GIC and create FDT
between the 2 steps.

The new procedure is:
1. load_kernel()
    load kernel binary
    (X86_64) configure system
2. create VCPU's
3. (AArch64) setup GIC
4. (AArch64) configure system
5. start VCPU's

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-26 07:20:22 +00:00
+								        }
 								        Ok(())
 								    }
 								    fn start_vcpu(
 								        &mut self,
 								        vcpu: Arc<Mutex<Vcpu>>,
 								        vcpu_thread_barrier: Arc<Barrier>,
 								        inserting: bool,
 								    ) -> Result<()> {
 								        let cpu_id = vcpu.lock().unwrap().id;
 								        let reset_evt = self.reset_evt.try_clone().unwrap();
-												vmm: Implement VM rebooting on AArch64

The logic to handle AArch64 system event was: SHUTDOWN and RESET were
all treated as RESET.

Now we handle them differently:
- RESET event will trigger Vmm::vm_reboot(),
- SHUTDOWN event will trigger Vmm::vm_shutdown().

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-10-30 13:34:16 +00:00
+								        let exit_evt = self.exit_evt.try_clone().unwrap();
-												vmm: Change booting process to cover AArch64 requirements

Between X86 and AArch64, there is some difference in booting a VM:
- X86_64 can setup IOAPIC before creating any VCPU.
- AArch64 have to create VCPU's before creating GIC.

The old process is:
1. load_kernel()
    load kernel binary
    configure system
2. activate_vcpus()
    create & start VCPU's

So we need to separate "activate_vcpus" into "create_vcpus" and
"activate_vcpus" (to start vcpus only). Setup GIC and create FDT
between the 2 steps.

The new procedure is:
1. load_kernel()
    load kernel binary
    (X86_64) configure system
2. create VCPU's
3. (AArch64) setup GIC
4. (AArch64) configure system
5. start VCPU's

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-26 07:20:22 +00:00
+								        let vcpu_kill_signalled = self.vcpus_kill_signalled.clone();
 								        let vcpu_pause_signalled = self.vcpus_pause_signalled.clone();
 								        let vcpu_kill = self.vcpu_states[usize::from(cpu_id)].kill.clone();
 								        let vcpu_run_interrupted = self.vcpu_states[usize::from(cpu_id)]
 								            .vcpu_run_interrupted
 								            .clone();
-												vmm: cpu: Factorize vcpu starting code

Anticipating the need for a slightly different function for restoring
vCPUs, this patch factorizes most of the vCPU creation, so that it can
be reused for migration purposes.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-04-03 12:27:41 +00:00
-												vmm: cpu: Add info!() level debugging to vCPU handling

These messages are intended to be useful to support debugging related to
vCPU hotplug/unplug issues.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-06-23 12:11:00 +00:00
+								        info!("Starting vCPU: cpu_id = {}", cpu_id);
-												vmm: seccomp: Add seccomp filters for the vcpu worker thread

Partially fixes: #925

Signed-off-by: Bo Chen <chen.bo@intel.com>

											
										
										
											2020-09-09 22:15:26 +00:00
+								        // Retrieve seccomp filter for vcpu thread
 								        let vcpu_seccomp_filter = get_seccomp_filter(&self.seccomp_action, Thread::Vcpu)
 								            .map_err(Error::CreateSeccompFilter)?;
-												vmm: Handle hypervisor VCPU run result from Vcpu to VcpuManager

Now Vcpu::run() returns a boolean value to VcpuManager, indicating
whether the VM is going to reboot (false) or just continue (true).
Moving the handling of hypervisor VCPU run result from Vcpu to
VcpuManager gives us the flexibility to handle more scenarios like
shutting down on AArch64.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-10-30 13:01:53 +00:00
+								        #[cfg(target_arch = "x86_64")]
 								        let interrupt_controller_clone =
 								            if let Some(interrupt_controller) = &self.interrupt_controller {
 								                Some(interrupt_controller.clone())
 								            } else {
 								                None
 								            };
-												vmm: cpu: Factorize vcpu starting code

Anticipating the need for a slightly different function for restoring
vCPUs, this patch factorizes most of the vCPU creation, so that it can
be reused for migration purposes.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-04-03 12:27:41 +00:00
+								        let handle = Some(
 								            thread::Builder::new()
 								                .name(format!("vcpu{}", cpu_id))
 								                .spawn(move || {
-												vmm: seccomp: Add seccomp filters for the vcpu worker thread

Partially fixes: #925

Signed-off-by: Bo Chen <chen.bo@intel.com>

											
										
										
											2020-09-09 22:15:26 +00:00
+								                    // Apply seccomp filter for vcpu thread.
 								                    if let Err(e) =
 								                        SeccompFilter::apply(vcpu_seccomp_filter).map_err(Error::ApplySeccompFilter)
 								                    {
 								                        error!("Error applying seccomp filter: {:?}", e);
 								                        return;
 								                    }
-												vmm: cpu: Factorize vcpu starting code

Anticipating the need for a slightly different function for restoring
vCPUs, this patch factorizes most of the vCPU creation, so that it can
be reused for migration purposes.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-04-03 12:27:41 +00:00
+								                    extern "C" fn handle_signal(_: i32, _: *mut siginfo_t, _: *mut c_void) {}
 								                    // This uses an async signal safe handler to kill the vcpu handles.
 								                    register_signal_handler(SIGRTMIN(), handle_signal)
 								                        .expect("Failed to register vcpu signal handler");
 								                    // Block until all CPUs are ready.
 								                    vcpu_thread_barrier.wait();
 								                    loop {
 								                        // If we are being told to pause, we park the thread
 								                        // until the pause boolean is toggled.
 								                        // The resume operation is responsible for toggling
 								                        // the boolean and unpark the thread.
 								                        // We enter a loop because park() could spuriously
 								                        // return. We will then park() again unless the
 								                        // pause boolean has been toggled.
-												misc: Use a more relaxed memory model when possible

When a total ordering between multiple atomic variables is not required
then use Ordering::Acquire with atomic loads and Ordering::Release with
atomic stores.

This will improve performance as this does not require a memory fence
on x86_64 which Ordering::SeqCst will use.

Add a comment to the code in the vCPU handling code where it operates on
multiple atomics to explain why Ordering::SeqCst is required.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-12-01 16:15:26 +00:00
 								                        // Need to use Ordering::SeqCst as we have multiple
 								                        // loads and stores to different atomics and we need
 								                        // to see them in a consistent order in all threads
-												vmm: cpu: Retry sending signals if necessary

To avoid a race condition where the signal might "miss" the KVM_RUN
ioctl() instead reapeatedly try sending a signal until the vCPU run is
interrupted (as indicated by setting a new per vCPU atomic.)

It important to also clear this atomic when coming out of a paused
state.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-05-06 10:34:19 +00:00
+								                        if vcpu_pause_signalled.load(Ordering::SeqCst) {
 								                            vcpu_run_interrupted.store(true, Ordering::SeqCst);
 								                            while vcpu_pause_signalled.load(Ordering::SeqCst) {
 								                                thread::park();
 								                            }
 								                            vcpu_run_interrupted.store(false, Ordering::SeqCst);
-												vmm: cpu: Factorize vcpu starting code

Anticipating the need for a slightly different function for restoring
vCPUs, this patch factorizes most of the vCPU creation, so that it can
be reused for migration purposes.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-04-03 12:27:41 +00:00
+								                        }
-												vmm: cpu: When coming out of the pause event check for a kill signal

Rather than immediately entering the vCPU run() code check if the kill
signal is set. This allows paused VMs to be shutdown.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-05-06 08:59:46 +00:00
 								                        // We've been told to terminate
 								                        if vcpu_kill_signalled.load(Ordering::SeqCst)
 								                            || vcpu_kill.load(Ordering::SeqCst)
 								                        {
-												vmm: cpu: Retry sending signals if necessary

To avoid a race condition where the signal might "miss" the KVM_RUN
ioctl() instead reapeatedly try sending a signal until the vCPU run is
interrupted (as indicated by setting a new per vCPU atomic.)

It important to also clear this atomic when coming out of a paused
state.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-05-06 10:34:19 +00:00
+								                            vcpu_run_interrupted.store(true, Ordering::SeqCst);
-												vmm: cpu: When coming out of the pause event check for a kill signal

Rather than immediately entering the vCPU run() code check if the kill
signal is set. This allows paused VMs to be shutdown.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-05-06 08:59:46 +00:00
+								                            break;
 								                        }
-												vmm: Restore vCPUs in "paused" state

To follow a symmetrical model, and avoid potential race conditions, it's
important to restore a previously snapshot VM in a "paused" state.

The snapshot operation being valid only if the VM has been previously
paused.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-06-22 13:13:45 +00:00
-												hypervisor: Define a VM-Exit abstraction

In order to move the hypervisor specific parts of the VM exit handling
path, we're defining a generic, hypervisor agnostic VM exit enum.

This is what the hypervisor's Vcpu run() call should return when the VM
exit can not be completely handled through the hypervisor specific bits.
For KVM based hypervisors, this means directly forwarding the IO related
exits back to the VMM itself. For other hypervisors that e.g. rely on the
VMM to decode and emulate instructions, this means the decoding itself
would happen in the hypervisor crate exclusively, and the rest of the VM
exit handling would be handled through the VMM device model implementation.

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

Fix test_vm unit test by using the new abstraction and dropping some
dead code.

Signed-off-by: Wei Liu <liuwe@microsoft.com>

											
										
										
											2020-07-03 14:27:53 +00:00
+								                        // vcpu.run() returns false on a triple-fault so trigger a reset
-												vmm: Restore vCPUs in "paused" state

To follow a symmetrical model, and avoid potential race conditions, it's
important to restore a previously snapshot VM in a "paused" state.

The snapshot operation being valid only if the VM has been previously
paused.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-06-22 13:13:45 +00:00
+								                        match vcpu.lock().unwrap().run() {
-												vmm: Handle hypervisor VCPU run result from Vcpu to VcpuManager

Now Vcpu::run() returns a boolean value to VcpuManager, indicating
whether the VM is going to reboot (false) or just continue (true).
Moving the handling of hypervisor VCPU run result from Vcpu to
VcpuManager gives us the flexibility to handle more scenarios like
shutting down on AArch64.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-10-30 13:01:53 +00:00
+								                            Ok(run) => match run {
 								                                #[cfg(target_arch = "x86_64")]
 								                                VmExit::IoapicEoi(vector) => {
 								                                    if let Some(interrupt_controller) = &interrupt_controller_clone
 								                                    {
 								                                        interrupt_controller
 								                                            .lock()
 								                                            .unwrap()
 								                                            .end_of_interrupt(vector);
 								                                    }
 								                                }
 								                                VmExit::Ignore => {}
 								                                VmExit::Hyperv => {}
 								                                VmExit::Reset => {
 								                                    debug!("VmExit::Reset");
 								                                    vcpu_run_interrupted.store(true, Ordering::SeqCst);
 								                                    reset_evt.write(1).unwrap();
 								                                    break;
 								                                }
-												vmm: Implement VM rebooting on AArch64

The logic to handle AArch64 system event was: SHUTDOWN and RESET were
all treated as RESET.

Now we handle them differently:
- RESET event will trigger Vmm::vm_reboot(),
- SHUTDOWN event will trigger Vmm::vm_shutdown().

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-10-30 13:34:16 +00:00
+								                                VmExit::Shutdown => {
 								                                    debug!("VmExit::Shutdown");
 								                                    vcpu_run_interrupted.store(true, Ordering::SeqCst);
 								                                    exit_evt.write(1).unwrap();
 								                                    break;
 								                                }
-												vmm: Handle hypervisor VCPU run result from Vcpu to VcpuManager

Now Vcpu::run() returns a boolean value to VcpuManager, indicating
whether the VM is going to reboot (false) or just continue (true).
Moving the handling of hypervisor VCPU run result from Vcpu to
VcpuManager gives us the flexibility to handle more scenarios like
shutting down on AArch64.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-10-30 13:01:53 +00:00
+								                                _ => {
 								                                    error!("VCPU generated error: {:?}", Error::UnexpectedVmExit);
 								                                    break;
 								                                }
 								                            },
-												vmm: Restore vCPUs in "paused" state

To follow a symmetrical model, and avoid potential race conditions, it's
important to restore a previously snapshot VM in a "paused" state.

The snapshot operation being valid only if the VM has been previously
paused.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-06-22 13:13:45 +00:00
+								                            Err(e) => {
-												vmm: Handle hypervisor VCPU run result from Vcpu to VcpuManager

Now Vcpu::run() returns a boolean value to VcpuManager, indicating
whether the VM is going to reboot (false) or just continue (true).
Moving the handling of hypervisor VCPU run result from Vcpu to
VcpuManager gives us the flexibility to handle more scenarios like
shutting down on AArch64.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-10-30 13:01:53 +00:00
+								                                error!("VCPU generated error: {:?}", Error::VcpuRun(e.into()));
-												vmm: Restore vCPUs in "paused" state

To follow a symmetrical model, and avoid potential race conditions, it's
important to restore a previously snapshot VM in a "paused" state.

The snapshot operation being valid only if the VM has been previously
paused.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-06-22 13:13:45 +00:00
+								                                break;
 								                            }
 								                        }
 								                        // We've been told to terminate
 								                        if vcpu_kill_signalled.load(Ordering::SeqCst)
 								                            || vcpu_kill.load(Ordering::SeqCst)
 								                        {
 								                            vcpu_run_interrupted.store(true, Ordering::SeqCst);
 								                            break;
 								                        }
-												vmm: cpu: Factorize vcpu starting code

Anticipating the need for a slightly different function for restoring
vCPUs, this patch factorizes most of the vCPU creation, so that it can
be reused for migration purposes.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-04-03 12:27:41 +00:00
+								                    }
 								                })
 								                .map_err(Error::VcpuSpawn)?,
 								        );
 								        // On hot plug calls into this function entry_point is None. It is for
 								        // those hotplug CPU additions that we need to set the inserting flag.
 								        self.vcpu_states[usize::from(cpu_id)].handle = handle;
 								        self.vcpu_states[usize::from(cpu_id)].inserting = inserting;
 								        Ok(())
 								    }
-												vmm: cpu: Reuse already allocated vCPUs if available

When a request is made to increase the number of vCPUs in the VM attempt
to reuse any previously removed (and hence inactive) vCPUs before
creating new ones.

This ensures that the APIC ID is not reused for a different KVM vCPU
(which is not allowed) and that the APIC IDs are also sequential.

The two key changes to support this are:

* Clearing the "kill" bit on the old vCPU state so that it does not
  immediately exit upon thread recreation.
* Using the length of the vcpus vector (the number of allocated vcpus)
  rather than the number of active vCPUs (.present_vcpus()) to determine
  how many should be created.

This change also introduced some new info!() debugging on the vCPU
creation/removal path to aid further development in the future.

TEST=Expanded test_cpu_hotplug test.

Fixes: #1338

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-06-23 11:52:17 +00:00
+								    /// Start up as many vCPUs threads as needed to reach `desired_vcpus`
-												vmm: Change booting process to cover AArch64 requirements

Between X86 and AArch64, there is some difference in booting a VM:
- X86_64 can setup IOAPIC before creating any VCPU.
- AArch64 have to create VCPU's before creating GIC.

The old process is:
1. load_kernel()
    load kernel binary
    configure system
2. activate_vcpus()
    create & start VCPU's

So we need to separate "activate_vcpus" into "create_vcpus" and
"activate_vcpus" (to start vcpus only). Setup GIC and create FDT
between the 2 steps.

The new procedure is:
1. load_kernel()
    load kernel binary
    (X86_64) configure system
2. create VCPU's
3. (AArch64) setup GIC
4. (AArch64) configure system
5. start VCPU's

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-26 07:20:22 +00:00
+								    fn activate_vcpus(&mut self, desired_vcpus: u8, inserting: bool) -> Result<()> {
-												vmm: cpu: Save CpusConfig into CpuManager

Rather than saving the individual parts into the CpuManager save the
full struct as it now also contains the topology data.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-06-16 10:52:07 +00:00
+								        if desired_vcpus > self.config.max_vcpus {
-												vmm: cpu: Refactor vCPU thread starting

Refactor the vCPU thread starting so that there is the possibility to
bring on extra vCPU threads.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 13:06:24 +00:00
+								            return Err(Error::DesiredVCPUCountExceedsMax);
 								        }
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
-												vmm: cpu: Refactor vCPU thread starting

Refactor the vCPU thread starting so that there is the possibility to
bring on extra vCPU threads.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 13:06:24 +00:00
+								        let vcpu_thread_barrier = Arc::new(Barrier::new(
 								            (desired_vcpus - self.present_vcpus() + 1) as usize,
 								        ));
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
-												vmm: cpu: Add info!() level debugging to vCPU handling

These messages are intended to be useful to support debugging related to
vCPU hotplug/unplug issues.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-06-23 12:11:00 +00:00
+								        info!(
 								            "Starting vCPUs: desired = {}, allocated = {}, present = {}",
 								            desired_vcpus,
 								            self.vcpus.len(),
 								            self.present_vcpus()
 								        );
-												vmm: cpu: Reuse already allocated vCPUs if available

When a request is made to increase the number of vCPUs in the VM attempt
to reuse any previously removed (and hence inactive) vCPUs before
creating new ones.

This ensures that the APIC ID is not reused for a different KVM vCPU
(which is not allowed) and that the APIC IDs are also sequential.

The two key changes to support this are:

* Clearing the "kill" bit on the old vCPU state so that it does not
  immediately exit upon thread recreation.
* Using the length of the vcpus vector (the number of allocated vcpus)
  rather than the number of active vCPUs (.present_vcpus()) to determine
  how many should be created.

This change also introduced some new info!() debugging on the vCPU
creation/removal path to aid further development in the future.

TEST=Expanded test_cpu_hotplug test.

Fixes: #1338

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-06-23 11:52:17 +00:00
+								        // This reuses any inactive vCPUs as well as any that were newly created
-												vmm: cpu: Refactor vCPU thread starting

Refactor the vCPU thread starting so that there is the possibility to
bring on extra vCPU threads.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 13:06:24 +00:00
+								        for cpu_id in self.present_vcpus()..desired_vcpus {
-												vmm: Change booting process to cover AArch64 requirements

Between X86 and AArch64, there is some difference in booting a VM:
- X86_64 can setup IOAPIC before creating any VCPU.
- AArch64 have to create VCPU's before creating GIC.

The old process is:
1. load_kernel()
    load kernel binary
    configure system
2. activate_vcpus()
    create & start VCPU's

So we need to separate "activate_vcpus" into "create_vcpus" and
"activate_vcpus" (to start vcpus only). Setup GIC and create FDT
between the 2 steps.

The new procedure is:
1. load_kernel()
    load kernel binary
    (X86_64) configure system
2. create VCPU's
3. (AArch64) setup GIC
4. (AArch64) configure system
5. start VCPU's

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-26 07:20:22 +00:00
+								            let vcpu = Arc::clone(&self.vcpus[cpu_id as usize]);
 								            self.start_vcpu(vcpu, vcpu_thread_barrier.clone(), inserting)?;
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								        }
 								        // Unblock all CPU threads.
 								        vcpu_thread_barrier.wait();
 								        Ok(())
 								    }
-												vmm: cpu: Notify guest OS that it should offline vCPUs

Allow the resizing of the number of vCPUs to less than the current
active vCPUs. This does not currently remove them from the system but
the kernel will take them offline.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 10:49:05 +00:00
+								    fn mark_vcpus_for_removal(&mut self, desired_vcpus: u8) -> Result<()> {
 								        // Mark vCPUs for removal, actual removal happens on ejection
 								        for cpu_id in desired_vcpus..self.present_vcpus() {
 								            self.vcpu_states[usize::from(cpu_id)].removing = true;
 								        }
 								        Ok(())
 								    }
-												vmm: cpu: Implement CPU removal

When the running OS has been told that a CPU should be removed it will
shutdown the CPU and then signal to the hypervisor via the "_EJ0" method
on the device that ultimately writes into an I/O port than the vCPU
should be shutdown. Upon notification the hypervisor signals to the
individual thread that it should shutdown and waits for that thread to
end.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 11:22:33 +00:00
+								    fn remove_vcpu(&mut self, cpu_id: u8) -> Result<()> {
-												vmm: cpu: Add info!() level debugging to vCPU handling

These messages are intended to be useful to support debugging related to
vCPU hotplug/unplug issues.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-06-23 12:11:00 +00:00
+								        info!("Removing vCPU: cpu_id = {}", cpu_id);
-												vmm: cpu: Implement CPU removal

When the running OS has been told that a CPU should be removed it will
shutdown the CPU and then signal to the hypervisor via the "_EJ0" method
on the device that ultimately writes into an I/O port than the vCPU
should be shutdown. Upon notification the hypervisor signals to the
individual thread that it should shutdown and waits for that thread to
end.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 11:22:33 +00:00
+								        let mut state = &mut self.vcpu_states[usize::from(cpu_id)];
 								        state.kill.store(true, Ordering::SeqCst);
 								        state.signal_thread();
 								        state.join_thread()?;
 								        state.handle = None;
-												vmm: cpu: Clear the "kill" flag on vCPU to support reuse

After the vCPU has been ejected and the thread shutdown it is useful to
clear the "kill" flag so that if the vCPU is reused it does not
immediately exit upon thread recreation.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-06-23 12:12:44 +00:00
 								        // Once the thread has exited, clear the "kill" so that it can reused
 								        state.kill.store(false, Ordering::SeqCst);
-												vmm: cpu: Implement CPU removal

When the running OS has been told that a CPU should be removed it will
shutdown the CPU and then signal to the hypervisor via the "_EJ0" method
on the device that ultimately writes into an I/O port than the vCPU
should be shutdown. Upon notification the hypervisor signals to the
individual thread that it should shutdown and waits for that thread to
end.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 11:22:33 +00:00
+								        Ok(())
 								    }
-												vmm: Change booting process to cover AArch64 requirements

Between X86 and AArch64, there is some difference in booting a VM:
- X86_64 can setup IOAPIC before creating any VCPU.
- AArch64 have to create VCPU's before creating GIC.

The old process is:
1. load_kernel()
    load kernel binary
    configure system
2. activate_vcpus()
    create & start VCPU's

So we need to separate "activate_vcpus" into "create_vcpus" and
"activate_vcpus" (to start vcpus only). Setup GIC and create FDT
between the 2 steps.

The new procedure is:
1. load_kernel()
    load kernel binary
    (X86_64) configure system
2. create VCPU's
3. (AArch64) setup GIC
4. (AArch64) configure system
5. start VCPU's

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-26 07:20:22 +00:00
+								    pub fn create_boot_vcpus(&mut self, entry_point: EntryPoint) -> Result<()> {
 								        self.create_vcpus(self.boot_vcpus(), Some(entry_point))
 								    }
-												vmm: cpu: Refactor vCPU thread starting

Refactor the vCPU thread starting so that there is the possibility to
bring on extra vCPU threads.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 13:06:24 +00:00
+								    // Starts all the vCPUs that the VM is booting with. Blocks until all vCPUs are running.
-												vmm: Change booting process to cover AArch64 requirements

Between X86 and AArch64, there is some difference in booting a VM:
- X86_64 can setup IOAPIC before creating any VCPU.
- AArch64 have to create VCPU's before creating GIC.

The old process is:
1. load_kernel()
    load kernel binary
    configure system
2. activate_vcpus()
    create & start VCPU's

So we need to separate "activate_vcpus" into "create_vcpus" and
"activate_vcpus" (to start vcpus only). Setup GIC and create FDT
between the 2 steps.

The new procedure is:
1. load_kernel()
    load kernel binary
    (X86_64) configure system
2. create VCPU's
3. (AArch64) setup GIC
4. (AArch64) configure system
5. start VCPU's

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-26 07:20:22 +00:00
+								    pub fn start_boot_vcpus(&mut self) -> Result<()> {
 								        self.activate_vcpus(self.boot_vcpus(), false)
-												vmm: cpu: Add support for starting more vCPU threads

Add support for starting vCPU threads after the initial boot ones.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 15:56:16 +00:00
+								    }
-												vmm: refactor vCPU save/restore code in restoring VM

Similarly as the VM booting process, on AArch64 systems,
the vCPUs should be created before the creation of GIC. This
commit refactors the vCPU save/restore code to achieve the
above-mentioned restoring order.

Signed-off-by: Henry Wang <Henry.Wang@arm.com>

											
										
										
											2020-09-04 10:56:30 +00:00
+								    pub fn start_restored_vcpus(&mut self) -> Result<()> {
 								        let vcpu_numbers = self.vcpus.len();
 								        let vcpu_thread_barrier = Arc::new(Barrier::new((vcpu_numbers + 1) as usize));
 								        // Restore the vCPUs in "paused" state.
 								        self.vcpus_pause_signalled.store(true, Ordering::SeqCst);
 								        for vcpu_index in 0..vcpu_numbers {
 								            let vcpu = Arc::clone(&self.vcpus[vcpu_index as usize]);
 								            self.start_vcpu(vcpu, vcpu_thread_barrier.clone(), false)
 								                .map_err(|e| {
 								                    Error::StartRestoreVcpu(anyhow!("Failed to start restored vCPUs: {:#?}", e))
 								                })?;
 								        }
 								        // Unblock all restored CPU threads.
 								        vcpu_thread_barrier.wait();
 								        Ok(())
 								    }
-												vmm: Only generate GED interrupt when the number of vCPUs has changed

Avoid activity in the the guest OS if the number of vCPUs has not
changed.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-01-17 16:48:46 +00:00
+								    pub fn resize(&mut self, desired_vcpus: u8) -> Result<bool> {
-												vmm: cpu: Rewrite if chain using match

Address updated clippy error:

error: `if` chain can be rewritten with `match`
   --> vmm/src/cpu.rs:668:9
    |
668 | /         if desired_vcpus > self.present_vcpus() {
669 | |             self.activate_vcpus(desired_vcpus, None)?;
670 | |         } else if desired_vcpus < self.present_vcpus() {
671 | |             self.mark_vcpus_for_removal(desired_vcpus)?;
672 | |         }
    | |_________^
    |
    = note: `-D clippy::comparison-chain` implied by `-D warnings`
    = help: Consider rewriting the `if` chain to use `cmp` and `match`.
    = help: for further information visit https://rust-lang.github.io/rust-clippy/master/index.html#comparison_chain

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-19 17:08:38 +00:00
+								        match desired_vcpus.cmp(&self.present_vcpus()) {
-												vmm: Change booting process to cover AArch64 requirements

Between X86 and AArch64, there is some difference in booting a VM:
- X86_64 can setup IOAPIC before creating any VCPU.
- AArch64 have to create VCPU's before creating GIC.

The old process is:
1. load_kernel()
    load kernel binary
    configure system
2. activate_vcpus()
    create & start VCPU's

So we need to separate "activate_vcpus" into "create_vcpus" and
"activate_vcpus" (to start vcpus only). Setup GIC and create FDT
between the 2 steps.

The new procedure is:
1. load_kernel()
    load kernel binary
    (X86_64) configure system
2. create VCPU's
3. (AArch64) setup GIC
4. (AArch64) configure system
5. start VCPU's

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-26 07:20:22 +00:00
+								            cmp::Ordering::Greater => {
 								                self.create_vcpus(desired_vcpus, None)?;
 								                self.activate_vcpus(desired_vcpus, true)?;
 								                Ok(true)
 								            }
-												vmm: Only generate GED interrupt when the number of vCPUs has changed

Avoid activity in the the guest OS if the number of vCPUs has not
changed.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-01-17 16:48:46 +00:00
+								            cmp::Ordering::Less => self.mark_vcpus_for_removal(desired_vcpus).and(Ok(true)),
 								            _ => Ok(false),
-												vmm: cpu: Notify guest OS that it should offline vCPUs

Allow the resizing of the number of vCPUs to less than the current
active vCPUs. This does not currently remove them from the system but
the kernel will take them offline.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 10:49:05 +00:00
+								        }
-												vmm: cpu: Refactor vCPU thread starting

Refactor the vCPU thread starting so that there is the possibility to
bring on extra vCPU threads.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 13:06:24 +00:00
+								    }
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								    pub fn shutdown(&mut self) -> Result<()> {
 								        // Tell the vCPUs to stop themselves next time they go through the loop
 								        self.vcpus_kill_signalled.store(true, Ordering::SeqCst);
-												vmm: cpu: Resume before shutdown in a specific way

Instead of calling the resume() function from the CpuManager, which
involves more than what is needed from the shutdown codepath, and
potentially ends up with a deadlock, we replace it with a subset.

The full resume operation is reserved for a VM that has been paused.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-06-24 10:25:06 +00:00
+								        // Toggle the vCPUs pause boolean
 								        self.vcpus_pause_signalled.store(false, Ordering::SeqCst);
 								        // Unpark all the VCPU threads.
 								        for state in self.vcpu_states.iter() {
 								            state.unpark_thread();
 								        }
-												vmm: cpu: Unpause vCPU threads

After setting the kill signal flag for the vCPU thread release the pause
flag and unpark the threads. This ensures that that the vCPU thread will
wake up and check the kill signal flag if the VM is paused.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-05-06 09:24:19 +00:00
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								        // Signal to the spawned threads (vCPUs and console signal handler). For the vCPU threads
 								        // this will interrupt the KVM_RUN ioctl() allowing the loop to check the boolean set
 								        // above.
-												vmm: cpu: Encapsulate vCPU state into its own struct

Currently this just holds the thread handle but will be enlarged to
encompass details such as whether the vCPU is currently being inserted
or ejected.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 11:32:36 +00:00
+								        for state in self.vcpu_states.iter() {
 								            state.signal_thread();
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								        }
-												vmm: cpu: Encapsulate vCPU state into its own struct

Currently this just holds the thread handle but will be enlarged to
encompass details such as whether the vCPU is currently being inserted
or ejected.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 11:32:36 +00:00
+								        // Wait for all the threads to finish. This removes the state from the vector.
 								        for mut state in self.vcpu_states.drain(..) {
 								            state.join_thread()?;
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								        }
 								        Ok(())
 								    }
-												vmm: cpu: Introduce concept of maximum vs boot vCPUs in CpuManager

For now the max vCPUs is the same as the boot vCPUs.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-25 13:55:10 +00:00
+								    pub fn boot_vcpus(&self) -> u8 {
-												vmm: cpu: Save CpusConfig into CpuManager

Rather than saving the individual parts into the CpuManager save the
full struct as it now also contains the topology data.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-06-16 10:52:07 +00:00
+								        self.config.boot_vcpus
-												vmm: cpu: Introduce concept of maximum vs boot vCPUs in CpuManager

For now the max vCPUs is the same as the boot vCPUs.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-25 13:55:10 +00:00
+								    }
 								    pub fn max_vcpus(&self) -> u8 {
-												vmm: cpu: Save CpusConfig into CpuManager

Rather than saving the individual parts into the CpuManager save the
full struct as it now also contains the topology data.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-06-16 10:52:07 +00:00
+								        self.config.max_vcpus
-												vmm: cpu: Introduce concept of maximum vs boot vCPUs in CpuManager

For now the max vCPUs is the same as the boot vCPUs.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-25 13:55:10 +00:00
+								    }
-												vmm: cpu: Encapsulate vCPU state into its own struct

Currently this just holds the thread handle but will be enlarged to
encompass details such as whether the vCPU is currently being inserted
or ejected.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 11:32:36 +00:00
 								    fn present_vcpus(&self) -> u8 {
-												vmm: cpu: Create vCPU state for all possible vCPUs

This will make it more straightforward when we attempt to remove vCPUs.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 17:15:25 +00:00
+								        self.vcpu_states
 								            .iter()
 								            .fold(0, |acc, state| acc + state.active() as u8)
-												vmm: cpu: Encapsulate vCPU state into its own struct

Currently this just holds the thread handle but will be enlarged to
encompass details such as whether the vCPU is currently being inserted
or ejected.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 11:32:36 +00:00
+								    }
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
-												vmm: Enable VCPU for AArch64

Added MPIDR which is needed in system configuration.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-06-09 07:24:23 +00:00
+								    #[cfg(target_arch = "aarch64")]
-												vmm: Configure VM on AArch64

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-06-09 10:28:02 +00:00
+								    pub fn get_mpidrs(&self) -> Vec<u64> {
-												vmm: Fix AArch64 clippy warnings of vmm and other crates

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-08-23 07:45:44 +00:00
+								        self.vcpus
-												vmm: Enable VCPU for AArch64

Added MPIDR which is needed in system configuration.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-06-09 07:24:23 +00:00
+								            .iter()
 								            .map(|cpu| cpu.lock().unwrap().get_mpidr())
-												vmm: Fix AArch64 clippy warnings of vmm and other crates

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-08-23 07:45:44 +00:00
+								            .collect()
-												vmm: Enable VCPU for AArch64

Added MPIDR which is needed in system configuration.

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-06-09 07:24:23 +00:00
+								    }
-												vmm: AArch64: add methods to get saved vCPU states

The construction of `GICR_TYPER` register will need vCPU states.
Therefore this commit adds methods to extract saved vCPU states
from the cpu manager.

Signed-off-by: Henry Wang <Henry.Wang@arm.com>

											
										
										
											2020-09-04 15:37:52 +00:00
+								    #[cfg(target_arch = "aarch64")]
 								    pub fn get_saved_states(&self) -> Vec<CpuState> {
 								        self.vcpus
 								            .iter()
 								            .map(|cpu| cpu.lock().unwrap().get_saved_state().unwrap())
 								            .collect()
 								    }
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								    #[cfg(feature = "acpi")]
 								    pub fn create_madt(&self) -> SDT {
 								        // This is also checked in the commandline parsing.
-												vmm: cpu: Save CpusConfig into CpuManager

Rather than saving the individual parts into the CpuManager save the
full struct as it now also contains the topology data.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-06-16 10:52:07 +00:00
+								        assert!(self.config.boot_vcpus <= self.config.max_vcpus);
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
 								        let mut madt = SDT::new(*b"APIC", 44, 5, *b"CLOUDH", *b"CHMADT  ", 1);
 								        madt.write(36, layout::APIC_START);
-												vmm: cpu: Save CpusConfig into CpuManager

Rather than saving the individual parts into the CpuManager save the
full struct as it now also contains the topology data.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-06-16 10:52:07 +00:00
+								        for cpu in 0..self.config.max_vcpus {
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								            let lapic = LocalAPIC {
 								                r#type: 0,
 								                length: 8,
 								                processor_id: cpu,
 								                apic_id: cpu,
-												vmm: cpu: Save CpusConfig into CpuManager

Rather than saving the individual parts into the CpuManager save the
full struct as it now also contains the topology data.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-06-16 10:52:07 +00:00
+								                flags: if cpu < self.config.boot_vcpus {
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+<< MADT_CPU_ENABLE_FLAG
 								                } else {
 
 								                },
 								            };
 								            madt.append(lapic);
 								        }
 								        madt.append(IOAPIC {
 								            r#type: 1,
 								            length: 12,
 								            ioapic_id: 0,
 								            apic_address: layout::IOAPIC_START.0 as u32,
 								            gsi_base: 0,
 								            ..Default::default()
 								        });
 								        madt.append(InterruptSourceOverride {
 								            r#type: 2,
 								            length: 10,
 								            bus: 0,
 								            source: 4,
 								            gsi: 4,
 								            flags: 0,
 								        });
 								        madt
 								    }
 								}
-												ci: Run clippy for each specific feature

The build is run against "--all-features", "pci,acpi", "pci" and "mmio"
separately. The clippy validation must be run against the same set of
features in order to validate the code is correct.

Because of these new checks, this commit includes multiple fixes
related to the errors generated when manually running the checks.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-01-21 08:32:50 +00:00
+								#[cfg(feature = "acpi")]
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								struct CPU {
 								    cpu_id: u8,
 								}
-												ci: Run clippy for each specific feature

The build is run against "--all-features", "pci,acpi", "pci" and "mmio"
separately. The clippy validation must be run against the same set of
features in order to validate the code is correct.

Because of these new checks, this commit includes multiple fixes
related to the errors generated when manually running the checks.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-01-21 08:32:50 +00:00
+								#[cfg(feature = "acpi")]
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								const MADT_CPU_ENABLE_FLAG: usize = 0;
 								#[cfg(feature = "acpi")]
 								impl Aml for CPU {
 								    fn to_aml_bytes(&self) -> Vec<u8> {
 								        let lapic = LocalAPIC {
 								            r#type: 0,
 								            length: 8,
 								            processor_id: self.cpu_id,
 								            apic_id: self.cpu_id,
 								            flags: 1 << MADT_CPU_ENABLE_FLAG,
 								        };
 								        let mut mat_data: Vec<u8> = Vec::new();
 								        mat_data.resize(std::mem::size_of_val(&lapic), 0);
 								        unsafe { *(mat_data.as_mut_ptr() as *mut LocalAPIC) = lapic };
 								        aml::Device::new(
 								            format!("C{:03}", self.cpu_id).as_str().into(),
 								            vec![
 								                &aml::Name::new("_HID".into(), &"ACPI0007"),
 								                &aml::Name::new("_UID".into(), &self.cpu_id),
 								                /*
 								                _STA return value:
 								                Bit [0] – Set if the device is present.
 								                Bit [1] – Set if the device is enabled and decoding its resources.
 								                Bit [2] – Set if the device should be shown in the UI.
 								                Bit [3] – Set if the device is functioning properly (cleared if device failed its diagnostics).
 								                Bit [4] – Set if the battery is present.
 								                Bits [31:5] – Reserved (must be cleared).
 								                */
 								                &aml::Method::new(
 								                    "_STA".into(),
 ,
 								                    false,
 								                    // Call into CSTA method which will interrogate device
 								                    vec![&aml::Return::new(&aml::MethodCall::new(
 								                        "CSTA".into(),
 								                        vec![&self.cpu_id],
 								                    ))],
 								                ),
 								                // The Linux kernel expects every CPU device to have a _MAT entry
 								                // containing the LAPIC for this processor with the enabled bit set
 								                // even it if is disabled in the MADT (non-boot CPU)
 								                &aml::Name::new("_MAT".into(), &aml::Buffer::new(mat_data)),
-												vmm: cpu: Implement CPU removal

When the running OS has been told that a CPU should be removed it will
shutdown the CPU and then signal to the hypervisor via the "_EJ0" method
on the device that ultimately writes into an I/O port than the vCPU
should be shutdown. Upon notification the hypervisor signals to the
individual thread that it should shutdown and waits for that thread to
end.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 11:22:33 +00:00
+								                // Trigger CPU ejection
 								                &aml::Method::new(
 								                    "_EJ0".into(),
 ,
 								                    false,
 								                    // Call into CEJ0 method which will actually eject device
 								                    vec![&aml::Return::new(&aml::MethodCall::new(
 								                        "CEJ0".into(),
 								                        vec![&self.cpu_id],
 								                    ))],
 								                ),
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								            ],
 								        )
 								        .to_aml_bytes()
 								    }
 								}
-												ci: Run clippy for each specific feature

The build is run against "--all-features", "pci,acpi", "pci" and "mmio"
separately. The clippy validation must be run against the same set of
features in order to validate the code is correct.

Because of these new checks, this commit includes multiple fixes
related to the errors generated when manually running the checks.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-01-21 08:32:50 +00:00
+								#[cfg(feature = "acpi")]
-												vmm: acpi: Refactor ACPI CPU notification

Continue to notify on all vCPUs but instead separate the notification
functionality into two methods, CSCN that walks through all the CPUs
and CTFY which notifies based on the numerical CPU id. This is an
interim step towards only notifying on changed CPUs and ultimately CPU
removal.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:09:24 +00:00
+								struct CPUNotify {
 								    cpu_id: u8,
 								}
 								#[cfg(feature = "acpi")]
 								impl Aml for CPUNotify {
 								    fn to_aml_bytes(&self) -> Vec<u8> {
 								        let object = aml::Path::new(&format!("C{:03}", self.cpu_id));
 								        aml::If::new(
 								            &aml::Equal::new(&aml::Arg(0), &self.cpu_id),
 								            vec![&aml::Notify::new(&object, &aml::Arg(1))],
 								        )
 								        .to_aml_bytes()
 								    }
 								}
-												ci: Run clippy for each specific feature

The build is run against "--all-features", "pci,acpi", "pci" and "mmio"
separately. The clippy validation must be run against the same set of
features in order to validate the code is correct.

Because of these new checks, this commit includes multiple fixes
related to the errors generated when manually running the checks.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-01-21 08:32:50 +00:00
+								#[cfg(feature = "acpi")]
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								struct CPUMethods {
 								    max_vcpus: u8,
 								}
 								#[cfg(feature = "acpi")]
 								impl Aml for CPUMethods {
 								    fn to_aml_bytes(&self) -> Vec<u8> {
 								        let mut bytes = Vec::new();
 								        bytes.extend_from_slice(
 								            // CPU status method
 								            &aml::Method::new(
 								                "CSTA".into(),
 ,
 								                true,
 								                vec![
 								                    // Take lock defined above
 								                    &aml::Acquire::new("\\_SB_.PRES.CPLK".into(), 0xfff),
-												Revert "vmm: Move CpuManager device to MMIO region"

This reverts commit 980e03fa0ab3d217fe91fd60d8459507c903d88b.

											
										
										
											2020-01-24 10:36:39 +00:00
+								                    // Write CPU number (in first argument) to I/O port via field
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								                    &aml::Store::new(&aml::Path::new("\\_SB_.PRES.CSEL"), &aml::Arg(0)),
 								                    &aml::Store::new(&aml::Local(0), &aml::ZERO),
 								                    // Check if CPEN bit is set, if so make the local variable 0xf (see _STA for details of meaning)
 								                    &aml::If::new(
 								                        &aml::Equal::new(&aml::Path::new("\\_SB_.PRES.CPEN"), &aml::ONE),
 								                        vec![&aml::Store::new(&aml::Local(0), &0xfu8)],
 								                    ),
 								                    // Release lock
 								                    &aml::Release::new("\\_SB_.PRES.CPLK".into()),
 								                    // Return 0 or 0xf
 								                    &aml::Return::new(&aml::Local(0)),
 								                ],
 								            )
 								            .to_aml_bytes(),
 								        );
-												vmm: acpi: Refactor ACPI CPU notification

Continue to notify on all vCPUs but instead separate the notification
functionality into two methods, CSCN that walks through all the CPUs
and CTFY which notifies based on the numerical CPU id. This is an
interim step towards only notifying on changed CPUs and ultimately CPU
removal.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:09:24 +00:00
+								        let mut cpu_notifies = Vec::new();
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								        for cpu_id in 0..self.max_vcpus {
-												vmm: acpi: Refactor ACPI CPU notification

Continue to notify on all vCPUs but instead separate the notification
functionality into two methods, CSCN that walks through all the CPUs
and CTFY which notifies based on the numerical CPU id. This is an
interim step towards only notifying on changed CPUs and ultimately CPU
removal.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:09:24 +00:00
+								            cpu_notifies.push(CPUNotify { cpu_id });
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								        }
-												vmm: acpi: Refactor ACPI CPU notification

Continue to notify on all vCPUs but instead separate the notification
functionality into two methods, CSCN that walks through all the CPUs
and CTFY which notifies based on the numerical CPU id. This is an
interim step towards only notifying on changed CPUs and ultimately CPU
removal.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:09:24 +00:00
+								        let mut cpu_notifies_refs: Vec<&dyn aml::Aml> = Vec::new();
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								        for cpu_id in 0..self.max_vcpus {
-												vmm: acpi: Refactor ACPI CPU notification

Continue to notify on all vCPUs but instead separate the notification
functionality into two methods, CSCN that walks through all the CPUs
and CTFY which notifies based on the numerical CPU id. This is an
interim step towards only notifying on changed CPUs and ultimately CPU
removal.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:09:24 +00:00
+								            cpu_notifies_refs.push(&cpu_notifies[usize::from(cpu_id)]);
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								        }
-												vmm: acpi: Refactor ACPI CPU notification

Continue to notify on all vCPUs but instead separate the notification
functionality into two methods, CSCN that walks through all the CPUs
and CTFY which notifies based on the numerical CPU id. This is an
interim step towards only notifying on changed CPUs and ultimately CPU
removal.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:09:24 +00:00
+								        bytes.extend_from_slice(
 								            &aml::Method::new("CTFY".into(), 2, true, cpu_notifies_refs).to_aml_bytes(),
 								        );
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
-												vmm: cpu: Implement CPU removal

When the running OS has been told that a CPU should be removed it will
shutdown the CPU and then signal to the hypervisor via the "_EJ0" method
on the device that ultimately writes into an I/O port than the vCPU
should be shutdown. Upon notification the hypervisor signals to the
individual thread that it should shutdown and waits for that thread to
end.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 11:22:33 +00:00
+								        bytes.extend_from_slice(
 								            &aml::Method::new(
 								                "CEJ0".into(),
 ,
 								                true,
 								                vec![
 								                    &aml::Acquire::new("\\_SB_.PRES.CPLK".into(), 0xfff),
-												Revert "vmm: Move CpuManager device to MMIO region"

This reverts commit 980e03fa0ab3d217fe91fd60d8459507c903d88b.

											
										
										
											2020-01-24 10:36:39 +00:00
+								                    // Write CPU number (in first argument) to I/O port via field
-												vmm: cpu: Implement CPU removal

When the running OS has been told that a CPU should be removed it will
shutdown the CPU and then signal to the hypervisor via the "_EJ0" method
on the device that ultimately writes into an I/O port than the vCPU
should be shutdown. Upon notification the hypervisor signals to the
individual thread that it should shutdown and waits for that thread to
end.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 11:22:33 +00:00
+								                    &aml::Store::new(&aml::Path::new("\\_SB_.PRES.CSEL"), &aml::Arg(0)),
 								                    // Set CEJ0 bit
 								                    &aml::Store::new(&aml::Path::new("\\_SB_.PRES.CEJ0"), &aml::ONE),
 								                    &aml::Release::new("\\_SB_.PRES.CPLK".into()),
 								                ],
 								            )
 								            .to_aml_bytes(),
 								        );
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								        bytes.extend_from_slice(
-												vmm: acpi: Refactor ACPI CPU notification

Continue to notify on all vCPUs but instead separate the notification
functionality into two methods, CSCN that walks through all the CPUs
and CTFY which notifies based on the numerical CPU id. This is an
interim step towards only notifying on changed CPUs and ultimately CPU
removal.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:09:24 +00:00
+								            &aml::Method::new(
 								                "CSCN".into(),
 ,
 								                true,
 								                vec![
-												vmm: cpu: Only do ACPI notify on newly added vCPUs

When we add a vCPU set an "inserting" boolean that is exposed as an ACPI
field that will be checked for and reset when the ACPI GED notification
for CPU devices happens.

This change is a precursor for CPU unplug.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:42:29 +00:00
+								                    // Take lock defined above
 								                    &aml::Acquire::new("\\_SB_.PRES.CPLK".into(), 0xfff),
-												vmm: acpi: Refactor ACPI CPU notification

Continue to notify on all vCPUs but instead separate the notification
functionality into two methods, CSCN that walks through all the CPUs
and CTFY which notifies based on the numerical CPU id. This is an
interim step towards only notifying on changed CPUs and ultimately CPU
removal.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:09:24 +00:00
+								                    &aml::Store::new(&aml::Local(0), &aml::ZERO),
 								                    &aml::While::new(
 								                        &aml::LessThan::new(&aml::Local(0), &self.max_vcpus),
 								                        vec![
-												Revert "vmm: Move CpuManager device to MMIO region"

This reverts commit 980e03fa0ab3d217fe91fd60d8459507c903d88b.

											
										
										
											2020-01-24 10:36:39 +00:00
+								                            // Write CPU number (in first argument) to I/O port via field
-												vmm: cpu: Only do ACPI notify on newly added vCPUs

When we add a vCPU set an "inserting" boolean that is exposed as an ACPI
field that will be checked for and reset when the ACPI GED notification
for CPU devices happens.

This change is a precursor for CPU unplug.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:42:29 +00:00
+								                            &aml::Store::new(&aml::Path::new("\\_SB_.PRES.CSEL"), &aml::Local(0)),
 								                            // Check if CINS bit is set
 								                            &aml::If::new(
 								                                &aml::Equal::new(&aml::Path::new("\\_SB_.PRES.CINS"), &aml::ONE),
 								                                // Notify device if it is
 								                                vec![
 								                                    &aml::MethodCall::new(
 								                                        "CTFY".into(),
 								                                        vec![&aml::Local(0), &aml::ONE],
 								                                    ),
 								                                    // Reset CINS bit
 								                                    &aml::Store::new(
 								                                        &aml::Path::new("\\_SB_.PRES.CINS"),
 								                                        &aml::ONE,
 								                                    ),
 								                                ],
 								                            ),
-												vmm: cpu: Notify guest OS that it should offline vCPUs

Allow the resizing of the number of vCPUs to less than the current
active vCPUs. This does not currently remove them from the system but
the kernel will take them offline.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 10:49:05 +00:00
+								                            // Check if CRMV bit is set
 								                            &aml::If::new(
 								                                &aml::Equal::new(&aml::Path::new("\\_SB_.PRES.CRMV"), &aml::ONE),
 								                                // Notify device if it is (with the eject constant 0x3)
 								                                vec![
 								                                    &aml::MethodCall::new(
 								                                        "CTFY".into(),
 								                                        vec![&aml::Local(0), &3u8],
 								                                    ),
 								                                    // Reset CRMV bit
 								                                    &aml::Store::new(
 								                                        &aml::Path::new("\\_SB_.PRES.CRMV"),
 								                                        &aml::ONE,
 								                                    ),
 								                                ],
 								                            ),
-												vmm: acpi: Refactor ACPI CPU notification

Continue to notify on all vCPUs but instead separate the notification
functionality into two methods, CSCN that walks through all the CPUs
and CTFY which notifies based on the numerical CPU id. This is an
interim step towards only notifying on changed CPUs and ultimately CPU
removal.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:09:24 +00:00
+								                            &aml::Add::new(&aml::Local(0), &aml::Local(0), &aml::ONE),
 								                        ],
 								                    ),
-												vmm: cpu: Only do ACPI notify on newly added vCPUs

When we add a vCPU set an "inserting" boolean that is exposed as an ACPI
field that will be checked for and reset when the ACPI GED notification
for CPU devices happens.

This change is a precursor for CPU unplug.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:42:29 +00:00
+								                    // Release lock
 								                    &aml::Release::new("\\_SB_.PRES.CPLK".into()),
-												vmm: acpi: Refactor ACPI CPU notification

Continue to notify on all vCPUs but instead separate the notification
functionality into two methods, CSCN that walks through all the CPUs
and CTFY which notifies based on the numerical CPU id. This is an
interim step towards only notifying on changed CPUs and ultimately CPU
removal.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:09:24 +00:00
+								                ],
 								            )
 								            .to_aml_bytes(),
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								        );
 								        bytes
 								    }
 								}
 								#[cfg(feature = "acpi")]
 								impl Aml for CpuManager {
 								    fn to_aml_bytes(&self) -> Vec<u8> {
 								        let mut bytes = Vec::new();
 								        // CPU hotplug controller
 								        bytes.extend_from_slice(
 								            &aml::Device::new(
 								                "_SB_.PRES".into(),
 								                vec![
 								                    &aml::Name::new("_HID".into(), &aml::EISAName::new("PNP0A06")),
-												devices: acpi: Add UID to devices with common HID

Some OS might check for duplicates and bail out, if it can't create a
distinct mapping. According to ACPI 5.0 section 6.1.12, while _UID is
optional, it becomes required when there are multiple devices with the
same _HID.

Signed-off-by: Anatol Belski <ab@php.net>

											
										
										
											2020-08-13 21:18:17 +00:00
+								                    &aml::Name::new("_UID".into(), &"CPU Hotplug Controller"),
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								                    // Mutex to protect concurrent access as we write to choose CPU and then read back status
 								                    &aml::Mutex::new("CPLK".into(), 0),
-												Revert "vmm: Move CpuManager device to MMIO region"

This reverts commit 980e03fa0ab3d217fe91fd60d8459507c903d88b.

											
										
										
											2020-01-24 10:36:39 +00:00
+								                    // I/O port for CPU controller
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								                    &aml::Name::new(
 								                        "_CRS".into(),
-												Revert "vmm: Move CpuManager device to MMIO region"

This reverts commit 980e03fa0ab3d217fe91fd60d8459507c903d88b.

											
										
										
											2020-01-24 10:36:39 +00:00
+								                        &aml::ResourceTemplate::new(vec![&aml::IO::new(
 x0cd8, 0x0cd8, 0x01, 0x0c,
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								                        )]),
 								                    ),
-												Revert "vmm: Move CpuManager device to MMIO region"

This reverts commit 980e03fa0ab3d217fe91fd60d8459507c903d88b.

											
										
										
											2020-01-24 10:36:39 +00:00
+								                    // OpRegion and Fields map I/O port into individual field values
 								                    &aml::OpRegion::new("PRST".into(), aml::OpRegionSpace::SystemIO, 0x0cd8, 0x0c),
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								                    &aml::Field::new(
 								                        "PRST".into(),
 								                        aml::FieldAccessType::Byte,
 								                        aml::FieldUpdateRule::WriteAsZeroes,
 								                        vec![
 								                            aml::FieldEntry::Reserved(32),
 								                            aml::FieldEntry::Named(*b"CPEN", 1),
 								                            aml::FieldEntry::Named(*b"CINS", 1),
 								                            aml::FieldEntry::Named(*b"CRMV", 1),
 								                            aml::FieldEntry::Named(*b"CEJ0", 1),
 								                            aml::FieldEntry::Reserved(4),
 								                            aml::FieldEntry::Named(*b"CCMD", 8),
 								                        ],
 								                    ),
 								                    &aml::Field::new(
 								                        "PRST".into(),
 								                        aml::FieldAccessType::DWord,
 								                        aml::FieldUpdateRule::Preserve,
 								                        vec![
 								                            aml::FieldEntry::Named(*b"CSEL", 32),
 								                            aml::FieldEntry::Reserved(32),
 								                            aml::FieldEntry::Named(*b"CDAT", 32),
 								                        ],
 								                    ),
 								                ],
 								            )
 								            .to_aml_bytes(),
 								        );
 								        // CPU devices
 								        let hid = aml::Name::new("_HID".into(), &"ACPI0010");
 								        let uid = aml::Name::new("_CID".into(), &aml::EISAName::new("PNP0A05"));
 								        // Bundle methods together under a common object
 								        let methods = CPUMethods {
-												vmm: cpu: Save CpusConfig into CpuManager

Rather than saving the individual parts into the CpuManager save the
full struct as it now also contains the topology data.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-06-16 10:52:07 +00:00
+								            max_vcpus: self.config.max_vcpus,
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								        };
 								        let mut cpu_data_inner: Vec<&dyn aml::Aml> = vec![&hid, &uid, &methods];
 								        let mut cpu_devices = Vec::new();
-												vmm: cpu: Save CpusConfig into CpuManager

Rather than saving the individual parts into the CpuManager save the
full struct as it now also contains the topology data.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-06-16 10:52:07 +00:00
+								        for cpu_id in 0..self.config.max_vcpus {
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								            let cpu_device = CPU { cpu_id };
 								            cpu_devices.push(cpu_device);
 								        }
 								        for cpu_device in cpu_devices.iter() {
 								            cpu_data_inner.push(cpu_device);
 								        }
 								        bytes.extend_from_slice(
 								            &aml::Device::new("_SB_.CPUS".into(), cpu_data_inner).to_aml_bytes(),
 								        );
 								        bytes
 								    }
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								}
-												vmm: cpu_manager: Implement the Pausable trait

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2019-11-21 18:04:08 +00:00
 								impl Pausable for CpuManager {
 								    fn pause(&mut self) -> std::result::Result<(), MigratableError> {
 								        // Tell the vCPUs to pause themselves next time they exit
 								        self.vcpus_pause_signalled.store(true, Ordering::SeqCst);
 								        // Signal to the spawned threads (vCPUs and console signal handler). For the vCPU threads
 								        // this will interrupt the KVM_RUN ioctl() allowing the loop to check the boolean set
 								        // above.
 								        for state in self.vcpu_states.iter() {
 								            state.signal_thread();
 								        }
-												vmm: Notify the guest about vCPUs being paused

Through the newly added API notify_guest_clock_paused(), this patch
improves the vCPU pause operation by letting the guest know that each
vCPU is being paused. This is important to avoid soft lockups detection
from the guest that could happen because the VM has been paused for more
than 20 seconds.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-06-17 11:11:26 +00:00
+								        for vcpu in self.vcpus.iter() {
-												vmm: Implement Pausable trait for Vcpu

We want each Vcpu to store the vCPU state upon VM pausing. This is the
reason why we need to explicitly implement the Pausable trait for the
Vcpu structure.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-06-24 09:59:17 +00:00
+								            let mut vcpu = vcpu.lock().unwrap();
 								            vcpu.pause()?;
-												hypervisor, vmm: Feature guard KVM specific code

There are some code base and function which are purely KVM specific for
now and we don't have those supports in mshv at the moment but we have plan
for the future. We are doing a feature guard with KVM. For example, KVM has
mp_state, cpu clock support,  which we don't have for mshv. In order to build
those code we are making the code base for KVM specific compilation.

Signed-off-by: Muminul Islam <muislam@microsoft.com>

											
										
										
											2020-12-04 23:35:29 +00:00
+								            #[cfg(all(feature = "kvm", target_arch = "x86_64"))]
-												vmm: don't call notify_guest_clock_paused when Hyper-V emulation is on

We turn on that emulation for Windows. Windows does not have KVM's PV
clock, so calling notify_guest_clock_paused results in an error.

Signed-off-by: Wei Liu <liuwe@microsoft.com>

											
										
										
											2020-10-15 14:55:50 +00:00
+								            if !self.config.kvm_hyperv {
 								                vcpu.vcpu.notify_guest_clock_paused().map_err(|e| {
 								                    MigratableError::Pause(anyhow!(
 								                        "Could not notify guest it has been paused {:?}",
 								                        e
 								                    ))
 								                })?;
 								            }
-												vmm: Notify the guest about vCPUs being paused

Through the newly added API notify_guest_clock_paused(), this patch
improves the vCPU pause operation by letting the guest know that each
vCPU is being paused. This is important to avoid soft lockups detection
from the guest that could happen because the VM has been paused for more
than 20 seconds.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-06-17 11:11:26 +00:00
+								        }
-												vmm: cpu_manager: Implement the Pausable trait

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2019-11-21 18:04:08 +00:00
+								        Ok(())
 								    }
 								    fn resume(&mut self) -> std::result::Result<(), MigratableError> {
-												vmm: Implement Pausable trait for Vcpu

We want each Vcpu to store the vCPU state upon VM pausing. This is the
reason why we need to explicitly implement the Pausable trait for the
Vcpu structure.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-06-24 09:59:17 +00:00
+								        for vcpu in self.vcpus.iter() {
 								            vcpu.lock().unwrap().resume()?;
 								        }
-												vmm: cpu_manager: Implement the Pausable trait

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2019-11-21 18:04:08 +00:00
+								        // Toggle the vCPUs pause boolean
 								        self.vcpus_pause_signalled.store(false, Ordering::SeqCst);
 								        // Unpark all the VCPU threads.
 								        // Once unparked, the next thing they will do is checking for the pause
 								        // boolean. Since it'll be set to false, they will exit their pause loop
 								        // and go back to vmx root.
 								        for state in self.vcpu_states.iter() {
 								            state.unpark_thread();
 								        }
 								        Ok(())
 								    }
 								}
-												vmm: cpu: Implement the Snapshottable trait

Implement the Snapshottable trait for Vcpu, and then implements it for
CpuManager. Note that CpuManager goes through the Snapshottable
implementation of Vcpu for every vCPU in order to implement the
Snapshottable trait for itself.

Signed-off-by: Yi Sun <yi.y.sun@linux.intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-18 15:44:41 +00:00
+								impl Snapshottable for CpuManager {
 								    fn id(&self) -> String {
 								        CPU_MANAGER_SNAPSHOT_ID.to_string()
 								    }
-												vm-migration: Make snapshot() mutable

There will be some cases where the implementation of the snapshot()
function from the Snapshottable trait will require to modify some
internal data, therefore we make this possible by updating the trait
definition with snapshot(&mut self).

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-08-21 12:31:58 +00:00
+								    fn snapshot(&mut self) -> std::result::Result<Snapshot, MigratableError> {
-												vmm: cpu: Implement the Snapshottable trait

Implement the Snapshottable trait for Vcpu, and then implements it for
CpuManager. Note that CpuManager goes through the Snapshottable
implementation of Vcpu for every vCPU in order to implement the
Snapshottable trait for itself.

Signed-off-by: Yi Sun <yi.y.sun@linux.intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-18 15:44:41 +00:00
+								        let mut cpu_manager_snapshot = Snapshot::new(CPU_MANAGER_SNAPSHOT_ID);
 								        // The CpuManager snapshot is a collection of all vCPUs snapshots.
 								        for vcpu in &self.vcpus {
 								            let cpu_snapshot = vcpu.lock().unwrap().snapshot()?;
 								            cpu_manager_snapshot.add_snapshot(cpu_snapshot);
 								        }
 								        Ok(cpu_manager_snapshot)
 								    }
 								    fn restore(&mut self, snapshot: Snapshot) -> std::result::Result<(), MigratableError> {
 								        for (cpu_id, snapshot) in snapshot.snapshots.iter() {
 								            debug!("Restoring VCPU {}", cpu_id);
-												vmm: refactor vCPU save/restore code in restoring VM

Similarly as the VM booting process, on AArch64 systems,
the vCPUs should be created before the creation of GIC. This
commit refactors the vCPU save/restore code to achieve the
above-mentioned restoring order.

Signed-off-by: Henry Wang <Henry.Wang@arm.com>

											
										
										
											2020-09-04 10:56:30 +00:00
+								            self.create_vcpu(cpu_id.parse::<u8>().unwrap(), None, Some(*snapshot.clone()))
-												vmm: Change booting process to cover AArch64 requirements

Between X86 and AArch64, there is some difference in booting a VM:
- X86_64 can setup IOAPIC before creating any VCPU.
- AArch64 have to create VCPU's before creating GIC.

The old process is:
1. load_kernel()
    load kernel binary
    configure system
2. activate_vcpus()
    create & start VCPU's

So we need to separate "activate_vcpus" into "create_vcpus" and
"activate_vcpus" (to start vcpus only). Setup GIC and create FDT
between the 2 steps.

The new procedure is:
1. load_kernel()
    load kernel binary
    (X86_64) configure system
2. create VCPU's
3. (AArch64) setup GIC
4. (AArch64) configure system
5. start VCPU's

Signed-off-by: Michael Zhao <michael.zhao@arm.com>

											
										
										
											2020-05-26 07:20:22 +00:00
+								                .map_err(|e| MigratableError::Restore(anyhow!("Could not create vCPU {:?}", e)))?;
-												vmm: cpu: Implement the Snapshottable trait

Implement the Snapshottable trait for Vcpu, and then implements it for
CpuManager. Note that CpuManager goes through the Snapshottable
implementation of Vcpu for every vCPU in order to implement the
Snapshottable trait for itself.

Signed-off-by: Yi Sun <yi.y.sun@linux.intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-18 15:44:41 +00:00
+								        }
 								        Ok(())
 								    }
 								}
-												vm-migration: Define the Snapshottable and Transportable traits

A Snapshottable component can snapshot itself and
provide a MigrationSnapshot payload as a result.

A MigrationSnapshot payload is a map of component IDs to a list of
migration sections (MigrationSection). As component can be made of
several Migratable sub-components (e.g. the DeviceManager and its
device objects), a migration snapshot can be made of multiple snapshot
itself.
A snapshot is a list of migration sections, each section being a
component state snapshot. Having multiple sections allows for easier and
backward compatible migration payload extensions.

Once created, a migratable component snapshot may be transported and this
is what the Transportable trait defines, through 2 methods: send and recv.

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>
Signed-off-by: Yi Sun <yi.y.sun@linux.intel.com>

											
										
										
											2019-05-01 16:59:51 +00:00
+								impl Transportable for CpuManager {}
-												vmm: cpu_manager: Implement the Pausable trait

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2019-11-21 18:04:08 +00:00
+								impl Migratable for CpuManager {}
-												arch: move test cases to vmm crate

This saves us from adding a "kvm" feature to arch crate merely for the
purpose of running tests.

Signed-off-by: Wei Liu <liuwe@microsoft.com>

											
										
										
											2020-07-08 12:48:46 +00:00
-												hypervisor, vmm: Feature guard KVM specific code

There are some code base and function which are purely KVM specific for
now and we don't have those supports in mshv at the moment but we have plan
for the future. We are doing a feature guard with KVM. For example, KVM has
mp_state, cpu clock support,  which we don't have for mshv. In order to build
those code we are making the code base for KVM specific compilation.

Signed-off-by: Muminul Islam <muislam@microsoft.com>

											
										
										
											2020-12-04 23:35:29 +00:00
+								#[cfg(all(feature = "kvm", target_arch = "x86_64"))]
-												arch: move test cases to vmm crate

This saves us from adding a "kvm" feature to arch crate merely for the
purpose of running tests.

Signed-off-by: Wei Liu <liuwe@microsoft.com>

											
										
										
											2020-07-08 12:48:46 +00:00
+								#[cfg(test)]
 								mod tests {
 								    use super::*;
 								    use arch::x86_64::interrupts::*;
 								    use arch::x86_64::regs::*;
 								    use arch::x86_64::BootProtocol;
 								    use hypervisor::x86_64::{FpuState, LapicState, SpecialRegisters, StandardRegisters};
 								    #[test]
 								    fn test_setlint() {
 								        let hv = hypervisor::new().unwrap();
 								        let vm = hv.create_vm().expect("new VM fd creation failed");
 								        assert!(hv.check_capability(hypervisor::kvm::Cap::Irqchip));
 								        // Calling get_lapic will fail if there is no irqchip before hand.
 								        assert!(vm.create_irq_chip().is_ok());
-												hypervisor, vmm: Remove shared ownership of VmmOps

This interface is used by the vCPU thread to delegate responsibility for
handling MMIO/PIO operations and to support different approaches than a
VM exit.

During profiling I found that we were spending 13.75% of the boot CPU
uage acquiring access to the object holding the VmmOps via
ArcSwap::load_full()

    13.75%     6.02%  vcpu0            cloud-hypervisor    [.] arc_swap::ArcSwapAny<T,S>::load_full
            |
            ---arc_swap::ArcSwapAny<T,S>::load_full
               |
                --13.43%--<hypervisor::kvm::KvmVcpu as hypervisor::cpu::Vcpu>::run
                          std::sys_common::backtrace::__rust_begin_short_backtrace
                          core::ops::function::FnOnce::call_once{{vtable-shim}}
                          std::sys::unix::thread::Thread::new::thread_start

However since the object implementing VmmOps does not need to be mutable
and it is only used from the vCPU side we can change the ownership to
being a simple Arc<> that is passed in when calling create_vcpu().

This completely removes the above CPU usage from subsequent profiles.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-11-18 16:37:52 +00:00
+								        let vcpu = vm.create_vcpu(0, None).unwrap();
-												arch: move test cases to vmm crate

This saves us from adding a "kvm" feature to arch crate merely for the
purpose of running tests.

Signed-off-by: Wei Liu <liuwe@microsoft.com>

											
										
										
											2020-07-08 12:48:46 +00:00
+								        let klapic_before: LapicState = vcpu.get_lapic().unwrap();
 								        // Compute the value that is expected to represent LVT0 and LVT1.
 								        let lint0 = get_klapic_reg(&klapic_before, APIC_LVT0);
 								        let lint1 = get_klapic_reg(&klapic_before, APIC_LVT1);
 								        let lint0_mode_expected = set_apic_delivery_mode(lint0, APIC_MODE_EXTINT);
 								        let lint1_mode_expected = set_apic_delivery_mode(lint1, APIC_MODE_NMI);
 								        set_lint(&vcpu).unwrap();
 								        // Compute the value that represents LVT0 and LVT1 after set_lint.
 								        let klapic_actual: LapicState = vcpu.get_lapic().unwrap();
 								        let lint0_mode_actual = get_klapic_reg(&klapic_actual, APIC_LVT0);
 								        let lint1_mode_actual = get_klapic_reg(&klapic_actual, APIC_LVT1);
 								        assert_eq!(lint0_mode_expected, lint0_mode_actual);
 								        assert_eq!(lint1_mode_expected, lint1_mode_actual);
 								    }
 								    #[test]
 								    fn test_setup_fpu() {
 								        let hv = hypervisor::new().unwrap();
 								        let vm = hv.create_vm().expect("new VM fd creation failed");
-												hypervisor, vmm: Remove shared ownership of VmmOps

This interface is used by the vCPU thread to delegate responsibility for
handling MMIO/PIO operations and to support different approaches than a
VM exit.

During profiling I found that we were spending 13.75% of the boot CPU
uage acquiring access to the object holding the VmmOps via
ArcSwap::load_full()

    13.75%     6.02%  vcpu0            cloud-hypervisor    [.] arc_swap::ArcSwapAny<T,S>::load_full
            |
            ---arc_swap::ArcSwapAny<T,S>::load_full
               |
                --13.43%--<hypervisor::kvm::KvmVcpu as hypervisor::cpu::Vcpu>::run
                          std::sys_common::backtrace::__rust_begin_short_backtrace
                          core::ops::function::FnOnce::call_once{{vtable-shim}}
                          std::sys::unix::thread::Thread::new::thread_start

However since the object implementing VmmOps does not need to be mutable
and it is only used from the vCPU side we can change the ownership to
being a simple Arc<> that is passed in when calling create_vcpu().

This completely removes the above CPU usage from subsequent profiles.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-11-18 16:37:52 +00:00
+								        let vcpu = vm.create_vcpu(0, None).unwrap();
-												arch: move test cases to vmm crate

This saves us from adding a "kvm" feature to arch crate merely for the
purpose of running tests.

Signed-off-by: Wei Liu <liuwe@microsoft.com>

											
										
										
											2020-07-08 12:48:46 +00:00
+								        setup_fpu(&vcpu).unwrap();
 								        let expected_fpu: FpuState = FpuState {
 								            fcw: 0x37f,
 								            mxcsr: 0x1f80,
 								            ..Default::default()
 								        };
 								        let actual_fpu: FpuState = vcpu.get_fpu().unwrap();
 								        // TODO: auto-generate kvm related structures with PartialEq on.
 								        assert_eq!(expected_fpu.fcw, actual_fpu.fcw);
 								        // Setting the mxcsr register from FpuState inside setup_fpu does not influence anything.
 								        // See 'kvm_arch_vcpu_ioctl_set_fpu' from arch/x86/kvm/x86.c.
 								        // The mxcsr will stay 0 and the assert below fails. Decide whether or not we should
 								        // remove it at all.
 								        // assert!(expected_fpu.mxcsr == actual_fpu.mxcsr);
 								    }
 								    #[test]
 								    fn test_setup_msrs() {
 								        use hypervisor::arch::x86::msr_index;
 								        use hypervisor::x86_64::{MsrEntries, MsrEntry};
 								        let hv = hypervisor::new().unwrap();
 								        let vm = hv.create_vm().expect("new VM fd creation failed");
-												hypervisor, vmm: Remove shared ownership of VmmOps

This interface is used by the vCPU thread to delegate responsibility for
handling MMIO/PIO operations and to support different approaches than a
VM exit.

During profiling I found that we were spending 13.75% of the boot CPU
uage acquiring access to the object holding the VmmOps via
ArcSwap::load_full()

    13.75%     6.02%  vcpu0            cloud-hypervisor    [.] arc_swap::ArcSwapAny<T,S>::load_full
            |
            ---arc_swap::ArcSwapAny<T,S>::load_full
               |
                --13.43%--<hypervisor::kvm::KvmVcpu as hypervisor::cpu::Vcpu>::run
                          std::sys_common::backtrace::__rust_begin_short_backtrace
                          core::ops::function::FnOnce::call_once{{vtable-shim}}
                          std::sys::unix::thread::Thread::new::thread_start

However since the object implementing VmmOps does not need to be mutable
and it is only used from the vCPU side we can change the ownership to
being a simple Arc<> that is passed in when calling create_vcpu().

This completely removes the above CPU usage from subsequent profiles.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-11-18 16:37:52 +00:00
+								        let vcpu = vm.create_vcpu(0, None).unwrap();
-												arch: move test cases to vmm crate

This saves us from adding a "kvm" feature to arch crate merely for the
purpose of running tests.

Signed-off-by: Wei Liu <liuwe@microsoft.com>

											
										
										
											2020-07-08 12:48:46 +00:00
+								        setup_msrs(&vcpu).unwrap();
 								        // This test will check against the last MSR entry configured (the tenth one).
 								        // See create_msr_entries for details.
 								        let mut msrs = MsrEntries::from_entries(&[MsrEntry {
 								            index: msr_index::MSR_IA32_MISC_ENABLE,
 								            ..Default::default()
 								        }]);
 								        // get_msrs returns the number of msrs that it succeed in reading. We only want to read 1
 								        // in this test case scenario.
 								        let read_msrs = vcpu.get_msrs(&mut msrs).unwrap();
 								        assert_eq!(read_msrs, 1);
 								        // Official entries that were setup when we did setup_msrs. We need to assert that the
 								        // tenth one (i.e the one with index msr_index::MSR_IA32_MISC_ENABLE has the data we
 								        // expect.
 								        let entry_vec = hypervisor::x86_64::boot_msr_entries();
 								        assert_eq!(entry_vec.as_slice()[9], msrs.as_slice()[0]);
 								    }
 								    #[test]
 								    fn test_setup_regs() {
 								        let hv = hypervisor::new().unwrap();
 								        let vm = hv.create_vm().expect("new VM fd creation failed");
-												hypervisor, vmm: Remove shared ownership of VmmOps

This interface is used by the vCPU thread to delegate responsibility for
handling MMIO/PIO operations and to support different approaches than a
VM exit.

During profiling I found that we were spending 13.75% of the boot CPU
uage acquiring access to the object holding the VmmOps via
ArcSwap::load_full()

    13.75%     6.02%  vcpu0            cloud-hypervisor    [.] arc_swap::ArcSwapAny<T,S>::load_full
            |
            ---arc_swap::ArcSwapAny<T,S>::load_full
               |
                --13.43%--<hypervisor::kvm::KvmVcpu as hypervisor::cpu::Vcpu>::run
                          std::sys_common::backtrace::__rust_begin_short_backtrace
                          core::ops::function::FnOnce::call_once{{vtable-shim}}
                          std::sys::unix::thread::Thread::new::thread_start

However since the object implementing VmmOps does not need to be mutable
and it is only used from the vCPU side we can change the ownership to
being a simple Arc<> that is passed in when calling create_vcpu().

This completely removes the above CPU usage from subsequent profiles.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-11-18 16:37:52 +00:00
+								        let vcpu = vm.create_vcpu(0, None).unwrap();
-												arch: move test cases to vmm crate

This saves us from adding a "kvm" feature to arch crate merely for the
purpose of running tests.

Signed-off-by: Wei Liu <liuwe@microsoft.com>

											
										
										
											2020-07-08 12:48:46 +00:00
 								        let expected_regs: StandardRegisters = StandardRegisters {
 								            rflags: 0x0000000000000002u64,
 								            rip: 1,
 								            rsp: 2,
 								            rbp: 2,
 								            rsi: 3,
 								            ..Default::default()
 								        };
 								        setup_regs(
 								            &vcpu,
 								            expected_regs.rip,
 								            expected_regs.rsp,
 								            expected_regs.rsi,
 								            BootProtocol::LinuxBoot,
 								        )
 								        .unwrap();
 								        let actual_regs: StandardRegisters = vcpu.get_regs().unwrap();
 								        assert_eq!(actual_regs, expected_regs);
 								    }
 								    #[test]
 								    fn test_setup_sregs() {
 								        let hv = hypervisor::new().unwrap();
 								        let vm = hv.create_vm().expect("new VM fd creation failed");
-												hypervisor, vmm: Remove shared ownership of VmmOps

This interface is used by the vCPU thread to delegate responsibility for
handling MMIO/PIO operations and to support different approaches than a
VM exit.

During profiling I found that we were spending 13.75% of the boot CPU
uage acquiring access to the object holding the VmmOps via
ArcSwap::load_full()

    13.75%     6.02%  vcpu0            cloud-hypervisor    [.] arc_swap::ArcSwapAny<T,S>::load_full
            |
            ---arc_swap::ArcSwapAny<T,S>::load_full
               |
                --13.43%--<hypervisor::kvm::KvmVcpu as hypervisor::cpu::Vcpu>::run
                          std::sys_common::backtrace::__rust_begin_short_backtrace
                          core::ops::function::FnOnce::call_once{{vtable-shim}}
                          std::sys::unix::thread::Thread::new::thread_start

However since the object implementing VmmOps does not need to be mutable
and it is only used from the vCPU side we can change the ownership to
being a simple Arc<> that is passed in when calling create_vcpu().

This completely removes the above CPU usage from subsequent profiles.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-11-18 16:37:52 +00:00
+								        let vcpu = vm.create_vcpu(0, None).unwrap();
-												arch: move test cases to vmm crate

This saves us from adding a "kvm" feature to arch crate merely for the
purpose of running tests.

Signed-off-by: Wei Liu <liuwe@microsoft.com>

											
										
										
											2020-07-08 12:48:46 +00:00
 								        let mut expected_sregs: SpecialRegisters = vcpu.get_sregs().unwrap();
-												vmm: cpu: Fix clippy issues inside test

Found by:  cargo clippy --all-features --all --tests

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-11-25 16:22:41 +00:00
+								        let gm = GuestMemoryMmap::from_ranges(&[(GuestAddress(0), 0x10000)]).unwrap();
-												arch: move test cases to vmm crate

This saves us from adding a "kvm" feature to arch crate merely for the
purpose of running tests.

Signed-off-by: Wei Liu <liuwe@microsoft.com>

											
										
										
											2020-07-08 12:48:46 +00:00
+								        configure_segments_and_sregs(&gm, &mut expected_sregs, BootProtocol::LinuxBoot).unwrap();
 								        setup_page_tables(&gm, &mut expected_sregs).unwrap();
 								        setup_sregs(&gm, &vcpu, BootProtocol::LinuxBoot).unwrap();
 								        let actual_sregs: SpecialRegisters = vcpu.get_sregs().unwrap();
 								        assert_eq!(expected_sregs, actual_sregs);
 								    }
 								}
 								#[cfg(target_arch = "aarch64")]
 								#[cfg(test)]
 								mod tests {
 								    use arch::aarch64::layout;
 								    use arch::aarch64::regs::*;
-												tests: AArch64: Add unit test cases for vCPU save/restore

Adds 3 more unit test cases for AArch64:

*save_restore_core_regs
*save_restore_system_regs
*get_set_mpstate

Signed-off-by: Henry Wang <Henry.Wang@arm.com>

											
										
										
											2020-08-30 12:50:19 +00:00
+								    use hypervisor::kvm::aarch64::{is_system_register, MPIDR_EL1};
-												AArch64: Preparation for vCPU save/restore

This commit ports code from firecracker and refactors the existing
AArch64 code as the preparation for implementing save/restore
AArch64 vCPU, including:

1. Modification of `arm64_core_reg` macro to retrive the index of
arm64 core register and implemention of a helper to determine if
a register is a system register.

2. Move some macros and helpers in `arch` crate to the `hypervisor`
crate.

3. Added related unit tests for above functions and macros.

Signed-off-by: Henry Wang <Henry.Wang@arm.com>

											
										
										
											2020-08-28 09:06:54 +00:00
+								    use hypervisor::kvm::kvm_bindings::{
-												tests: AArch64: Add unit test cases for vCPU save/restore

Adds 3 more unit test cases for AArch64:

*save_restore_core_regs
*save_restore_system_regs
*get_set_mpstate

Signed-off-by: Henry Wang <Henry.Wang@arm.com>

											
										
										
											2020-08-30 12:50:19 +00:00
+								        kvm_one_reg, kvm_regs, kvm_vcpu_init, user_pt_regs, KVM_REG_ARM64, KVM_REG_ARM64_SYSREG,
 								        KVM_REG_ARM_CORE, KVM_REG_SIZE_U64,
-												AArch64: Preparation for vCPU save/restore

This commit ports code from firecracker and refactors the existing
AArch64 code as the preparation for implementing save/restore
AArch64 vCPU, including:

1. Modification of `arm64_core_reg` macro to retrive the index of
arm64 core register and implemention of a helper to determine if
a register is a system register.

2. Move some macros and helpers in `arch` crate to the `hypervisor`
crate.

3. Added related unit tests for above functions and macros.

Signed-off-by: Henry Wang <Henry.Wang@arm.com>

											
										
										
											2020-08-28 09:06:54 +00:00
+								    };
 								    use hypervisor::{arm64_core_reg_id, offset__of};
 								    use std::mem;
-												arch: move test cases to vmm crate

This saves us from adding a "kvm" feature to arch crate merely for the
purpose of running tests.

Signed-off-by: Wei Liu <liuwe@microsoft.com>

											
										
										
											2020-07-08 12:48:46 +00:00
+								    use vm_memory::{GuestAddress, GuestMemoryMmap};
 								    #[test]
 								    fn test_setup_regs() {
 								        let hv = hypervisor::new().unwrap();
 								        let vm = hv.create_vm().unwrap();
-												hypervisor, vmm: Remove shared ownership of VmmOps

This interface is used by the vCPU thread to delegate responsibility for
handling MMIO/PIO operations and to support different approaches than a
VM exit.

During profiling I found that we were spending 13.75% of the boot CPU
uage acquiring access to the object holding the VmmOps via
ArcSwap::load_full()

    13.75%     6.02%  vcpu0            cloud-hypervisor    [.] arc_swap::ArcSwapAny<T,S>::load_full
            |
            ---arc_swap::ArcSwapAny<T,S>::load_full
               |
                --13.43%--<hypervisor::kvm::KvmVcpu as hypervisor::cpu::Vcpu>::run
                          std::sys_common::backtrace::__rust_begin_short_backtrace
                          core::ops::function::FnOnce::call_once{{vtable-shim}}
                          std::sys::unix::thread::Thread::new::thread_start

However since the object implementing VmmOps does not need to be mutable
and it is only used from the vCPU side we can change the ownership to
being a simple Arc<> that is passed in when calling create_vcpu().

This completely removes the above CPU usage from subsequent profiles.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-11-18 16:37:52 +00:00
+								        let vcpu = vm.create_vcpu(0, None).unwrap();
-												arch: move test cases to vmm crate

This saves us from adding a "kvm" feature to arch crate merely for the
purpose of running tests.

Signed-off-by: Wei Liu <liuwe@microsoft.com>

											
										
										
											2020-07-08 12:48:46 +00:00
+								        let mut regions = Vec::new();
 								        regions.push((
 								            GuestAddress(layout::RAM_64BIT_START),
 								            (layout::FDT_MAX_SIZE + 0x1000) as usize,
 								        ));
 								        let mem = GuestMemoryMmap::from_ranges(&regions).expect("Cannot initialize memory");
-												AArch64: Preparation for vCPU save/restore

This commit ports code from firecracker and refactors the existing
AArch64 code as the preparation for implementing save/restore
AArch64 vCPU, including:

1. Modification of `arm64_core_reg` macro to retrive the index of
arm64 core register and implemention of a helper to determine if
a register is a system register.

2. Move some macros and helpers in `arch` crate to the `hypervisor`
crate.

3. Added related unit tests for above functions and macros.

Signed-off-by: Henry Wang <Henry.Wang@arm.com>

											
										
										
											2020-08-28 09:06:54 +00:00
+								        let res = setup_regs(&vcpu, 0, 0x0, &mem);
 								        // Must fail when vcpu is not initialized yet.
 								        assert!(res.is_err());
 								        let mut kvi: kvm_vcpu_init = kvm_vcpu_init::default();
-												arch: move test cases to vmm crate

This saves us from adding a "kvm" feature to arch crate merely for the
purpose of running tests.

Signed-off-by: Wei Liu <liuwe@microsoft.com>

											
										
										
											2020-07-08 12:48:46 +00:00
+								        vm.get_preferred_target(&mut kvi).unwrap();
 								        vcpu.vcpu_init(&kvi).unwrap();
 								        assert!(setup_regs(&vcpu, 0, 0x0, &mem).is_ok());
 								    }
 								    #[test]
 								    fn test_read_mpidr() {
 								        let hv = hypervisor::new().unwrap();
 								        let vm = hv.create_vm().unwrap();
-												hypervisor, vmm: Remove shared ownership of VmmOps

This interface is used by the vCPU thread to delegate responsibility for
handling MMIO/PIO operations and to support different approaches than a
VM exit.

During profiling I found that we were spending 13.75% of the boot CPU
uage acquiring access to the object holding the VmmOps via
ArcSwap::load_full()

    13.75%     6.02%  vcpu0            cloud-hypervisor    [.] arc_swap::ArcSwapAny<T,S>::load_full
            |
            ---arc_swap::ArcSwapAny<T,S>::load_full
               |
                --13.43%--<hypervisor::kvm::KvmVcpu as hypervisor::cpu::Vcpu>::run
                          std::sys_common::backtrace::__rust_begin_short_backtrace
                          core::ops::function::FnOnce::call_once{{vtable-shim}}
                          std::sys::unix::thread::Thread::new::thread_start

However since the object implementing VmmOps does not need to be mutable
and it is only used from the vCPU side we can change the ownership to
being a simple Arc<> that is passed in when calling create_vcpu().

This completely removes the above CPU usage from subsequent profiles.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-11-18 16:37:52 +00:00
+								        let vcpu = vm.create_vcpu(0, None).unwrap();
-												AArch64: Preparation for vCPU save/restore

This commit ports code from firecracker and refactors the existing
AArch64 code as the preparation for implementing save/restore
AArch64 vCPU, including:

1. Modification of `arm64_core_reg` macro to retrive the index of
arm64 core register and implemention of a helper to determine if
a register is a system register.

2. Move some macros and helpers in `arch` crate to the `hypervisor`
crate.

3. Added related unit tests for above functions and macros.

Signed-off-by: Henry Wang <Henry.Wang@arm.com>

											
										
										
											2020-08-28 09:06:54 +00:00
+								        let mut kvi: kvm_vcpu_init = kvm_vcpu_init::default();
-												arch: move test cases to vmm crate

This saves us from adding a "kvm" feature to arch crate merely for the
purpose of running tests.

Signed-off-by: Wei Liu <liuwe@microsoft.com>

											
										
										
											2020-07-08 12:48:46 +00:00
+								        vm.get_preferred_target(&mut kvi).unwrap();
 								        // Must fail when vcpu is not initialized yet.
-												tests: AArch64: Add unit test cases for vCPU save/restore

Adds 3 more unit test cases for AArch64:

*save_restore_core_regs
*save_restore_system_regs
*get_set_mpstate

Signed-off-by: Henry Wang <Henry.Wang@arm.com>

											
										
										
											2020-08-30 12:50:19 +00:00
+								        assert!(vcpu.read_mpidr().is_err());
-												arch: move test cases to vmm crate

This saves us from adding a "kvm" feature to arch crate merely for the
purpose of running tests.

Signed-off-by: Wei Liu <liuwe@microsoft.com>

											
										
										
											2020-07-08 12:48:46 +00:00
 								        vcpu.vcpu_init(&kvi).unwrap();
-												tests: AArch64: Add unit test cases for vCPU save/restore

Adds 3 more unit test cases for AArch64:

*save_restore_core_regs
*save_restore_system_regs
*get_set_mpstate

Signed-off-by: Henry Wang <Henry.Wang@arm.com>

											
										
										
											2020-08-30 12:50:19 +00:00
+								        assert_eq!(vcpu.read_mpidr().unwrap(), 0x80000000);
-												arch: move test cases to vmm crate

This saves us from adding a "kvm" feature to arch crate merely for the
purpose of running tests.

Signed-off-by: Wei Liu <liuwe@microsoft.com>

											
										
										
											2020-07-08 12:48:46 +00:00
+								    }
-												AArch64: Preparation for vCPU save/restore

This commit ports code from firecracker and refactors the existing
AArch64 code as the preparation for implementing save/restore
AArch64 vCPU, including:

1. Modification of `arm64_core_reg` macro to retrive the index of
arm64 core register and implemention of a helper to determine if
a register is a system register.

2. Move some macros and helpers in `arch` crate to the `hypervisor`
crate.

3. Added related unit tests for above functions and macros.

Signed-off-by: Henry Wang <Henry.Wang@arm.com>

											
										
										
											2020-08-28 09:06:54 +00:00
 								    #[test]
 								    fn test_is_system_register() {
 								        let offset = offset__of!(user_pt_regs, pc);
 								        let regid = arm64_core_reg_id!(KVM_REG_SIZE_U64, offset);
 								        assert!(!is_system_register(regid));
 								        let regid = KVM_REG_ARM64 as u64 | KVM_REG_SIZE_U64 as u64 | KVM_REG_ARM64_SYSREG as u64;
 								        assert!(is_system_register(regid));
 								    }
-												tests: AArch64: Add unit test cases for vCPU save/restore

Adds 3 more unit test cases for AArch64:

*save_restore_core_regs
*save_restore_system_regs
*get_set_mpstate

Signed-off-by: Henry Wang <Henry.Wang@arm.com>

											
										
										
											2020-08-30 12:50:19 +00:00
 								    #[test]
 								    fn test_save_restore_core_regs() {
 								        let hv = hypervisor::new().unwrap();
 								        let vm = hv.create_vm().unwrap();
-												hypervisor, vmm: Remove shared ownership of VmmOps

This interface is used by the vCPU thread to delegate responsibility for
handling MMIO/PIO operations and to support different approaches than a
VM exit.

During profiling I found that we were spending 13.75% of the boot CPU
uage acquiring access to the object holding the VmmOps via
ArcSwap::load_full()

    13.75%     6.02%  vcpu0            cloud-hypervisor    [.] arc_swap::ArcSwapAny<T,S>::load_full
            |
            ---arc_swap::ArcSwapAny<T,S>::load_full
               |
                --13.43%--<hypervisor::kvm::KvmVcpu as hypervisor::cpu::Vcpu>::run
                          std::sys_common::backtrace::__rust_begin_short_backtrace
                          core::ops::function::FnOnce::call_once{{vtable-shim}}
                          std::sys::unix::thread::Thread::new::thread_start

However since the object implementing VmmOps does not need to be mutable
and it is only used from the vCPU side we can change the ownership to
being a simple Arc<> that is passed in when calling create_vcpu().

This completely removes the above CPU usage from subsequent profiles.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-11-18 16:37:52 +00:00
+								        let vcpu = vm.create_vcpu(0, None).unwrap();
-												tests: AArch64: Add unit test cases for vCPU save/restore

Adds 3 more unit test cases for AArch64:

*save_restore_core_regs
*save_restore_system_regs
*get_set_mpstate

Signed-off-by: Henry Wang <Henry.Wang@arm.com>

											
										
										
											2020-08-30 12:50:19 +00:00
+								        let mut kvi: kvm_vcpu_init = kvm_vcpu_init::default();
 								        vm.get_preferred_target(&mut kvi).unwrap();
 								        // Must fail when vcpu is not initialized yet.
 								        let mut state = kvm_regs::default();
 								        let res = vcpu.core_registers(&mut state);
 								        assert!(res.is_err());
 								        assert_eq!(
 								            format!("{}", res.unwrap_err()),
 								            "Failed to get core register: Exec format error (os error 8)"
 								        );
 								        let res = vcpu.set_core_registers(&mut state);
 								        assert!(res.is_err());
 								        assert_eq!(
 								            format!("{}", res.unwrap_err()),
 								            "Failed to set core register: Exec format error (os error 8)"
 								        );
 								        vcpu.vcpu_init(&kvi).unwrap();
 								        assert!(vcpu.core_registers(&mut state).is_ok());
 								        assert_eq!(state.regs.pstate, 0x3C5);
 								        assert!(vcpu.set_core_registers(&state).is_ok());
 								        let off = offset__of!(user_pt_regs, pstate);
 								        let pstate = vcpu
-												hypervisor, arch: rename "OneRegister" and relevant code

The OneRegister literally means "one (arbitrary) register". Just call it
"Register" instead. There is no need to inherit KVM's naming scheme in
the hypervisor agnostic code.

Signed-off-by: Wei Liu <liuwe@microsoft.com>

											
										
										
											2020-10-07 14:45:25 +00:00
+								            .get_reg(arm64_core_reg_id!(KVM_REG_SIZE_U64, off))
-												tests: AArch64: Add unit test cases for vCPU save/restore

Adds 3 more unit test cases for AArch64:

*save_restore_core_regs
*save_restore_system_regs
*get_set_mpstate

Signed-off-by: Henry Wang <Henry.Wang@arm.com>

											
										
										
											2020-08-30 12:50:19 +00:00
+								            .expect("Failed to call kvm get one reg");
 								        assert_eq!(state.regs.pstate, pstate);
 								    }
 								    #[test]
 								    fn test_save_restore_system_regs() {
 								        let hv = hypervisor::new().unwrap();
 								        let vm = hv.create_vm().unwrap();
-												hypervisor, vmm: Remove shared ownership of VmmOps

This interface is used by the vCPU thread to delegate responsibility for
handling MMIO/PIO operations and to support different approaches than a
VM exit.

During profiling I found that we were spending 13.75% of the boot CPU
uage acquiring access to the object holding the VmmOps via
ArcSwap::load_full()

    13.75%     6.02%  vcpu0            cloud-hypervisor    [.] arc_swap::ArcSwapAny<T,S>::load_full
            |
            ---arc_swap::ArcSwapAny<T,S>::load_full
               |
                --13.43%--<hypervisor::kvm::KvmVcpu as hypervisor::cpu::Vcpu>::run
                          std::sys_common::backtrace::__rust_begin_short_backtrace
                          core::ops::function::FnOnce::call_once{{vtable-shim}}
                          std::sys::unix::thread::Thread::new::thread_start

However since the object implementing VmmOps does not need to be mutable
and it is only used from the vCPU side we can change the ownership to
being a simple Arc<> that is passed in when calling create_vcpu().

This completely removes the above CPU usage from subsequent profiles.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-11-18 16:37:52 +00:00
+								        let vcpu = vm.create_vcpu(0, None).unwrap();
-												tests: AArch64: Add unit test cases for vCPU save/restore

Adds 3 more unit test cases for AArch64:

*save_restore_core_regs
*save_restore_system_regs
*get_set_mpstate

Signed-off-by: Henry Wang <Henry.Wang@arm.com>

											
										
										
											2020-08-30 12:50:19 +00:00
+								        let mut kvi: kvm_vcpu_init = kvm_vcpu_init::default();
 								        vm.get_preferred_target(&mut kvi).unwrap();
 								        // Must fail when vcpu is not initialized yet.
 								        let mut state: Vec<kvm_one_reg> = Vec::new();
 								        let res = vcpu.system_registers(&mut state);
 								        assert!(res.is_err());
 								        assert_eq!(
 								            format!("{}", res.unwrap_err()),
 								            "Failed to retrieve list of registers: Exec format error (os error 8)"
 								        );
 								        state.push(kvm_one_reg {
 								            id: MPIDR_EL1,
 								            addr: 0x00,
 								        });
 								        let res = vcpu.set_system_registers(&mut state);
 								        assert!(res.is_err());
 								        assert_eq!(
 								            format!("{}", res.unwrap_err()),
 								            "Failed to set system register: Exec format error (os error 8)"
 								        );
 								        vcpu.vcpu_init(&kvi).unwrap();
 								        assert!(vcpu.system_registers(&mut state).is_ok());
 								        let initial_mpidr: u64 = vcpu.read_mpidr().expect("Fail to read mpidr");
 								        assert!(state.contains(&kvm_one_reg {
 								            id: MPIDR_EL1,
 								            addr: initial_mpidr
 								        }));
 								        assert!(vcpu.set_system_registers(&state).is_ok());
 								        let mpidr: u64 = vcpu.read_mpidr().expect("Fail to read mpidr");
 								        assert_eq!(initial_mpidr, mpidr);
 								    }
 								    #[test]
 								    fn test_get_set_mpstate() {
 								        let hv = hypervisor::new().unwrap();
 								        let vm = hv.create_vm().unwrap();
-												hypervisor, vmm: Remove shared ownership of VmmOps

This interface is used by the vCPU thread to delegate responsibility for
handling MMIO/PIO operations and to support different approaches than a
VM exit.

During profiling I found that we were spending 13.75% of the boot CPU
uage acquiring access to the object holding the VmmOps via
ArcSwap::load_full()

    13.75%     6.02%  vcpu0            cloud-hypervisor    [.] arc_swap::ArcSwapAny<T,S>::load_full
            |
            ---arc_swap::ArcSwapAny<T,S>::load_full
               |
                --13.43%--<hypervisor::kvm::KvmVcpu as hypervisor::cpu::Vcpu>::run
                          std::sys_common::backtrace::__rust_begin_short_backtrace
                          core::ops::function::FnOnce::call_once{{vtable-shim}}
                          std::sys::unix::thread::Thread::new::thread_start

However since the object implementing VmmOps does not need to be mutable
and it is only used from the vCPU side we can change the ownership to
being a simple Arc<> that is passed in when calling create_vcpu().

This completely removes the above CPU usage from subsequent profiles.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-11-18 16:37:52 +00:00
+								        let vcpu = vm.create_vcpu(0, None).unwrap();
-												tests: AArch64: Add unit test cases for vCPU save/restore

Adds 3 more unit test cases for AArch64:

*save_restore_core_regs
*save_restore_system_regs
*get_set_mpstate

Signed-off-by: Henry Wang <Henry.Wang@arm.com>

											
										
										
											2020-08-30 12:50:19 +00:00
+								        let mut kvi: kvm_vcpu_init = kvm_vcpu_init::default();
 								        vm.get_preferred_target(&mut kvi).unwrap();
 								        let res = vcpu.get_mp_state();
 								        assert!(res.is_ok());
 								        assert!(vcpu.set_mp_state(res.unwrap()).is_ok());
 								    }
-												arch: move test cases to vmm crate

This saves us from adding a "kvm" feature to arch crate merely for the
purpose of running tests.

Signed-off-by: Wei Liu <liuwe@microsoft.com>

											
										
										
											2020-07-08 12:48:46 +00:00
+								}