cloud-hypervisor/vmm/src/cpu.rs

// Copyright © 2020, Oracle and/or its affiliates.
//
// Copyright 2018 Amazon.com, Inc. or its affiliates. All Rights Reserved.
//
// Portions Copyright 2017 The Chromium OS Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE-BSD-3-Clause file.
//
// Copyright © 2019 Intel Corporation
//
// SPDX-License-Identifier: Apache-2.0 AND BSD-3-Clause
//

use crate::config::CpusConfig;
use crate::device_manager::DeviceManager;
#[cfg(feature = "acpi")]
use acpi_tables::{aml, aml::Aml, sdt::SDT};
#[cfg(feature = "acpi")]
use arch::layout;
use arch::EntryPoint;
use devices::{ioapic, BusDevice};
use kvm_bindings::{
    kvm_fpu, kvm_lapic_state, kvm_mp_state, kvm_regs, kvm_sregs, kvm_vcpu_events, kvm_xcrs,
    kvm_xsave, CpuId, Msrs,
};
use kvm_ioctls::*;
use libc::{c_void, siginfo_t};
use serde_derive::{Deserialize, Serialize};
use std::cmp;
use std::os::unix::thread::JoinHandleExt;
use std::sync::atomic::{AtomicBool, Ordering};
use std::sync::{Arc, Barrier, Mutex};
use std::thread;
use std::{fmt, io, result};
use vm_memory::{Address, GuestAddress, GuestAddressSpace, GuestMemoryAtomic, GuestMemoryMmap};
use vm_migration::{Migratable, MigratableError, Pausable, Snapshottable, Transportable};
use vmm_sys_util::eventfd::EventFd;
use vmm_sys_util::signal::{register_signal_handler, SIGRTMIN};

// CPUID feature bits
const TSC_DEADLINE_TIMER_ECX_BIT: u8 = 24; // tsc deadline timer ecx bit.
const HYPERVISOR_ECX_BIT: u8 = 31; // Hypervisor ecx bit.

// Debug I/O port
#[cfg(target_arch = "x86_64")]
const DEBUG_IOPORT: u16 = 0x80;
const DEBUG_IOPORT_PREFIX: &str = "Debug I/O port";

/// Debug I/O port, see:
/// https://www.intel.com/content/www/us/en/support/articles/000005500/boards-and-kits.html
///
/// Since we're not a physical platform, we can freely assign code ranges for
/// debugging specific parts of our virtual platform.
pub enum DebugIoPortRange {
    Firmware,
    Bootloader,
    Kernel,
    Userspace,
    Custom,
}

impl DebugIoPortRange {
    fn from_u8(value: u8) -> DebugIoPortRange {
        match value {
            0x00..=0x1f => DebugIoPortRange::Firmware,
            0x20..=0x3f => DebugIoPortRange::Bootloader,
            0x40..=0x5f => DebugIoPortRange::Kernel,
            0x60..=0x7f => DebugIoPortRange::Userspace,
            _ => DebugIoPortRange::Custom,
        }
    }
}

impl fmt::Display for DebugIoPortRange {
    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
        match self {
            DebugIoPortRange::Firmware => write!(f, "{}: Firmware", DEBUG_IOPORT_PREFIX),
            DebugIoPortRange::Bootloader => write!(f, "{}: Bootloader", DEBUG_IOPORT_PREFIX),
            DebugIoPortRange::Kernel => write!(f, "{}: Kernel", DEBUG_IOPORT_PREFIX),
            DebugIoPortRange::Userspace => write!(f, "{}: Userspace", DEBUG_IOPORT_PREFIX),
            DebugIoPortRange::Custom => write!(f, "{}: Custom", DEBUG_IOPORT_PREFIX),
        }
    }
}

#[derive(Debug)]
pub enum Error {
    /// Cannot open the VCPU file descriptor.
    VcpuFd(kvm_ioctls::Error),

    /// Cannot run the VCPUs.
    VcpuRun(kvm_ioctls::Error),

    /// Cannot spawn a new vCPU thread.
    VcpuSpawn(io::Error),

    /// Cannot patch the CPU ID
    PatchCpuId(kvm_ioctls::Error),

    #[cfg(target_arch = "x86_64")]
    /// Error configuring the general purpose registers
    REGSConfiguration(arch::x86_64::regs::Error),

    #[cfg(target_arch = "x86_64")]
    /// Error configuring the special registers
    SREGSConfiguration(arch::x86_64::regs::Error),

    #[cfg(target_arch = "x86_64")]
    /// Error configuring the floating point related registers
    FPUConfiguration(arch::x86_64::regs::Error),

    /// The call to KVM_SET_CPUID2 failed.
    SetSupportedCpusFailed(kvm_ioctls::Error),

    #[cfg(target_arch = "x86_64")]
    /// Cannot set the local interruption due to bad configuration.
    LocalIntConfiguration(arch::x86_64::interrupts::Error),

    #[cfg(target_arch = "x86_64")]
    /// Error configuring the MSR registers
    MSRSConfiguration(arch::x86_64::regs::Error),

    /// Unexpected KVM_RUN exit reason
    VcpuUnhandledKvmExit,

    /// Failed to join on vCPU threads
    ThreadCleanup(std::boxed::Box<dyn std::any::Any + std::marker::Send>),

    /// Cannot add legacy device to Bus.
    BusError(devices::BusError),

    /// Failed to allocate IO port
    AllocateIOPort,

    /// Asking for more vCPUs that we can have
    DesiredVCPUCountExceedsMax,

    /// Failed to get KVM vcpu lapic.
    VcpuGetLapic(kvm_ioctls::Error),

    /// Failed to set KVM vcpu lapic.
    VcpuSetLapic(kvm_ioctls::Error),

    /// Failed to get KVM vcpu MP state.
    VcpuGetMpState(kvm_ioctls::Error),

    /// Failed to set KVM vcpu MP state.
    VcpuSetMpState(kvm_ioctls::Error),

    /// Failed to get KVM vcpu msrs.
    VcpuGetMsrs(kvm_ioctls::Error),

    /// Failed to set KVM vcpu msrs.
    VcpuSetMsrs(kvm_ioctls::Error),

    /// Failed to get KVM vcpu regs.
    VcpuGetRegs(kvm_ioctls::Error),

    /// Failed to set KVM vcpu regs.
    VcpuSetRegs(kvm_ioctls::Error),

    /// Failed to get KVM vcpu sregs.
    VcpuGetSregs(kvm_ioctls::Error),

    /// Failed to set KVM vcpu sregs.
    VcpuSetSregs(kvm_ioctls::Error),

    /// Failed to get KVM vcpu events.
    VcpuGetVcpuEvents(kvm_ioctls::Error),

    /// Failed to set KVM vcpu events.
    VcpuSetVcpuEvents(kvm_ioctls::Error),

    /// Failed to get KVM vcpu FPU.
    VcpuGetFpu(kvm_ioctls::Error),

    /// Failed to set KVM vcpu FPU.
    VcpuSetFpu(kvm_ioctls::Error),

    /// Failed to get KVM vcpu XSAVE.
    VcpuGetXsave(kvm_ioctls::Error),

    /// Failed to set KVM vcpu XSAVE.
    VcpuSetXsave(kvm_ioctls::Error),

    /// Failed to get KVM vcpu XCRS.
    VcpuGetXcrs(kvm_ioctls::Error),

    /// Failed to set KVM vcpu XCRS.
    VcpuSetXcrs(kvm_ioctls::Error),
}
pub type Result<T> = result::Result<T, Error>;

#[allow(dead_code)]
#[derive(Copy, Clone)]
enum CpuidReg {
    EAX,
    EBX,
    ECX,
    EDX,
}

pub struct CpuidPatch {
    pub function: u32,
    pub index: u32,
    pub flags_bit: Option<u8>,
    pub eax_bit: Option<u8>,
    pub ebx_bit: Option<u8>,
    pub ecx_bit: Option<u8>,
    pub edx_bit: Option<u8>,
}

impl CpuidPatch {
    fn set_cpuid_reg(
        cpuid: &mut CpuId,
        function: u32,
        index: Option<u32>,
        reg: CpuidReg,
        value: u32,
    ) {
        let entries = cpuid.as_mut_slice();

        for entry in entries.iter_mut() {
            if entry.function == function && (index == None || index.unwrap() == entry.index) {
                match reg {
                    CpuidReg::EAX => {
                        entry.eax = value;
                    }
                    CpuidReg::EBX => {
                        entry.ebx = value;
                    }
                    CpuidReg::ECX => {
                        entry.ecx = value;
                    }
                    CpuidReg::EDX => {
                        entry.edx = value;
                    }
                }
            }
        }
    }

    pub fn patch_cpuid(cpuid: &mut CpuId, patches: Vec<CpuidPatch>) {
        let entries = cpuid.as_mut_slice();

        for entry in entries.iter_mut() {
            for patch in patches.iter() {
                if entry.function == patch.function && entry.index == patch.index {
                    if let Some(flags_bit) = patch.flags_bit {
                        entry.flags |= 1 << flags_bit;
                    }
                    if let Some(eax_bit) = patch.eax_bit {
                        entry.eax |= 1 << eax_bit;
                    }
                    if let Some(ebx_bit) = patch.ebx_bit {
                        entry.ebx |= 1 << ebx_bit;
                    }
                    if let Some(ecx_bit) = patch.ecx_bit {
                        entry.ecx |= 1 << ecx_bit;
                    }
                    if let Some(edx_bit) = patch.edx_bit {
                        entry.edx |= 1 << edx_bit;
                    }
                }
            }
        }
    }
}

#[cfg(feature = "acpi")]
#[repr(packed)]
struct LocalAPIC {
    pub r#type: u8,
    pub length: u8,
    pub processor_id: u8,
    pub apic_id: u8,
    pub flags: u32,
}

#[repr(packed)]
#[derive(Default)]
struct IOAPIC {
    pub r#type: u8,
    pub length: u8,
    pub ioapic_id: u8,
    _reserved: u8,
    pub apic_address: u32,
    pub gsi_base: u32,
}

#[repr(packed)]
#[derive(Default)]
struct InterruptSourceOverride {
    pub r#type: u8,
    pub length: u8,
    pub bus: u8,
    pub source: u8,
    pub gsi: u32,
    pub flags: u16,
}

/// A wrapper around creating and using a kvm-based VCPU.
pub struct Vcpu {
    fd: VcpuFd,
    id: u8,
    io_bus: Arc<devices::Bus>,
    mmio_bus: Arc<devices::Bus>,
    ioapic: Option<Arc<Mutex<ioapic::Ioapic>>>,
    vm_ts: std::time::Instant,
}

#[derive(Clone, Serialize, Deserialize)]
pub struct VcpuKvmState {
    msrs: Msrs,
    vcpu_events: kvm_vcpu_events,
    regs: kvm_regs,
    sregs: kvm_sregs,
    fpu: kvm_fpu,
    lapic_state: kvm_lapic_state,
    xsave: kvm_xsave,
    xcrs: kvm_xcrs,
    mp_state: kvm_mp_state,
}

impl Vcpu {
    /// Constructs a new VCPU for `vm`.
    ///
    /// # Arguments
    ///
    /// * `id` - Represents the CPU number between [0, max vcpus).
    /// * `vm` - The virtual machine this vcpu will get attached to.
    pub fn new(
        id: u8,
        fd: &Arc<VmFd>,
        io_bus: Arc<devices::Bus>,
        mmio_bus: Arc<devices::Bus>,
        ioapic: Option<Arc<Mutex<ioapic::Ioapic>>>,
        creation_ts: std::time::Instant,
    ) -> Result<Arc<Mutex<Self>>> {
        let kvm_vcpu = fd.create_vcpu(id).map_err(Error::VcpuFd)?;
        // Initially the cpuid per vCPU is the one supported by this VM.
        Ok(Arc::new(Mutex::new(Vcpu {
            fd: kvm_vcpu,
            id,
            io_bus,
            mmio_bus,
            ioapic,
            vm_ts: creation_ts,
        })))
    }

    /// Configures a x86_64 specific vcpu and should be called once per vcpu from the vcpu's thread.
    ///
    /// # Arguments
    ///
    /// * `machine_config` - Specifies necessary info used for the CPUID configuration.
    /// * `kernel_entry_point` - Kernel entry point address in guest memory and boot protocol used.
    /// * `vm` - The virtual machine this vcpu will get attached to.
    pub fn configure(
        &mut self,
        kernel_entry_point: Option<EntryPoint>,
        vm_memory: &GuestMemoryAtomic<GuestMemoryMmap>,
        cpuid: CpuId,
    ) -> Result<()> {
        let mut cpuid = cpuid;
        CpuidPatch::set_cpuid_reg(&mut cpuid, 0xb, None, CpuidReg::EDX, u32::from(self.id));
        self.fd
            .set_cpuid2(&cpuid)
            .map_err(Error::SetSupportedCpusFailed)?;

        arch::x86_64::regs::setup_msrs(&self.fd).map_err(Error::MSRSConfiguration)?;
        if let Some(kernel_entry_point) = kernel_entry_point {
            // Safe to unwrap because this method is called after the VM is configured
            arch::x86_64::regs::setup_regs(
                &self.fd,
                kernel_entry_point.entry_addr.raw_value(),
                arch::x86_64::layout::BOOT_STACK_POINTER.raw_value(),
                arch::x86_64::layout::ZERO_PAGE_START.raw_value(),
                kernel_entry_point.protocol,
            )
            .map_err(Error::REGSConfiguration)?;
            arch::x86_64::regs::setup_fpu(&self.fd).map_err(Error::FPUConfiguration)?;
            arch::x86_64::regs::setup_sregs(
                &vm_memory.memory(),
                &self.fd,
                kernel_entry_point.protocol,
            )
            .map_err(Error::SREGSConfiguration)?;
        }
        arch::x86_64::interrupts::set_lint(&self.fd).map_err(Error::LocalIntConfiguration)?;
        Ok(())
    }

    /// Runs the VCPU until it exits, returning the reason.
    ///
    /// Note that the state of the VCPU and associated VM must be setup first for this to do
    /// anything useful.
    pub fn run(&self) -> Result<bool> {
        match self.fd.run() {
            Ok(run) => match run {
                VcpuExit::IoIn(addr, data) => {
                    self.io_bus.read(u64::from(addr), data);
                    Ok(true)
                }
                VcpuExit::IoOut(addr, data) => {
                    if addr == DEBUG_IOPORT && data.len() == 1 {
                        self.log_debug_ioport(data[0]);
                    }
                    self.io_bus.write(u64::from(addr), data);
                    Ok(true)
                }
                VcpuExit::MmioRead(addr, data) => {
                    self.mmio_bus.read(addr as u64, data);
                    Ok(true)
                }
                VcpuExit::MmioWrite(addr, data) => {
                    self.mmio_bus.write(addr as u64, data);
                    Ok(true)
                }
                VcpuExit::IoapicEoi(vector) => {
                    if let Some(ioapic) = &self.ioapic {
                        ioapic.lock().unwrap().end_of_interrupt(vector);
                    }
                    Ok(true)
                }
                VcpuExit::Shutdown => {
                    // Triple fault to trigger a reboot
                    Ok(false)
                }
                r => {
                    error!("Unexpected exit reason on vcpu run: {:?}", r);
                    Err(Error::VcpuUnhandledKvmExit)
                }
            },

            Err(ref e) => match e.errno() {
                libc::EAGAIN | libc::EINTR => Ok(true),
                _ => {
                    error!("VCPU {:?} error {:?}", self.id, e);
                    Err(Error::VcpuUnhandledKvmExit)
                }
            },
        }
    }

    // Log debug io port codes.
    fn log_debug_ioport(&self, code: u8) {
        let ts = self.vm_ts.elapsed();

        debug!(
            "[{} code 0x{:x}] {}.{:>06} seconds",
            DebugIoPortRange::from_u8(code),
            code,
            ts.as_secs(),
            ts.as_micros()
        );
    }

    #[allow(unused)]
    fn kvm_state(&self) -> Result<VcpuKvmState> {
        let mut msrs = arch::x86_64::regs::boot_msr_entries();
        self.fd.get_msrs(&mut msrs).map_err(Error::VcpuGetMsrs)?;

        let vcpu_events = self
            .fd
            .get_vcpu_events()
            .map_err(Error::VcpuGetVcpuEvents)?;
        let regs = self.fd.get_regs().map_err(Error::VcpuGetRegs)?;
        let sregs = self.fd.get_sregs().map_err(Error::VcpuGetSregs)?;
        let lapic_state = self.fd.get_lapic().map_err(Error::VcpuGetLapic)?;
        let fpu = self.fd.get_fpu().map_err(Error::VcpuGetFpu)?;
        let xsave = self.fd.get_xsave().map_err(Error::VcpuGetXsave)?;
        let xcrs = self.fd.get_xcrs().map_err(Error::VcpuGetXsave)?;
        let mp_state = self.fd.get_mp_state().map_err(Error::VcpuGetMpState)?;

        Ok(VcpuKvmState {
            msrs,
            vcpu_events,
            regs,
            sregs,
            fpu,
            lapic_state,
            xsave,
            xcrs,
            mp_state,
        })
    }

    #[allow(unused)]
    fn set_kvm_state(&mut self, state: &VcpuKvmState) -> Result<()> {
        self.fd.set_regs(&state.regs).map_err(Error::VcpuSetRegs)?;

        self.fd.set_fpu(&state.fpu).map_err(Error::VcpuSetFpu)?;

        self.fd
            .set_xsave(&state.xsave)
            .map_err(Error::VcpuSetXsave)?;

        self.fd
            .set_sregs(&state.sregs)
            .map_err(Error::VcpuSetSregs)?;

        self.fd.set_xcrs(&state.xcrs).map_err(Error::VcpuSetXcrs)?;

        self.fd.set_msrs(&state.msrs).map_err(Error::VcpuSetMsrs)?;

        self.fd
            .set_lapic(&state.lapic_state)
            .map_err(Error::VcpuSetLapic)?;

        self.fd
            .set_mp_state(state.mp_state)
            .map_err(Error::VcpuSetMpState)?;

        Ok(())
    }
}

pub struct CpuManager {
    boot_vcpus: u8,
    max_vcpus: u8,
    io_bus: Arc<devices::Bus>,
    mmio_bus: Arc<devices::Bus>,
    ioapic: Option<Arc<Mutex<ioapic::Ioapic>>>,
    vm_memory: GuestMemoryAtomic<GuestMemoryMmap>,
    cpuid: CpuId,
    fd: Arc<VmFd>,
    vcpus_kill_signalled: Arc<AtomicBool>,
    vcpus_pause_signalled: Arc<AtomicBool>,
    reset_evt: EventFd,
    vcpu_states: Vec<VcpuState>,
    selected_cpu: u8,
    vcpus: Vec<Arc<Mutex<Vcpu>>>,
}

const CPU_ENABLE_FLAG: usize = 0;
const CPU_INSERTING_FLAG: usize = 1;
const CPU_REMOVING_FLAG: usize = 2;
const CPU_EJECT_FLAG: usize = 3;

const CPU_STATUS_OFFSET: u64 = 4;
const CPU_SELECTION_OFFSET: u64 = 0;

impl BusDevice for CpuManager {
    fn read(&mut self, _base: u64, offset: u64, data: &mut [u8]) {
        match offset {
            CPU_STATUS_OFFSET => {
                if self.selected_cpu < self.present_vcpus() {
                    let state = &self.vcpu_states[usize::from(self.selected_cpu)];
                    if state.active() {
                        data[0] |= 1 << CPU_ENABLE_FLAG;
                    }
                    if state.inserting {
                        data[0] |= 1 << CPU_INSERTING_FLAG;
                    }
                    if state.removing {
                        data[0] |= 1 << CPU_REMOVING_FLAG;
                    }
                }
            }
            _ => {
                warn!(
                    "Unexpected offset for accessing CPU manager device: {:#}",
                    offset
                );
            }
        }
    }

    fn write(&mut self, _base: u64, offset: u64, data: &[u8]) {
        match offset {
            CPU_SELECTION_OFFSET => {
                self.selected_cpu = data[0];
            }
            CPU_STATUS_OFFSET => {
                let state = &mut self.vcpu_states[usize::from(self.selected_cpu)];
                // The ACPI code writes back a 1 to acknowledge the insertion
                if (data[0] & (1 << CPU_INSERTING_FLAG) == 1 << CPU_INSERTING_FLAG)
                    && state.inserting
                {
                    state.inserting = false;
                }
                // Ditto for removal
                if (data[0] & (1 << CPU_REMOVING_FLAG) == 1 << CPU_REMOVING_FLAG) && state.removing
                {
                    state.removing = false;
                }
                // Trigger removal of vCPU
                if data[0] & (1 << CPU_EJECT_FLAG) == 1 << CPU_EJECT_FLAG {
                    if let Err(e) = self.remove_vcpu(self.selected_cpu) {
                        error!("Error removing vCPU: {:?}", e);
                    }
                }
            }
            _ => {
                warn!(
                    "Unexpected offset for accessing CPU manager device: {:#}",
                    offset
                );
            }
        }
    }
}

#[derive(Default)]
struct VcpuState {
    inserting: bool,
    removing: bool,
    handle: Option<thread::JoinHandle<()>>,
    kill: Arc<AtomicBool>,
}

impl VcpuState {
    fn active(&self) -> bool {
        self.handle.is_some()
    }

    fn signal_thread(&self) {
        if let Some(handle) = self.handle.as_ref() {
            unsafe {
                libc::pthread_kill(handle.as_pthread_t(), SIGRTMIN());
            }
        }
    }

    fn join_thread(&mut self) -> Result<()> {
        if let Some(handle) = self.handle.take() {
            handle.join().map_err(Error::ThreadCleanup)?
        }

        Ok(())
    }

    fn unpark_thread(&self) {
        if let Some(handle) = self.handle.as_ref() {
            handle.thread().unpark()
        }
    }
}

impl CpuManager {
    pub fn new(
        config: &CpusConfig,
        device_manager: &Arc<Mutex<DeviceManager>>,
        guest_memory: GuestMemoryAtomic<GuestMemoryMmap>,
        kvm: &Kvm,
        fd: Arc<VmFd>,
        reset_evt: EventFd,
    ) -> Result<Arc<Mutex<CpuManager>>> {
        let mut vcpu_states = Vec::with_capacity(usize::from(config.max_vcpus));
        vcpu_states.resize_with(usize::from(config.max_vcpus), VcpuState::default);

        let device_manager = device_manager.lock().unwrap();
        let cpuid = CpuManager::patch_cpuid(kvm)?;
        let cpu_manager = Arc::new(Mutex::new(CpuManager {
            boot_vcpus: config.boot_vcpus,
            max_vcpus: config.max_vcpus,
            io_bus: device_manager.io_bus().clone(),
            mmio_bus: device_manager.mmio_bus().clone(),
            ioapic: device_manager.ioapic().clone(),
            vm_memory: guest_memory,
            cpuid,
            fd,
            vcpus_kill_signalled: Arc::new(AtomicBool::new(false)),
            vcpus_pause_signalled: Arc::new(AtomicBool::new(false)),
            vcpu_states,
            reset_evt,
            selected_cpu: 0,
            vcpus: Vec::with_capacity(usize::from(config.max_vcpus)),
        }));

        device_manager
            .allocator()
            .lock()
            .unwrap()
            .allocate_io_addresses(Some(GuestAddress(0x0cd8)), 0x8, None)
            .ok_or(Error::AllocateIOPort)?;

        cpu_manager
            .lock()
            .unwrap()
            .io_bus
            .insert(cpu_manager.clone(), 0x0cd8, 0xc)
            .map_err(Error::BusError)?;

        Ok(cpu_manager)
    }

    fn patch_cpuid(kvm: &Kvm) -> Result<CpuId> {
        let mut cpuid_patches = Vec::new();

        // Patch tsc deadline timer bit
        cpuid_patches.push(CpuidPatch {
            function: 1,
            index: 0,
            flags_bit: None,
            eax_bit: None,
            ebx_bit: None,
            ecx_bit: Some(TSC_DEADLINE_TIMER_ECX_BIT),
            edx_bit: None,
        });

        // Patch hypervisor bit
        cpuid_patches.push(CpuidPatch {
            function: 1,
            index: 0,
            flags_bit: None,
            eax_bit: None,
            ebx_bit: None,
            ecx_bit: Some(HYPERVISOR_ECX_BIT),
            edx_bit: None,
        });

        // Supported CPUID
        let mut cpuid = kvm
            .get_supported_cpuid(kvm_bindings::KVM_MAX_CPUID_ENTRIES)
            .map_err(Error::PatchCpuId)?;

        CpuidPatch::patch_cpuid(&mut cpuid, cpuid_patches);

        Ok(cpuid)
    }

    fn start_vcpu(
        &mut self,
        cpu_id: u8,
        creation_ts: std::time::Instant,
        vcpu_thread_barrier: Arc<Barrier>,
        entry_point: Option<EntryPoint>,
        inserting: bool,
    ) -> Result<()> {
        let ioapic = if let Some(ioapic) = &self.ioapic {
            Some(ioapic.clone())
        } else {
            None
        };

        let vcpu = Vcpu::new(
            cpu_id,
            &self.fd,
            self.io_bus.clone(),
            self.mmio_bus.clone(),
            ioapic,
            creation_ts,
        )?;

        let reset_evt = self.reset_evt.try_clone().unwrap();
        let vcpu_kill_signalled = self.vcpus_kill_signalled.clone();
        let vcpu_pause_signalled = self.vcpus_pause_signalled.clone();

        let vcpu_kill = self.vcpu_states[usize::from(cpu_id)].kill.clone();
        let vm_memory = self.vm_memory.clone();

        vcpu.lock()
            .unwrap()
            .configure(entry_point, &vm_memory, self.cpuid.clone())
            .expect("Failed to configure vCPU");

        let vcpu_clone = Arc::clone(&vcpu);
        self.vcpus.push(vcpu_clone);

        let handle = Some(
            thread::Builder::new()
                .name(format!("vcpu{}", cpu_id))
                .spawn(move || {
                    extern "C" fn handle_signal(_: i32, _: *mut siginfo_t, _: *mut c_void) {}
                    // This uses an async signal safe handler to kill the vcpu handles.
                    register_signal_handler(SIGRTMIN(), handle_signal)
                        .expect("Failed to register vcpu signal handler");

                    // Block until all CPUs are ready.
                    vcpu_thread_barrier.wait();

                    loop {
                        // vcpu.run() returns false on a KVM_EXIT_SHUTDOWN (triple-fault) so trigger a reset
                        match vcpu.lock().unwrap().run() {
                            Err(e) => {
                                error!("VCPU generated error: {:?}", e);
                                break;
                            }
                            Ok(true) => {}
                            Ok(false) => {
                                reset_evt.write(1).unwrap();
                                break;
                            }
                        }

                        // We've been told to terminate
                        if vcpu_kill_signalled.load(Ordering::SeqCst)
                            || vcpu_kill.load(Ordering::SeqCst)
                        {
                            break;
                        }

                        // If we are being told to pause, we park the thread
                        // until the pause boolean is toggled.
                        // The resume operation is responsible for toggling
                        // the boolean and unpark the thread.
                        // We enter a loop because park() could spuriously
                        // return. We will then park() again unless the
                        // pause boolean has been toggled.
                        while vcpu_pause_signalled.load(Ordering::SeqCst) {
                            thread::park();
                        }
                    }
                })
                .map_err(Error::VcpuSpawn)?,
        );

        // On hot plug calls into this function entry_point is None. It is for
        // those hotplug CPU additions that we need to set the inserting flag.
        self.vcpu_states[usize::from(cpu_id)].handle = handle;
        self.vcpu_states[usize::from(cpu_id)].inserting = inserting;

        Ok(())
    }

    fn activate_vcpus(&mut self, desired_vcpus: u8, entry_point: Option<EntryPoint>) -> Result<()> {
        if desired_vcpus > self.max_vcpus {
            return Err(Error::DesiredVCPUCountExceedsMax);
        }

        let creation_ts = std::time::Instant::now();
        let vcpu_thread_barrier = Arc::new(Barrier::new(
            (desired_vcpus - self.present_vcpus() + 1) as usize,
        ));

        for cpu_id in self.present_vcpus()..desired_vcpus {
            self.start_vcpu(
                cpu_id,
                creation_ts,
                vcpu_thread_barrier.clone(),
                entry_point,
                entry_point.is_none(),
            )?;
        }

        // Unblock all CPU threads.
        vcpu_thread_barrier.wait();
        Ok(())
    }

    fn mark_vcpus_for_removal(&mut self, desired_vcpus: u8) -> Result<()> {
        // Mark vCPUs for removal, actual removal happens on ejection
        for cpu_id in desired_vcpus..self.present_vcpus() {
            self.vcpu_states[usize::from(cpu_id)].removing = true;
        }
        Ok(())
    }

    fn remove_vcpu(&mut self, cpu_id: u8) -> Result<()> {
        let mut state = &mut self.vcpu_states[usize::from(cpu_id)];
        state.kill.store(true, Ordering::SeqCst);
        state.signal_thread();
        state.join_thread()?;
        state.handle = None;
        Ok(())
    }

    // Starts all the vCPUs that the VM is booting with. Blocks until all vCPUs are running.
    pub fn start_boot_vcpus(&mut self, entry_point: EntryPoint) -> Result<()> {
        self.activate_vcpus(self.boot_vcpus(), Some(entry_point))
    }

    pub fn resize(&mut self, desired_vcpus: u8) -> Result<bool> {
        match desired_vcpus.cmp(&self.present_vcpus()) {
            cmp::Ordering::Greater => self.activate_vcpus(desired_vcpus, None).and(Ok(true)),
            cmp::Ordering::Less => self.mark_vcpus_for_removal(desired_vcpus).and(Ok(true)),
            _ => Ok(false),
        }
    }

    pub fn shutdown(&mut self) -> Result<()> {
        // Tell the vCPUs to stop themselves next time they go through the loop
        self.vcpus_kill_signalled.store(true, Ordering::SeqCst);

        // Signal to the spawned threads (vCPUs and console signal handler). For the vCPU threads
        // this will interrupt the KVM_RUN ioctl() allowing the loop to check the boolean set
        // above.
        for state in self.vcpu_states.iter() {
            state.signal_thread();
        }

        // Wait for all the threads to finish. This removes the state from the vector.
        for mut state in self.vcpu_states.drain(..) {
            state.join_thread()?;
        }

        Ok(())
    }

    pub fn boot_vcpus(&self) -> u8 {
        self.boot_vcpus
    }

    pub fn max_vcpus(&self) -> u8 {
        self.max_vcpus
    }

    fn present_vcpus(&self) -> u8 {
        self.vcpu_states
            .iter()
            .fold(0, |acc, state| acc + state.active() as u8)
    }

    #[cfg(feature = "acpi")]
    pub fn create_madt(&self) -> SDT {
        // This is also checked in the commandline parsing.
        assert!(self.boot_vcpus <= self.max_vcpus);

        let mut madt = SDT::new(*b"APIC", 44, 5, *b"CLOUDH", *b"CHMADT  ", 1);
        madt.write(36, layout::APIC_START);

        for cpu in 0..self.max_vcpus {
            let lapic = LocalAPIC {
                r#type: 0,
                length: 8,
                processor_id: cpu,
                apic_id: cpu,
                flags: if cpu < self.boot_vcpus {
                    1 << MADT_CPU_ENABLE_FLAG
                } else {
                    0
                },
            };
            madt.append(lapic);
        }

        madt.append(IOAPIC {
            r#type: 1,
            length: 12,
            ioapic_id: 0,
            apic_address: layout::IOAPIC_START.0 as u32,
            gsi_base: 0,
            ..Default::default()
        });

        madt.append(InterruptSourceOverride {
            r#type: 2,
            length: 10,
            bus: 0,
            source: 4,
            gsi: 4,
            flags: 0,
        });

        madt
    }
}

#[cfg(feature = "acpi")]
struct CPU {
    cpu_id: u8,
}

#[cfg(feature = "acpi")]
const MADT_CPU_ENABLE_FLAG: usize = 0;

#[cfg(feature = "acpi")]
impl Aml for CPU {
    fn to_aml_bytes(&self) -> Vec<u8> {
        let lapic = LocalAPIC {
            r#type: 0,
            length: 8,
            processor_id: self.cpu_id,
            apic_id: self.cpu_id,
            flags: 1 << MADT_CPU_ENABLE_FLAG,
        };

        let mut mat_data: Vec<u8> = Vec::new();
        mat_data.resize(std::mem::size_of_val(&lapic), 0);
        unsafe { *(mat_data.as_mut_ptr() as *mut LocalAPIC) = lapic };

        aml::Device::new(
            format!("C{:03}", self.cpu_id).as_str().into(),
            vec![
                &aml::Name::new("_HID".into(), &"ACPI0007"),
                &aml::Name::new("_UID".into(), &self.cpu_id),
                /*
                _STA return value:
                Bit [0] – Set if the device is present.
                Bit [1] – Set if the device is enabled and decoding its resources.
                Bit [2] – Set if the device should be shown in the UI.
                Bit [3] – Set if the device is functioning properly (cleared if device failed its diagnostics).
                Bit [4] – Set if the battery is present.
                Bits [31:5] – Reserved (must be cleared).
                */
                &aml::Method::new(
                    "_STA".into(),
                    0,
                    false,
                    // Call into CSTA method which will interrogate device
                    vec![&aml::Return::new(&aml::MethodCall::new(
                        "CSTA".into(),
                        vec![&self.cpu_id],
                    ))],
                ),
                // The Linux kernel expects every CPU device to have a _MAT entry
                // containing the LAPIC for this processor with the enabled bit set
                // even it if is disabled in the MADT (non-boot CPU)
                &aml::Name::new("_MAT".into(), &aml::Buffer::new(mat_data)),
                // Trigger CPU ejection
                &aml::Method::new(
                    "_EJ0".into(),
                    1,
                    false,
                    // Call into CEJ0 method which will actually eject device
                    vec![&aml::Return::new(&aml::MethodCall::new(
                        "CEJ0".into(),
                        vec![&self.cpu_id],
                    ))],
                ),
            ],
        )
        .to_aml_bytes()
    }
}

#[cfg(feature = "acpi")]
struct CPUNotify {
    cpu_id: u8,
}

#[cfg(feature = "acpi")]
impl Aml for CPUNotify {
    fn to_aml_bytes(&self) -> Vec<u8> {
        let object = aml::Path::new(&format!("C{:03}", self.cpu_id));
        aml::If::new(
            &aml::Equal::new(&aml::Arg(0), &self.cpu_id),
            vec![&aml::Notify::new(&object, &aml::Arg(1))],
        )
        .to_aml_bytes()
    }
}

#[cfg(feature = "acpi")]
struct CPUMethods {
    max_vcpus: u8,
}

#[cfg(feature = "acpi")]
impl Aml for CPUMethods {
    fn to_aml_bytes(&self) -> Vec<u8> {
        let mut bytes = Vec::new();
        bytes.extend_from_slice(
            // CPU status method
            &aml::Method::new(
                "CSTA".into(),
                1,
                true,
                vec![
                    // Take lock defined above
                    &aml::Acquire::new("\\_SB_.PRES.CPLK".into(), 0xfff),
                    // Write CPU number (in first argument) to I/O port via field
                    &aml::Store::new(&aml::Path::new("\\_SB_.PRES.CSEL"), &aml::Arg(0)),
                    &aml::Store::new(&aml::Local(0), &aml::ZERO),
                    // Check if CPEN bit is set, if so make the local variable 0xf (see _STA for details of meaning)
                    &aml::If::new(
                        &aml::Equal::new(&aml::Path::new("\\_SB_.PRES.CPEN"), &aml::ONE),
                        vec![&aml::Store::new(&aml::Local(0), &0xfu8)],
                    ),
                    // Release lock
                    &aml::Release::new("\\_SB_.PRES.CPLK".into()),
                    // Return 0 or 0xf
                    &aml::Return::new(&aml::Local(0)),
                ],
            )
            .to_aml_bytes(),
        );

        let mut cpu_notifies = Vec::new();
        for cpu_id in 0..self.max_vcpus {
            cpu_notifies.push(CPUNotify { cpu_id });
        }

        let mut cpu_notifies_refs: Vec<&dyn aml::Aml> = Vec::new();
        for cpu_id in 0..self.max_vcpus {
            cpu_notifies_refs.push(&cpu_notifies[usize::from(cpu_id)]);
        }

        bytes.extend_from_slice(
            &aml::Method::new("CTFY".into(), 2, true, cpu_notifies_refs).to_aml_bytes(),
        );

        bytes.extend_from_slice(
            &aml::Method::new(
                "CEJ0".into(),
                1,
                true,
                vec![
                    &aml::Acquire::new("\\_SB_.PRES.CPLK".into(), 0xfff),
                    // Write CPU number (in first argument) to I/O port via field
                    &aml::Store::new(&aml::Path::new("\\_SB_.PRES.CSEL"), &aml::Arg(0)),
                    // Set CEJ0 bit
                    &aml::Store::new(&aml::Path::new("\\_SB_.PRES.CEJ0"), &aml::ONE),
                    &aml::Release::new("\\_SB_.PRES.CPLK".into()),
                ],
            )
            .to_aml_bytes(),
        );

        bytes.extend_from_slice(
            &aml::Method::new(
                "CSCN".into(),
                0,
                true,
                vec![
                    // Take lock defined above
                    &aml::Acquire::new("\\_SB_.PRES.CPLK".into(), 0xfff),
                    &aml::Store::new(&aml::Local(0), &aml::ZERO),
                    &aml::While::new(
                        &aml::LessThan::new(&aml::Local(0), &self.max_vcpus),
                        vec![
                            // Write CPU number (in first argument) to I/O port via field
                            &aml::Store::new(&aml::Path::new("\\_SB_.PRES.CSEL"), &aml::Local(0)),
                            // Check if CINS bit is set
                            &aml::If::new(
                                &aml::Equal::new(&aml::Path::new("\\_SB_.PRES.CINS"), &aml::ONE),
                                // Notify device if it is
                                vec![
                                    &aml::MethodCall::new(
                                        "CTFY".into(),
                                        vec![&aml::Local(0), &aml::ONE],
                                    ),
                                    // Reset CINS bit
                                    &aml::Store::new(
                                        &aml::Path::new("\\_SB_.PRES.CINS"),
                                        &aml::ONE,
                                    ),
                                ],
                            ),
                            // Check if CRMV bit is set
                            &aml::If::new(
                                &aml::Equal::new(&aml::Path::new("\\_SB_.PRES.CRMV"), &aml::ONE),
                                // Notify device if it is (with the eject constant 0x3)
                                vec![
                                    &aml::MethodCall::new(
                                        "CTFY".into(),
                                        vec![&aml::Local(0), &3u8],
                                    ),
                                    // Reset CRMV bit
                                    &aml::Store::new(
                                        &aml::Path::new("\\_SB_.PRES.CRMV"),
                                        &aml::ONE,
                                    ),
                                ],
                            ),
                            &aml::Add::new(&aml::Local(0), &aml::Local(0), &aml::ONE),
                        ],
                    ),
                    // Release lock
                    &aml::Release::new("\\_SB_.PRES.CPLK".into()),
                ],
            )
            .to_aml_bytes(),
        );
        bytes
    }
}

#[cfg(feature = "acpi")]
impl Aml for CpuManager {
    fn to_aml_bytes(&self) -> Vec<u8> {
        let mut bytes = Vec::new();
        // CPU hotplug controller
        bytes.extend_from_slice(
            &aml::Device::new(
                "_SB_.PRES".into(),
                vec![
                    &aml::Name::new("_HID".into(), &aml::EISAName::new("PNP0A06")),
                    // Mutex to protect concurrent access as we write to choose CPU and then read back status
                    &aml::Mutex::new("CPLK".into(), 0),
                    // I/O port for CPU controller
                    &aml::Name::new(
                        "_CRS".into(),
                        &aml::ResourceTemplate::new(vec![&aml::IO::new(
                            0x0cd8, 0x0cd8, 0x01, 0x0c,
                        )]),
                    ),
                    // OpRegion and Fields map I/O port into individual field values
                    &aml::OpRegion::new("PRST".into(), aml::OpRegionSpace::SystemIO, 0x0cd8, 0x0c),
                    &aml::Field::new(
                        "PRST".into(),
                        aml::FieldAccessType::Byte,
                        aml::FieldUpdateRule::WriteAsZeroes,
                        vec![
                            aml::FieldEntry::Reserved(32),
                            aml::FieldEntry::Named(*b"CPEN", 1),
                            aml::FieldEntry::Named(*b"CINS", 1),
                            aml::FieldEntry::Named(*b"CRMV", 1),
                            aml::FieldEntry::Named(*b"CEJ0", 1),
                            aml::FieldEntry::Reserved(4),
                            aml::FieldEntry::Named(*b"CCMD", 8),
                        ],
                    ),
                    &aml::Field::new(
                        "PRST".into(),
                        aml::FieldAccessType::DWord,
                        aml::FieldUpdateRule::Preserve,
                        vec![
                            aml::FieldEntry::Named(*b"CSEL", 32),
                            aml::FieldEntry::Reserved(32),
                            aml::FieldEntry::Named(*b"CDAT", 32),
                        ],
                    ),
                ],
            )
            .to_aml_bytes(),
        );

        // CPU devices
        let hid = aml::Name::new("_HID".into(), &"ACPI0010");
        let uid = aml::Name::new("_CID".into(), &aml::EISAName::new("PNP0A05"));
        // Bundle methods together under a common object
        let methods = CPUMethods {
            max_vcpus: self.max_vcpus,
        };
        let mut cpu_data_inner: Vec<&dyn aml::Aml> = vec![&hid, &uid, &methods];

        let mut cpu_devices = Vec::new();
        for cpu_id in 0..self.max_vcpus {
            let cpu_device = CPU { cpu_id };

            cpu_devices.push(cpu_device);
        }

        for cpu_device in cpu_devices.iter() {
            cpu_data_inner.push(cpu_device);
        }

        bytes.extend_from_slice(
            &aml::Device::new("_SB_.CPUS".into(), cpu_data_inner).to_aml_bytes(),
        );
        bytes
    }
}

impl Pausable for CpuManager {
    fn pause(&mut self) -> std::result::Result<(), MigratableError> {
        // Tell the vCPUs to pause themselves next time they exit
        self.vcpus_pause_signalled.store(true, Ordering::SeqCst);

        // Signal to the spawned threads (vCPUs and console signal handler). For the vCPU threads
        // this will interrupt the KVM_RUN ioctl() allowing the loop to check the boolean set
        // above.
        for state in self.vcpu_states.iter() {
            state.signal_thread();
        }

        Ok(())
    }

    fn resume(&mut self) -> std::result::Result<(), MigratableError> {
        // Toggle the vCPUs pause boolean
        self.vcpus_pause_signalled.store(false, Ordering::SeqCst);

        // Unpark all the VCPU threads.
        // Once unparked, the next thing they will do is checking for the pause
        // boolean. Since it'll be set to false, they will exit their pause loop
        // and go back to vmx root.
        for state in self.vcpu_states.iter() {
            state.unpark_thread();
        }
        Ok(())
    }
}

impl Snapshottable for CpuManager {}
impl Transportable for CpuManager {}
impl Migratable for CpuManager {}
-												pvh: Introduce EntryPoint struct

In order to properly initialize the kvm regs/sregs structs for
the guest, the load_kernel() return type must specify which
boot protocol to use with the entry point address it returns.

Make load_kernel() return an EntryPoint struct containing the
required information. This structure will later be used
in the vCPU configuration methods to setup the appropriate
initial conditions for the guest.

Signed-off-by: Alejandro Jimenez <alejandro.j.jimenez@oracle.com>

											
										
										
											2020-02-12 03:37:33 +00:00
+								// Copyright © 2020, Oracle and/or its affiliates.
 								//
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								// Copyright 2018 Amazon.com, Inc. or its affiliates. All Rights Reserved.
 								//
 								// Portions Copyright 2017 The Chromium OS Authors. All rights reserved.
 								// Use of this source code is governed by a BSD-style license that can be
 								// found in the LICENSE-BSD-3-Clause file.
 								//
 								// Copyright © 2019 Intel Corporation
 								//
 								// SPDX-License-Identifier: Apache-2.0 AND BSD-3-Clause
 								//
-												vmm: cpu: Pass CpusConfig to simplify the new() prototype

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-03-16 17:14:15 +00:00
 								use crate::config::CpusConfig;
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								use crate::device_manager::DeviceManager;
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								#[cfg(feature = "acpi")]
 								use acpi_tables::{aml, aml::Aml, sdt::SDT};
-												ci: Run clippy for each specific feature

The build is run against "--all-features", "pci,acpi", "pci" and "mmio"
separately. The clippy validation must be run against the same set of
features in order to validate the code is correct.

Because of these new checks, this commit includes multiple fixes
related to the errors generated when manually running the checks.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-01-21 08:32:50 +00:00
+								#[cfg(feature = "acpi")]
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								use arch::layout;
-												pvh: Introduce EntryPoint struct

In order to properly initialize the kvm regs/sregs structs for
the guest, the load_kernel() return type must specify which
boot protocol to use with the entry point address it returns.

Make load_kernel() return an EntryPoint struct containing the
required information. This structure will later be used
in the vCPU configuration methods to setup the appropriate
initial conditions for the guest.

Signed-off-by: Alejandro Jimenez <alejandro.j.jimenez@oracle.com>

											
										
										
											2020-02-12 03:37:33 +00:00
+								use arch::EntryPoint;
-												vmm: cpu: Add the CpuManager onto the IO bus

This allows the kernel (via ACPI based controls) to query and control
the CPU state.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 14:56:10 +00:00
+								use devices::{ioapic, BusDevice};
-												vmm: cpu: Get and set KVM vCPU state

These two new helpers will be useful to capture a vCPU state and being
able to restore it at a later time.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-16 20:42:42 +00:00
+								use kvm_bindings::{
 								    kvm_fpu, kvm_lapic_state, kvm_mp_state, kvm_regs, kvm_sregs, kvm_vcpu_events, kvm_xcrs,
 								    kvm_xsave, CpuId, Msrs,
 								};
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								use kvm_ioctls::*;
-												vm-virtio, vmm, vfio: Store GuestMemoryMmap in an Arc<ArcSwap<T>>

This allows us to change the memory map that is being used by the
devices via an atomic swap (by replacing the map with another one). The
ArcSwap provides the mechanism for atomically swapping from to another
whilst still giving good read performace. It is inside an Arc so that we
can use a single ArcSwap for all users.

Not covered by this change is replacing the GuestMemoryMmap itself.

This change also removes some vertical whitespace from use blocks in the
files that this commit also changed. Vertical whitespace was being used
inconsistently and broke rustfmt's behaviour of ordering the imports as
it would only do it within the block.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-31 10:49:11 +00:00
+								use libc::{c_void, siginfo_t};
-												vmm: cpu: Get and set KVM vCPU state

These two new helpers will be useful to capture a vCPU state and being
able to restore it at a later time.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-16 20:42:42 +00:00
+								use serde_derive::{Deserialize, Serialize};
-												vm-virtio, vmm, vfio: Store GuestMemoryMmap in an Arc<ArcSwap<T>>

This allows us to change the memory map that is being used by the
devices via an atomic swap (by replacing the map with another one). The
ArcSwap provides the mechanism for atomically swapping from to another
whilst still giving good read performace. It is inside an Arc so that we
can use a single ArcSwap for all users.

Not covered by this change is replacing the GuestMemoryMmap itself.

This change also removes some vertical whitespace from use blocks in the
files that this commit also changed. Vertical whitespace was being used
inconsistently and broke rustfmt's behaviour of ordering the imports as
it would only do it within the block.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-31 10:49:11 +00:00
+								use std::cmp;
 								use std::os::unix::thread::JoinHandleExt;
 								use std::sync::atomic::{AtomicBool, Ordering};
-												vmm: Remove all Weak references from CpuManager

Now that the BusDevice devices are stored as Weak references by the
IO and MMIO buses, there's no need to use Weak references from the
CpuManager anymore.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-03-04 15:19:37 +00:00
+								use std::sync::{Arc, Barrier, Mutex};
-												vm-virtio, vmm, vfio: Store GuestMemoryMmap in an Arc<ArcSwap<T>>

This allows us to change the memory map that is being used by the
devices via an atomic swap (by replacing the map with another one). The
ArcSwap provides the mechanism for atomically swapping from to another
whilst still giving good read performace. It is inside an Arc so that we
can use a single ArcSwap for all users.

Not covered by this change is replacing the GuestMemoryMmap itself.

This change also removes some vertical whitespace from use blocks in the
files that this commit also changed. Vertical whitespace was being used
inconsistently and broke rustfmt's behaviour of ordering the imports as
it would only do it within the block.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-31 10:49:11 +00:00
+								use std::thread;
 								use std::{fmt, io, result};
-												vmm: Move codebase to GuestMemoryAtomic from vm-memory

Relying on the latest vm-memory version, including the freshly
introduced structure GuestMemoryAtomic, this patch replaces every
occurrence of Arc<ArcSwap<GuestMemoryMmap> with
GuestMemoryAtomic<GuestMemoryMmap>.

The point is to rely on the common RCU-like implementation from
vm-memory so that we don't have to do it from Cloud-Hypervisor.

Fixes #735

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-02-11 16:22:40 +00:00
+								use vm_memory::{Address, GuestAddress, GuestAddressSpace, GuestMemoryAtomic, GuestMemoryMmap};
-												vm-migration: Define the Snapshottable and Transportable traits

A Snapshottable component can snapshot itself and
provide a MigrationSnapshot payload as a result.

A MigrationSnapshot payload is a map of component IDs to a list of
migration sections (MigrationSection). As component can be made of
several Migratable sub-components (e.g. the DeviceManager and its
device objects), a migration snapshot can be made of multiple snapshot
itself.
A snapshot is a list of migration sections, each section being a
component state snapshot. Having multiple sections allows for easier and
backward compatible migration payload extensions.

Once created, a migratable component snapshot may be transported and this
is what the Transportable trait defines, through 2 methods: send and recv.

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>
Signed-off-by: Yi Sun <yi.y.sun@linux.intel.com>

											
										
										
											2019-05-01 16:59:51 +00:00
+								use vm_migration::{Migratable, MigratableError, Pausable, Snapshottable, Transportable};
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								use vmm_sys_util::eventfd::EventFd;
-												vmm: Port to latest vmm-sys-util

The signal handling for vCPU signals has changed in the latest release
so switch to the new API.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-11 13:02:07 +00:00
+								use vmm_sys_util::signal::{register_signal_handler, SIGRTMIN};
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
-												vmm: cpu: Move CPUID patching to CpuManager

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-03-16 15:15:38 +00:00
+								// CPUID feature bits
 								const TSC_DEADLINE_TIMER_ECX_BIT: u8 = 24; // tsc deadline timer ecx bit.
 								const HYPERVISOR_ECX_BIT: u8 = 31; // Hypervisor ecx bit.
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								// Debug I/O port
 								#[cfg(target_arch = "x86_64")]
 								const DEBUG_IOPORT: u16 = 0x80;
 								const DEBUG_IOPORT_PREFIX: &str = "Debug I/O port";
 								/// Debug I/O port, see:
 								/// https://www.intel.com/content/www/us/en/support/articles/000005500/boards-and-kits.html
 								///
 								/// Since we're not a physical platform, we can freely assign code ranges for
 								/// debugging specific parts of our virtual platform.
 								pub enum DebugIoPortRange {
 								    Firmware,
 								    Bootloader,
 								    Kernel,
 								    Userspace,
 								    Custom,
 								}
 								impl DebugIoPortRange {
 								    fn from_u8(value: u8) -> DebugIoPortRange {
 								        match value {
 x00..=0x1f => DebugIoPortRange::Firmware,
 x20..=0x3f => DebugIoPortRange::Bootloader,
 x40..=0x5f => DebugIoPortRange::Kernel,
 x60..=0x7f => DebugIoPortRange::Userspace,
 								            _ => DebugIoPortRange::Custom,
 								        }
 								    }
 								}
 								impl fmt::Display for DebugIoPortRange {
 								    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
 								        match self {
 								            DebugIoPortRange::Firmware => write!(f, "{}: Firmware", DEBUG_IOPORT_PREFIX),
 								            DebugIoPortRange::Bootloader => write!(f, "{}: Bootloader", DEBUG_IOPORT_PREFIX),
 								            DebugIoPortRange::Kernel => write!(f, "{}: Kernel", DEBUG_IOPORT_PREFIX),
 								            DebugIoPortRange::Userspace => write!(f, "{}: Userspace", DEBUG_IOPORT_PREFIX),
 								            DebugIoPortRange::Custom => write!(f, "{}: Custom", DEBUG_IOPORT_PREFIX),
 								        }
 								    }
 								}
 								#[derive(Debug)]
 								pub enum Error {
 								    /// Cannot open the VCPU file descriptor.
-												cargo: Bump the kvm and vmm-sys-util crates

Since the kvm crates now depend on vmm-sys-util, the bump must be
atomic.
The kvm-bindings and ioctls 0.2.0 and 0.4.0 crates come with a few API
changes, one of them being the use of a kvm_ioctls specific error type.
Porting our code to that type makes for a fairly large diff stat.

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2019-11-29 15:36:33 +00:00
+								    VcpuFd(kvm_ioctls::Error),
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
 								    /// Cannot run the VCPUs.
-												cargo: Bump the kvm and vmm-sys-util crates

Since the kvm crates now depend on vmm-sys-util, the bump must be
atomic.
The kvm-bindings and ioctls 0.2.0 and 0.4.0 crates come with a few API
changes, one of them being the use of a kvm_ioctls specific error type.
Porting our code to that type makes for a fairly large diff stat.

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2019-11-29 15:36:33 +00:00
+								    VcpuRun(kvm_ioctls::Error),
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
 								    /// Cannot spawn a new vCPU thread.
 								    VcpuSpawn(io::Error),
-												vmm: cpu: Move CPUID patching to CpuManager

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-03-16 15:15:38 +00:00
+								    /// Cannot patch the CPU ID
 								    PatchCpuId(kvm_ioctls::Error),
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								    #[cfg(target_arch = "x86_64")]
 								    /// Error configuring the general purpose registers
 								    REGSConfiguration(arch::x86_64::regs::Error),
 								    #[cfg(target_arch = "x86_64")]
 								    /// Error configuring the special registers
 								    SREGSConfiguration(arch::x86_64::regs::Error),
 								    #[cfg(target_arch = "x86_64")]
 								    /// Error configuring the floating point related registers
 								    FPUConfiguration(arch::x86_64::regs::Error),
 								    /// The call to KVM_SET_CPUID2 failed.
-												cargo: Bump the kvm and vmm-sys-util crates

Since the kvm crates now depend on vmm-sys-util, the bump must be
atomic.
The kvm-bindings and ioctls 0.2.0 and 0.4.0 crates come with a few API
changes, one of them being the use of a kvm_ioctls specific error type.
Porting our code to that type makes for a fairly large diff stat.

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2019-11-29 15:36:33 +00:00
+								    SetSupportedCpusFailed(kvm_ioctls::Error),
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
 								    #[cfg(target_arch = "x86_64")]
 								    /// Cannot set the local interruption due to bad configuration.
 								    LocalIntConfiguration(arch::x86_64::interrupts::Error),
 								    #[cfg(target_arch = "x86_64")]
 								    /// Error configuring the MSR registers
 								    MSRSConfiguration(arch::x86_64::regs::Error),
 								    /// Unexpected KVM_RUN exit reason
 								    VcpuUnhandledKvmExit,
 								    /// Failed to join on vCPU threads
-												vmm: Fix map_err losing the inner error

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-01-24 08:34:51 +00:00
+								    ThreadCleanup(std::boxed::Box<dyn std::any::Any + std::marker::Send>),
-												vmm: cpu: Add the CpuManager onto the IO bus

This allows the kernel (via ACPI based controls) to query and control
the CPU state.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 14:56:10 +00:00
 								    /// Cannot add legacy device to Bus.
 								    BusError(devices::BusError),
-												vmm: cpu: Allocate I/O port for the CPU manager

The CPU manager uses an I/O port and to prevent potential clashes with
assignment for PCI devices ensure that it is allocated by the allocator.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-20 14:16:14 +00:00
-												Revert "vmm: Move CpuManager device to MMIO region"

This reverts commit 980e03fa0ab3d217fe91fd60d8459507c903d88b.

											
										
										
											2020-01-24 10:36:39 +00:00
+								    /// Failed to allocate IO port
 								    AllocateIOPort,
-												vmm: cpu: Refactor vCPU thread starting

Refactor the vCPU thread starting so that there is the possibility to
bring on extra vCPU threads.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 13:06:24 +00:00
 								    /// Asking for more vCPUs that we can have
 								    DesiredVCPUCountExceedsMax,
-												vmm: cpu: Get and set KVM vCPU state

These two new helpers will be useful to capture a vCPU state and being
able to restore it at a later time.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-16 20:42:42 +00:00
 								    /// Failed to get KVM vcpu lapic.
 								    VcpuGetLapic(kvm_ioctls::Error),
 								    /// Failed to set KVM vcpu lapic.
 								    VcpuSetLapic(kvm_ioctls::Error),
 								    /// Failed to get KVM vcpu MP state.
 								    VcpuGetMpState(kvm_ioctls::Error),
 								    /// Failed to set KVM vcpu MP state.
 								    VcpuSetMpState(kvm_ioctls::Error),
 								    /// Failed to get KVM vcpu msrs.
 								    VcpuGetMsrs(kvm_ioctls::Error),
 								    /// Failed to set KVM vcpu msrs.
 								    VcpuSetMsrs(kvm_ioctls::Error),
 								    /// Failed to get KVM vcpu regs.
 								    VcpuGetRegs(kvm_ioctls::Error),
 								    /// Failed to set KVM vcpu regs.
 								    VcpuSetRegs(kvm_ioctls::Error),
 								    /// Failed to get KVM vcpu sregs.
 								    VcpuGetSregs(kvm_ioctls::Error),
 								    /// Failed to set KVM vcpu sregs.
 								    VcpuSetSregs(kvm_ioctls::Error),
 								    /// Failed to get KVM vcpu events.
 								    VcpuGetVcpuEvents(kvm_ioctls::Error),
 								    /// Failed to set KVM vcpu events.
 								    VcpuSetVcpuEvents(kvm_ioctls::Error),
 								    /// Failed to get KVM vcpu FPU.
 								    VcpuGetFpu(kvm_ioctls::Error),
 								    /// Failed to set KVM vcpu FPU.
 								    VcpuSetFpu(kvm_ioctls::Error),
 								    /// Failed to get KVM vcpu XSAVE.
 								    VcpuGetXsave(kvm_ioctls::Error),
 								    /// Failed to set KVM vcpu XSAVE.
 								    VcpuSetXsave(kvm_ioctls::Error),
 								    /// Failed to get KVM vcpu XCRS.
 								    VcpuGetXcrs(kvm_ioctls::Error),
 								    /// Failed to set KVM vcpu XCRS.
 								    VcpuSetXcrs(kvm_ioctls::Error),
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								}
 								pub type Result<T> = result::Result<T, Error>;
 								#[allow(dead_code)]
 								#[derive(Copy, Clone)]
 								enum CpuidReg {
 								    EAX,
 								    EBX,
 								    ECX,
 								    EDX,
 								}
 								pub struct CpuidPatch {
 								    pub function: u32,
 								    pub index: u32,
 								    pub flags_bit: Option<u8>,
 								    pub eax_bit: Option<u8>,
 								    pub ebx_bit: Option<u8>,
 								    pub ecx_bit: Option<u8>,
 								    pub edx_bit: Option<u8>,
 								}
 								impl CpuidPatch {
 								    fn set_cpuid_reg(
 								        cpuid: &mut CpuId,
 								        function: u32,
 								        index: Option<u32>,
 								        reg: CpuidReg,
 								        value: u32,
 								    ) {
 								        let entries = cpuid.as_mut_slice();
 								        for entry in entries.iter_mut() {
 								            if entry.function == function && (index == None || index.unwrap() == entry.index) {
 								                match reg {
 								                    CpuidReg::EAX => {
 								                        entry.eax = value;
 								                    }
 								                    CpuidReg::EBX => {
 								                        entry.ebx = value;
 								                    }
 								                    CpuidReg::ECX => {
 								                        entry.ecx = value;
 								                    }
 								                    CpuidReg::EDX => {
 								                        entry.edx = value;
 								                    }
 								                }
 								            }
 								        }
 								    }
 								    pub fn patch_cpuid(cpuid: &mut CpuId, patches: Vec<CpuidPatch>) {
 								        let entries = cpuid.as_mut_slice();
 								        for entry in entries.iter_mut() {
 								            for patch in patches.iter() {
 								                if entry.function == patch.function && entry.index == patch.index {
 								                    if let Some(flags_bit) = patch.flags_bit {
 								                        entry.flags |= 1 << flags_bit;
 								                    }
 								                    if let Some(eax_bit) = patch.eax_bit {
 								                        entry.eax |= 1 << eax_bit;
 								                    }
 								                    if let Some(ebx_bit) = patch.ebx_bit {
 								                        entry.ebx |= 1 << ebx_bit;
 								                    }
 								                    if let Some(ecx_bit) = patch.ecx_bit {
 								                        entry.ecx |= 1 << ecx_bit;
 								                    }
 								                    if let Some(edx_bit) = patch.edx_bit {
 								                        entry.edx |= 1 << edx_bit;
 								                    }
 								                }
 								            }
 								        }
 								    }
 								}
-												ci: Run clippy for each specific feature

The build is run against "--all-features", "pci,acpi", "pci" and "mmio"
separately. The clippy validation must be run against the same set of
features in order to validate the code is correct.

Because of these new checks, this commit includes multiple fixes
related to the errors generated when manually running the checks.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-01-21 08:32:50 +00:00
+								#[cfg(feature = "acpi")]
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								#[repr(packed)]
 								struct LocalAPIC {
 								    pub r#type: u8,
 								    pub length: u8,
 								    pub processor_id: u8,
 								    pub apic_id: u8,
 								    pub flags: u32,
 								}
 								#[repr(packed)]
 								#[derive(Default)]
 								struct IOAPIC {
 								    pub r#type: u8,
 								    pub length: u8,
 								    pub ioapic_id: u8,
 								    _reserved: u8,
 								    pub apic_address: u32,
 								    pub gsi_base: u32,
 								}
 								#[repr(packed)]
 								#[derive(Default)]
 								struct InterruptSourceOverride {
 								    pub r#type: u8,
 								    pub length: u8,
 								    pub bus: u8,
 								    pub source: u8,
 								    pub gsi: u32,
 								    pub flags: u16,
 								}
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								/// A wrapper around creating and using a kvm-based VCPU.
 								pub struct Vcpu {
 								    fd: VcpuFd,
 								    id: u8,
 								    io_bus: Arc<devices::Bus>,
 								    mmio_bus: Arc<devices::Bus>,
 								    ioapic: Option<Arc<Mutex<ioapic::Ioapic>>>,
 								    vm_ts: std::time::Instant,
 								}
-												vmm: cpu: Get and set KVM vCPU state

These two new helpers will be useful to capture a vCPU state and being
able to restore it at a later time.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-16 20:42:42 +00:00
+								#[derive(Clone, Serialize, Deserialize)]
 								pub struct VcpuKvmState {
 								    msrs: Msrs,
 								    vcpu_events: kvm_vcpu_events,
 								    regs: kvm_regs,
 								    sregs: kvm_sregs,
 								    fpu: kvm_fpu,
 								    lapic_state: kvm_lapic_state,
 								    xsave: kvm_xsave,
 								    xcrs: kvm_xcrs,
 								    mp_state: kvm_mp_state,
 								}
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								impl Vcpu {
 								    /// Constructs a new VCPU for `vm`.
 								    ///
 								    /// # Arguments
 								    ///
 								    /// * `id` - Represents the CPU number between [0, max vcpus).
 								    /// * `vm` - The virtual machine this vcpu will get attached to.
 								    pub fn new(
 								        id: u8,
 								        fd: &Arc<VmFd>,
 								        io_bus: Arc<devices::Bus>,
 								        mmio_bus: Arc<devices::Bus>,
 								        ioapic: Option<Arc<Mutex<ioapic::Ioapic>>>,
 								        creation_ts: std::time::Instant,
-												vmm: cpu: Track all Vcpus through CpuManager

In anticipation for the CpuManager to aggregate all Vcpu snapshots
together, this change makes sure the CpuManager has a handle onto
every vCPU.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-18 15:58:51 +00:00
+								    ) -> Result<Arc<Mutex<Self>>> {
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								        let kvm_vcpu = fd.create_vcpu(id).map_err(Error::VcpuFd)?;
 								        // Initially the cpuid per vCPU is the one supported by this VM.
-												vmm: cpu: Track all Vcpus through CpuManager

In anticipation for the CpuManager to aggregate all Vcpu snapshots
together, this change makes sure the CpuManager has a handle onto
every vCPU.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-18 15:58:51 +00:00
+								        Ok(Arc::new(Mutex::new(Vcpu {
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								            fd: kvm_vcpu,
 								            id,
 								            io_bus,
 								            mmio_bus,
 								            ioapic,
 								            vm_ts: creation_ts,
-												vmm: cpu: Track all Vcpus through CpuManager

In anticipation for the CpuManager to aggregate all Vcpu snapshots
together, this change makes sure the CpuManager has a handle onto
every vCPU.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-18 15:58:51 +00:00
+								        })))
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								    }
 								    /// Configures a x86_64 specific vcpu and should be called once per vcpu from the vcpu's thread.
 								    ///
 								    /// # Arguments
 								    ///
 								    /// * `machine_config` - Specifies necessary info used for the CPUID configuration.
-												pvh: Introduce EntryPoint struct

In order to properly initialize the kvm regs/sregs structs for
the guest, the load_kernel() return type must specify which
boot protocol to use with the entry point address it returns.

Make load_kernel() return an EntryPoint struct containing the
required information. This structure will later be used
in the vCPU configuration methods to setup the appropriate
initial conditions for the guest.

Signed-off-by: Alejandro Jimenez <alejandro.j.jimenez@oracle.com>

											
										
										
											2020-02-12 03:37:33 +00:00
+								    /// * `kernel_entry_point` - Kernel entry point address in guest memory and boot protocol used.
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								    /// * `vm` - The virtual machine this vcpu will get attached to.
 								    pub fn configure(
 								        &mut self,
-												pvh: Introduce EntryPoint struct

In order to properly initialize the kvm regs/sregs structs for
the guest, the load_kernel() return type must specify which
boot protocol to use with the entry point address it returns.

Make load_kernel() return an EntryPoint struct containing the
required information. This structure will later be used
in the vCPU configuration methods to setup the appropriate
initial conditions for the guest.

Signed-off-by: Alejandro Jimenez <alejandro.j.jimenez@oracle.com>

											
										
										
											2020-02-12 03:37:33 +00:00
+								        kernel_entry_point: Option<EntryPoint>,
-												vmm: Move codebase to GuestMemoryAtomic from vm-memory

Relying on the latest vm-memory version, including the freshly
introduced structure GuestMemoryAtomic, this patch replaces every
occurrence of Arc<ArcSwap<GuestMemoryMmap> with
GuestMemoryAtomic<GuestMemoryMmap>.

The point is to rely on the common RCU-like implementation from
vm-memory so that we don't have to do it from Cloud-Hypervisor.

Fixes #735

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-02-11 16:22:40 +00:00
+								        vm_memory: &GuestMemoryAtomic<GuestMemoryMmap>,
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								        cpuid: CpuId,
 								    ) -> Result<()> {
 								        let mut cpuid = cpuid;
 								        CpuidPatch::set_cpuid_reg(&mut cpuid, 0xb, None, CpuidReg::EDX, u32::from(self.id));
 								        self.fd
 								            .set_cpuid2(&cpuid)
 								            .map_err(Error::SetSupportedCpusFailed)?;
 								        arch::x86_64::regs::setup_msrs(&self.fd).map_err(Error::MSRSConfiguration)?;
-												pvh: Introduce EntryPoint struct

In order to properly initialize the kvm regs/sregs structs for
the guest, the load_kernel() return type must specify which
boot protocol to use with the entry point address it returns.

Make load_kernel() return an EntryPoint struct containing the
required information. This structure will later be used
in the vCPU configuration methods to setup the appropriate
initial conditions for the guest.

Signed-off-by: Alejandro Jimenez <alejandro.j.jimenez@oracle.com>

											
										
										
											2020-02-12 03:37:33 +00:00
+								        if let Some(kernel_entry_point) = kernel_entry_point {
-												vmm: cpu: Support only partially configuring the vCPU

When configuring a processor after boot as a hotplug CPU we only
configure a subset of the CPU state. In particular we should not
configure the FPU, segment registers (or reconfigure the paging which is
a side-effect of that) nor the main registers. Achieve this by making
the function take an Option type for the start address.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-27 17:18:10 +00:00
+								            // Safe to unwrap because this method is called after the VM is configured
 								            arch::x86_64::regs::setup_regs(
 								                &self.fd,
-												pvh: Introduce EntryPoint struct

In order to properly initialize the kvm regs/sregs structs for
the guest, the load_kernel() return type must specify which
boot protocol to use with the entry point address it returns.

Make load_kernel() return an EntryPoint struct containing the
required information. This structure will later be used
in the vCPU configuration methods to setup the appropriate
initial conditions for the guest.

Signed-off-by: Alejandro Jimenez <alejandro.j.jimenez@oracle.com>

											
										
										
											2020-02-12 03:37:33 +00:00
+								                kernel_entry_point.entry_addr.raw_value(),
-												vmm: cpu: Support only partially configuring the vCPU

When configuring a processor after boot as a hotplug CPU we only
configure a subset of the CPU state. In particular we should not
configure the FPU, segment registers (or reconfigure the paging which is
a side-effect of that) nor the main registers. Achieve this by making
the function take an Option type for the start address.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-27 17:18:10 +00:00
+								                arch::x86_64::layout::BOOT_STACK_POINTER.raw_value(),
 								                arch::x86_64::layout::ZERO_PAGE_START.raw_value(),
-												pvh: Initialize vCPU regs/sregs for PVH boot

Set the initial values of the KVM vCPU registers as specified in
the PVH boot ABI:

https://xenbits.xen.org/docs/unstable/misc/pvh.html

Signed-off-by: Alejandro Jimenez <alejandro.j.jimenez@oracle.com>

											
										
										
											2020-02-12 04:48:09 +00:00
+								                kernel_entry_point.protocol,
-												vmm: cpu: Support only partially configuring the vCPU

When configuring a processor after boot as a hotplug CPU we only
configure a subset of the CPU state. In particular we should not
configure the FPU, segment registers (or reconfigure the paging which is
a side-effect of that) nor the main registers. Achieve this by making
the function take an Option type for the start address.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-27 17:18:10 +00:00
+								            )
 								            .map_err(Error::REGSConfiguration)?;
 								            arch::x86_64::regs::setup_fpu(&self.fd).map_err(Error::FPUConfiguration)?;
-												pvh: Initialize vCPU regs/sregs for PVH boot

Set the initial values of the KVM vCPU registers as specified in
the PVH boot ABI:

https://xenbits.xen.org/docs/unstable/misc/pvh.html

Signed-off-by: Alejandro Jimenez <alejandro.j.jimenez@oracle.com>

											
										
										
											2020-02-12 04:48:09 +00:00
+								            arch::x86_64::regs::setup_sregs(
 								                &vm_memory.memory(),
 								                &self.fd,
 								                kernel_entry_point.protocol,
 								            )
 								            .map_err(Error::SREGSConfiguration)?;
-												vmm: cpu: Support only partially configuring the vCPU

When configuring a processor after boot as a hotplug CPU we only
configure a subset of the CPU state. In particular we should not
configure the FPU, segment registers (or reconfigure the paging which is
a side-effect of that) nor the main registers. Achieve this by making
the function take an Option type for the start address.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-27 17:18:10 +00:00
+								        }
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								        arch::x86_64::interrupts::set_lint(&self.fd).map_err(Error::LocalIntConfiguration)?;
 								        Ok(())
 								    }
 								    /// Runs the VCPU until it exits, returning the reason.
 								    ///
 								    /// Note that the state of the VCPU and associated VM must be setup first for this to do
 								    /// anything useful.
 								    pub fn run(&self) -> Result<bool> {
 								        match self.fd.run() {
 								            Ok(run) => match run {
 								                VcpuExit::IoIn(addr, data) => {
 								                    self.io_bus.read(u64::from(addr), data);
 								                    Ok(true)
 								                }
 								                VcpuExit::IoOut(addr, data) => {
 								                    if addr == DEBUG_IOPORT && data.len() == 1 {
 								                        self.log_debug_ioport(data[0]);
 								                    }
 								                    self.io_bus.write(u64::from(addr), data);
 								                    Ok(true)
 								                }
 								                VcpuExit::MmioRead(addr, data) => {
 								                    self.mmio_bus.read(addr as u64, data);
 								                    Ok(true)
 								                }
 								                VcpuExit::MmioWrite(addr, data) => {
 								                    self.mmio_bus.write(addr as u64, data);
 								                    Ok(true)
 								                }
 								                VcpuExit::IoapicEoi(vector) => {
 								                    if let Some(ioapic) = &self.ioapic {
 								                        ioapic.lock().unwrap().end_of_interrupt(vector);
 								                    }
 								                    Ok(true)
 								                }
 								                VcpuExit::Shutdown => {
 								                    // Triple fault to trigger a reboot
 								                    Ok(false)
 								                }
 								                r => {
 								                    error!("Unexpected exit reason on vcpu run: {:?}", r);
 								                    Err(Error::VcpuUnhandledKvmExit)
 								                }
 								            },
-												cargo: Bump the kvm and vmm-sys-util crates

Since the kvm crates now depend on vmm-sys-util, the bump must be
atomic.
The kvm-bindings and ioctls 0.2.0 and 0.4.0 crates come with a few API
changes, one of them being the use of a kvm_ioctls specific error type.
Porting our code to that type makes for a fairly large diff stat.

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2019-11-29 15:36:33 +00:00
+								            Err(ref e) => match e.errno() {
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								                libc::EAGAIN | libc::EINTR => Ok(true),
 								                _ => {
 								                    error!("VCPU {:?} error {:?}", self.id, e);
 								                    Err(Error::VcpuUnhandledKvmExit)
 								                }
 								            },
 								        }
 								    }
 								    // Log debug io port codes.
 								    fn log_debug_ioport(&self, code: u8) {
 								        let ts = self.vm_ts.elapsed();
 								        debug!(
 								            "[{} code 0x{:x}] {}.{:>06} seconds",
 								            DebugIoPortRange::from_u8(code),
 								            code,
 								            ts.as_secs(),
 								            ts.as_micros()
 								        );
 								    }
-												vmm: cpu: Get and set KVM vCPU state

These two new helpers will be useful to capture a vCPU state and being
able to restore it at a later time.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-16 20:42:42 +00:00
 								    #[allow(unused)]
 								    fn kvm_state(&self) -> Result<VcpuKvmState> {
 								        let mut msrs = arch::x86_64::regs::boot_msr_entries();
 								        self.fd.get_msrs(&mut msrs).map_err(Error::VcpuGetMsrs)?;
 								        let vcpu_events = self
 								            .fd
 								            .get_vcpu_events()
 								            .map_err(Error::VcpuGetVcpuEvents)?;
 								        let regs = self.fd.get_regs().map_err(Error::VcpuGetRegs)?;
 								        let sregs = self.fd.get_sregs().map_err(Error::VcpuGetSregs)?;
 								        let lapic_state = self.fd.get_lapic().map_err(Error::VcpuGetLapic)?;
 								        let fpu = self.fd.get_fpu().map_err(Error::VcpuGetFpu)?;
 								        let xsave = self.fd.get_xsave().map_err(Error::VcpuGetXsave)?;
 								        let xcrs = self.fd.get_xcrs().map_err(Error::VcpuGetXsave)?;
 								        let mp_state = self.fd.get_mp_state().map_err(Error::VcpuGetMpState)?;
 								        Ok(VcpuKvmState {
 								            msrs,
 								            vcpu_events,
 								            regs,
 								            sregs,
 								            fpu,
 								            lapic_state,
 								            xsave,
 								            xcrs,
 								            mp_state,
 								        })
 								    }
 								    #[allow(unused)]
 								    fn set_kvm_state(&mut self, state: &VcpuKvmState) -> Result<()> {
 								        self.fd.set_regs(&state.regs).map_err(Error::VcpuSetRegs)?;
 								        self.fd.set_fpu(&state.fpu).map_err(Error::VcpuSetFpu)?;
 								        self.fd
 								            .set_xsave(&state.xsave)
 								            .map_err(Error::VcpuSetXsave)?;
 								        self.fd
 								            .set_sregs(&state.sregs)
 								            .map_err(Error::VcpuSetSregs)?;
 								        self.fd.set_xcrs(&state.xcrs).map_err(Error::VcpuSetXcrs)?;
 								        self.fd.set_msrs(&state.msrs).map_err(Error::VcpuSetMsrs)?;
 								        self.fd
 								            .set_lapic(&state.lapic_state)
 								            .map_err(Error::VcpuSetLapic)?;
 								        self.fd
 								            .set_mp_state(state.mp_state)
 								            .map_err(Error::VcpuSetMpState)?;
 								        Ok(())
 								    }
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								}
 								pub struct CpuManager {
 								    boot_vcpus: u8,
-												vmm: cpu: Introduce concept of maximum vs boot vCPUs in CpuManager

For now the max vCPUs is the same as the boot vCPUs.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-25 13:55:10 +00:00
+								    max_vcpus: u8,
-												vmm: Remove all Weak references from CpuManager

Now that the BusDevice devices are stored as Weak references by the
IO and MMIO buses, there's no need to use Weak references from the
CpuManager anymore.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-03-04 15:19:37 +00:00
+								    io_bus: Arc<devices::Bus>,
-												Revert "vmm: Move CpuManager device to MMIO region"

This reverts commit 980e03fa0ab3d217fe91fd60d8459507c903d88b.

											
										
										
											2020-01-24 10:36:39 +00:00
+								    mmio_bus: Arc<devices::Bus>,
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								    ioapic: Option<Arc<Mutex<ioapic::Ioapic>>>,
-												vmm: Move codebase to GuestMemoryAtomic from vm-memory

Relying on the latest vm-memory version, including the freshly
introduced structure GuestMemoryAtomic, this patch replaces every
occurrence of Arc<ArcSwap<GuestMemoryMmap> with
GuestMemoryAtomic<GuestMemoryMmap>.

The point is to rely on the common RCU-like implementation from
vm-memory so that we don't have to do it from Cloud-Hypervisor.

Fixes #735

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-02-11 16:22:40 +00:00
+								    vm_memory: GuestMemoryAtomic<GuestMemoryMmap>,
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								    cpuid: CpuId,
 								    fd: Arc<VmFd>,
 								    vcpus_kill_signalled: Arc<AtomicBool>,
 								    vcpus_pause_signalled: Arc<AtomicBool>,
 								    reset_evt: EventFd,
-												vmm: cpu: Encapsulate vCPU state into its own struct

Currently this just holds the thread handle but will be enlarged to
encompass details such as whether the vCPU is currently being inserted
or ejected.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 11:32:36 +00:00
+								    vcpu_states: Vec<VcpuState>,
-												vmm: cpu & acpi: Query CPU manager for CPU status

Rather than hardcode the CPU status for all the CPUs instead query from
the CPU manager via the I/O port that is is on via the ACPI tables.

Each CPU device has a _STA method that calls into the CSTA method which
reads and writes the I/O ports via the PRST field which exposes the I/O
port through and OpRegion.

As we only support boot CPUS report that all the CPUs are enabled for
now.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-20 14:06:37 +00:00
+								    selected_cpu: u8,
-												vmm: cpu: Track all Vcpus through CpuManager

In anticipation for the CpuManager to aggregate all Vcpu snapshots
together, this change makes sure the CpuManager has a handle onto
every vCPU.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-18 15:58:51 +00:00
+								    vcpus: Vec<Arc<Mutex<Vcpu>>>,
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								}
-												vmm: cpu & acpi: Query CPU manager for CPU status

Rather than hardcode the CPU status for all the CPUs instead query from
the CPU manager via the I/O port that is is on via the ACPI tables.

Each CPU device has a _STA method that calls into the CSTA method which
reads and writes the I/O ports via the PRST field which exposes the I/O
port through and OpRegion.

As we only support boot CPUS report that all the CPUs are enabled for
now.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-20 14:06:37 +00:00
+								const CPU_ENABLE_FLAG: usize = 0;
-												vmm: cpu: Only do ACPI notify on newly added vCPUs

When we add a vCPU set an "inserting" boolean that is exposed as an ACPI
field that will be checked for and reset when the ACPI GED notification
for CPU devices happens.

This change is a precursor for CPU unplug.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:42:29 +00:00
+								const CPU_INSERTING_FLAG: usize = 1;
-												vmm: cpu: Notify guest OS that it should offline vCPUs

Allow the resizing of the number of vCPUs to less than the current
active vCPUs. This does not currently remove them from the system but
the kernel will take them offline.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 10:49:05 +00:00
+								const CPU_REMOVING_FLAG: usize = 2;
-												vmm: cpu: Implement CPU removal

When the running OS has been told that a CPU should be removed it will
shutdown the CPU and then signal to the hypervisor via the "_EJ0" method
on the device that ultimately writes into an I/O port than the vCPU
should be shutdown. Upon notification the hypervisor signals to the
individual thread that it should shutdown and waits for that thread to
end.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 11:22:33 +00:00
+								const CPU_EJECT_FLAG: usize = 3;
-												vmm: cpu & acpi: Query CPU manager for CPU status

Rather than hardcode the CPU status for all the CPUs instead query from
the CPU manager via the I/O port that is is on via the ACPI tables.

Each CPU device has a _STA method that calls into the CSTA method which
reads and writes the I/O ports via the PRST field which exposes the I/O
port through and OpRegion.

As we only support boot CPUS report that all the CPUs are enabled for
now.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-20 14:06:37 +00:00
 								const CPU_STATUS_OFFSET: u64 = 4;
 								const CPU_SELECTION_OFFSET: u64 = 0;
-												vmm: cpu: Add the CpuManager onto the IO bus

This allows the kernel (via ACPI based controls) to query and control
the CPU state.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 14:56:10 +00:00
+								impl BusDevice for CpuManager {
-												vmm: cpu & acpi: Query CPU manager for CPU status

Rather than hardcode the CPU status for all the CPUs instead query from
the CPU manager via the I/O port that is is on via the ACPI tables.

Each CPU device has a _STA method that calls into the CSTA method which
reads and writes the I/O ports via the PRST field which exposes the I/O
port through and OpRegion.

As we only support boot CPUS report that all the CPUs are enabled for
now.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-20 14:06:37 +00:00
+								    fn read(&mut self, _base: u64, offset: u64, data: &mut [u8]) {
 								        match offset {
 								            CPU_STATUS_OFFSET => {
-												vmm: cpu: Encapsulate vCPU state into its own struct

Currently this just holds the thread handle but will be enlarged to
encompass details such as whether the vCPU is currently being inserted
or ejected.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 11:32:36 +00:00
+								                if self.selected_cpu < self.present_vcpus() {
 								                    let state = &self.vcpu_states[usize::from(self.selected_cpu)];
 								                    if state.active() {
 								                        data[0] |= 1 << CPU_ENABLE_FLAG;
 								                    }
-												vmm: cpu: Only do ACPI notify on newly added vCPUs

When we add a vCPU set an "inserting" boolean that is exposed as an ACPI
field that will be checked for and reset when the ACPI GED notification
for CPU devices happens.

This change is a precursor for CPU unplug.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:42:29 +00:00
+								                    if state.inserting {
 								                        data[0] |= 1 << CPU_INSERTING_FLAG;
 								                    }
-												vmm: cpu: Notify guest OS that it should offline vCPUs

Allow the resizing of the number of vCPUs to less than the current
active vCPUs. This does not currently remove them from the system but
the kernel will take them offline.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 10:49:05 +00:00
+								                    if state.removing {
 								                        data[0] |= 1 << CPU_REMOVING_FLAG;
 								                    }
-												vmm: cpu: Encapsulate vCPU state into its own struct

Currently this just holds the thread handle but will be enlarged to
encompass details such as whether the vCPU is currently being inserted
or ejected.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 11:32:36 +00:00
+								                }
-												vmm: cpu & acpi: Query CPU manager for CPU status

Rather than hardcode the CPU status for all the CPUs instead query from
the CPU manager via the I/O port that is is on via the ACPI tables.

Each CPU device has a _STA method that calls into the CSTA method which
reads and writes the I/O ports via the PRST field which exposes the I/O
port through and OpRegion.

As we only support boot CPUS report that all the CPUs are enabled for
now.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-20 14:06:37 +00:00
+								            }
 								            _ => {
 								                warn!(
 								                    "Unexpected offset for accessing CPU manager device: {:#}",
 								                    offset
 								                );
 								            }
 								        }
 								    }
-												vmm: cpu: Add the CpuManager onto the IO bus

This allows the kernel (via ACPI based controls) to query and control
the CPU state.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 14:56:10 +00:00
-												vmm: cpu & acpi: Query CPU manager for CPU status

Rather than hardcode the CPU status for all the CPUs instead query from
the CPU manager via the I/O port that is is on via the ACPI tables.

Each CPU device has a _STA method that calls into the CSTA method which
reads and writes the I/O ports via the PRST field which exposes the I/O
port through and OpRegion.

As we only support boot CPUS report that all the CPUs are enabled for
now.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-20 14:06:37 +00:00
+								    fn write(&mut self, _base: u64, offset: u64, data: &[u8]) {
 								        match offset {
 								            CPU_SELECTION_OFFSET => {
 								                self.selected_cpu = data[0];
 								            }
-												vmm: cpu: Only do ACPI notify on newly added vCPUs

When we add a vCPU set an "inserting" boolean that is exposed as an ACPI
field that will be checked for and reset when the ACPI GED notification
for CPU devices happens.

This change is a precursor for CPU unplug.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:42:29 +00:00
+								            CPU_STATUS_OFFSET => {
 								                let state = &mut self.vcpu_states[usize::from(self.selected_cpu)];
 								                // The ACPI code writes back a 1 to acknowledge the insertion
 								                if (data[0] & (1 << CPU_INSERTING_FLAG) == 1 << CPU_INSERTING_FLAG)
 								                    && state.inserting
 								                {
 								                    state.inserting = false;
 								                }
-												vmm: cpu: Notify guest OS that it should offline vCPUs

Allow the resizing of the number of vCPUs to less than the current
active vCPUs. This does not currently remove them from the system but
the kernel will take them offline.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 10:49:05 +00:00
+								                // Ditto for removal
 								                if (data[0] & (1 << CPU_REMOVING_FLAG) == 1 << CPU_REMOVING_FLAG) && state.removing
 								                {
 								                    state.removing = false;
 								                }
-												vmm: cpu: Implement CPU removal

When the running OS has been told that a CPU should be removed it will
shutdown the CPU and then signal to the hypervisor via the "_EJ0" method
on the device that ultimately writes into an I/O port than the vCPU
should be shutdown. Upon notification the hypervisor signals to the
individual thread that it should shutdown and waits for that thread to
end.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 11:22:33 +00:00
+								                // Trigger removal of vCPU
 								                if data[0] & (1 << CPU_EJECT_FLAG) == 1 << CPU_EJECT_FLAG {
 								                    if let Err(e) = self.remove_vcpu(self.selected_cpu) {
 								                        error!("Error removing vCPU: {:?}", e);
 								                    }
 								                }
-												vmm: cpu: Only do ACPI notify on newly added vCPUs

When we add a vCPU set an "inserting" boolean that is exposed as an ACPI
field that will be checked for and reset when the ACPI GED notification
for CPU devices happens.

This change is a precursor for CPU unplug.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:42:29 +00:00
+								            }
-												vmm: cpu & acpi: Query CPU manager for CPU status

Rather than hardcode the CPU status for all the CPUs instead query from
the CPU manager via the I/O port that is is on via the ACPI tables.

Each CPU device has a _STA method that calls into the CSTA method which
reads and writes the I/O ports via the PRST field which exposes the I/O
port through and OpRegion.

As we only support boot CPUS report that all the CPUs are enabled for
now.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-20 14:06:37 +00:00
+								            _ => {
 								                warn!(
 								                    "Unexpected offset for accessing CPU manager device: {:#}",
 								                    offset
 								                );
 								            }
 								        }
 								    }
-												vmm: cpu: Add the CpuManager onto the IO bus

This allows the kernel (via ACPI based controls) to query and control
the CPU state.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 14:56:10 +00:00
+								}
-												vmm: cpu: Create vCPU state for all possible vCPUs

This will make it more straightforward when we attempt to remove vCPUs.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 17:15:25 +00:00
+								#[derive(Default)]
-												vmm: cpu: Encapsulate vCPU state into its own struct

Currently this just holds the thread handle but will be enlarged to
encompass details such as whether the vCPU is currently being inserted
or ejected.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 11:32:36 +00:00
+								struct VcpuState {
-												vmm: cpu: Only do ACPI notify on newly added vCPUs

When we add a vCPU set an "inserting" boolean that is exposed as an ACPI
field that will be checked for and reset when the ACPI GED notification
for CPU devices happens.

This change is a precursor for CPU unplug.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:42:29 +00:00
+								    inserting: bool,
-												vmm: cpu: Notify guest OS that it should offline vCPUs

Allow the resizing of the number of vCPUs to less than the current
active vCPUs. This does not currently remove them from the system but
the kernel will take them offline.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 10:49:05 +00:00
+								    removing: bool,
-												vmm: cpu: Encapsulate vCPU state into its own struct

Currently this just holds the thread handle but will be enlarged to
encompass details such as whether the vCPU is currently being inserted
or ejected.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 11:32:36 +00:00
+								    handle: Option<thread::JoinHandle<()>>,
-												vmm: cpu: Implement CPU removal

When the running OS has been told that a CPU should be removed it will
shutdown the CPU and then signal to the hypervisor via the "_EJ0" method
on the device that ultimately writes into an I/O port than the vCPU
should be shutdown. Upon notification the hypervisor signals to the
individual thread that it should shutdown and waits for that thread to
end.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 11:22:33 +00:00
+								    kill: Arc<AtomicBool>,
-												vmm: cpu: Encapsulate vCPU state into its own struct

Currently this just holds the thread handle but will be enlarged to
encompass details such as whether the vCPU is currently being inserted
or ejected.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 11:32:36 +00:00
+								}
 								impl VcpuState {
 								    fn active(&self) -> bool {
 								        self.handle.is_some()
 								    }
 								    fn signal_thread(&self) {
 								        if let Some(handle) = self.handle.as_ref() {
 								            unsafe {
-												vmm: Port to latest vmm-sys-util

The signal handling for vCPU signals has changed in the latest release
so switch to the new API.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-11 13:02:07 +00:00
+								                libc::pthread_kill(handle.as_pthread_t(), SIGRTMIN());
-												vmm: cpu: Encapsulate vCPU state into its own struct

Currently this just holds the thread handle but will be enlarged to
encompass details such as whether the vCPU is currently being inserted
or ejected.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 11:32:36 +00:00
+								            }
 								        }
 								    }
 								    fn join_thread(&mut self) -> Result<()> {
 								        if let Some(handle) = self.handle.take() {
-												vmm: Fix map_err losing the inner error

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-01-24 08:34:51 +00:00
+								            handle.join().map_err(Error::ThreadCleanup)?
-												vmm: cpu: Encapsulate vCPU state into its own struct

Currently this just holds the thread handle but will be enlarged to
encompass details such as whether the vCPU is currently being inserted
or ejected.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 11:32:36 +00:00
+								        }
 								        Ok(())
 								    }
 								    fn unpark_thread(&self) {
 								        if let Some(handle) = self.handle.as_ref() {
 								            handle.thread().unpark()
 								        }
 								    }
 								}
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								impl CpuManager {
 								    pub fn new(
-												vmm: cpu: Pass CpusConfig to simplify the new() prototype

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-03-16 17:14:15 +00:00
+								        config: &CpusConfig,
-												vmm: Move DeviceManager into an Arc<Mutex<>>

In anticipation of the support for device hotplug, this commit moves the
DeviceManager object into an Arc<Mutex<>> when the DeviceManager is
being created. The reason is, we need the DeviceManager to implement the
BusDevice trait and then provide it to the IO bus, so that IO accesses
related to device hotplug can be handled correctly.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-02-27 09:29:03 +00:00
+								        device_manager: &Arc<Mutex<DeviceManager>>,
-												vmm: Move codebase to GuestMemoryAtomic from vm-memory

Relying on the latest vm-memory version, including the freshly
introduced structure GuestMemoryAtomic, this patch replaces every
occurrence of Arc<ArcSwap<GuestMemoryMmap> with
GuestMemoryAtomic<GuestMemoryMmap>.

The point is to rely on the common RCU-like implementation from
vm-memory so that we don't have to do it from Cloud-Hypervisor.

Fixes #735

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-02-11 16:22:40 +00:00
+								        guest_memory: GuestMemoryAtomic<GuestMemoryMmap>,
-												vmm: cpu: Move CPUID patching to CpuManager

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-03-16 15:15:38 +00:00
+								        kvm: &Kvm,
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								        fd: Arc<VmFd>,
 								        reset_evt: EventFd,
-												vmm: cpu: Add the CpuManager onto the IO bus

This allows the kernel (via ACPI based controls) to query and control
the CPU state.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 14:56:10 +00:00
+								    ) -> Result<Arc<Mutex<CpuManager>>> {
-												vmm: cpu: Pass CpusConfig to simplify the new() prototype

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-03-16 17:14:15 +00:00
+								        let mut vcpu_states = Vec::with_capacity(usize::from(config.max_vcpus));
 								        vcpu_states.resize_with(usize::from(config.max_vcpus), VcpuState::default);
-												vmm: cpu: Create vCPU state for all possible vCPUs

This will make it more straightforward when we attempt to remove vCPUs.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 17:15:25 +00:00
-												vmm: Move DeviceManager into an Arc<Mutex<>>

In anticipation of the support for device hotplug, this commit moves the
DeviceManager object into an Arc<Mutex<>> when the DeviceManager is
being created. The reason is, we need the DeviceManager to implement the
BusDevice trait and then provide it to the IO bus, so that IO accesses
related to device hotplug can be handled correctly.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-02-27 09:29:03 +00:00
+								        let device_manager = device_manager.lock().unwrap();
-												vmm: cpu: Move CPUID patching to CpuManager

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-03-16 15:15:38 +00:00
+								        let cpuid = CpuManager::patch_cpuid(kvm)?;
-												vmm: Encase CpuManager within an Arc<Mutex<>>

This is necessary to be able to add the CpuManager onto the IO bus.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 14:31:11 +00:00
+								        let cpu_manager = Arc::new(Mutex::new(CpuManager {
-												vmm: cpu: Pass CpusConfig to simplify the new() prototype

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-03-16 17:14:15 +00:00
+								            boot_vcpus: config.boot_vcpus,
 								            max_vcpus: config.max_vcpus,
-												vmm: Remove all Weak references from DeviceManager

Now that the BusDevice devices are stored as Weak references by the
IO and MMIO buses, there's no need to use Weak references from the
DeviceManager anymore.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-03-04 15:24:15 +00:00
+								            io_bus: device_manager.io_bus().clone(),
-												Revert "vmm: Move CpuManager device to MMIO region"

This reverts commit 980e03fa0ab3d217fe91fd60d8459507c903d88b.

											
										
										
											2020-01-24 10:36:39 +00:00
+								            mmio_bus: device_manager.mmio_bus().clone(),
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								            ioapic: device_manager.ioapic().clone(),
 								            vm_memory: guest_memory,
 								            cpuid,
 								            fd,
 								            vcpus_kill_signalled: Arc::new(AtomicBool::new(false)),
 								            vcpus_pause_signalled: Arc::new(AtomicBool::new(false)),
-												vmm: cpu: Create vCPU state for all possible vCPUs

This will make it more straightforward when we attempt to remove vCPUs.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 17:15:25 +00:00
+								            vcpu_states,
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								            reset_evt,
-												vmm: cpu & acpi: Query CPU manager for CPU status

Rather than hardcode the CPU status for all the CPUs instead query from
the CPU manager via the I/O port that is is on via the ACPI tables.

Each CPU device has a _STA method that calls into the CSTA method which
reads and writes the I/O ports via the PRST field which exposes the I/O
port through and OpRegion.

As we only support boot CPUS report that all the CPUs are enabled for
now.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-20 14:06:37 +00:00
+								            selected_cpu: 0,
-												vmm: cpu: Track all Vcpus through CpuManager

In anticipation for the CpuManager to aggregate all Vcpu snapshots
together, this change makes sure the CpuManager has a handle onto
every vCPU.

Signed-off-by: Cathy Zhang <cathy.zhang@intel.com>
Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-02-18 15:58:51 +00:00
+								            vcpus: Vec::with_capacity(usize::from(config.max_vcpus)),
-												vmm: Encase CpuManager within an Arc<Mutex<>>

This is necessary to be able to add the CpuManager onto the IO bus.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 14:31:11 +00:00
+								        }));
-												Revert "vmm: Move CpuManager device to MMIO region"

This reverts commit 980e03fa0ab3d217fe91fd60d8459507c903d88b.

											
										
										
											2020-01-24 10:36:39 +00:00
+								        device_manager
 								            .allocator()
 								            .lock()
 								            .unwrap()
 								            .allocate_io_addresses(Some(GuestAddress(0x0cd8)), 0x8, None)
 								            .ok_or(Error::AllocateIOPort)?;
-												vmm: Encase CpuManager within an Arc<Mutex<>>

This is necessary to be able to add the CpuManager onto the IO bus.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 14:31:11 +00:00
+								        cpu_manager
-												vmm: cpu: Add the CpuManager onto the IO bus

This allows the kernel (via ACPI based controls) to query and control
the CPU state.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 14:56:10 +00:00
+								            .lock()
 								            .unwrap()
-												Revert "vmm: Move CpuManager device to MMIO region"

This reverts commit 980e03fa0ab3d217fe91fd60d8459507c903d88b.

											
										
										
											2020-01-24 10:36:39 +00:00
+								            .io_bus
 								            .insert(cpu_manager.clone(), 0x0cd8, 0xc)
-												vmm: cpu: Add the CpuManager onto the IO bus

This allows the kernel (via ACPI based controls) to query and control
the CPU state.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 14:56:10 +00:00
+								            .map_err(Error::BusError)?;
 								        Ok(cpu_manager)
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								    }
-												vmm: cpu: Move CPUID patching to CpuManager

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2020-03-16 15:15:38 +00:00
+								    fn patch_cpuid(kvm: &Kvm) -> Result<CpuId> {
 								        let mut cpuid_patches = Vec::new();
 								        // Patch tsc deadline timer bit
 								        cpuid_patches.push(CpuidPatch {
 								            function: 1,
 								            index: 0,
 								            flags_bit: None,
 								            eax_bit: None,
 								            ebx_bit: None,
 								            ecx_bit: Some(TSC_DEADLINE_TIMER_ECX_BIT),
 								            edx_bit: None,
 								        });
 								        // Patch hypervisor bit
 								        cpuid_patches.push(CpuidPatch {
 								            function: 1,
 								            index: 0,
 								            flags_bit: None,
 								            eax_bit: None,
 								            ebx_bit: None,
 								            ecx_bit: Some(HYPERVISOR_ECX_BIT),
 								            edx_bit: None,
 								        });
 								        // Supported CPUID
 								        let mut cpuid = kvm
 								            .get_supported_cpuid(kvm_bindings::KVM_MAX_CPUID_ENTRIES)
 								            .map_err(Error::PatchCpuId)?;
 								        CpuidPatch::patch_cpuid(&mut cpuid, cpuid_patches);
 								        Ok(cpuid)
 								    }
-												vmm: cpu: Factorize vcpu starting code

Anticipating the need for a slightly different function for restoring
vCPUs, this patch factorizes most of the vCPU creation, so that it can
be reused for migration purposes.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-04-03 12:27:41 +00:00
+								    fn start_vcpu(
 								        &mut self,
 								        cpu_id: u8,
 								        creation_ts: std::time::Instant,
 								        vcpu_thread_barrier: Arc<Barrier>,
 								        entry_point: Option<EntryPoint>,
 								        inserting: bool,
 								    ) -> Result<()> {
 								        let ioapic = if let Some(ioapic) = &self.ioapic {
 								            Some(ioapic.clone())
 								        } else {
 								            None
 								        };
 								        let vcpu = Vcpu::new(
 								            cpu_id,
 								            &self.fd,
 								            self.io_bus.clone(),
 								            self.mmio_bus.clone(),
 								            ioapic,
 								            creation_ts,
 								        )?;
 								        let reset_evt = self.reset_evt.try_clone().unwrap();
 								        let vcpu_kill_signalled = self.vcpus_kill_signalled.clone();
 								        let vcpu_pause_signalled = self.vcpus_pause_signalled.clone();
 								        let vcpu_kill = self.vcpu_states[usize::from(cpu_id)].kill.clone();
 								        let vm_memory = self.vm_memory.clone();
 								        vcpu.lock()
 								            .unwrap()
 								            .configure(entry_point, &vm_memory, self.cpuid.clone())
 								            .expect("Failed to configure vCPU");
 								        let vcpu_clone = Arc::clone(&vcpu);
 								        self.vcpus.push(vcpu_clone);
 								        let handle = Some(
 								            thread::Builder::new()
 								                .name(format!("vcpu{}", cpu_id))
 								                .spawn(move || {
 								                    extern "C" fn handle_signal(_: i32, _: *mut siginfo_t, _: *mut c_void) {}
 								                    // This uses an async signal safe handler to kill the vcpu handles.
 								                    register_signal_handler(SIGRTMIN(), handle_signal)
 								                        .expect("Failed to register vcpu signal handler");
 								                    // Block until all CPUs are ready.
 								                    vcpu_thread_barrier.wait();
 								                    loop {
 								                        // vcpu.run() returns false on a KVM_EXIT_SHUTDOWN (triple-fault) so trigger a reset
 								                        match vcpu.lock().unwrap().run() {
 								                            Err(e) => {
 								                                error!("VCPU generated error: {:?}", e);
 								                                break;
 								                            }
 								                            Ok(true) => {}
 								                            Ok(false) => {
 								                                reset_evt.write(1).unwrap();
 								                                break;
 								                            }
 								                        }
 								                        // We've been told to terminate
 								                        if vcpu_kill_signalled.load(Ordering::SeqCst)
 								                            || vcpu_kill.load(Ordering::SeqCst)
 								                        {
 								                            break;
 								                        }
 								                        // If we are being told to pause, we park the thread
 								                        // until the pause boolean is toggled.
 								                        // The resume operation is responsible for toggling
 								                        // the boolean and unpark the thread.
 								                        // We enter a loop because park() could spuriously
 								                        // return. We will then park() again unless the
 								                        // pause boolean has been toggled.
 								                        while vcpu_pause_signalled.load(Ordering::SeqCst) {
 								                            thread::park();
 								                        }
 								                    }
 								                })
 								                .map_err(Error::VcpuSpawn)?,
 								        );
 								        // On hot plug calls into this function entry_point is None. It is for
 								        // those hotplug CPU additions that we need to set the inserting flag.
 								        self.vcpu_states[usize::from(cpu_id)].handle = handle;
 								        self.vcpu_states[usize::from(cpu_id)].inserting = inserting;
 								        Ok(())
 								    }
-												pvh: Introduce EntryPoint struct

In order to properly initialize the kvm regs/sregs structs for
the guest, the load_kernel() return type must specify which
boot protocol to use with the entry point address it returns.

Make load_kernel() return an EntryPoint struct containing the
required information. This structure will later be used
in the vCPU configuration methods to setup the appropriate
initial conditions for the guest.

Signed-off-by: Alejandro Jimenez <alejandro.j.jimenez@oracle.com>

											
										
										
											2020-02-12 03:37:33 +00:00
+								    fn activate_vcpus(&mut self, desired_vcpus: u8, entry_point: Option<EntryPoint>) -> Result<()> {
-												vmm: cpu: Refactor vCPU thread starting

Refactor the vCPU thread starting so that there is the possibility to
bring on extra vCPU threads.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 13:06:24 +00:00
+								        if desired_vcpus > self.max_vcpus {
 								            return Err(Error::DesiredVCPUCountExceedsMax);
 								        }
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
-												vmm: cpu: Refactor vCPU thread starting

Refactor the vCPU thread starting so that there is the possibility to
bring on extra vCPU threads.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 13:06:24 +00:00
+								        let creation_ts = std::time::Instant::now();
 								        let vcpu_thread_barrier = Arc::new(Barrier::new(
 								            (desired_vcpus - self.present_vcpus() + 1) as usize,
 								        ));
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
-												vmm: cpu: Refactor vCPU thread starting

Refactor the vCPU thread starting so that there is the possibility to
bring on extra vCPU threads.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 13:06:24 +00:00
+								        for cpu_id in self.present_vcpus()..desired_vcpus {
-												vmm: cpu: Factorize vcpu starting code

Anticipating the need for a slightly different function for restoring
vCPUs, this patch factorizes most of the vCPU creation, so that it can
be reused for migration purposes.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-04-03 12:27:41 +00:00
+								            self.start_vcpu(
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								                cpu_id,
 								                creation_ts,
-												vmm: cpu: Factorize vcpu starting code

Anticipating the need for a slightly different function for restoring
vCPUs, this patch factorizes most of the vCPU creation, so that it can
be reused for migration purposes.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-04-03 12:27:41 +00:00
+								                vcpu_thread_barrier.clone(),
 								                entry_point,
 								                entry_point.is_none(),
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								            )?;
 								        }
 								        // Unblock all CPU threads.
 								        vcpu_thread_barrier.wait();
 								        Ok(())
 								    }
-												vmm: cpu: Notify guest OS that it should offline vCPUs

Allow the resizing of the number of vCPUs to less than the current
active vCPUs. This does not currently remove them from the system but
the kernel will take them offline.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 10:49:05 +00:00
+								    fn mark_vcpus_for_removal(&mut self, desired_vcpus: u8) -> Result<()> {
 								        // Mark vCPUs for removal, actual removal happens on ejection
 								        for cpu_id in desired_vcpus..self.present_vcpus() {
 								            self.vcpu_states[usize::from(cpu_id)].removing = true;
 								        }
 								        Ok(())
 								    }
-												vmm: cpu: Implement CPU removal

When the running OS has been told that a CPU should be removed it will
shutdown the CPU and then signal to the hypervisor via the "_EJ0" method
on the device that ultimately writes into an I/O port than the vCPU
should be shutdown. Upon notification the hypervisor signals to the
individual thread that it should shutdown and waits for that thread to
end.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 11:22:33 +00:00
+								    fn remove_vcpu(&mut self, cpu_id: u8) -> Result<()> {
 								        let mut state = &mut self.vcpu_states[usize::from(cpu_id)];
 								        state.kill.store(true, Ordering::SeqCst);
 								        state.signal_thread();
 								        state.join_thread()?;
 								        state.handle = None;
 								        Ok(())
 								    }
-												vmm: cpu: Refactor vCPU thread starting

Refactor the vCPU thread starting so that there is the possibility to
bring on extra vCPU threads.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 13:06:24 +00:00
+								    // Starts all the vCPUs that the VM is booting with. Blocks until all vCPUs are running.
-												pvh: Introduce EntryPoint struct

In order to properly initialize the kvm regs/sregs structs for
the guest, the load_kernel() return type must specify which
boot protocol to use with the entry point address it returns.

Make load_kernel() return an EntryPoint struct containing the
required information. This structure will later be used
in the vCPU configuration methods to setup the appropriate
initial conditions for the guest.

Signed-off-by: Alejandro Jimenez <alejandro.j.jimenez@oracle.com>

											
										
										
											2020-02-12 03:37:33 +00:00
+								    pub fn start_boot_vcpus(&mut self, entry_point: EntryPoint) -> Result<()> {
 								        self.activate_vcpus(self.boot_vcpus(), Some(entry_point))
-												vmm: cpu: Add support for starting more vCPU threads

Add support for starting vCPU threads after the initial boot ones.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 15:56:16 +00:00
+								    }
-												vmm: Only generate GED interrupt when the number of vCPUs has changed

Avoid activity in the the guest OS if the number of vCPUs has not
changed.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-01-17 16:48:46 +00:00
+								    pub fn resize(&mut self, desired_vcpus: u8) -> Result<bool> {
-												vmm: cpu: Rewrite if chain using match

Address updated clippy error:

error: `if` chain can be rewritten with `match`
   --> vmm/src/cpu.rs:668:9
    |
668 | /         if desired_vcpus > self.present_vcpus() {
669 | |             self.activate_vcpus(desired_vcpus, None)?;
670 | |         } else if desired_vcpus < self.present_vcpus() {
671 | |             self.mark_vcpus_for_removal(desired_vcpus)?;
672 | |         }
    | |_________^
    |
    = note: `-D clippy::comparison-chain` implied by `-D warnings`
    = help: Consider rewriting the `if` chain to use `cmp` and `match`.
    = help: for further information visit https://rust-lang.github.io/rust-clippy/master/index.html#comparison_chain

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-19 17:08:38 +00:00
+								        match desired_vcpus.cmp(&self.present_vcpus()) {
-												vmm: Only generate GED interrupt when the number of vCPUs has changed

Avoid activity in the the guest OS if the number of vCPUs has not
changed.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2020-01-17 16:48:46 +00:00
+								            cmp::Ordering::Greater => self.activate_vcpus(desired_vcpus, None).and(Ok(true)),
 								            cmp::Ordering::Less => self.mark_vcpus_for_removal(desired_vcpus).and(Ok(true)),
 								            _ => Ok(false),
-												vmm: cpu: Notify guest OS that it should offline vCPUs

Allow the resizing of the number of vCPUs to less than the current
active vCPUs. This does not currently remove them from the system but
the kernel will take them offline.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 10:49:05 +00:00
+								        }
-												vmm: cpu: Refactor vCPU thread starting

Refactor the vCPU thread starting so that there is the possibility to
bring on extra vCPU threads.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 13:06:24 +00:00
+								    }
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								    pub fn shutdown(&mut self) -> Result<()> {
 								        // Tell the vCPUs to stop themselves next time they go through the loop
 								        self.vcpus_kill_signalled.store(true, Ordering::SeqCst);
 								        // Signal to the spawned threads (vCPUs and console signal handler). For the vCPU threads
 								        // this will interrupt the KVM_RUN ioctl() allowing the loop to check the boolean set
 								        // above.
-												vmm: cpu: Encapsulate vCPU state into its own struct

Currently this just holds the thread handle but will be enlarged to
encompass details such as whether the vCPU is currently being inserted
or ejected.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 11:32:36 +00:00
+								        for state in self.vcpu_states.iter() {
 								            state.signal_thread();
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								        }
-												vmm: cpu: Encapsulate vCPU state into its own struct

Currently this just holds the thread handle but will be enlarged to
encompass details such as whether the vCPU is currently being inserted
or ejected.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 11:32:36 +00:00
+								        // Wait for all the threads to finish. This removes the state from the vector.
 								        for mut state in self.vcpu_states.drain(..) {
 								            state.join_thread()?;
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								        }
 								        Ok(())
 								    }
-												vmm: cpu: Introduce concept of maximum vs boot vCPUs in CpuManager

For now the max vCPUs is the same as the boot vCPUs.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-25 13:55:10 +00:00
+								    pub fn boot_vcpus(&self) -> u8 {
 								        self.boot_vcpus
 								    }
 								    pub fn max_vcpus(&self) -> u8 {
 								        self.max_vcpus
 								    }
-												vmm: cpu: Encapsulate vCPU state into its own struct

Currently this just holds the thread handle but will be enlarged to
encompass details such as whether the vCPU is currently being inserted
or ejected.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 11:32:36 +00:00
 								    fn present_vcpus(&self) -> u8 {
-												vmm: cpu: Create vCPU state for all possible vCPUs

This will make it more straightforward when we attempt to remove vCPUs.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 17:15:25 +00:00
+								        self.vcpu_states
 								            .iter()
 								            .fold(0, |acc, state| acc + state.active() as u8)
-												vmm: cpu: Encapsulate vCPU state into its own struct

Currently this just holds the thread handle but will be enlarged to
encompass details such as whether the vCPU is currently being inserted
or ejected.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-26 11:32:36 +00:00
+								    }
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
 								    #[cfg(feature = "acpi")]
 								    pub fn create_madt(&self) -> SDT {
 								        // This is also checked in the commandline parsing.
 								        assert!(self.boot_vcpus <= self.max_vcpus);
 								        let mut madt = SDT::new(*b"APIC", 44, 5, *b"CLOUDH", *b"CHMADT  ", 1);
 								        madt.write(36, layout::APIC_START);
 								        for cpu in 0..self.max_vcpus {
 								            let lapic = LocalAPIC {
 								                r#type: 0,
 								                length: 8,
 								                processor_id: cpu,
 								                apic_id: cpu,
 								                flags: if cpu < self.boot_vcpus {
 << MADT_CPU_ENABLE_FLAG
 								                } else {
 
 								                },
 								            };
 								            madt.append(lapic);
 								        }
 								        madt.append(IOAPIC {
 								            r#type: 1,
 								            length: 12,
 								            ioapic_id: 0,
 								            apic_address: layout::IOAPIC_START.0 as u32,
 								            gsi_base: 0,
 								            ..Default::default()
 								        });
 								        madt.append(InterruptSourceOverride {
 								            r#type: 2,
 								            length: 10,
 								            bus: 0,
 								            source: 4,
 								            gsi: 4,
 								            flags: 0,
 								        });
 								        madt
 								    }
 								}
-												ci: Run clippy for each specific feature

The build is run against "--all-features", "pci,acpi", "pci" and "mmio"
separately. The clippy validation must be run against the same set of
features in order to validate the code is correct.

Because of these new checks, this commit includes multiple fixes
related to the errors generated when manually running the checks.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-01-21 08:32:50 +00:00
+								#[cfg(feature = "acpi")]
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								struct CPU {
 								    cpu_id: u8,
 								}
-												ci: Run clippy for each specific feature

The build is run against "--all-features", "pci,acpi", "pci" and "mmio"
separately. The clippy validation must be run against the same set of
features in order to validate the code is correct.

Because of these new checks, this commit includes multiple fixes
related to the errors generated when manually running the checks.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-01-21 08:32:50 +00:00
+								#[cfg(feature = "acpi")]
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								const MADT_CPU_ENABLE_FLAG: usize = 0;
 								#[cfg(feature = "acpi")]
 								impl Aml for CPU {
 								    fn to_aml_bytes(&self) -> Vec<u8> {
 								        let lapic = LocalAPIC {
 								            r#type: 0,
 								            length: 8,
 								            processor_id: self.cpu_id,
 								            apic_id: self.cpu_id,
 								            flags: 1 << MADT_CPU_ENABLE_FLAG,
 								        };
 								        let mut mat_data: Vec<u8> = Vec::new();
 								        mat_data.resize(std::mem::size_of_val(&lapic), 0);
 								        unsafe { *(mat_data.as_mut_ptr() as *mut LocalAPIC) = lapic };
 								        aml::Device::new(
 								            format!("C{:03}", self.cpu_id).as_str().into(),
 								            vec![
 								                &aml::Name::new("_HID".into(), &"ACPI0007"),
 								                &aml::Name::new("_UID".into(), &self.cpu_id),
 								                /*
 								                _STA return value:
 								                Bit [0] – Set if the device is present.
 								                Bit [1] – Set if the device is enabled and decoding its resources.
 								                Bit [2] – Set if the device should be shown in the UI.
 								                Bit [3] – Set if the device is functioning properly (cleared if device failed its diagnostics).
 								                Bit [4] – Set if the battery is present.
 								                Bits [31:5] – Reserved (must be cleared).
 								                */
 								                &aml::Method::new(
 								                    "_STA".into(),
 ,
 								                    false,
 								                    // Call into CSTA method which will interrogate device
 								                    vec![&aml::Return::new(&aml::MethodCall::new(
 								                        "CSTA".into(),
 								                        vec![&self.cpu_id],
 								                    ))],
 								                ),
 								                // The Linux kernel expects every CPU device to have a _MAT entry
 								                // containing the LAPIC for this processor with the enabled bit set
 								                // even it if is disabled in the MADT (non-boot CPU)
 								                &aml::Name::new("_MAT".into(), &aml::Buffer::new(mat_data)),
-												vmm: cpu: Implement CPU removal

When the running OS has been told that a CPU should be removed it will
shutdown the CPU and then signal to the hypervisor via the "_EJ0" method
on the device that ultimately writes into an I/O port than the vCPU
should be shutdown. Upon notification the hypervisor signals to the
individual thread that it should shutdown and waits for that thread to
end.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 11:22:33 +00:00
+								                // Trigger CPU ejection
 								                &aml::Method::new(
 								                    "_EJ0".into(),
 ,
 								                    false,
 								                    // Call into CEJ0 method which will actually eject device
 								                    vec![&aml::Return::new(&aml::MethodCall::new(
 								                        "CEJ0".into(),
 								                        vec![&self.cpu_id],
 								                    ))],
 								                ),
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								            ],
 								        )
 								        .to_aml_bytes()
 								    }
 								}
-												ci: Run clippy for each specific feature

The build is run against "--all-features", "pci,acpi", "pci" and "mmio"
separately. The clippy validation must be run against the same set of
features in order to validate the code is correct.

Because of these new checks, this commit includes multiple fixes
related to the errors generated when manually running the checks.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-01-21 08:32:50 +00:00
+								#[cfg(feature = "acpi")]
-												vmm: acpi: Refactor ACPI CPU notification

Continue to notify on all vCPUs but instead separate the notification
functionality into two methods, CSCN that walks through all the CPUs
and CTFY which notifies based on the numerical CPU id. This is an
interim step towards only notifying on changed CPUs and ultimately CPU
removal.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:09:24 +00:00
+								struct CPUNotify {
 								    cpu_id: u8,
 								}
 								#[cfg(feature = "acpi")]
 								impl Aml for CPUNotify {
 								    fn to_aml_bytes(&self) -> Vec<u8> {
 								        let object = aml::Path::new(&format!("C{:03}", self.cpu_id));
 								        aml::If::new(
 								            &aml::Equal::new(&aml::Arg(0), &self.cpu_id),
 								            vec![&aml::Notify::new(&object, &aml::Arg(1))],
 								        )
 								        .to_aml_bytes()
 								    }
 								}
-												ci: Run clippy for each specific feature

The build is run against "--all-features", "pci,acpi", "pci" and "mmio"
separately. The clippy validation must be run against the same set of
features in order to validate the code is correct.

Because of these new checks, this commit includes multiple fixes
related to the errors generated when manually running the checks.

Signed-off-by: Sebastien Boeuf <sebastien.boeuf@intel.com>

											
										
										
											2020-01-21 08:32:50 +00:00
+								#[cfg(feature = "acpi")]
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								struct CPUMethods {
 								    max_vcpus: u8,
 								}
 								#[cfg(feature = "acpi")]
 								impl Aml for CPUMethods {
 								    fn to_aml_bytes(&self) -> Vec<u8> {
 								        let mut bytes = Vec::new();
 								        bytes.extend_from_slice(
 								            // CPU status method
 								            &aml::Method::new(
 								                "CSTA".into(),
 ,
 								                true,
 								                vec![
 								                    // Take lock defined above
 								                    &aml::Acquire::new("\\_SB_.PRES.CPLK".into(), 0xfff),
-												Revert "vmm: Move CpuManager device to MMIO region"

This reverts commit 980e03fa0ab3d217fe91fd60d8459507c903d88b.

											
										
										
											2020-01-24 10:36:39 +00:00
+								                    // Write CPU number (in first argument) to I/O port via field
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								                    &aml::Store::new(&aml::Path::new("\\_SB_.PRES.CSEL"), &aml::Arg(0)),
 								                    &aml::Store::new(&aml::Local(0), &aml::ZERO),
 								                    // Check if CPEN bit is set, if so make the local variable 0xf (see _STA for details of meaning)
 								                    &aml::If::new(
 								                        &aml::Equal::new(&aml::Path::new("\\_SB_.PRES.CPEN"), &aml::ONE),
 								                        vec![&aml::Store::new(&aml::Local(0), &0xfu8)],
 								                    ),
 								                    // Release lock
 								                    &aml::Release::new("\\_SB_.PRES.CPLK".into()),
 								                    // Return 0 or 0xf
 								                    &aml::Return::new(&aml::Local(0)),
 								                ],
 								            )
 								            .to_aml_bytes(),
 								        );
-												vmm: acpi: Refactor ACPI CPU notification

Continue to notify on all vCPUs but instead separate the notification
functionality into two methods, CSCN that walks through all the CPUs
and CTFY which notifies based on the numerical CPU id. This is an
interim step towards only notifying on changed CPUs and ultimately CPU
removal.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:09:24 +00:00
+								        let mut cpu_notifies = Vec::new();
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								        for cpu_id in 0..self.max_vcpus {
-												vmm: acpi: Refactor ACPI CPU notification

Continue to notify on all vCPUs but instead separate the notification
functionality into two methods, CSCN that walks through all the CPUs
and CTFY which notifies based on the numerical CPU id. This is an
interim step towards only notifying on changed CPUs and ultimately CPU
removal.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:09:24 +00:00
+								            cpu_notifies.push(CPUNotify { cpu_id });
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								        }
-												vmm: acpi: Refactor ACPI CPU notification

Continue to notify on all vCPUs but instead separate the notification
functionality into two methods, CSCN that walks through all the CPUs
and CTFY which notifies based on the numerical CPU id. This is an
interim step towards only notifying on changed CPUs and ultimately CPU
removal.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:09:24 +00:00
+								        let mut cpu_notifies_refs: Vec<&dyn aml::Aml> = Vec::new();
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								        for cpu_id in 0..self.max_vcpus {
-												vmm: acpi: Refactor ACPI CPU notification

Continue to notify on all vCPUs but instead separate the notification
functionality into two methods, CSCN that walks through all the CPUs
and CTFY which notifies based on the numerical CPU id. This is an
interim step towards only notifying on changed CPUs and ultimately CPU
removal.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:09:24 +00:00
+								            cpu_notifies_refs.push(&cpu_notifies[usize::from(cpu_id)]);
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								        }
-												vmm: acpi: Refactor ACPI CPU notification

Continue to notify on all vCPUs but instead separate the notification
functionality into two methods, CSCN that walks through all the CPUs
and CTFY which notifies based on the numerical CPU id. This is an
interim step towards only notifying on changed CPUs and ultimately CPU
removal.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:09:24 +00:00
+								        bytes.extend_from_slice(
 								            &aml::Method::new("CTFY".into(), 2, true, cpu_notifies_refs).to_aml_bytes(),
 								        );
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
-												vmm: cpu: Implement CPU removal

When the running OS has been told that a CPU should be removed it will
shutdown the CPU and then signal to the hypervisor via the "_EJ0" method
on the device that ultimately writes into an I/O port than the vCPU
should be shutdown. Upon notification the hypervisor signals to the
individual thread that it should shutdown and waits for that thread to
end.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 11:22:33 +00:00
+								        bytes.extend_from_slice(
 								            &aml::Method::new(
 								                "CEJ0".into(),
 ,
 								                true,
 								                vec![
 								                    &aml::Acquire::new("\\_SB_.PRES.CPLK".into(), 0xfff),
-												Revert "vmm: Move CpuManager device to MMIO region"

This reverts commit 980e03fa0ab3d217fe91fd60d8459507c903d88b.

											
										
										
											2020-01-24 10:36:39 +00:00
+								                    // Write CPU number (in first argument) to I/O port via field
-												vmm: cpu: Implement CPU removal

When the running OS has been told that a CPU should be removed it will
shutdown the CPU and then signal to the hypervisor via the "_EJ0" method
on the device that ultimately writes into an I/O port than the vCPU
should be shutdown. Upon notification the hypervisor signals to the
individual thread that it should shutdown and waits for that thread to
end.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 11:22:33 +00:00
+								                    &aml::Store::new(&aml::Path::new("\\_SB_.PRES.CSEL"), &aml::Arg(0)),
 								                    // Set CEJ0 bit
 								                    &aml::Store::new(&aml::Path::new("\\_SB_.PRES.CEJ0"), &aml::ONE),
 								                    &aml::Release::new("\\_SB_.PRES.CPLK".into()),
 								                ],
 								            )
 								            .to_aml_bytes(),
 								        );
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								        bytes.extend_from_slice(
-												vmm: acpi: Refactor ACPI CPU notification

Continue to notify on all vCPUs but instead separate the notification
functionality into two methods, CSCN that walks through all the CPUs
and CTFY which notifies based on the numerical CPU id. This is an
interim step towards only notifying on changed CPUs and ultimately CPU
removal.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:09:24 +00:00
+								            &aml::Method::new(
 								                "CSCN".into(),
 ,
 								                true,
 								                vec![
-												vmm: cpu: Only do ACPI notify on newly added vCPUs

When we add a vCPU set an "inserting" boolean that is exposed as an ACPI
field that will be checked for and reset when the ACPI GED notification
for CPU devices happens.

This change is a precursor for CPU unplug.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:42:29 +00:00
+								                    // Take lock defined above
 								                    &aml::Acquire::new("\\_SB_.PRES.CPLK".into(), 0xfff),
-												vmm: acpi: Refactor ACPI CPU notification

Continue to notify on all vCPUs but instead separate the notification
functionality into two methods, CSCN that walks through all the CPUs
and CTFY which notifies based on the numerical CPU id. This is an
interim step towards only notifying on changed CPUs and ultimately CPU
removal.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:09:24 +00:00
+								                    &aml::Store::new(&aml::Local(0), &aml::ZERO),
 								                    &aml::While::new(
 								                        &aml::LessThan::new(&aml::Local(0), &self.max_vcpus),
 								                        vec![
-												Revert "vmm: Move CpuManager device to MMIO region"

This reverts commit 980e03fa0ab3d217fe91fd60d8459507c903d88b.

											
										
										
											2020-01-24 10:36:39 +00:00
+								                            // Write CPU number (in first argument) to I/O port via field
-												vmm: cpu: Only do ACPI notify on newly added vCPUs

When we add a vCPU set an "inserting" boolean that is exposed as an ACPI
field that will be checked for and reset when the ACPI GED notification
for CPU devices happens.

This change is a precursor for CPU unplug.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:42:29 +00:00
+								                            &aml::Store::new(&aml::Path::new("\\_SB_.PRES.CSEL"), &aml::Local(0)),
 								                            // Check if CINS bit is set
 								                            &aml::If::new(
 								                                &aml::Equal::new(&aml::Path::new("\\_SB_.PRES.CINS"), &aml::ONE),
 								                                // Notify device if it is
 								                                vec![
 								                                    &aml::MethodCall::new(
 								                                        "CTFY".into(),
 								                                        vec![&aml::Local(0), &aml::ONE],
 								                                    ),
 								                                    // Reset CINS bit
 								                                    &aml::Store::new(
 								                                        &aml::Path::new("\\_SB_.PRES.CINS"),
 								                                        &aml::ONE,
 								                                    ),
 								                                ],
 								                            ),
-												vmm: cpu: Notify guest OS that it should offline vCPUs

Allow the resizing of the number of vCPUs to less than the current
active vCPUs. This does not currently remove them from the system but
the kernel will take them offline.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-17 10:49:05 +00:00
+								                            // Check if CRMV bit is set
 								                            &aml::If::new(
 								                                &aml::Equal::new(&aml::Path::new("\\_SB_.PRES.CRMV"), &aml::ONE),
 								                                // Notify device if it is (with the eject constant 0x3)
 								                                vec![
 								                                    &aml::MethodCall::new(
 								                                        "CTFY".into(),
 								                                        vec![&aml::Local(0), &3u8],
 								                                    ),
 								                                    // Reset CRMV bit
 								                                    &aml::Store::new(
 								                                        &aml::Path::new("\\_SB_.PRES.CRMV"),
 								                                        &aml::ONE,
 								                                    ),
 								                                ],
 								                            ),
-												vmm: acpi: Refactor ACPI CPU notification

Continue to notify on all vCPUs but instead separate the notification
functionality into two methods, CSCN that walks through all the CPUs
and CTFY which notifies based on the numerical CPU id. This is an
interim step towards only notifying on changed CPUs and ultimately CPU
removal.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:09:24 +00:00
+								                            &aml::Add::new(&aml::Local(0), &aml::Local(0), &aml::ONE),
 								                        ],
 								                    ),
-												vmm: cpu: Only do ACPI notify on newly added vCPUs

When we add a vCPU set an "inserting" boolean that is exposed as an ACPI
field that will be checked for and reset when the ACPI GED notification
for CPU devices happens.

This change is a precursor for CPU unplug.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:42:29 +00:00
+								                    // Release lock
 								                    &aml::Release::new("\\_SB_.PRES.CPLK".into()),
-												vmm: acpi: Refactor ACPI CPU notification

Continue to notify on all vCPUs but instead separate the notification
functionality into two methods, CSCN that walks through all the CPUs
and CTFY which notifies based on the numerical CPU id. This is an
interim step towards only notifying on changed CPUs and ultimately CPU
removal.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-16 16:09:24 +00:00
+								                ],
 								            )
 								            .to_aml_bytes(),
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								        );
 								        bytes
 								    }
 								}
 								#[cfg(feature = "acpi")]
 								impl Aml for CpuManager {
 								    fn to_aml_bytes(&self) -> Vec<u8> {
 								        let mut bytes = Vec::new();
 								        // CPU hotplug controller
 								        bytes.extend_from_slice(
 								            &aml::Device::new(
 								                "_SB_.PRES".into(),
 								                vec![
 								                    &aml::Name::new("_HID".into(), &aml::EISAName::new("PNP0A06")),
 								                    // Mutex to protect concurrent access as we write to choose CPU and then read back status
 								                    &aml::Mutex::new("CPLK".into(), 0),
-												Revert "vmm: Move CpuManager device to MMIO region"

This reverts commit 980e03fa0ab3d217fe91fd60d8459507c903d88b.

											
										
										
											2020-01-24 10:36:39 +00:00
+								                    // I/O port for CPU controller
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								                    &aml::Name::new(
 								                        "_CRS".into(),
-												Revert "vmm: Move CpuManager device to MMIO region"

This reverts commit 980e03fa0ab3d217fe91fd60d8459507c903d88b.

											
										
										
											2020-01-24 10:36:39 +00:00
+								                        &aml::ResourceTemplate::new(vec![&aml::IO::new(
 x0cd8, 0x0cd8, 0x01, 0x0c,
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								                        )]),
 								                    ),
-												Revert "vmm: Move CpuManager device to MMIO region"

This reverts commit 980e03fa0ab3d217fe91fd60d8459507c903d88b.

											
										
										
											2020-01-24 10:36:39 +00:00
+								                    // OpRegion and Fields map I/O port into individual field values
 								                    &aml::OpRegion::new("PRST".into(), aml::OpRegionSpace::SystemIO, 0x0cd8, 0x0c),
-												vmm: Delegate CPU related ACPI tables to CpuManager

Move the code for generating the MADT (APIC) table and the DSDT
generation for CPU related functionality into the CpuManager.

There is no functional change just code rearrangement.

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-12-06 15:25:57 +00:00
+								                    &aml::Field::new(
 								                        "PRST".into(),
 								                        aml::FieldAccessType::Byte,
 								                        aml::FieldUpdateRule::WriteAsZeroes,
 								                        vec![
 								                            aml::FieldEntry::Reserved(32),
 								                            aml::FieldEntry::Named(*b"CPEN", 1),
 								                            aml::FieldEntry::Named(*b"CINS", 1),
 								                            aml::FieldEntry::Named(*b"CRMV", 1),
 								                            aml::FieldEntry::Named(*b"CEJ0", 1),
 								                            aml::FieldEntry::Reserved(4),
 								                            aml::FieldEntry::Named(*b"CCMD", 8),
 								                        ],
 								                    ),
 								                    &aml::Field::new(
 								                        "PRST".into(),
 								                        aml::FieldAccessType::DWord,
 								                        aml::FieldUpdateRule::Preserve,
 								                        vec![
 								                            aml::FieldEntry::Named(*b"CSEL", 32),
 								                            aml::FieldEntry::Reserved(32),
 								                            aml::FieldEntry::Named(*b"CDAT", 32),
 								                        ],
 								                    ),
 								                ],
 								            )
 								            .to_aml_bytes(),
 								        );
 								        // CPU devices
 								        let hid = aml::Name::new("_HID".into(), &"ACPI0010");
 								        let uid = aml::Name::new("_CID".into(), &aml::EISAName::new("PNP0A05"));
 								        // Bundle methods together under a common object
 								        let methods = CPUMethods {
 								            max_vcpus: self.max_vcpus,
 								        };
 								        let mut cpu_data_inner: Vec<&dyn aml::Aml> = vec![&hid, &uid, &methods];
 								        let mut cpu_devices = Vec::new();
 								        for cpu_id in 0..self.max_vcpus {
 								            let cpu_device = CPU { cpu_id };
 								            cpu_devices.push(cpu_device);
 								        }
 								        for cpu_device in cpu_devices.iter() {
 								            cpu_data_inner.push(cpu_device);
 								        }
 								        bytes.extend_from_slice(
 								            &aml::Device::new("_SB_.CPUS".into(), cpu_data_inner).to_aml_bytes(),
 								        );
 								        bytes
 								    }
-												vmm: Move CPU management code to its own module

Move CpuManager, Vcpu and related functionality to its own module (and
file) inside the VMM crate

Signed-off-by: Rob Bradford <robert.bradford@intel.com>

											
										
										
											2019-11-11 13:55:50 +00:00
+								}
-												vmm: cpu_manager: Implement the Pausable trait

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2019-11-21 18:04:08 +00:00
 								impl Pausable for CpuManager {
 								    fn pause(&mut self) -> std::result::Result<(), MigratableError> {
 								        // Tell the vCPUs to pause themselves next time they exit
 								        self.vcpus_pause_signalled.store(true, Ordering::SeqCst);
 								        // Signal to the spawned threads (vCPUs and console signal handler). For the vCPU threads
 								        // this will interrupt the KVM_RUN ioctl() allowing the loop to check the boolean set
 								        // above.
 								        for state in self.vcpu_states.iter() {
 								            state.signal_thread();
 								        }
 								        Ok(())
 								    }
 								    fn resume(&mut self) -> std::result::Result<(), MigratableError> {
 								        // Toggle the vCPUs pause boolean
 								        self.vcpus_pause_signalled.store(false, Ordering::SeqCst);
 								        // Unpark all the VCPU threads.
 								        // Once unparked, the next thing they will do is checking for the pause
 								        // boolean. Since it'll be set to false, they will exit their pause loop
 								        // and go back to vmx root.
 								        for state in self.vcpu_states.iter() {
 								            state.unpark_thread();
 								        }
 								        Ok(())
 								    }
 								}
-												vm-migration: Define the Snapshottable and Transportable traits

A Snapshottable component can snapshot itself and
provide a MigrationSnapshot payload as a result.

A MigrationSnapshot payload is a map of component IDs to a list of
migration sections (MigrationSection). As component can be made of
several Migratable sub-components (e.g. the DeviceManager and its
device objects), a migration snapshot can be made of multiple snapshot
itself.
A snapshot is a list of migration sections, each section being a
component state snapshot. Having multiple sections allows for easier and
backward compatible migration payload extensions.

Once created, a migratable component snapshot may be transported and this
is what the Transportable trait defines, through 2 methods: send and recv.

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>
Signed-off-by: Yi Sun <yi.y.sun@linux.intel.com>

											
										
										
											2019-05-01 16:59:51 +00:00
+								impl Snapshottable for CpuManager {}
 								impl Transportable for CpuManager {}
-												vmm: cpu_manager: Implement the Pausable trait

Signed-off-by: Samuel Ortiz <sameo@linux.intel.com>

											
										
										
											2019-11-21 18:04:08 +00:00
+								impl Migratable for CpuManager {}