mirror of
https://github.com/cloud-hypervisor/cloud-hypervisor.git
synced 2024-11-05 03:21:13 +00:00
d57c49664f
Remove requirement for CpuManager to lock the Vcpu when starting the vCPU as the numerical id corresponds to the index in the the vector. This avoids a potential lock inversion between the Vcpu and CpuManager. WARNING: ThreadSanitizer: lock-order-inversion (potential deadlock) (pid=30497) Cycle in lock order graph: M48 (0x7b0c00001aa0) => M121 (0x7b0c000022b0) => M48 Mutex M121 acquired here while holding mutex M48 in thread T1: #0 pthread_mutex_lock /rustc/llvm/src/llvm-project/compiler-rt/lib/tsan/../sanitizer_common/sanitizer_common_interceptors.inc:4249:3 (cloud-hypervisor+0x9c368) #1 std::sys::unix::mutex::Mutex:🔒:hcd1b9aa06ff775d3 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/sys/unix/mutex.rs:63:17 (cloud-hypervisor+0x662ff4) #2 std::sys_common::mutex::MovableMutex::raw_lock::hff98d0b036469bca /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/sys_common/mutex.rs:76:18 (cloud-hypervisor+0x4915de) #3 std::sync::mutex::Mutex$LT$T$GT$:🔒:h14cfa3c8f5ba878a /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/sync/mutex.rs:267:13 (cloud-hypervisor+0x36ca3b) #4 vmm::cpu::CpuManager::start_vcpu::h290fdbb4b7124ec5 /home/rob/src/cloud-hypervisor/vmm/src/cpu.rs:710:22 (cloud-hypervisor+0x375023) #5 vmm::cpu::CpuManager::activate_vcpus::h2eab380826588391 /home/rob/src/cloud-hypervisor/vmm/src/cpu.rs:902:13 (cloud-hypervisor+0x376b7b) #6 vmm::cpu::CpuManager::start_boot_vcpus::hd80cafe6aa4e8279 /home/rob/src/cloud-hypervisor/vmm/src/cpu.rs:937:9 (cloud-hypervisor+0x3773af) #7 vmm::vm::Vm:👢:hc2ca6b16f996267b /home/rob/src/cloud-hypervisor/vmm/src/vm.rs:2063:9 (cloud-hypervisor+0x343d57) #8 vmm::Vmm::vm_boot::h06bdf54b95d5e14f /home/rob/src/cloud-hypervisor/vmm/src/lib.rs:397:13 (cloud-hypervisor+0x2e5f45) #9 vmm::Vmm::control_loop::h40c9b48c7b800bed /home/rob/src/cloud-hypervisor/vmm/src/lib.rs:1299:48 (cloud-hypervisor+0x2f44e0) #10 vmm::start_vmm_thread::_$u7b$$u7b$closure$u7d$$u7d$::h016d2f7cff698175 /home/rob/src/cloud-hypervisor/vmm/src/lib.rs:263:17 (cloud-hypervisor+0x1ddae0) #11 std::sys_common::backtrace::__rust_begin_short_backtrace::h7fd2df3e7cfba503 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/sys_common/backtrace.rs:123:18 (cloud-hypervisor+0x65926a) #12 std:🧵:Builder::spawn_unchecked::_$u7b$$u7b$closure$u7d$$u7d$::_$u7b$$u7b$closure$u7d$$u7d$::h89880b05fe892d7e /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/thread/mod.rs:477:17 (cloud-hypervisor+0x440a3e) #13 _$LT$core..panic..unwind_safe..AssertUnwindSafe$LT$F$GT$$u20$as$u20$core..ops..function..FnOnce$LT$$LP$$RP$$GT$$GT$::call_once::h487382524d80571f /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/core/src/panic/unwind_safe.rs:271:9 (cloud-hypervisor+0x6dd0fe) #14 std::panicking::try::do_call::h1d9c2ccdc39f3322 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/panicking.rs:406:40 (cloud-hypervisor+0x6d2d71) #15 __rust_try 3hkmq3dzyyv5ejsx (cloud-hypervisor+0x6d3db8) #16 std::panicking::try::h251306df23d21913 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/panicking.rs:370:19 (cloud-hypervisor+0x6d1af9) #17 std::panic::catch_unwind::h2a9ac2fb12c3c64e /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/panic.rs:133:14 (cloud-hypervisor+0x57b75e) #18 std:🧵:Builder::spawn_unchecked::_$u7b$$u7b$closure$u7d$$u7d$::h10f4c340611b55e4 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/thread/mod.rs:476:30 (cloud-hypervisor+0x43f343) #19 core::ops::function::FnOnce::call_once$u7b$$u7b$vtable.shim$u7d$$u7d$::hdd9b37241caf97b3 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/core/src/ops/function.rs:227:5 (cloud-hypervisor+0x3cef45) #20 _$LT$alloc..boxed..Box$LT$F$C$A$GT$$u20$as$u20$core..ops..function..FnOnce$LT$Args$GT$$GT$::call_once::ha5022a6bb7833f62 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/alloc/src/boxed.rs:1854:9 (cloud-hypervisor+0x119d692) #21 _$LT$alloc..boxed..Box$LT$F$C$A$GT$$u20$as$u20$core..ops..function..FnOnce$LT$Args$GT$$GT$::call_once::h481697829cbc6746 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/alloc/src/boxed.rs:1854:9 (cloud-hypervisor+0x119d692) #22 std::sys::unix:🧵:Thread:🆕:thread_start::h6fad62c4c393bbe7 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/sys/unix/thread.rs:108:17 (cloud-hypervisor+0x119d692) Mutex M48 previously acquired by the same thread here: #0 pthread_mutex_lock /rustc/llvm/src/llvm-project/compiler-rt/lib/tsan/../sanitizer_common/sanitizer_common_interceptors.inc:4249:3 (cloud-hypervisor+0x9c368) #1 std::sys::unix::mutex::Mutex:🔒:hcd1b9aa06ff775d3 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/sys/unix/mutex.rs:63:17 (cloud-hypervisor+0x662ff4) #2 std::sys_common::mutex::MovableMutex::raw_lock::hff98d0b036469bca /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/sys_common/mutex.rs:76:18 (cloud-hypervisor+0x4915de) #3 std::sync::mutex::Mutex$LT$T$GT$:🔒:hecf671add5fe1762 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/sync/mutex.rs:267:13 (cloud-hypervisor+0x36d1cb) #4 vmm::vm::Vm:👢:hc2ca6b16f996267b /home/rob/src/cloud-hypervisor/vmm/src/vm.rs:2063:9 (cloud-hypervisor+0x343cd1) #5 vmm::Vmm::vm_boot::h06bdf54b95d5e14f /home/rob/src/cloud-hypervisor/vmm/src/lib.rs:397:13 (cloud-hypervisor+0x2e5f45) #6 vmm::Vmm::control_loop::h40c9b48c7b800bed /home/rob/src/cloud-hypervisor/vmm/src/lib.rs:1299:48 (cloud-hypervisor+0x2f44e0) #7 vmm::start_vmm_thread::_$u7b$$u7b$closure$u7d$$u7d$::h016d2f7cff698175 /home/rob/src/cloud-hypervisor/vmm/src/lib.rs:263:17 (cloud-hypervisor+0x1ddae0) #8 std::sys_common::backtrace::__rust_begin_short_backtrace::h7fd2df3e7cfba503 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/sys_common/backtrace.rs:123:18 (cloud-hypervisor+0x65926a) #9 std:🧵:Builder::spawn_unchecked::_$u7b$$u7b$closure$u7d$$u7d$::_$u7b$$u7b$closure$u7d$$u7d$::h89880b05fe892d7e /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/thread/mod.rs:477:17 (cloud-hypervisor+0x440a3e) #10 _$LT$core..panic..unwind_safe..AssertUnwindSafe$LT$F$GT$$u20$as$u20$core..ops..function..FnOnce$LT$$LP$$RP$$GT$$GT$::call_once::h487382524d80571f /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/core/src/panic/unwind_safe.rs:271:9 (cloud-hypervisor+0x6dd0fe) #11 std::panicking::try::do_call::h1d9c2ccdc39f3322 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/panicking.rs:406:40 (cloud-hypervisor+0x6d2d71) #12 __rust_try 3hkmq3dzyyv5ejsx (cloud-hypervisor+0x6d3db8) #13 std::panicking::try::h251306df23d21913 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/panicking.rs:370:19 (cloud-hypervisor+0x6d1af9) #14 std::panic::catch_unwind::h2a9ac2fb12c3c64e /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/panic.rs:133:14 (cloud-hypervisor+0x57b75e) #15 std:🧵:Builder::spawn_unchecked::_$u7b$$u7b$closure$u7d$$u7d$::h10f4c340611b55e4 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/thread/mod.rs:476:30 (cloud-hypervisor+0x43f343) #16 core::ops::function::FnOnce::call_once$u7b$$u7b$vtable.shim$u7d$$u7d$::hdd9b37241caf97b3 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/core/src/ops/function.rs:227:5 (cloud-hypervisor+0x3cef45) #17 _$LT$alloc..boxed..Box$LT$F$C$A$GT$$u20$as$u20$core..ops..function..FnOnce$LT$Args$GT$$GT$::call_once::ha5022a6bb7833f62 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/alloc/src/boxed.rs:1854:9 (cloud-hypervisor+0x119d692) #18 _$LT$alloc..boxed..Box$LT$F$C$A$GT$$u20$as$u20$core..ops..function..FnOnce$LT$Args$GT$$GT$::call_once::h481697829cbc6746 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/alloc/src/boxed.rs:1854:9 (cloud-hypervisor+0x119d692) #19 std::sys::unix:🧵:Thread:🆕:thread_start::h6fad62c4c393bbe7 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/sys/unix/thread.rs:108:17 (cloud-hypervisor+0x119d692) Mutex M48 acquired here while holding mutex M121 in thread T4: #0 pthread_mutex_lock /rustc/llvm/src/llvm-project/compiler-rt/lib/tsan/../sanitizer_common/sanitizer_common_interceptors.inc:4249:3 (cloud-hypervisor+0x9c368) #1 std::sys::unix::mutex::Mutex:🔒:h967991d72ceb6eb0 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/sys/unix/mutex.rs:63:17 (cloud-hypervisor+0xd94df4) #2 std::sys_common::mutex::MovableMutex::raw_lock::h8779639163126a21 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/sys_common/mutex.rs:76:18 (cloud-hypervisor+0xd90cce) #3 std::sync::mutex::Mutex$LT$T$GT$:🔒:hd85239d207beb12f /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/sync/mutex.rs:267:13 (cloud-hypervisor+0xd6e9ba) #4 vm_device:🚌:Bus::write::hf20f991e71af3199 /home/rob/src/cloud-hypervisor/vm-device/src/bus.rs:235:16 (cloud-hypervisor+0xd8dd2d) #5 _$LT$vmm..vm..VmOps$u20$as$u20$hypervisor..vm..VmmOps$GT$::mmio_write::hc759194aaebc7399 /home/rob/src/cloud-hypervisor/vmm/src/vm.rs:424:15 (cloud-hypervisor+0x32db5f) #6 _$LT$hypervisor..kvm..KvmVcpu$u20$as$u20$hypervisor..cpu..Vcpu$GT$::run::h94762dfba6642fb2 /home/rob/src/cloud-hypervisor/hypervisor/src/kvm/mod.rs:1003:32 (cloud-hypervisor+0xcc3ed8) #7 vmm::cpu::Vcpu::run::hd5cf042157f95bea /home/rob/src/cloud-hypervisor/vmm/src/cpu.rs:327:9 (cloud-hypervisor+0x370234) #8 vmm::cpu::CpuManager::start_vcpu::_$u7b$$u7b$closure$u7d$$u7d$::_$u7b$$u7b$closure$u7d$$u7d$::h37e4dd8619b3a5e5 /home/rob/src/cloud-hypervisor/vmm/src/cpu.rs:813:35 (cloud-hypervisor+0x47785b) #9 std::panicking::try::do_call::h093e4d1434150d77 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/panicking.rs:406:40 (cloud-hypervisor+0x6d2aea) #10 __rust_try 3hkmq3dzyyv5ejsx (cloud-hypervisor+0x6d3db8) #11 std::panicking::try::hee9535cb997282b4 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/panicking.rs:370:19 (cloud-hypervisor+0x6d268f) #12 std::panic::catch_unwind::he3908c4d08a8a028 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/panic.rs:133:14 (cloud-hypervisor+0x57baf9) #13 vmm::cpu::CpuManager::start_vcpu::_$u7b$$u7b$closure$u7d$$u7d$::h29472aaa3a600231 /home/rob/src/cloud-hypervisor/vmm/src/cpu.rs:782:21 (cloud-hypervisor+0x477156) #14 std::sys_common::backtrace::__rust_begin_short_backtrace::hcfc2f02361c98808 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/sys_common/backtrace.rs:123:18 (cloud-hypervisor+0x65932b) #15 std:🧵:Builder::spawn_unchecked::_$u7b$$u7b$closure$u7d$$u7d$::_$u7b$$u7b$closure$u7d$$u7d$::h08b82db41d7af2f2 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/thread/mod.rs:477:17 (cloud-hypervisor+0x4408ef) #16 _$LT$core..panic..unwind_safe..AssertUnwindSafe$LT$F$GT$$u20$as$u20$core..ops..function..FnOnce$LT$$LP$$RP$$GT$$GT$::call_once::h7ebad9d94e64fa5f /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/core/src/panic/unwind_safe.rs:271:9 (cloud-hypervisor+0x6dd1df) #17 std::panicking::try::do_call::h121fafbdf5cf84af /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/panicking.rs:406:40 (cloud-hypervisor+0x6d2b81) #18 __rust_try 3hkmq3dzyyv5ejsx (cloud-hypervisor+0x6d3db8) #19 std::panicking::try::h79e25f019cd90522 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/panicking.rs:370:19 (cloud-hypervisor+0x6d1e1f) #20 std::panic::catch_unwind::h5a0619a53bbd611d /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/panic.rs:133:14 (cloud-hypervisor+0x57b8ff) #21 std:🧵:Builder::spawn_unchecked::_$u7b$$u7b$closure$u7d$$u7d$::h1cfd689c9d362e48 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/thread/mod.rs:476:30 (cloud-hypervisor+0x43fafb) #22 core::ops::function::FnOnce::call_once$u7b$$u7b$vtable.shim$u7d$$u7d$::h6642b1b3a2289640 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/core/src/ops/function.rs:227:5 (cloud-hypervisor+0x3ced55) #23 _$LT$alloc..boxed..Box$LT$F$C$A$GT$$u20$as$u20$core..ops..function..FnOnce$LT$Args$GT$$GT$::call_once::ha5022a6bb7833f62 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/alloc/src/boxed.rs:1854:9 (cloud-hypervisor+0x119d692) #24 _$LT$alloc..boxed..Box$LT$F$C$A$GT$$u20$as$u20$core..ops..function..FnOnce$LT$Args$GT$$GT$::call_once::h481697829cbc6746 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/alloc/src/boxed.rs:1854:9 (cloud-hypervisor+0x119d692) #25 std::sys::unix:🧵:Thread:🆕:thread_start::h6fad62c4c393bbe7 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/sys/unix/thread.rs:108:17 (cloud-hypervisor+0x119d692) Mutex M121 previously acquired by the same thread here: #0 pthread_mutex_lock /rustc/llvm/src/llvm-project/compiler-rt/lib/tsan/../sanitizer_common/sanitizer_common_interceptors.inc:4249:3 (cloud-hypervisor+0x9c368) #1 std::sys::unix::mutex::Mutex:🔒:hcd1b9aa06ff775d3 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/sys/unix/mutex.rs:63:17 (cloud-hypervisor+0x662ff4) #2 std::sys_common::mutex::MovableMutex::raw_lock::hff98d0b036469bca /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/sys_common/mutex.rs:76:18 (cloud-hypervisor+0x4915de) #3 std::sync::mutex::Mutex$LT$T$GT$:🔒:h14cfa3c8f5ba878a /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/sync/mutex.rs:267:13 (cloud-hypervisor+0x36ca3b) #4 vmm::cpu::CpuManager::start_vcpu::_$u7b$$u7b$closure$u7d$$u7d$::_$u7b$$u7b$closure$u7d$$u7d$::h37e4dd8619b3a5e5 /home/rob/src/cloud-hypervisor/vmm/src/cpu.rs:813:35 (cloud-hypervisor+0x4777c9) #5 std::panicking::try::do_call::h093e4d1434150d77 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/panicking.rs:406:40 (cloud-hypervisor+0x6d2aea) #6 __rust_try 3hkmq3dzyyv5ejsx (cloud-hypervisor+0x6d3db8) #7 std::panicking::try::hee9535cb997282b4 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/panicking.rs:370:19 (cloud-hypervisor+0x6d268f) #8 std::panic::catch_unwind::he3908c4d08a8a028 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/panic.rs:133:14 (cloud-hypervisor+0x57baf9) #9 vmm::cpu::CpuManager::start_vcpu::_$u7b$$u7b$closure$u7d$$u7d$::h29472aaa3a600231 /home/rob/src/cloud-hypervisor/vmm/src/cpu.rs:782:21 (cloud-hypervisor+0x477156) #10 std::sys_common::backtrace::__rust_begin_short_backtrace::hcfc2f02361c98808 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/sys_common/backtrace.rs:123:18 (cloud-hypervisor+0x65932b) #11 std:🧵:Builder::spawn_unchecked::_$u7b$$u7b$closure$u7d$$u7d$::_$u7b$$u7b$closure$u7d$$u7d$::h08b82db41d7af2f2 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/thread/mod.rs:477:17 (cloud-hypervisor+0x4408ef) #12 _$LT$core..panic..unwind_safe..AssertUnwindSafe$LT$F$GT$$u20$as$u20$core..ops..function..FnOnce$LT$$LP$$RP$$GT$$GT$::call_once::h7ebad9d94e64fa5f /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/core/src/panic/unwind_safe.rs:271:9 (cloud-hypervisor+0x6dd1df) #13 std::panicking::try::do_call::h121fafbdf5cf84af /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/panicking.rs:406:40 (cloud-hypervisor+0x6d2b81) #14 __rust_try 3hkmq3dzyyv5ejsx (cloud-hypervisor+0x6d3db8) #15 std::panicking::try::h79e25f019cd90522 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/panicking.rs:370:19 (cloud-hypervisor+0x6d1e1f) #16 std::panic::catch_unwind::h5a0619a53bbd611d /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/panic.rs:133:14 (cloud-hypervisor+0x57b8ff) #17 std:🧵:Builder::spawn_unchecked::_$u7b$$u7b$closure$u7d$$u7d$::h1cfd689c9d362e48 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/thread/mod.rs:476:30 (cloud-hypervisor+0x43fafb) #18 core::ops::function::FnOnce::call_once$u7b$$u7b$vtable.shim$u7d$$u7d$::h6642b1b3a2289640 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/core/src/ops/function.rs:227:5 (cloud-hypervisor+0x3ced55) #19 _$LT$alloc..boxed..Box$LT$F$C$A$GT$$u20$as$u20$core..ops..function..FnOnce$LT$Args$GT$$GT$::call_once::ha5022a6bb7833f62 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/alloc/src/boxed.rs:1854:9 (cloud-hypervisor+0x119d692) #20 _$LT$alloc..boxed..Box$LT$F$C$A$GT$$u20$as$u20$core..ops..function..FnOnce$LT$Args$GT$$GT$::call_once::h481697829cbc6746 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/alloc/src/boxed.rs:1854:9 (cloud-hypervisor+0x119d692) #21 std::sys::unix:🧵:Thread:🆕:thread_start::h6fad62c4c393bbe7 /rustc/7d6f948173ccb18822bab13d548c65632db5f0aa/library/std/src/sys/unix/thread.rs:108:17 (cloud-hypervisor+0x119d692) Signed-off-by: Rob Bradford <robert.bradford@intel.com>
1891 lines
66 KiB
Rust
1891 lines
66 KiB
Rust
// Copyright © 2020, Oracle and/or its affiliates.
|
||
//
|
||
// Copyright 2018 Amazon.com, Inc. or its affiliates. All Rights Reserved.
|
||
//
|
||
// Portions Copyright 2017 The Chromium OS Authors. All rights reserved.
|
||
// Use of this source code is governed by a BSD-style license that can be
|
||
// found in the LICENSE-BSD-3-Clause file.
|
||
//
|
||
// Copyright © 2019 Intel Corporation
|
||
//
|
||
// SPDX-License-Identifier: Apache-2.0 AND BSD-3-Clause
|
||
//
|
||
|
||
use crate::config::CpusConfig;
|
||
use crate::device_manager::DeviceManager;
|
||
use crate::memory_manager::MemoryManager;
|
||
use crate::seccomp_filters::{get_seccomp_filter, Thread};
|
||
#[cfg(target_arch = "x86_64")]
|
||
use crate::vm::physical_bits;
|
||
use crate::GuestMemoryMmap;
|
||
use crate::CPU_MANAGER_SNAPSHOT_ID;
|
||
#[cfg(feature = "acpi")]
|
||
use acpi_tables::{aml, aml::Aml, sdt::Sdt};
|
||
use anyhow::anyhow;
|
||
use arch::EntryPoint;
|
||
#[cfg(any(target_arch = "aarch64", feature = "acpi"))]
|
||
use arch::NumaNodes;
|
||
use devices::interrupt_controller::InterruptController;
|
||
#[cfg(target_arch = "aarch64")]
|
||
use hypervisor::kvm::kvm_bindings;
|
||
#[cfg(target_arch = "x86_64")]
|
||
use hypervisor::CpuId;
|
||
use hypervisor::{vm::VmmOps, CpuState, HypervisorCpuError, VmExit};
|
||
use libc::{c_void, siginfo_t};
|
||
use seccompiler::{apply_filter, SeccompAction};
|
||
use std::collections::BTreeMap;
|
||
use std::os::unix::thread::JoinHandleExt;
|
||
use std::sync::atomic::{AtomicBool, Ordering};
|
||
use std::sync::{Arc, Barrier, Mutex};
|
||
use std::{cmp, io, result, thread};
|
||
use vm_device::BusDevice;
|
||
#[cfg(feature = "acpi")]
|
||
use vm_memory::GuestAddress;
|
||
use vm_memory::GuestMemoryAtomic;
|
||
use vm_migration::{
|
||
Migratable, MigratableError, Pausable, Snapshot, SnapshotDataSection, Snapshottable,
|
||
Transportable,
|
||
};
|
||
use vmm_sys_util::eventfd::EventFd;
|
||
use vmm_sys_util::signal::{register_signal_handler, SIGRTMIN};
|
||
|
||
#[cfg(feature = "acpi")]
|
||
pub const CPU_MANAGER_ACPI_SIZE: usize = 0xc;
|
||
|
||
#[derive(Debug)]
|
||
pub enum Error {
|
||
/// Cannot create the vCPU.
|
||
VcpuCreate(anyhow::Error),
|
||
|
||
/// Cannot run the VCPUs.
|
||
VcpuRun(anyhow::Error),
|
||
|
||
/// Cannot spawn a new vCPU thread.
|
||
VcpuSpawn(io::Error),
|
||
|
||
/// Cannot generate common CPUID
|
||
CommonCpuId(arch::Error),
|
||
|
||
/// Error configuring VCPU
|
||
VcpuConfiguration(arch::Error),
|
||
|
||
#[cfg(target_arch = "aarch64")]
|
||
/// Error fetching prefered target
|
||
VcpuArmPreferredTarget(hypervisor::HypervisorVmError),
|
||
|
||
#[cfg(target_arch = "aarch64")]
|
||
/// Error doing vCPU init on Arm.
|
||
VcpuArmInit(hypervisor::HypervisorCpuError),
|
||
|
||
/// Failed to join on vCPU threads
|
||
ThreadCleanup(std::boxed::Box<dyn std::any::Any + std::marker::Send>),
|
||
|
||
/// Cannot add legacy device to Bus.
|
||
BusError(vm_device::BusError),
|
||
|
||
/// Asking for more vCPUs that we can have
|
||
DesiredVCpuCountExceedsMax,
|
||
|
||
/// Cannot create seccomp filter
|
||
CreateSeccompFilter(seccompiler::Error),
|
||
|
||
/// Cannot apply seccomp filter
|
||
ApplySeccompFilter(seccompiler::Error),
|
||
|
||
/// Error starting vCPU after restore
|
||
StartRestoreVcpu(anyhow::Error),
|
||
|
||
/// Error because an unexpected VmExit type was received.
|
||
UnexpectedVmExit,
|
||
|
||
/// Failed to allocate MMIO address
|
||
AllocateMmmioAddress,
|
||
|
||
#[cfg(feature = "tdx")]
|
||
InitializeTdx(hypervisor::HypervisorCpuError),
|
||
|
||
/// Failed scheduling the thread on the expected CPU set.
|
||
ScheduleCpuSet,
|
||
}
|
||
pub type Result<T> = result::Result<T, Error>;
|
||
|
||
#[cfg(all(target_arch = "x86_64", feature = "acpi"))]
|
||
#[allow(dead_code)]
|
||
#[repr(packed)]
|
||
struct LocalApic {
|
||
pub r#type: u8,
|
||
pub length: u8,
|
||
pub processor_id: u8,
|
||
pub apic_id: u8,
|
||
pub flags: u32,
|
||
}
|
||
|
||
#[allow(dead_code)]
|
||
#[repr(packed)]
|
||
#[derive(Default)]
|
||
struct Ioapic {
|
||
pub r#type: u8,
|
||
pub length: u8,
|
||
pub ioapic_id: u8,
|
||
_reserved: u8,
|
||
pub apic_address: u32,
|
||
pub gsi_base: u32,
|
||
}
|
||
|
||
#[cfg(all(target_arch = "aarch64", feature = "acpi"))]
|
||
#[allow(dead_code)]
|
||
#[repr(packed)]
|
||
struct GicC {
|
||
pub r#type: u8,
|
||
pub length: u8,
|
||
pub reserved0: u16,
|
||
pub cpu_interface_number: u32,
|
||
pub uid: u32,
|
||
pub flags: u32,
|
||
pub parking_version: u32,
|
||
pub performance_interrupt: u32,
|
||
pub parked_address: u64,
|
||
pub base_address: u64,
|
||
pub gicv_base_address: u64,
|
||
pub gich_base_address: u64,
|
||
pub vgic_interrupt: u32,
|
||
pub gicr_base_address: u64,
|
||
pub mpidr: u64,
|
||
pub proc_power_effi_class: u8,
|
||
pub reserved1: u8,
|
||
pub spe_overflow_interrupt: u16,
|
||
}
|
||
|
||
#[cfg(all(target_arch = "aarch64", feature = "acpi"))]
|
||
#[allow(dead_code)]
|
||
#[repr(packed)]
|
||
struct GicD {
|
||
pub r#type: u8,
|
||
pub length: u8,
|
||
pub reserved0: u16,
|
||
pub gic_id: u32,
|
||
pub base_address: u64,
|
||
pub global_irq_base: u32,
|
||
pub version: u8,
|
||
pub reserved1: [u8; 3],
|
||
}
|
||
|
||
#[cfg(all(target_arch = "aarch64", feature = "acpi"))]
|
||
#[allow(dead_code)]
|
||
#[repr(packed)]
|
||
struct GicR {
|
||
pub r#type: u8,
|
||
pub length: u8,
|
||
pub reserved: u16,
|
||
pub base_address: u64,
|
||
pub range_length: u32,
|
||
}
|
||
|
||
#[cfg(all(target_arch = "aarch64", feature = "acpi"))]
|
||
#[allow(dead_code)]
|
||
#[repr(packed)]
|
||
struct GicIts {
|
||
pub r#type: u8,
|
||
pub length: u8,
|
||
pub reserved0: u16,
|
||
pub translation_id: u32,
|
||
pub base_address: u64,
|
||
pub reserved1: u32,
|
||
}
|
||
|
||
#[cfg(all(target_arch = "aarch64", feature = "acpi"))]
|
||
#[allow(dead_code)]
|
||
#[repr(packed)]
|
||
struct ProcessorHierarchyNode {
|
||
pub r#type: u8,
|
||
pub length: u8,
|
||
pub reserved: u16,
|
||
pub flags: u32,
|
||
pub parent: u32,
|
||
pub acpi_processor_id: u32,
|
||
pub num_private_resources: u32,
|
||
}
|
||
|
||
#[allow(dead_code)]
|
||
#[repr(packed)]
|
||
#[derive(Default)]
|
||
struct InterruptSourceOverride {
|
||
pub r#type: u8,
|
||
pub length: u8,
|
||
pub bus: u8,
|
||
pub source: u8,
|
||
pub gsi: u32,
|
||
pub flags: u16,
|
||
}
|
||
|
||
/// A wrapper around creating and using a kvm-based VCPU.
|
||
pub struct Vcpu {
|
||
// The hypervisor abstracted CPU.
|
||
vcpu: Arc<dyn hypervisor::Vcpu>,
|
||
id: u8,
|
||
#[cfg(target_arch = "aarch64")]
|
||
mpidr: u64,
|
||
saved_state: Option<CpuState>,
|
||
}
|
||
|
||
impl Vcpu {
|
||
/// Constructs a new VCPU for `vm`.
|
||
///
|
||
/// # Arguments
|
||
///
|
||
/// * `id` - Represents the CPU number between [0, max vcpus).
|
||
/// * `vm` - The virtual machine this vcpu will get attached to.
|
||
/// * `vmmops` - Optional object for exit handling.
|
||
pub fn new(
|
||
id: u8,
|
||
vm: &Arc<dyn hypervisor::Vm>,
|
||
vmmops: Option<Arc<dyn VmmOps>>,
|
||
) -> Result<Self> {
|
||
let vcpu = vm
|
||
.create_vcpu(id, vmmops)
|
||
.map_err(|e| Error::VcpuCreate(e.into()))?;
|
||
// Initially the cpuid per vCPU is the one supported by this VM.
|
||
Ok(Vcpu {
|
||
vcpu,
|
||
id,
|
||
#[cfg(target_arch = "aarch64")]
|
||
mpidr: 0,
|
||
saved_state: None,
|
||
})
|
||
}
|
||
|
||
/// Configures a vcpu and should be called once per vcpu when created.
|
||
///
|
||
/// # Arguments
|
||
///
|
||
/// * `kernel_entry_point` - Kernel entry point address in guest memory and boot protocol used.
|
||
/// * `vm_memory` - Guest memory.
|
||
/// * `cpuid` - (x86_64) CpuId, wrapper over the `kvm_cpuid2` structure.
|
||
pub fn configure(
|
||
&mut self,
|
||
#[cfg(target_arch = "aarch64")] vm: &Arc<dyn hypervisor::Vm>,
|
||
kernel_entry_point: Option<EntryPoint>,
|
||
vm_memory: &GuestMemoryAtomic<GuestMemoryMmap>,
|
||
#[cfg(target_arch = "x86_64")] cpuid: CpuId,
|
||
#[cfg(target_arch = "x86_64")] kvm_hyperv: bool,
|
||
) -> Result<()> {
|
||
#[cfg(target_arch = "aarch64")]
|
||
{
|
||
self.init(vm)?;
|
||
self.mpidr = arch::configure_vcpu(&self.vcpu, self.id, kernel_entry_point, vm_memory)
|
||
.map_err(Error::VcpuConfiguration)?;
|
||
}
|
||
info!("Configuring vCPU: cpu_id = {}", self.id);
|
||
#[cfg(target_arch = "x86_64")]
|
||
arch::configure_vcpu(
|
||
&self.vcpu,
|
||
self.id,
|
||
kernel_entry_point,
|
||
vm_memory,
|
||
cpuid,
|
||
kvm_hyperv,
|
||
)
|
||
.map_err(Error::VcpuConfiguration)?;
|
||
|
||
Ok(())
|
||
}
|
||
|
||
/// Gets the MPIDR register value.
|
||
#[cfg(target_arch = "aarch64")]
|
||
pub fn get_mpidr(&self) -> u64 {
|
||
self.mpidr
|
||
}
|
||
|
||
/// Gets the saved vCPU state.
|
||
#[cfg(target_arch = "aarch64")]
|
||
pub fn get_saved_state(&self) -> Option<CpuState> {
|
||
self.saved_state.clone()
|
||
}
|
||
|
||
/// Initializes an aarch64 specific vcpu for booting Linux.
|
||
#[cfg(target_arch = "aarch64")]
|
||
pub fn init(&self, vm: &Arc<dyn hypervisor::Vm>) -> Result<()> {
|
||
let mut kvi: kvm_bindings::kvm_vcpu_init = kvm_bindings::kvm_vcpu_init::default();
|
||
|
||
// This reads back the kernel's preferred target type.
|
||
vm.get_preferred_target(&mut kvi)
|
||
.map_err(Error::VcpuArmPreferredTarget)?;
|
||
// We already checked that the capability is supported.
|
||
kvi.features[0] |= 1 << kvm_bindings::KVM_ARM_VCPU_PSCI_0_2;
|
||
// Non-boot cpus are powered off initially.
|
||
if self.id > 0 {
|
||
kvi.features[0] |= 1 << kvm_bindings::KVM_ARM_VCPU_POWER_OFF;
|
||
}
|
||
self.vcpu.vcpu_init(&kvi).map_err(Error::VcpuArmInit)
|
||
}
|
||
|
||
/// Runs the VCPU until it exits, returning the reason.
|
||
///
|
||
/// Note that the state of the VCPU and associated VM must be setup first for this to do
|
||
/// anything useful.
|
||
pub fn run(&self) -> std::result::Result<VmExit, HypervisorCpuError> {
|
||
self.vcpu.run()
|
||
}
|
||
}
|
||
|
||
const VCPU_SNAPSHOT_ID: &str = "vcpu";
|
||
impl Pausable for Vcpu {
|
||
fn pause(&mut self) -> std::result::Result<(), MigratableError> {
|
||
self.saved_state =
|
||
Some(self.vcpu.state().map_err(|e| {
|
||
MigratableError::Pause(anyhow!("Could not get vCPU state {:?}", e))
|
||
})?);
|
||
|
||
Ok(())
|
||
}
|
||
|
||
fn resume(&mut self) -> std::result::Result<(), MigratableError> {
|
||
if let Some(vcpu_state) = &self.saved_state {
|
||
self.vcpu.set_state(vcpu_state).map_err(|e| {
|
||
MigratableError::Pause(anyhow!("Could not set the vCPU state {:?}", e))
|
||
})?;
|
||
}
|
||
|
||
Ok(())
|
||
}
|
||
}
|
||
impl Snapshottable for Vcpu {
|
||
fn id(&self) -> String {
|
||
VCPU_SNAPSHOT_ID.to_string()
|
||
}
|
||
|
||
fn snapshot(&mut self) -> std::result::Result<Snapshot, MigratableError> {
|
||
let mut vcpu_snapshot = Snapshot::new(&format!("{}", self.id));
|
||
vcpu_snapshot.add_data_section(SnapshotDataSection::new_from_state(
|
||
VCPU_SNAPSHOT_ID,
|
||
&self.saved_state,
|
||
)?);
|
||
|
||
Ok(vcpu_snapshot)
|
||
}
|
||
|
||
fn restore(&mut self, snapshot: Snapshot) -> std::result::Result<(), MigratableError> {
|
||
self.saved_state = Some(snapshot.to_state(VCPU_SNAPSHOT_ID)?);
|
||
Ok(())
|
||
}
|
||
}
|
||
|
||
pub struct CpuManager {
|
||
config: CpusConfig,
|
||
#[cfg_attr(target_arch = "aarch64", allow(dead_code))]
|
||
interrupt_controller: Option<Arc<Mutex<dyn InterruptController>>>,
|
||
#[cfg_attr(target_arch = "aarch64", allow(dead_code))]
|
||
vm_memory: GuestMemoryAtomic<GuestMemoryMmap>,
|
||
#[cfg(target_arch = "x86_64")]
|
||
cpuid: CpuId,
|
||
#[cfg_attr(target_arch = "aarch64", allow(dead_code))]
|
||
vm: Arc<dyn hypervisor::Vm>,
|
||
vcpus_kill_signalled: Arc<AtomicBool>,
|
||
vcpus_pause_signalled: Arc<AtomicBool>,
|
||
exit_evt: EventFd,
|
||
#[cfg_attr(target_arch = "aarch64", allow(dead_code))]
|
||
reset_evt: EventFd,
|
||
vcpu_states: Vec<VcpuState>,
|
||
selected_cpu: u8,
|
||
vcpus: Vec<Arc<Mutex<Vcpu>>>,
|
||
seccomp_action: SeccompAction,
|
||
vmmops: Arc<dyn VmmOps>,
|
||
#[cfg(feature = "acpi")]
|
||
#[cfg_attr(target_arch = "aarch64", allow(dead_code))]
|
||
acpi_address: GuestAddress,
|
||
#[cfg(feature = "acpi")]
|
||
proximity_domain_per_cpu: BTreeMap<u8, u32>,
|
||
affinity: BTreeMap<u8, Vec<u8>>,
|
||
}
|
||
|
||
const CPU_ENABLE_FLAG: usize = 0;
|
||
const CPU_INSERTING_FLAG: usize = 1;
|
||
const CPU_REMOVING_FLAG: usize = 2;
|
||
const CPU_EJECT_FLAG: usize = 3;
|
||
|
||
const CPU_STATUS_OFFSET: u64 = 4;
|
||
const CPU_SELECTION_OFFSET: u64 = 0;
|
||
|
||
impl BusDevice for CpuManager {
|
||
fn read(&mut self, _base: u64, offset: u64, data: &mut [u8]) {
|
||
// The Linux kernel, quite reasonably, doesn't zero the memory it gives us.
|
||
data.fill(0);
|
||
|
||
match offset {
|
||
CPU_SELECTION_OFFSET => {
|
||
data[0] = self.selected_cpu;
|
||
}
|
||
CPU_STATUS_OFFSET => {
|
||
if self.selected_cpu < self.max_vcpus() {
|
||
let state = &self.vcpu_states[usize::from(self.selected_cpu)];
|
||
if state.active() {
|
||
data[0] |= 1 << CPU_ENABLE_FLAG;
|
||
}
|
||
if state.inserting {
|
||
data[0] |= 1 << CPU_INSERTING_FLAG;
|
||
}
|
||
if state.removing {
|
||
data[0] |= 1 << CPU_REMOVING_FLAG;
|
||
}
|
||
} else {
|
||
warn!("Out of range vCPU id: {}", self.selected_cpu);
|
||
}
|
||
}
|
||
_ => {
|
||
warn!(
|
||
"Unexpected offset for accessing CPU manager device: {:#}",
|
||
offset
|
||
);
|
||
}
|
||
}
|
||
}
|
||
|
||
fn write(&mut self, _base: u64, offset: u64, data: &[u8]) -> Option<Arc<Barrier>> {
|
||
match offset {
|
||
CPU_SELECTION_OFFSET => {
|
||
self.selected_cpu = data[0];
|
||
}
|
||
CPU_STATUS_OFFSET => {
|
||
if self.selected_cpu < self.max_vcpus() {
|
||
let state = &mut self.vcpu_states[usize::from(self.selected_cpu)];
|
||
// The ACPI code writes back a 1 to acknowledge the insertion
|
||
if (data[0] & (1 << CPU_INSERTING_FLAG) == 1 << CPU_INSERTING_FLAG)
|
||
&& state.inserting
|
||
{
|
||
state.inserting = false;
|
||
}
|
||
// Ditto for removal
|
||
if (data[0] & (1 << CPU_REMOVING_FLAG) == 1 << CPU_REMOVING_FLAG)
|
||
&& state.removing
|
||
{
|
||
state.removing = false;
|
||
}
|
||
// Trigger removal of vCPU
|
||
if data[0] & (1 << CPU_EJECT_FLAG) == 1 << CPU_EJECT_FLAG {
|
||
if let Err(e) = self.remove_vcpu(self.selected_cpu) {
|
||
error!("Error removing vCPU: {:?}", e);
|
||
}
|
||
}
|
||
} else {
|
||
warn!("Out of range vCPU id: {}", self.selected_cpu);
|
||
}
|
||
}
|
||
_ => {
|
||
warn!(
|
||
"Unexpected offset for accessing CPU manager device: {:#}",
|
||
offset
|
||
);
|
||
}
|
||
}
|
||
None
|
||
}
|
||
}
|
||
|
||
#[derive(Default)]
|
||
struct VcpuState {
|
||
inserting: bool,
|
||
removing: bool,
|
||
handle: Option<thread::JoinHandle<()>>,
|
||
kill: Arc<AtomicBool>,
|
||
vcpu_run_interrupted: Arc<AtomicBool>,
|
||
}
|
||
|
||
impl VcpuState {
|
||
fn active(&self) -> bool {
|
||
self.handle.is_some()
|
||
}
|
||
|
||
fn signal_thread(&self) {
|
||
if let Some(handle) = self.handle.as_ref() {
|
||
loop {
|
||
unsafe {
|
||
libc::pthread_kill(handle.as_pthread_t() as _, SIGRTMIN());
|
||
}
|
||
if self.vcpu_run_interrupted.load(Ordering::SeqCst) {
|
||
break;
|
||
} else {
|
||
// This is more effective than thread::yield_now() at
|
||
// avoiding a priority inversion with the vCPU thread
|
||
thread::sleep(std::time::Duration::from_millis(1));
|
||
}
|
||
}
|
||
}
|
||
}
|
||
|
||
fn join_thread(&mut self) -> Result<()> {
|
||
if let Some(handle) = self.handle.take() {
|
||
handle.join().map_err(Error::ThreadCleanup)?
|
||
}
|
||
|
||
Ok(())
|
||
}
|
||
|
||
fn unpark_thread(&self) {
|
||
if let Some(handle) = self.handle.as_ref() {
|
||
handle.thread().unpark()
|
||
}
|
||
}
|
||
}
|
||
|
||
impl CpuManager {
|
||
#[allow(unused_variables)]
|
||
#[allow(clippy::too_many_arguments)]
|
||
pub fn new(
|
||
config: &CpusConfig,
|
||
device_manager: &Arc<Mutex<DeviceManager>>,
|
||
memory_manager: &Arc<Mutex<MemoryManager>>,
|
||
vm: Arc<dyn hypervisor::Vm>,
|
||
exit_evt: EventFd,
|
||
reset_evt: EventFd,
|
||
hypervisor: Arc<dyn hypervisor::Hypervisor>,
|
||
seccomp_action: SeccompAction,
|
||
vmmops: Arc<dyn VmmOps>,
|
||
#[cfg(feature = "tdx")] tdx_enabled: bool,
|
||
#[cfg(any(target_arch = "aarch64", feature = "acpi"))] numa_nodes: &NumaNodes,
|
||
) -> Result<Arc<Mutex<CpuManager>>> {
|
||
let guest_memory = memory_manager.lock().unwrap().guest_memory();
|
||
let mut vcpu_states = Vec::with_capacity(usize::from(config.max_vcpus));
|
||
vcpu_states.resize_with(usize::from(config.max_vcpus), VcpuState::default);
|
||
|
||
#[cfg(target_arch = "x86_64")]
|
||
let sgx_epc_sections = memory_manager
|
||
.lock()
|
||
.unwrap()
|
||
.sgx_epc_region()
|
||
.as_ref()
|
||
.map(|sgx_epc_region| sgx_epc_region.epc_sections().values().cloned().collect());
|
||
#[cfg(target_arch = "x86_64")]
|
||
let cpuid = {
|
||
let phys_bits = physical_bits(config.max_phys_bits);
|
||
arch::generate_common_cpuid(
|
||
hypervisor,
|
||
config
|
||
.topology
|
||
.clone()
|
||
.map(|t| (t.threads_per_core, t.cores_per_die, t.dies_per_package)),
|
||
sgx_epc_sections,
|
||
phys_bits,
|
||
config.kvm_hyperv,
|
||
#[cfg(feature = "tdx")]
|
||
tdx_enabled,
|
||
)
|
||
.map_err(Error::CommonCpuId)?
|
||
};
|
||
|
||
let device_manager = device_manager.lock().unwrap();
|
||
#[cfg(feature = "acpi")]
|
||
let acpi_address = device_manager
|
||
.allocator()
|
||
.lock()
|
||
.unwrap()
|
||
.allocate_platform_mmio_addresses(None, CPU_MANAGER_ACPI_SIZE as u64, None)
|
||
.ok_or(Error::AllocateMmmioAddress)?;
|
||
|
||
#[cfg(feature = "acpi")]
|
||
let proximity_domain_per_cpu: BTreeMap<u8, u32> = {
|
||
let mut cpu_list = Vec::new();
|
||
for (proximity_domain, numa_node) in numa_nodes.iter() {
|
||
for cpu in numa_node.cpus.iter() {
|
||
cpu_list.push((*cpu, *proximity_domain))
|
||
}
|
||
}
|
||
cpu_list
|
||
}
|
||
.into_iter()
|
||
.collect();
|
||
|
||
let affinity = if let Some(cpu_affinity) = config.affinity.as_ref() {
|
||
cpu_affinity
|
||
.iter()
|
||
.map(|a| (a.vcpu, a.host_cpus.clone()))
|
||
.collect()
|
||
} else {
|
||
BTreeMap::new()
|
||
};
|
||
|
||
let cpu_manager = Arc::new(Mutex::new(CpuManager {
|
||
config: config.clone(),
|
||
interrupt_controller: device_manager.interrupt_controller().clone(),
|
||
vm_memory: guest_memory,
|
||
#[cfg(target_arch = "x86_64")]
|
||
cpuid,
|
||
vm,
|
||
vcpus_kill_signalled: Arc::new(AtomicBool::new(false)),
|
||
vcpus_pause_signalled: Arc::new(AtomicBool::new(false)),
|
||
vcpu_states,
|
||
exit_evt,
|
||
reset_evt,
|
||
selected_cpu: 0,
|
||
vcpus: Vec::with_capacity(usize::from(config.max_vcpus)),
|
||
seccomp_action,
|
||
vmmops,
|
||
#[cfg(feature = "acpi")]
|
||
acpi_address,
|
||
#[cfg(feature = "acpi")]
|
||
proximity_domain_per_cpu,
|
||
affinity,
|
||
}));
|
||
|
||
#[cfg(feature = "acpi")]
|
||
device_manager
|
||
.mmio_bus()
|
||
.insert(
|
||
cpu_manager.clone(),
|
||
acpi_address.0,
|
||
CPU_MANAGER_ACPI_SIZE as u64,
|
||
)
|
||
.map_err(Error::BusError)?;
|
||
|
||
Ok(cpu_manager)
|
||
}
|
||
|
||
fn create_vcpu(
|
||
&mut self,
|
||
cpu_id: u8,
|
||
entry_point: Option<EntryPoint>,
|
||
snapshot: Option<Snapshot>,
|
||
) -> Result<Arc<Mutex<Vcpu>>> {
|
||
info!("Creating vCPU: cpu_id = {}", cpu_id);
|
||
|
||
let mut vcpu = Vcpu::new(cpu_id, &self.vm, Some(self.vmmops.clone()))?;
|
||
|
||
if let Some(snapshot) = snapshot {
|
||
// AArch64 vCPUs should be initialized after created.
|
||
#[cfg(target_arch = "aarch64")]
|
||
vcpu.init(&self.vm)?;
|
||
|
||
vcpu.restore(snapshot).expect("Failed to restore vCPU");
|
||
} else {
|
||
let vm_memory = self.vm_memory.clone();
|
||
|
||
#[cfg(target_arch = "x86_64")]
|
||
vcpu.configure(
|
||
entry_point,
|
||
&vm_memory,
|
||
self.cpuid.clone(),
|
||
self.config.kvm_hyperv,
|
||
)
|
||
.expect("Failed to configure vCPU");
|
||
|
||
#[cfg(target_arch = "aarch64")]
|
||
vcpu.configure(&self.vm, entry_point, &vm_memory)
|
||
.expect("Failed to configure vCPU");
|
||
}
|
||
|
||
// Adding vCPU to the CpuManager's vCPU list.
|
||
let vcpu = Arc::new(Mutex::new(vcpu));
|
||
self.vcpus.push(Arc::clone(&vcpu));
|
||
|
||
Ok(vcpu)
|
||
}
|
||
|
||
/// Only create new vCPUs if there aren't any inactive ones to reuse
|
||
fn create_vcpus(&mut self, desired_vcpus: u8, entry_point: Option<EntryPoint>) -> Result<()> {
|
||
info!(
|
||
"Request to create new vCPUs: desired = {}, max = {}, allocated = {}, present = {}",
|
||
desired_vcpus,
|
||
self.config.max_vcpus,
|
||
self.vcpus.len(),
|
||
self.present_vcpus()
|
||
);
|
||
|
||
if desired_vcpus > self.config.max_vcpus {
|
||
return Err(Error::DesiredVCpuCountExceedsMax);
|
||
}
|
||
|
||
// Only create vCPUs in excess of all the allocated vCPUs.
|
||
for cpu_id in self.vcpus.len() as u8..desired_vcpus {
|
||
self.create_vcpu(cpu_id, entry_point, None)?;
|
||
}
|
||
|
||
Ok(())
|
||
}
|
||
|
||
fn start_vcpu(
|
||
&mut self,
|
||
vcpu: Arc<Mutex<Vcpu>>,
|
||
vcpu_id: u8,
|
||
vcpu_thread_barrier: Arc<Barrier>,
|
||
inserting: bool,
|
||
) -> Result<()> {
|
||
let reset_evt = self.reset_evt.try_clone().unwrap();
|
||
let exit_evt = self.exit_evt.try_clone().unwrap();
|
||
let panic_exit_evt = self.exit_evt.try_clone().unwrap();
|
||
let vcpu_kill_signalled = self.vcpus_kill_signalled.clone();
|
||
let vcpu_pause_signalled = self.vcpus_pause_signalled.clone();
|
||
|
||
let vcpu_kill = self.vcpu_states[usize::from(vcpu_id)].kill.clone();
|
||
let vcpu_run_interrupted = self.vcpu_states[usize::from(vcpu_id)]
|
||
.vcpu_run_interrupted
|
||
.clone();
|
||
let panic_vcpu_run_interrupted = vcpu_run_interrupted.clone();
|
||
|
||
// Prepare the CPU set the current vCPU is expected to run onto.
|
||
let cpuset = self.affinity.get(&vcpu_id).map(|host_cpus| {
|
||
let mut cpuset: libc::cpu_set_t = unsafe { std::mem::zeroed() };
|
||
unsafe { libc::CPU_ZERO(&mut cpuset) };
|
||
for host_cpu in host_cpus {
|
||
unsafe { libc::CPU_SET(*host_cpu as usize, &mut cpuset) };
|
||
}
|
||
cpuset
|
||
});
|
||
|
||
// Retrieve seccomp filter for vcpu thread
|
||
let vcpu_seccomp_filter = get_seccomp_filter(&self.seccomp_action, Thread::Vcpu)
|
||
.map_err(Error::CreateSeccompFilter)?;
|
||
|
||
#[cfg(target_arch = "x86_64")]
|
||
let interrupt_controller_clone = self.interrupt_controller.as_ref().cloned();
|
||
|
||
info!("Starting vCPU: cpu_id = {}", vcpu_id);
|
||
|
||
let handle = Some(
|
||
thread::Builder::new()
|
||
.name(format!("vcpu{}", vcpu_id))
|
||
.spawn(move || {
|
||
// Schedule the thread to run on the expected CPU set
|
||
if let Some(cpuset) = cpuset.as_ref() {
|
||
let ret = unsafe {
|
||
libc::sched_setaffinity(
|
||
0,
|
||
std::mem::size_of::<libc::cpu_set_t>(),
|
||
cpuset as *const libc::cpu_set_t,
|
||
)
|
||
};
|
||
|
||
if ret != 0 {
|
||
error!(
|
||
"Failed scheduling the vCPU {} on the expected CPU set: {}",
|
||
vcpu_id,
|
||
io::Error::last_os_error()
|
||
);
|
||
return;
|
||
}
|
||
}
|
||
|
||
// Apply seccomp filter for vcpu thread.
|
||
if !vcpu_seccomp_filter.is_empty() {
|
||
if let Err(e) =
|
||
apply_filter(&vcpu_seccomp_filter).map_err(Error::ApplySeccompFilter)
|
||
{
|
||
error!("Error applying seccomp filter: {:?}", e);
|
||
return;
|
||
}
|
||
}
|
||
extern "C" fn handle_signal(_: i32, _: *mut siginfo_t, _: *mut c_void) {}
|
||
// This uses an async signal safe handler to kill the vcpu handles.
|
||
register_signal_handler(SIGRTMIN(), handle_signal)
|
||
.expect("Failed to register vcpu signal handler");
|
||
// Block until all CPUs are ready.
|
||
vcpu_thread_barrier.wait();
|
||
|
||
std::panic::catch_unwind(move || {
|
||
loop {
|
||
// If we are being told to pause, we park the thread
|
||
// until the pause boolean is toggled.
|
||
// The resume operation is responsible for toggling
|
||
// the boolean and unpark the thread.
|
||
// We enter a loop because park() could spuriously
|
||
// return. We will then park() again unless the
|
||
// pause boolean has been toggled.
|
||
|
||
// Need to use Ordering::SeqCst as we have multiple
|
||
// loads and stores to different atomics and we need
|
||
// to see them in a consistent order in all threads
|
||
|
||
if vcpu_pause_signalled.load(Ordering::SeqCst) {
|
||
vcpu_run_interrupted.store(true, Ordering::SeqCst);
|
||
while vcpu_pause_signalled.load(Ordering::SeqCst) {
|
||
thread::park();
|
||
}
|
||
vcpu_run_interrupted.store(false, Ordering::SeqCst);
|
||
}
|
||
|
||
// We've been told to terminate
|
||
if vcpu_kill_signalled.load(Ordering::SeqCst)
|
||
|| vcpu_kill.load(Ordering::SeqCst)
|
||
{
|
||
vcpu_run_interrupted.store(true, Ordering::SeqCst);
|
||
break;
|
||
}
|
||
|
||
// vcpu.run() returns false on a triple-fault so trigger a reset
|
||
match vcpu.lock().unwrap().run() {
|
||
Ok(run) => match run {
|
||
#[cfg(target_arch = "x86_64")]
|
||
VmExit::IoapicEoi(vector) => {
|
||
if let Some(interrupt_controller) =
|
||
&interrupt_controller_clone
|
||
{
|
||
interrupt_controller
|
||
.lock()
|
||
.unwrap()
|
||
.end_of_interrupt(vector);
|
||
}
|
||
}
|
||
VmExit::Ignore => {}
|
||
VmExit::Hyperv => {}
|
||
VmExit::Reset => {
|
||
info!("VmExit::Reset");
|
||
vcpu_run_interrupted.store(true, Ordering::SeqCst);
|
||
reset_evt.write(1).unwrap();
|
||
break;
|
||
}
|
||
VmExit::Shutdown => {
|
||
info!("VmExit::Shutdown");
|
||
vcpu_run_interrupted.store(true, Ordering::SeqCst);
|
||
exit_evt.write(1).unwrap();
|
||
break;
|
||
}
|
||
_ => {
|
||
error!(
|
||
"VCPU generated error: {:?}",
|
||
Error::UnexpectedVmExit
|
||
);
|
||
break;
|
||
}
|
||
},
|
||
|
||
Err(e) => {
|
||
error!("VCPU generated error: {:?}", Error::VcpuRun(e.into()));
|
||
break;
|
||
}
|
||
}
|
||
|
||
// We've been told to terminate
|
||
if vcpu_kill_signalled.load(Ordering::SeqCst)
|
||
|| vcpu_kill.load(Ordering::SeqCst)
|
||
{
|
||
vcpu_run_interrupted.store(true, Ordering::SeqCst);
|
||
break;
|
||
}
|
||
}
|
||
})
|
||
.or_else(|_| {
|
||
panic_vcpu_run_interrupted.store(true, Ordering::SeqCst);
|
||
error!("vCPU thread panicked");
|
||
panic_exit_evt.write(1)
|
||
})
|
||
.ok();
|
||
})
|
||
.map_err(Error::VcpuSpawn)?,
|
||
);
|
||
|
||
// On hot plug calls into this function entry_point is None. It is for
|
||
// those hotplug CPU additions that we need to set the inserting flag.
|
||
self.vcpu_states[usize::from(vcpu_id)].handle = handle;
|
||
self.vcpu_states[usize::from(vcpu_id)].inserting = inserting;
|
||
|
||
Ok(())
|
||
}
|
||
|
||
/// Start up as many vCPUs threads as needed to reach `desired_vcpus`
|
||
fn activate_vcpus(&mut self, desired_vcpus: u8, inserting: bool) -> Result<()> {
|
||
if desired_vcpus > self.config.max_vcpus {
|
||
return Err(Error::DesiredVCpuCountExceedsMax);
|
||
}
|
||
|
||
let vcpu_thread_barrier = Arc::new(Barrier::new(
|
||
(desired_vcpus - self.present_vcpus() + 1) as usize,
|
||
));
|
||
|
||
info!(
|
||
"Starting vCPUs: desired = {}, allocated = {}, present = {}",
|
||
desired_vcpus,
|
||
self.vcpus.len(),
|
||
self.present_vcpus()
|
||
);
|
||
|
||
// This reuses any inactive vCPUs as well as any that were newly created
|
||
for vcpu_id in self.present_vcpus()..desired_vcpus {
|
||
let vcpu = Arc::clone(&self.vcpus[vcpu_id as usize]);
|
||
self.start_vcpu(vcpu, vcpu_id, vcpu_thread_barrier.clone(), inserting)?;
|
||
}
|
||
|
||
// Unblock all CPU threads.
|
||
vcpu_thread_barrier.wait();
|
||
Ok(())
|
||
}
|
||
|
||
fn mark_vcpus_for_removal(&mut self, desired_vcpus: u8) {
|
||
// Mark vCPUs for removal, actual removal happens on ejection
|
||
for cpu_id in desired_vcpus..self.present_vcpus() {
|
||
self.vcpu_states[usize::from(cpu_id)].removing = true;
|
||
}
|
||
}
|
||
|
||
fn remove_vcpu(&mut self, cpu_id: u8) -> Result<()> {
|
||
info!("Removing vCPU: cpu_id = {}", cpu_id);
|
||
let mut state = &mut self.vcpu_states[usize::from(cpu_id)];
|
||
state.kill.store(true, Ordering::SeqCst);
|
||
state.signal_thread();
|
||
state.join_thread()?;
|
||
state.handle = None;
|
||
|
||
// Once the thread has exited, clear the "kill" so that it can reused
|
||
state.kill.store(false, Ordering::SeqCst);
|
||
|
||
Ok(())
|
||
}
|
||
|
||
pub fn create_boot_vcpus(&mut self, entry_point: Option<EntryPoint>) -> Result<()> {
|
||
self.create_vcpus(self.boot_vcpus(), entry_point)
|
||
}
|
||
|
||
// Starts all the vCPUs that the VM is booting with. Blocks until all vCPUs are running.
|
||
pub fn start_boot_vcpus(&mut self) -> Result<()> {
|
||
self.activate_vcpus(self.boot_vcpus(), false)
|
||
}
|
||
|
||
pub fn start_restored_vcpus(&mut self) -> Result<()> {
|
||
let vcpu_numbers = self.vcpus.len() as u8;
|
||
let vcpu_thread_barrier = Arc::new(Barrier::new((vcpu_numbers + 1) as usize));
|
||
// Restore the vCPUs in "paused" state.
|
||
self.vcpus_pause_signalled.store(true, Ordering::SeqCst);
|
||
|
||
for vcpu_id in 0..vcpu_numbers {
|
||
let vcpu = Arc::clone(&self.vcpus[vcpu_id as usize]);
|
||
|
||
self.start_vcpu(vcpu, vcpu_id, vcpu_thread_barrier.clone(), false)
|
||
.map_err(|e| {
|
||
Error::StartRestoreVcpu(anyhow!("Failed to start restored vCPUs: {:#?}", e))
|
||
})?;
|
||
}
|
||
// Unblock all restored CPU threads.
|
||
vcpu_thread_barrier.wait();
|
||
Ok(())
|
||
}
|
||
|
||
pub fn resize(&mut self, desired_vcpus: u8) -> Result<bool> {
|
||
match desired_vcpus.cmp(&self.present_vcpus()) {
|
||
cmp::Ordering::Greater => {
|
||
self.create_vcpus(desired_vcpus, None)?;
|
||
self.activate_vcpus(desired_vcpus, true)?;
|
||
Ok(true)
|
||
}
|
||
cmp::Ordering::Less => {
|
||
self.mark_vcpus_for_removal(desired_vcpus);
|
||
Ok(true)
|
||
}
|
||
_ => Ok(false),
|
||
}
|
||
}
|
||
|
||
pub fn shutdown(&mut self) -> Result<()> {
|
||
// Tell the vCPUs to stop themselves next time they go through the loop
|
||
self.vcpus_kill_signalled.store(true, Ordering::SeqCst);
|
||
|
||
// Toggle the vCPUs pause boolean
|
||
self.vcpus_pause_signalled.store(false, Ordering::SeqCst);
|
||
|
||
// Unpark all the VCPU threads.
|
||
for state in self.vcpu_states.iter() {
|
||
state.unpark_thread();
|
||
}
|
||
|
||
// Signal to the spawned threads (vCPUs and console signal handler). For the vCPU threads
|
||
// this will interrupt the KVM_RUN ioctl() allowing the loop to check the boolean set
|
||
// above.
|
||
for state in self.vcpu_states.iter() {
|
||
state.signal_thread();
|
||
}
|
||
|
||
// Wait for all the threads to finish. This removes the state from the vector.
|
||
for mut state in self.vcpu_states.drain(..) {
|
||
state.join_thread()?;
|
||
}
|
||
|
||
Ok(())
|
||
}
|
||
|
||
#[cfg(feature = "tdx")]
|
||
pub fn initialize_tdx(&self, hob_address: u64) -> Result<()> {
|
||
for vcpu in &self.vcpus {
|
||
vcpu.lock()
|
||
.unwrap()
|
||
.vcpu
|
||
.tdx_init(hob_address)
|
||
.map_err(Error::InitializeTdx)?;
|
||
}
|
||
Ok(())
|
||
}
|
||
|
||
pub fn boot_vcpus(&self) -> u8 {
|
||
self.config.boot_vcpus
|
||
}
|
||
|
||
pub fn max_vcpus(&self) -> u8 {
|
||
self.config.max_vcpus
|
||
}
|
||
|
||
#[cfg(target_arch = "x86_64")]
|
||
pub fn common_cpuid(&self) -> CpuId {
|
||
self.cpuid.clone()
|
||
}
|
||
|
||
fn present_vcpus(&self) -> u8 {
|
||
self.vcpu_states
|
||
.iter()
|
||
.fold(0, |acc, state| acc + state.active() as u8)
|
||
}
|
||
|
||
#[cfg(target_arch = "aarch64")]
|
||
pub fn get_mpidrs(&self) -> Vec<u64> {
|
||
self.vcpus
|
||
.iter()
|
||
.map(|cpu| cpu.lock().unwrap().get_mpidr())
|
||
.collect()
|
||
}
|
||
|
||
#[cfg(target_arch = "aarch64")]
|
||
pub fn get_saved_states(&self) -> Vec<CpuState> {
|
||
self.vcpus
|
||
.iter()
|
||
.map(|cpu| cpu.lock().unwrap().get_saved_state().unwrap())
|
||
.collect()
|
||
}
|
||
|
||
#[cfg(target_arch = "aarch64")]
|
||
pub fn get_vcpu_topology(&self) -> Option<(u8, u8, u8)> {
|
||
self.config
|
||
.topology
|
||
.clone()
|
||
.map(|t| (t.threads_per_core, t.cores_per_die, t.packages))
|
||
}
|
||
|
||
#[cfg(feature = "acpi")]
|
||
pub fn create_madt(&self) -> Sdt {
|
||
use crate::acpi;
|
||
// This is also checked in the commandline parsing.
|
||
assert!(self.config.boot_vcpus <= self.config.max_vcpus);
|
||
|
||
let mut madt = Sdt::new(*b"APIC", 44, 5, *b"CLOUDH", *b"CHMADT ", 1);
|
||
#[cfg(target_arch = "x86_64")]
|
||
{
|
||
madt.write(36, arch::layout::APIC_START);
|
||
|
||
for cpu in 0..self.config.max_vcpus {
|
||
let lapic = LocalApic {
|
||
r#type: acpi::ACPI_APIC_PROCESSOR,
|
||
length: 8,
|
||
processor_id: cpu,
|
||
apic_id: cpu,
|
||
flags: if cpu < self.config.boot_vcpus {
|
||
1 << MADT_CPU_ENABLE_FLAG
|
||
} else {
|
||
0
|
||
},
|
||
};
|
||
madt.append(lapic);
|
||
}
|
||
|
||
madt.append(Ioapic {
|
||
r#type: acpi::ACPI_APIC_IO,
|
||
length: 12,
|
||
ioapic_id: 0,
|
||
apic_address: arch::layout::IOAPIC_START.0 as u32,
|
||
gsi_base: 0,
|
||
..Default::default()
|
||
});
|
||
|
||
madt.append(InterruptSourceOverride {
|
||
r#type: acpi::ACPI_APIC_XRUPT_OVERRIDE,
|
||
length: 10,
|
||
bus: 0,
|
||
source: 4,
|
||
gsi: 4,
|
||
flags: 0,
|
||
});
|
||
}
|
||
|
||
#[cfg(target_arch = "aarch64")]
|
||
{
|
||
/* Notes:
|
||
* Ignore Local Interrupt Controller Address at byte offset 36 of MADT table.
|
||
*/
|
||
|
||
// See section 5.2.12.14 GIC CPU Interface (GICC) Structure in ACPI spec.
|
||
for cpu in 0..self.config.boot_vcpus {
|
||
let vcpu = &self.vcpus[cpu as usize];
|
||
let mpidr = vcpu.lock().unwrap().get_mpidr();
|
||
/* ARMv8 MPIDR format:
|
||
Bits [63:40] Must be zero
|
||
Bits [39:32] Aff3 : Match Aff3 of target processor MPIDR
|
||
Bits [31:24] Must be zero
|
||
Bits [23:16] Aff2 : Match Aff2 of target processor MPIDR
|
||
Bits [15:8] Aff1 : Match Aff1 of target processor MPIDR
|
||
Bits [7:0] Aff0 : Match Aff0 of target processor MPIDR
|
||
*/
|
||
let mpidr_mask = 0xff_00ff_ffff;
|
||
let gicc = GicC {
|
||
r#type: acpi::ACPI_APIC_GENERIC_CPU_INTERFACE,
|
||
length: 80,
|
||
reserved0: 0,
|
||
cpu_interface_number: cpu as u32,
|
||
uid: cpu as u32,
|
||
flags: 1,
|
||
parking_version: 0,
|
||
performance_interrupt: 0,
|
||
parked_address: 0,
|
||
base_address: 0,
|
||
gicv_base_address: 0,
|
||
gich_base_address: 0,
|
||
vgic_interrupt: 0,
|
||
gicr_base_address: 0,
|
||
mpidr: mpidr & mpidr_mask,
|
||
proc_power_effi_class: 0,
|
||
reserved1: 0,
|
||
spe_overflow_interrupt: 0,
|
||
};
|
||
|
||
madt.append(gicc);
|
||
}
|
||
|
||
// GIC Distributor structure. See section 5.2.12.15 in ACPI spec.
|
||
let gicd = GicD {
|
||
r#type: acpi::ACPI_APIC_GENERIC_DISTRIBUTOR,
|
||
length: 24,
|
||
reserved0: 0,
|
||
gic_id: 0,
|
||
base_address: arch::layout::MAPPED_IO_START - 0x0001_0000,
|
||
global_irq_base: 0,
|
||
version: 3,
|
||
reserved1: [0; 3],
|
||
};
|
||
madt.append(gicd);
|
||
|
||
// See 5.2.12.17 GIC Redistributor (GICR) Structure in ACPI spec.
|
||
let gicr_size: u32 = 0x0001_0000 * 2 * (self.config.boot_vcpus as u32);
|
||
let gicr_base: u64 = arch::layout::MAPPED_IO_START - 0x0001_0000 - gicr_size as u64;
|
||
let gicr = GicR {
|
||
r#type: acpi::ACPI_APIC_GENERIC_REDISTRIBUTOR,
|
||
length: 16,
|
||
reserved: 0,
|
||
base_address: gicr_base,
|
||
range_length: gicr_size,
|
||
};
|
||
madt.append(gicr);
|
||
|
||
// See 5.2.12.18 GIC Interrupt Translation Service (ITS) Structure in ACPI spec.
|
||
let gicits = GicIts {
|
||
r#type: acpi::ACPI_APIC_GENERIC_TRANSLATOR,
|
||
length: 20,
|
||
reserved0: 0,
|
||
translation_id: 0,
|
||
base_address: gicr_base - 2 * 0x0001_0000,
|
||
reserved1: 0,
|
||
};
|
||
madt.append(gicits);
|
||
|
||
madt.update_checksum();
|
||
}
|
||
|
||
madt
|
||
}
|
||
|
||
#[cfg(all(target_arch = "aarch64", feature = "acpi"))]
|
||
pub fn create_pptt(&self) -> Sdt {
|
||
let pptt_start = 0;
|
||
let mut cpus = 0;
|
||
let mut uid = 0;
|
||
let threads_per_core = self.get_vcpu_topology().unwrap_or_default().0 as u8;
|
||
let cores_per_package = self.get_vcpu_topology().unwrap_or_default().1 as u8;
|
||
let packages = self.get_vcpu_topology().unwrap_or_default().2 as u8;
|
||
|
||
let mut pptt = Sdt::new(*b"PPTT", 36, 2, *b"CLOUDH", *b"CHPPTT ", 1);
|
||
|
||
for cluster_idx in 0..packages {
|
||
if cpus < self.config.boot_vcpus as usize {
|
||
let cluster_offset = pptt.len() - pptt_start;
|
||
let cluster_hierarchy_node = ProcessorHierarchyNode {
|
||
r#type: 0,
|
||
length: 20,
|
||
reserved: 0,
|
||
flags: 0x2,
|
||
parent: 0,
|
||
acpi_processor_id: cluster_idx as u32,
|
||
num_private_resources: 0,
|
||
};
|
||
pptt.append(cluster_hierarchy_node);
|
||
|
||
for core_idx in 0..cores_per_package {
|
||
let core_offset = pptt.len() - pptt_start;
|
||
|
||
if threads_per_core > 1 {
|
||
let core_hierarchy_node = ProcessorHierarchyNode {
|
||
r#type: 0,
|
||
length: 20,
|
||
reserved: 0,
|
||
flags: 0x2,
|
||
parent: cluster_offset as u32,
|
||
acpi_processor_id: core_idx as u32,
|
||
num_private_resources: 0,
|
||
};
|
||
pptt.append(core_hierarchy_node);
|
||
|
||
for _thread_idx in 0..threads_per_core {
|
||
let thread_hierarchy_node = ProcessorHierarchyNode {
|
||
r#type: 0,
|
||
length: 20,
|
||
reserved: 0,
|
||
flags: 0xE,
|
||
parent: core_offset as u32,
|
||
acpi_processor_id: uid as u32,
|
||
num_private_resources: 0,
|
||
};
|
||
pptt.append(thread_hierarchy_node);
|
||
uid += 1;
|
||
}
|
||
} else {
|
||
let thread_hierarchy_node = ProcessorHierarchyNode {
|
||
r#type: 0,
|
||
length: 20,
|
||
reserved: 0,
|
||
flags: 0xA,
|
||
parent: cluster_offset as u32,
|
||
acpi_processor_id: uid as u32,
|
||
num_private_resources: 0,
|
||
};
|
||
pptt.append(thread_hierarchy_node);
|
||
uid += 1;
|
||
}
|
||
}
|
||
cpus += (cores_per_package * threads_per_core) as usize;
|
||
}
|
||
}
|
||
|
||
pptt.update_checksum();
|
||
pptt
|
||
}
|
||
}
|
||
|
||
#[cfg(feature = "acpi")]
|
||
struct Cpu {
|
||
cpu_id: u8,
|
||
proximity_domain: u32,
|
||
}
|
||
|
||
#[cfg(all(target_arch = "x86_64", feature = "acpi"))]
|
||
const MADT_CPU_ENABLE_FLAG: usize = 0;
|
||
|
||
#[cfg(feature = "acpi")]
|
||
impl Cpu {
|
||
#[cfg(target_arch = "x86_64")]
|
||
fn generate_mat(&self) -> Vec<u8> {
|
||
let lapic = LocalApic {
|
||
r#type: 0,
|
||
length: 8,
|
||
processor_id: self.cpu_id,
|
||
apic_id: self.cpu_id,
|
||
flags: 1 << MADT_CPU_ENABLE_FLAG,
|
||
};
|
||
|
||
let mut mat_data: Vec<u8> = Vec::new();
|
||
mat_data.resize(std::mem::size_of_val(&lapic), 0);
|
||
unsafe { *(mat_data.as_mut_ptr() as *mut LocalApic) = lapic };
|
||
|
||
mat_data
|
||
}
|
||
}
|
||
|
||
#[cfg(feature = "acpi")]
|
||
impl Aml for Cpu {
|
||
fn append_aml_bytes(&self, bytes: &mut Vec<u8>) {
|
||
#[cfg(target_arch = "x86_64")]
|
||
let mat_data: Vec<u8> = self.generate_mat();
|
||
|
||
aml::Device::new(
|
||
format!("C{:03}", self.cpu_id).as_str().into(),
|
||
vec![
|
||
&aml::Name::new("_HID".into(), &"ACPI0007"),
|
||
&aml::Name::new("_UID".into(), &self.cpu_id),
|
||
// Currently, AArch64 cannot support following fields.
|
||
/*
|
||
_STA return value:
|
||
Bit [0] – Set if the device is present.
|
||
Bit [1] – Set if the device is enabled and decoding its resources.
|
||
Bit [2] – Set if the device should be shown in the UI.
|
||
Bit [3] – Set if the device is functioning properly (cleared if device failed its diagnostics).
|
||
Bit [4] – Set if the battery is present.
|
||
Bits [31:5] – Reserved (must be cleared).
|
||
*/
|
||
#[cfg(target_arch = "x86_64")]
|
||
&aml::Method::new(
|
||
"_STA".into(),
|
||
0,
|
||
false,
|
||
// Call into CSTA method which will interrogate device
|
||
vec![&aml::Return::new(&aml::MethodCall::new(
|
||
"CSTA".into(),
|
||
vec![&self.cpu_id],
|
||
))],
|
||
),
|
||
&aml::Method::new(
|
||
"_PXM".into(),
|
||
0,
|
||
false,
|
||
vec![&aml::Return::new(&self.proximity_domain)],
|
||
),
|
||
// The Linux kernel expects every CPU device to have a _MAT entry
|
||
// containing the LAPIC for this processor with the enabled bit set
|
||
// even it if is disabled in the MADT (non-boot CPU)
|
||
#[cfg(target_arch = "x86_64")]
|
||
&aml::Name::new("_MAT".into(), &aml::Buffer::new(mat_data)),
|
||
// Trigger CPU ejection
|
||
#[cfg(target_arch = "x86_64")]
|
||
&aml::Method::new(
|
||
"_EJ0".into(),
|
||
1,
|
||
false,
|
||
// Call into CEJ0 method which will actually eject device
|
||
vec![&aml::MethodCall::new("CEJ0".into(), vec![&self.cpu_id])],
|
||
),
|
||
],
|
||
)
|
||
.append_aml_bytes(bytes)
|
||
}
|
||
}
|
||
|
||
#[cfg(feature = "acpi")]
|
||
struct CpuNotify {
|
||
cpu_id: u8,
|
||
}
|
||
|
||
#[cfg(feature = "acpi")]
|
||
impl Aml for CpuNotify {
|
||
fn append_aml_bytes(&self, bytes: &mut Vec<u8>) {
|
||
let object = aml::Path::new(&format!("C{:03}", self.cpu_id));
|
||
aml::If::new(
|
||
&aml::Equal::new(&aml::Arg(0), &self.cpu_id),
|
||
vec![&aml::Notify::new(&object, &aml::Arg(1))],
|
||
)
|
||
.append_aml_bytes(bytes)
|
||
}
|
||
}
|
||
|
||
#[cfg(feature = "acpi")]
|
||
struct CpuMethods {
|
||
max_vcpus: u8,
|
||
}
|
||
|
||
#[cfg(feature = "acpi")]
|
||
impl Aml for CpuMethods {
|
||
fn append_aml_bytes(&self, bytes: &mut Vec<u8>) {
|
||
// CPU status method
|
||
aml::Method::new(
|
||
"CSTA".into(),
|
||
1,
|
||
true,
|
||
vec![
|
||
// Take lock defined above
|
||
&aml::Acquire::new("\\_SB_.PRES.CPLK".into(), 0xffff),
|
||
// Write CPU number (in first argument) to I/O port via field
|
||
&aml::Store::new(&aml::Path::new("\\_SB_.PRES.CSEL"), &aml::Arg(0)),
|
||
&aml::Store::new(&aml::Local(0), &aml::ZERO),
|
||
// Check if CPEN bit is set, if so make the local variable 0xf (see _STA for details of meaning)
|
||
&aml::If::new(
|
||
&aml::Equal::new(&aml::Path::new("\\_SB_.PRES.CPEN"), &aml::ONE),
|
||
vec![&aml::Store::new(&aml::Local(0), &0xfu8)],
|
||
),
|
||
// Release lock
|
||
&aml::Release::new("\\_SB_.PRES.CPLK".into()),
|
||
// Return 0 or 0xf
|
||
&aml::Return::new(&aml::Local(0)),
|
||
],
|
||
)
|
||
.append_aml_bytes(bytes);
|
||
|
||
let mut cpu_notifies = Vec::new();
|
||
for cpu_id in 0..self.max_vcpus {
|
||
cpu_notifies.push(CpuNotify { cpu_id });
|
||
}
|
||
|
||
let mut cpu_notifies_refs: Vec<&dyn aml::Aml> = Vec::new();
|
||
for cpu_id in 0..self.max_vcpus {
|
||
cpu_notifies_refs.push(&cpu_notifies[usize::from(cpu_id)]);
|
||
}
|
||
|
||
aml::Method::new("CTFY".into(), 2, true, cpu_notifies_refs).append_aml_bytes(bytes);
|
||
|
||
aml::Method::new(
|
||
"CEJ0".into(),
|
||
1,
|
||
true,
|
||
vec![
|
||
&aml::Acquire::new("\\_SB_.PRES.CPLK".into(), 0xffff),
|
||
// Write CPU number (in first argument) to I/O port via field
|
||
&aml::Store::new(&aml::Path::new("\\_SB_.PRES.CSEL"), &aml::Arg(0)),
|
||
// Set CEJ0 bit
|
||
&aml::Store::new(&aml::Path::new("\\_SB_.PRES.CEJ0"), &aml::ONE),
|
||
&aml::Release::new("\\_SB_.PRES.CPLK".into()),
|
||
],
|
||
)
|
||
.append_aml_bytes(bytes);
|
||
|
||
aml::Method::new(
|
||
"CSCN".into(),
|
||
0,
|
||
true,
|
||
vec![
|
||
// Take lock defined above
|
||
&aml::Acquire::new("\\_SB_.PRES.CPLK".into(), 0xffff),
|
||
&aml::Store::new(&aml::Local(0), &aml::ZERO),
|
||
&aml::While::new(
|
||
&aml::LessThan::new(&aml::Local(0), &self.max_vcpus),
|
||
vec![
|
||
// Write CPU number (in first argument) to I/O port via field
|
||
&aml::Store::new(&aml::Path::new("\\_SB_.PRES.CSEL"), &aml::Local(0)),
|
||
// Check if CINS bit is set
|
||
&aml::If::new(
|
||
&aml::Equal::new(&aml::Path::new("\\_SB_.PRES.CINS"), &aml::ONE),
|
||
// Notify device if it is
|
||
vec![
|
||
&aml::MethodCall::new(
|
||
"CTFY".into(),
|
||
vec![&aml::Local(0), &aml::ONE],
|
||
),
|
||
// Reset CINS bit
|
||
&aml::Store::new(&aml::Path::new("\\_SB_.PRES.CINS"), &aml::ONE),
|
||
],
|
||
),
|
||
// Check if CRMV bit is set
|
||
&aml::If::new(
|
||
&aml::Equal::new(&aml::Path::new("\\_SB_.PRES.CRMV"), &aml::ONE),
|
||
// Notify device if it is (with the eject constant 0x3)
|
||
vec![
|
||
&aml::MethodCall::new("CTFY".into(), vec![&aml::Local(0), &3u8]),
|
||
// Reset CRMV bit
|
||
&aml::Store::new(&aml::Path::new("\\_SB_.PRES.CRMV"), &aml::ONE),
|
||
],
|
||
),
|
||
&aml::Add::new(&aml::Local(0), &aml::Local(0), &aml::ONE),
|
||
],
|
||
),
|
||
// Release lock
|
||
&aml::Release::new("\\_SB_.PRES.CPLK".into()),
|
||
],
|
||
)
|
||
.append_aml_bytes(bytes)
|
||
}
|
||
}
|
||
|
||
#[cfg(feature = "acpi")]
|
||
impl Aml for CpuManager {
|
||
fn append_aml_bytes(&self, bytes: &mut Vec<u8>) {
|
||
// CPU hotplug controller
|
||
#[cfg(target_arch = "x86_64")]
|
||
aml::Device::new(
|
||
"_SB_.PRES".into(),
|
||
vec![
|
||
&aml::Name::new("_HID".into(), &aml::EisaName::new("PNP0A06")),
|
||
&aml::Name::new("_UID".into(), &"CPU Hotplug Controller"),
|
||
// Mutex to protect concurrent access as we write to choose CPU and then read back status
|
||
&aml::Mutex::new("CPLK".into(), 0),
|
||
&aml::Name::new(
|
||
"_CRS".into(),
|
||
&aml::ResourceTemplate::new(vec![&aml::AddressSpace::new_memory(
|
||
aml::AddressSpaceCachable::NotCacheable,
|
||
true,
|
||
self.acpi_address.0 as u64,
|
||
self.acpi_address.0 + CPU_MANAGER_ACPI_SIZE as u64 - 1,
|
||
)]),
|
||
),
|
||
// OpRegion and Fields map MMIO range into individual field values
|
||
&aml::OpRegion::new(
|
||
"PRST".into(),
|
||
aml::OpRegionSpace::SystemMemory,
|
||
self.acpi_address.0 as usize,
|
||
CPU_MANAGER_ACPI_SIZE,
|
||
),
|
||
&aml::Field::new(
|
||
"PRST".into(),
|
||
aml::FieldAccessType::Byte,
|
||
aml::FieldUpdateRule::WriteAsZeroes,
|
||
vec![
|
||
aml::FieldEntry::Reserved(32),
|
||
aml::FieldEntry::Named(*b"CPEN", 1),
|
||
aml::FieldEntry::Named(*b"CINS", 1),
|
||
aml::FieldEntry::Named(*b"CRMV", 1),
|
||
aml::FieldEntry::Named(*b"CEJ0", 1),
|
||
aml::FieldEntry::Reserved(4),
|
||
aml::FieldEntry::Named(*b"CCMD", 8),
|
||
],
|
||
),
|
||
&aml::Field::new(
|
||
"PRST".into(),
|
||
aml::FieldAccessType::DWord,
|
||
aml::FieldUpdateRule::Preserve,
|
||
vec![
|
||
aml::FieldEntry::Named(*b"CSEL", 32),
|
||
aml::FieldEntry::Reserved(32),
|
||
aml::FieldEntry::Named(*b"CDAT", 32),
|
||
],
|
||
),
|
||
],
|
||
)
|
||
.append_aml_bytes(bytes);
|
||
|
||
// CPU devices
|
||
let hid = aml::Name::new("_HID".into(), &"ACPI0010");
|
||
let uid = aml::Name::new("_CID".into(), &aml::EisaName::new("PNP0A05"));
|
||
// Bundle methods together under a common object
|
||
let methods = CpuMethods {
|
||
max_vcpus: self.config.max_vcpus,
|
||
};
|
||
let mut cpu_data_inner: Vec<&dyn aml::Aml> = vec![&hid, &uid, &methods];
|
||
|
||
let mut cpu_devices = Vec::new();
|
||
for cpu_id in 0..self.config.max_vcpus {
|
||
let proximity_domain = *self.proximity_domain_per_cpu.get(&cpu_id).unwrap_or(&0);
|
||
let cpu_device = Cpu {
|
||
cpu_id,
|
||
proximity_domain,
|
||
};
|
||
|
||
cpu_devices.push(cpu_device);
|
||
}
|
||
|
||
for cpu_device in cpu_devices.iter() {
|
||
cpu_data_inner.push(cpu_device);
|
||
}
|
||
|
||
aml::Device::new("_SB_.CPUS".into(), cpu_data_inner).append_aml_bytes(bytes)
|
||
}
|
||
}
|
||
|
||
impl Pausable for CpuManager {
|
||
fn pause(&mut self) -> std::result::Result<(), MigratableError> {
|
||
// Tell the vCPUs to pause themselves next time they exit
|
||
self.vcpus_pause_signalled.store(true, Ordering::SeqCst);
|
||
|
||
// Signal to the spawned threads (vCPUs and console signal handler). For the vCPU threads
|
||
// this will interrupt the KVM_RUN ioctl() allowing the loop to check the boolean set
|
||
// above.
|
||
for state in self.vcpu_states.iter() {
|
||
state.signal_thread();
|
||
}
|
||
|
||
for vcpu in self.vcpus.iter() {
|
||
let mut vcpu = vcpu.lock().unwrap();
|
||
vcpu.pause()?;
|
||
#[cfg(all(feature = "kvm", target_arch = "x86_64"))]
|
||
if !self.config.kvm_hyperv {
|
||
vcpu.vcpu.notify_guest_clock_paused().map_err(|e| {
|
||
MigratableError::Pause(anyhow!(
|
||
"Could not notify guest it has been paused {:?}",
|
||
e
|
||
))
|
||
})?;
|
||
}
|
||
}
|
||
|
||
Ok(())
|
||
}
|
||
|
||
fn resume(&mut self) -> std::result::Result<(), MigratableError> {
|
||
for vcpu in self.vcpus.iter() {
|
||
vcpu.lock().unwrap().resume()?;
|
||
}
|
||
|
||
// Toggle the vCPUs pause boolean
|
||
self.vcpus_pause_signalled.store(false, Ordering::SeqCst);
|
||
|
||
// Unpark all the VCPU threads.
|
||
// Once unparked, the next thing they will do is checking for the pause
|
||
// boolean. Since it'll be set to false, they will exit their pause loop
|
||
// and go back to vmx root.
|
||
for state in self.vcpu_states.iter() {
|
||
state.unpark_thread();
|
||
}
|
||
Ok(())
|
||
}
|
||
}
|
||
|
||
impl Snapshottable for CpuManager {
|
||
fn id(&self) -> String {
|
||
CPU_MANAGER_SNAPSHOT_ID.to_string()
|
||
}
|
||
|
||
fn snapshot(&mut self) -> std::result::Result<Snapshot, MigratableError> {
|
||
let mut cpu_manager_snapshot = Snapshot::new(CPU_MANAGER_SNAPSHOT_ID);
|
||
|
||
// The CpuManager snapshot is a collection of all vCPUs snapshots.
|
||
for vcpu in &self.vcpus {
|
||
let cpu_snapshot = vcpu.lock().unwrap().snapshot()?;
|
||
cpu_manager_snapshot.add_snapshot(cpu_snapshot);
|
||
}
|
||
|
||
Ok(cpu_manager_snapshot)
|
||
}
|
||
|
||
fn restore(&mut self, snapshot: Snapshot) -> std::result::Result<(), MigratableError> {
|
||
for (cpu_id, snapshot) in snapshot.snapshots.iter() {
|
||
info!("Restoring VCPU {}", cpu_id);
|
||
self.create_vcpu(cpu_id.parse::<u8>().unwrap(), None, Some(*snapshot.clone()))
|
||
.map_err(|e| MigratableError::Restore(anyhow!("Could not create vCPU {:?}", e)))?;
|
||
}
|
||
|
||
Ok(())
|
||
}
|
||
}
|
||
|
||
impl Transportable for CpuManager {}
|
||
impl Migratable for CpuManager {}
|
||
|
||
#[cfg(all(feature = "kvm", target_arch = "x86_64"))]
|
||
#[cfg(test)]
|
||
mod tests {
|
||
use arch::x86_64::interrupts::*;
|
||
use arch::x86_64::regs::*;
|
||
use hypervisor::x86_64::{FpuState, LapicState, StandardRegisters};
|
||
|
||
#[test]
|
||
fn test_setlint() {
|
||
let hv = hypervisor::new().unwrap();
|
||
let vm = hv.create_vm().expect("new VM fd creation failed");
|
||
assert!(hv.check_required_extensions().is_ok());
|
||
// Calling get_lapic will fail if there is no irqchip before hand.
|
||
assert!(vm.create_irq_chip().is_ok());
|
||
let vcpu = vm.create_vcpu(0, None).unwrap();
|
||
let klapic_before: LapicState = vcpu.get_lapic().unwrap();
|
||
|
||
// Compute the value that is expected to represent LVT0 and LVT1.
|
||
let lint0 = get_klapic_reg(&klapic_before, APIC_LVT0);
|
||
let lint1 = get_klapic_reg(&klapic_before, APIC_LVT1);
|
||
let lint0_mode_expected = set_apic_delivery_mode(lint0, APIC_MODE_EXTINT);
|
||
let lint1_mode_expected = set_apic_delivery_mode(lint1, APIC_MODE_NMI);
|
||
|
||
set_lint(&vcpu).unwrap();
|
||
|
||
// Compute the value that represents LVT0 and LVT1 after set_lint.
|
||
let klapic_actual: LapicState = vcpu.get_lapic().unwrap();
|
||
let lint0_mode_actual = get_klapic_reg(&klapic_actual, APIC_LVT0);
|
||
let lint1_mode_actual = get_klapic_reg(&klapic_actual, APIC_LVT1);
|
||
assert_eq!(lint0_mode_expected, lint0_mode_actual);
|
||
assert_eq!(lint1_mode_expected, lint1_mode_actual);
|
||
}
|
||
|
||
#[test]
|
||
fn test_setup_fpu() {
|
||
let hv = hypervisor::new().unwrap();
|
||
let vm = hv.create_vm().expect("new VM fd creation failed");
|
||
let vcpu = vm.create_vcpu(0, None).unwrap();
|
||
setup_fpu(&vcpu).unwrap();
|
||
|
||
let expected_fpu: FpuState = FpuState {
|
||
fcw: 0x37f,
|
||
mxcsr: 0x1f80,
|
||
..Default::default()
|
||
};
|
||
let actual_fpu: FpuState = vcpu.get_fpu().unwrap();
|
||
// TODO: auto-generate kvm related structures with PartialEq on.
|
||
assert_eq!(expected_fpu.fcw, actual_fpu.fcw);
|
||
// Setting the mxcsr register from FpuState inside setup_fpu does not influence anything.
|
||
// See 'kvm_arch_vcpu_ioctl_set_fpu' from arch/x86/kvm/x86.c.
|
||
// The mxcsr will stay 0 and the assert below fails. Decide whether or not we should
|
||
// remove it at all.
|
||
// assert!(expected_fpu.mxcsr == actual_fpu.mxcsr);
|
||
}
|
||
|
||
#[test]
|
||
fn test_setup_msrs() {
|
||
use hypervisor::arch::x86::msr_index;
|
||
use hypervisor::x86_64::{MsrEntries, MsrEntry};
|
||
|
||
let hv = hypervisor::new().unwrap();
|
||
let vm = hv.create_vm().expect("new VM fd creation failed");
|
||
let vcpu = vm.create_vcpu(0, None).unwrap();
|
||
setup_msrs(&vcpu).unwrap();
|
||
|
||
// This test will check against the last MSR entry configured (the tenth one).
|
||
// See create_msr_entries for details.
|
||
let mut msrs = MsrEntries::from_entries(&[MsrEntry {
|
||
index: msr_index::MSR_IA32_MISC_ENABLE,
|
||
..Default::default()
|
||
}])
|
||
.unwrap();
|
||
|
||
// get_msrs returns the number of msrs that it succeed in reading. We only want to read 1
|
||
// in this test case scenario.
|
||
let read_msrs = vcpu.get_msrs(&mut msrs).unwrap();
|
||
assert_eq!(read_msrs, 1);
|
||
|
||
// Official entries that were setup when we did setup_msrs. We need to assert that the
|
||
// tenth one (i.e the one with index msr_index::MSR_IA32_MISC_ENABLE has the data we
|
||
// expect.
|
||
let entry_vec = hypervisor::x86_64::boot_msr_entries();
|
||
assert_eq!(entry_vec.as_slice()[9], msrs.as_slice()[0]);
|
||
}
|
||
|
||
#[test]
|
||
fn test_setup_regs() {
|
||
let hv = hypervisor::new().unwrap();
|
||
let vm = hv.create_vm().expect("new VM fd creation failed");
|
||
let vcpu = vm.create_vcpu(0, None).unwrap();
|
||
|
||
let expected_regs: StandardRegisters = StandardRegisters {
|
||
rflags: 0x0000000000000002u64,
|
||
rbx: arch::layout::PVH_INFO_START.0,
|
||
rip: 1,
|
||
..Default::default()
|
||
};
|
||
|
||
setup_regs(&vcpu, expected_regs.rip).unwrap();
|
||
|
||
let actual_regs: StandardRegisters = vcpu.get_regs().unwrap();
|
||
assert_eq!(actual_regs, expected_regs);
|
||
}
|
||
}
|
||
|
||
#[cfg(target_arch = "aarch64")]
|
||
#[cfg(test)]
|
||
mod tests {
|
||
use crate::GuestMemoryMmap;
|
||
use arch::aarch64::layout;
|
||
use arch::aarch64::regs::*;
|
||
use hypervisor::kvm::aarch64::{is_system_register, MPIDR_EL1};
|
||
use hypervisor::kvm::kvm_bindings::{
|
||
kvm_one_reg, kvm_regs, kvm_vcpu_init, user_pt_regs, KVM_REG_ARM64, KVM_REG_ARM64_SYSREG,
|
||
KVM_REG_ARM_CORE, KVM_REG_SIZE_U64,
|
||
};
|
||
use hypervisor::{arm64_core_reg_id, offset__of};
|
||
use std::mem;
|
||
use vm_memory::GuestAddress;
|
||
|
||
#[test]
|
||
fn test_setup_regs() {
|
||
let hv = hypervisor::new().unwrap();
|
||
let vm = hv.create_vm().unwrap();
|
||
let vcpu = vm.create_vcpu(0, None).unwrap();
|
||
let regions = vec![(
|
||
GuestAddress(layout::RAM_64BIT_START),
|
||
(layout::FDT_MAX_SIZE + 0x1000) as usize,
|
||
)];
|
||
let mem = GuestMemoryMmap::from_ranges(®ions).expect("Cannot initialize memory");
|
||
|
||
let res = setup_regs(&vcpu, 0, 0x0, &mem);
|
||
// Must fail when vcpu is not initialized yet.
|
||
assert!(res.is_err());
|
||
|
||
let mut kvi: kvm_vcpu_init = kvm_vcpu_init::default();
|
||
vm.get_preferred_target(&mut kvi).unwrap();
|
||
vcpu.vcpu_init(&kvi).unwrap();
|
||
|
||
assert!(setup_regs(&vcpu, 0, 0x0, &mem).is_ok());
|
||
}
|
||
|
||
#[test]
|
||
fn test_read_mpidr() {
|
||
let hv = hypervisor::new().unwrap();
|
||
let vm = hv.create_vm().unwrap();
|
||
let vcpu = vm.create_vcpu(0, None).unwrap();
|
||
let mut kvi: kvm_vcpu_init = kvm_vcpu_init::default();
|
||
vm.get_preferred_target(&mut kvi).unwrap();
|
||
|
||
// Must fail when vcpu is not initialized yet.
|
||
assert!(vcpu.read_mpidr().is_err());
|
||
|
||
vcpu.vcpu_init(&kvi).unwrap();
|
||
assert_eq!(vcpu.read_mpidr().unwrap(), 0x80000000);
|
||
}
|
||
|
||
#[test]
|
||
fn test_is_system_register() {
|
||
let offset = offset__of!(user_pt_regs, pc);
|
||
let regid = arm64_core_reg_id!(KVM_REG_SIZE_U64, offset);
|
||
assert!(!is_system_register(regid));
|
||
let regid = KVM_REG_ARM64 as u64 | KVM_REG_SIZE_U64 as u64 | KVM_REG_ARM64_SYSREG as u64;
|
||
assert!(is_system_register(regid));
|
||
}
|
||
|
||
#[test]
|
||
fn test_save_restore_core_regs() {
|
||
let hv = hypervisor::new().unwrap();
|
||
let vm = hv.create_vm().unwrap();
|
||
let vcpu = vm.create_vcpu(0, None).unwrap();
|
||
let mut kvi: kvm_vcpu_init = kvm_vcpu_init::default();
|
||
vm.get_preferred_target(&mut kvi).unwrap();
|
||
|
||
// Must fail when vcpu is not initialized yet.
|
||
let mut state = kvm_regs::default();
|
||
let res = vcpu.core_registers(&mut state);
|
||
assert!(res.is_err());
|
||
assert_eq!(
|
||
format!("{}", res.unwrap_err()),
|
||
"Failed to get core register: Exec format error (os error 8)"
|
||
);
|
||
|
||
let res = vcpu.set_core_registers(&state);
|
||
assert!(res.is_err());
|
||
assert_eq!(
|
||
format!("{}", res.unwrap_err()),
|
||
"Failed to set core register: Exec format error (os error 8)"
|
||
);
|
||
|
||
vcpu.vcpu_init(&kvi).unwrap();
|
||
assert!(vcpu.core_registers(&mut state).is_ok());
|
||
assert_eq!(state.regs.pstate, 0x3C5);
|
||
|
||
assert!(vcpu.set_core_registers(&state).is_ok());
|
||
let off = offset__of!(user_pt_regs, pstate);
|
||
let pstate = vcpu
|
||
.get_reg(arm64_core_reg_id!(KVM_REG_SIZE_U64, off))
|
||
.expect("Failed to call kvm get one reg");
|
||
assert_eq!(state.regs.pstate, pstate);
|
||
}
|
||
|
||
#[test]
|
||
fn test_save_restore_system_regs() {
|
||
let hv = hypervisor::new().unwrap();
|
||
let vm = hv.create_vm().unwrap();
|
||
let vcpu = vm.create_vcpu(0, None).unwrap();
|
||
let mut kvi: kvm_vcpu_init = kvm_vcpu_init::default();
|
||
vm.get_preferred_target(&mut kvi).unwrap();
|
||
|
||
// Must fail when vcpu is not initialized yet.
|
||
let mut state: Vec<kvm_one_reg> = Vec::new();
|
||
let res = vcpu.system_registers(&mut state);
|
||
assert!(res.is_err());
|
||
assert_eq!(
|
||
format!("{}", res.unwrap_err()),
|
||
"Failed to retrieve list of registers: Exec format error (os error 8)"
|
||
);
|
||
|
||
state.push(kvm_one_reg {
|
||
id: MPIDR_EL1,
|
||
addr: 0x00,
|
||
});
|
||
let res = vcpu.set_system_registers(&state);
|
||
assert!(res.is_err());
|
||
assert_eq!(
|
||
format!("{}", res.unwrap_err()),
|
||
"Failed to set system register: Exec format error (os error 8)"
|
||
);
|
||
|
||
vcpu.vcpu_init(&kvi).unwrap();
|
||
assert!(vcpu.system_registers(&mut state).is_ok());
|
||
let initial_mpidr: u64 = vcpu.read_mpidr().expect("Fail to read mpidr");
|
||
assert!(state.contains(&kvm_one_reg {
|
||
id: MPIDR_EL1,
|
||
addr: initial_mpidr
|
||
}));
|
||
|
||
assert!(vcpu.set_system_registers(&state).is_ok());
|
||
let mpidr: u64 = vcpu.read_mpidr().expect("Fail to read mpidr");
|
||
assert_eq!(initial_mpidr, mpidr);
|
||
}
|
||
|
||
#[test]
|
||
fn test_get_set_mpstate() {
|
||
let hv = hypervisor::new().unwrap();
|
||
let vm = hv.create_vm().unwrap();
|
||
let vcpu = vm.create_vcpu(0, None).unwrap();
|
||
let mut kvi: kvm_vcpu_init = kvm_vcpu_init::default();
|
||
vm.get_preferred_target(&mut kvi).unwrap();
|
||
|
||
let res = vcpu.get_mp_state();
|
||
assert!(res.is_ok());
|
||
assert!(vcpu.set_mp_state(res.unwrap()).is_ok());
|
||
}
|
||
}
|