seoul: support to run VM outside VMM's PD

Issue #949

Related to issue #808 - one way to nearly double the maximum VM size for
VMs on 32bit Genode/Nova host if decreased performance is acceptable.
This commit is contained in:
Alexander Boettcher 2013-11-14 11:58:28 +01:00 committed by Norman Feske
parent 67c1ad4cdd
commit f00195e26d
3 changed files with 111 additions and 27 deletions

View File

@ -19,27 +19,89 @@
#include <base/thread.h> #include <base/thread.h>
#include <cap_session/connection.h> #include <cap_session/connection.h>
#include <nova_cpu_session/connection.h> #include <nova_cpu_session/connection.h>
#include <cpu_session/connection.h>
#include <pd_session/connection.h>
namespace Vmm { namespace Vmm {
using namespace Genode; using namespace Genode;
class Vcpu_thread; class Vcpu_thread;
class Vcpu_other_pd;
class Vcpu_same_pd;
} }
class Vmm::Vcpu_thread
{
public:
class Vmm::Vcpu_thread : Genode::Thread_base virtual Genode::addr_t exc_base() = 0;
virtual void start(Genode::addr_t) = 0;
};
class Vmm::Vcpu_other_pd : public Vmm::Vcpu_thread
{ {
private: private:
/** Genode::Pd_connection _pd_session;
* Log2 size of portal window used for virtualization events Genode::Cpu_connection _cpu_session;
*/
enum { VCPU_EXC_BASE_LOG2 = 8 }; Genode::addr_t _exc_pt_sel;
public: public:
Vcpu_thread(size_t stack_size) Vcpu_other_pd()
:
_pd_session("VM"), _cpu_session("vCPU"),
_exc_pt_sel(Genode::cap_map()->insert(Nova::NUM_INITIAL_VCPU_PT_LOG2))
{ }
void start(Genode::addr_t sel_ec)
{
using namespace Genode;
Thread_capability vcpu_vm = _cpu_session.create_thread("vCPU");
/* assign thread to protection domain */
_pd_session.bind_thread(vcpu_vm);
/* create new pager object and assign it to the new thread */
Pager_capability pager_cap = env()->rm_session()->add_client(vcpu_vm);
_cpu_session.set_pager(vcpu_vm, pager_cap);
/* tell parent that this will be a vCPU */
Thread_state state;
state.sel_exc_base = Native_thread::INVALID_INDEX;
state.is_vcpu = true;
_cpu_session.state(vcpu_vm, state);
/*
* Delegate parent the vCPU exception portals required during PD
* creation.
*/
delegate_vcpu_portals(pager_cap, exc_base());
/* start vCPU in separate PD */
_cpu_session.start(vcpu_vm, 0, 0);
/*
* Request native EC thread cap and put it next to the
* SM cap - see Vcpu_dispatcher->sel_sm_ec description
*/
request_native_ec_cap(pager_cap, sel_ec);
}
Genode::addr_t exc_base() { return _exc_pt_sel; }
};
class Vmm::Vcpu_same_pd : public Vmm::Vcpu_thread, Genode::Thread_base
{
public:
Vcpu_same_pd(size_t stack_size)
: :
Thread_base("vCPU", stack_size) Thread_base("vCPU", stack_size)
{ {
@ -47,18 +109,18 @@ class Vmm::Vcpu_thread : Genode::Thread_base
Genode::cap_map()->remove(tid().exc_pt_sel, Nova::NUM_INITIAL_PT_LOG2); Genode::cap_map()->remove(tid().exc_pt_sel, Nova::NUM_INITIAL_PT_LOG2);
/* allocate correct number of selectors */ /* allocate correct number of selectors */
this->tid().exc_pt_sel = cap_map()->insert(VCPU_EXC_BASE_LOG2); this->tid().exc_pt_sel = cap_map()->insert(Nova::NUM_INITIAL_VCPU_PT_LOG2);
/* tell generic thread code that this becomes a vCPU */ /* tell generic thread code that this becomes a vCPU */
this->tid().is_vcpu = true; this->tid().is_vcpu = true;
} }
~Vcpu_thread() ~Vcpu_same_pd()
{ {
using namespace Nova; using namespace Nova;
revoke(Nova::Obj_crd(this->tid().exc_pt_sel, VCPU_EXC_BASE_LOG2)); revoke(Nova::Obj_crd(this->tid().exc_pt_sel, NUM_INITIAL_VCPU_PT_LOG2));
cap_map()->remove(this->tid().exc_pt_sel, VCPU_EXC_BASE_LOG2, false); cap_map()->remove(this->tid().exc_pt_sel, NUM_INITIAL_VCPU_PT_LOG2, false);
/* allocate selectors for ~Thread */ /* allocate selectors for ~Thread */
this->tid().exc_pt_sel = cap_map()->insert(Nova::NUM_INITIAL_PT_LOG2); this->tid().exc_pt_sel = cap_map()->insert(Nova::NUM_INITIAL_PT_LOG2);

View File

@ -42,7 +42,7 @@ build $build_components
# write Seoul config file # write Seoul config file
set vm_cfg_fd [open "bin/vm_linux.cfg" w] set vm_cfg_fd [open "bin/vm_linux.cfg" w]
puts $vm_cfg_fd {<config> puts $vm_cfg_fd {<config colocate="1" >
<machine> <machine>
<mem start="0x0" end="0x9a000"/> <mem start="0x0" end="0x9a000"/>
<mem start="0x100000" end="0xfffff000"/> <mem start="0x100000" end="0xfffff000"/>

View File

@ -256,7 +256,7 @@ class Vcpu_dispatcher : public Vmm::Vcpu_dispatcher,
*/ */
Genode::Synced_interface<VCpu> _vcpu; Genode::Synced_interface<VCpu> _vcpu;
Vmm::Vcpu_thread _vcpu_thread; Vmm::Vcpu_thread *_vcpu_thread;
/** /**
* Guest-physical memory * Guest-physical memory
@ -669,9 +669,10 @@ class Vcpu_dispatcher : public Vmm::Vcpu_dispatcher,
PERR("could not register handler %lx", exc_base + EV); PERR("could not register handler %lx", exc_base + EV);
} }
public:
enum { STACK_SIZE = 1024*sizeof(Genode::addr_t) }; enum { STACK_SIZE = 1024*sizeof(Genode::addr_t) };
public:
Vcpu_dispatcher(Genode::Lock &vcpu_lock, Vcpu_dispatcher(Genode::Lock &vcpu_lock,
Genode::Cap_connection &cap_connection, Genode::Cap_connection &cap_connection,
@ -679,11 +680,12 @@ class Vcpu_dispatcher : public Vmm::Vcpu_dispatcher,
Guest_memory &guest_memory, Guest_memory &guest_memory,
Synced_motherboard &motherboard, Synced_motherboard &motherboard,
bool has_svm, bool has_svm,
bool has_vmx) bool has_vmx,
Vmm::Vcpu_thread *vcpu_thread)
: :
Vmm::Vcpu_dispatcher(STACK_SIZE, cap_connection), Vmm::Vcpu_dispatcher(STACK_SIZE, cap_connection),
_vcpu(vcpu_lock, unsynchronized_vcpu), _vcpu(vcpu_lock, unsynchronized_vcpu),
_vcpu_thread(STACK_SIZE), _vcpu_thread(vcpu_thread),
_guest_memory(guest_memory), _guest_memory(guest_memory),
_motherboard(motherboard) _motherboard(motherboard)
{ {
@ -698,11 +700,10 @@ class Vcpu_dispatcher : public Vmm::Vcpu_dispatcher,
/* /*
* Register vCPU event handlers * Register vCPU event handlers
*/ */
Genode::addr_t const exc_base = _vcpu_thread.exc_base(); Genode::addr_t const exc_base = _vcpu_thread->exc_base();
typedef Vcpu_dispatcher This; typedef Vcpu_dispatcher This;
if (has_svm) { if (has_svm) {
_register_handler<0x64, &This::_vmx_irqwin> _register_handler<0x64, &This::_vmx_irqwin>
(exc_base, MTD_IRQ); (exc_base, MTD_IRQ);
_register_handler<0x72, &This::_svm_cpuid> _register_handler<0x72, &This::_svm_cpuid>
@ -725,7 +726,6 @@ class Vcpu_dispatcher : public Vmm::Vcpu_dispatcher,
(exc_base, MTD_IRQ); (exc_base, MTD_IRQ);
} else if (has_vmx) { } else if (has_vmx) {
_register_handler<2, &This::_vmx_triple> _register_handler<2, &This::_vmx_triple>
(exc_base, MTD_ALL); (exc_base, MTD_ALL);
_register_handler<3, &This::_vmx_init> _register_handler<3, &This::_vmx_init>
@ -765,7 +765,7 @@ class Vcpu_dispatcher : public Vmm::Vcpu_dispatcher,
} }
/* let vCPU run */ /* let vCPU run */
_vcpu_thread.start(sel_sm_ec() + 1); _vcpu_thread->start(sel_sm_ec() + 1);
/* handle cpuid overrides */ /* handle cpuid overrides */
unsynchronized_vcpu->executor.add(this, receive_static<CpuMessage>); unsynchronized_vcpu->executor.add(this, receive_static<CpuMessage>);
@ -834,6 +834,7 @@ class Machine : public StaticReceiver<Machine>
Alarm_thread *_alarm_thread; Alarm_thread *_alarm_thread;
bool _alloc_fb_mem; /* For detecting FB alloc message */ bool _alloc_fb_mem; /* For detecting FB alloc message */
bool _colocate_vm_vmm;
Nic::Session *_nic; Nic::Session *_nic;
Rtc::Session *_rtc; Rtc::Session *_rtc;
@ -908,13 +909,21 @@ class Machine : public StaticReceiver<Machine>
if (verbose_debug) if (verbose_debug)
Logging::printf("OP_VCPU_CREATE_BACKEND\n"); Logging::printf("OP_VCPU_CREATE_BACKEND\n");
Vmm::Vcpu_thread * vcpu_thread;
if (_colocate_vm_vmm)
vcpu_thread = new Vmm::Vcpu_same_pd(Vcpu_dispatcher::STACK_SIZE);
else
vcpu_thread = new Vmm::Vcpu_other_pd();
Vcpu_dispatcher *vcpu_dispatcher = Vcpu_dispatcher *vcpu_dispatcher =
new Vcpu_dispatcher(_motherboard_lock, new Vcpu_dispatcher(_motherboard_lock,
_cap, _cap,
msg.vcpu, msg.vcpu,
_guest_memory, _guest_memory,
_motherboard, _motherboard,
_hip->has_feature_svm(), _hip->has_feature_vmx()); _hip->has_feature_svm(),
_hip->has_feature_vmx(),
vcpu_thread);
msg.value = vcpu_dispatcher->sel_sm_ec(); msg.value = vcpu_dispatcher->sel_sm_ec();
return true; return true;
@ -1190,7 +1199,8 @@ class Machine : public StaticReceiver<Machine>
/** /**
* Constructor * Constructor
*/ */
Machine(Boot_module_provider &boot_modules, Guest_memory &guest_memory) Machine(Boot_module_provider &boot_modules, Guest_memory &guest_memory,
bool colocate)
: :
_hip_rom("hypervisor_info_page"), _hip_rom("hypervisor_info_page"),
_hip(Genode::env()->rm_session()->attach(_hip_rom.dataspace())), _hip(Genode::env()->rm_session()->attach(_hip_rom.dataspace())),
@ -1200,7 +1210,8 @@ class Machine : public StaticReceiver<Machine>
_motherboard(_motherboard_lock, &_unsynchronized_motherboard), _motherboard(_motherboard_lock, &_unsynchronized_motherboard),
_timeouts(_timeouts_lock, &_unsynchronized_timeouts), _timeouts(_timeouts_lock, &_unsynchronized_timeouts),
_guest_memory(guest_memory), _guest_memory(guest_memory),
_boot_modules(boot_modules) _boot_modules(boot_modules),
_colocate_vm_vmm(colocate)
{ {
_timeouts()->init(); _timeouts()->init();
@ -1344,6 +1355,7 @@ int main(int argc, char **argv)
{ {
Genode::addr_t fb_size = 4*1024*1024; Genode::addr_t fb_size = 4*1024*1024;
Genode::addr_t vm_size; Genode::addr_t vm_size;
unsigned colocate = 1; /* by default co-locate VM and VMM in same PD */
{ {
/* /*
@ -1374,17 +1386,24 @@ int main(int argc, char **argv)
arg.value(&val); arg.value(&val);
fb_size = val*1024; fb_size = val*1024;
} catch (...) { } } catch (...) { }
/* read out whether VM and VMM should be colocated or not */
try {
Genode::config()->xml_node().attribute("colocate").value(&colocate);
} catch (...) { }
} }
/* re-adjust reservation to actual VM size */ if (colocate)
Vmm::Virtual_reservation reservation(vm_size); /* re-adjust reservation to actual VM size */
static Vmm::Virtual_reservation reservation(vm_size);
/* setup guest memory */ /* setup guest memory */
static Guest_memory guest_memory(vm_size, fb_size); static Guest_memory guest_memory(vm_size, fb_size);
/* diagnostic messages */ /* diagnostic messages */
Genode::printf("[0x%012lx, 0x%012lx) - %lu MiB - VM accessible memory\n", if (colocate)
0, vm_size, vm_size / 1024 / 1024); Genode::printf("[0x%012lx, 0x%012lx) - %lu MiB - VM accessible "
"memory\n", 0, vm_size, vm_size / 1024 / 1024);
if (guest_memory.backing_store_local_base()) if (guest_memory.backing_store_local_base())
Genode::printf("[0x%012p, 0x%012p) - %lu MiB - VMM accessible shadow " Genode::printf("[0x%012p, 0x%012p) - %lu MiB - VMM accessible shadow "
@ -1421,7 +1440,8 @@ int main(int argc, char **argv)
static Boot_module_provider static Boot_module_provider
boot_modules(Genode::config()->xml_node().sub_node("multiboot")); boot_modules(Genode::config()->xml_node().sub_node("multiboot"));
static Machine machine(boot_modules, guest_memory); /* create the PC machine based on the configuration given */
static Machine machine(boot_modules, guest_memory, colocate);
/* create console thread */ /* create console thread */
Vancouver_console vcon(machine.motherboard(), fb_size, guest_memory.fb_ds()); Vancouver_console vcon(machine.motherboard(), fb_size, guest_memory.fb_ds());
@ -1437,6 +1457,8 @@ int main(int argc, char **argv)
machine.setup_devices(Genode::config()->xml_node().sub_node("machine")); machine.setup_devices(Genode::config()->xml_node().sub_node("machine"));
PINF("VM and VMM %s.", colocate ? "co-located" : "not co-located");
Genode::printf("\n--- Booting VM ---\n"); Genode::printf("\n--- Booting VM ---\n");
machine.boot(); machine.boot();