1513 lines
42 KiB
C++
1513 lines
42 KiB
C++
/*
|
|
* \brief Vancouver main program for Genode
|
|
* \author Norman Feske
|
|
* \author Markus Partheymueller
|
|
* \date 2011-11-18
|
|
*
|
|
* Important remark about debugging output:
|
|
*
|
|
* Most of the code within this file is called during virtualization event
|
|
* handling. NOVA's virtualization fault mechanism carries information about
|
|
* the fault cause and fault resolution in the UTCB of the VCPU handler EC.
|
|
* Consequently, the code involved in the fault handling is expected to
|
|
* preserve the UTCB content. I.e., it must not involve the use of IPC, which
|
|
* employs the UTCB to carry IPC payload. Because Genode's debug-output macros
|
|
* use the remote LOG service via IPC as back end, those macros must not be
|
|
* used directly. Instead, the 'Logging::printf' function should be used, which
|
|
* takes care about saving and restoring the UTCB.
|
|
*/
|
|
|
|
/*
|
|
* Copyright (C) 2011-2013 Genode Labs GmbH
|
|
* Copyright (C) 2012 Intel Corporation
|
|
*
|
|
* This file is distributed under the terms of the GNU General Public License
|
|
* version 2.
|
|
*
|
|
* The code is partially based on the Vancouver VMM, which is distributed
|
|
* under the terms of the GNU General Public License version 2.
|
|
*
|
|
* Modifications by Intel Corporation are contributed under the terms and
|
|
* conditions of the GNU General Public License version 2.
|
|
*/
|
|
|
|
/* Genode includes */
|
|
#include <util/touch.h>
|
|
#include <base/sleep.h>
|
|
#include <base/rpc_server.h>
|
|
#include <base/native_types.h>
|
|
#include <util/misc_math.h>
|
|
#include <rom_session/connection.h>
|
|
#include <rm_session/connection.h>
|
|
#include <base/allocator_avl.h>
|
|
#include <nic_session/connection.h>
|
|
#include <nic/packet_allocator.h>
|
|
#include <os/config.h>
|
|
#include <os/alarm.h>
|
|
#include <base/synced_interface.h>
|
|
#include <timer_session/connection.h>
|
|
#include <rtc_session/connection.h>
|
|
|
|
/* VMM utilities includes */
|
|
#include <vmm/guest_memory.h>
|
|
#include <vmm/vcpu_thread.h>
|
|
#include <vmm/vcpu_dispatcher.h>
|
|
|
|
/* NOVA includes that come with Genode */
|
|
#include <nova/syscalls.h>
|
|
|
|
/* NOVA userland includes */
|
|
#include <nul/vcpu.h>
|
|
#include <nul/motherboard.h>
|
|
#include <sys/hip.h>
|
|
|
|
/* utilities includes */
|
|
#include <service/time.h>
|
|
|
|
/* local includes */
|
|
#include "synced_motherboard.h"
|
|
#include "device_model_registry.h"
|
|
#include "boot_module_provider.h"
|
|
#include "console.h"
|
|
#include "network.h"
|
|
#include "disk.h"
|
|
|
|
|
|
enum { verbose_debug = false };
|
|
enum { verbose_npt = false };
|
|
enum { verbose_io = false };
|
|
|
|
static Genode::Native_utcb utcb_backup;
|
|
Genode::Lock *utcb_lock()
|
|
{
|
|
static Genode::Lock inst;
|
|
return &inst;
|
|
}
|
|
|
|
|
|
/* timer service */
|
|
using Genode::Thread;
|
|
using Genode::Alarm_scheduler;
|
|
using Genode::Alarm;
|
|
|
|
typedef Genode::Synced_interface<TimeoutList<32, void> > Synced_timeout_list;
|
|
|
|
class Alarm_thread : Thread<4096>, public Alarm_scheduler
|
|
{
|
|
private:
|
|
|
|
Timer::Connection _timer;
|
|
Alarm::Time _curr_time; /* jiffies value */
|
|
|
|
Synced_motherboard &_motherboard;
|
|
Synced_timeout_list &_timeouts;
|
|
|
|
/**
|
|
* Thread entry function
|
|
*/
|
|
void entry()
|
|
{
|
|
while (true) {
|
|
unsigned long long now = _motherboard()->clock()->time();
|
|
unsigned nr;
|
|
|
|
while ((nr = _timeouts()->trigger(now))) {
|
|
|
|
MessageTimeout msg(nr, _timeouts()->timeout());
|
|
|
|
if (_timeouts()->cancel(nr) < 0)
|
|
Logging::printf("Timeout not cancelled.\n");
|
|
|
|
_motherboard()->bus_timeout.send(msg);
|
|
}
|
|
|
|
_timer.usleep(1000);
|
|
}
|
|
}
|
|
|
|
public:
|
|
|
|
/**
|
|
* Constructor
|
|
*/
|
|
Alarm_thread(Synced_motherboard &mb, Synced_timeout_list &timeouts)
|
|
: Thread("alarm"), _curr_time(0), _motherboard(mb), _timeouts(timeouts)
|
|
{ start(); }
|
|
|
|
Alarm::Time curr_time() { return _curr_time; }
|
|
unsigned long long curr_time_long() { return _motherboard()->clock()->time(); }
|
|
};
|
|
|
|
|
|
/**
|
|
* Representation of guest memory
|
|
*
|
|
* The VMM and the guest share the same PD. However, the guest's view on the PD
|
|
* is restricted to the guest-physical-to-VMM-local mappings installed by the
|
|
* VMM for the VCPU's EC.
|
|
*
|
|
* The guest memory is shadowed at the lower portion of the VMM's address
|
|
* space. If the guest (the VCPU EC) tries to access a page that has no mapping
|
|
* in the VMM's PD, NOVA does not generate a page-fault (which would be
|
|
* delivered to the pager of the VMM, i.e., core) but it produces a NPT
|
|
* virtualization event handled locally by the VMM. The NPT event handler is
|
|
* the '_svm_npt' function.
|
|
*/
|
|
class Guest_memory
|
|
{
|
|
private:
|
|
|
|
Genode::Ram_dataspace_capability _ds;
|
|
Genode::Ram_dataspace_capability _fb_ds;
|
|
|
|
Genode::size_t _backing_store_size;
|
|
Genode::size_t _fb_size;
|
|
|
|
char *_local_addr;
|
|
char *_fb_addr;
|
|
|
|
public:
|
|
|
|
/**
|
|
* Number of bytes that are available to the guest
|
|
*
|
|
* At startup time, some device models (i.e., the VGA controller) claim
|
|
* a bit of guest-physical memory for their respective devices (i.e.,
|
|
* the virtual frame buffer) by calling 'OP_ALLOC_FROM_GUEST'. This
|
|
* function allocates such blocks from the end of the backing store.
|
|
* The 'remaining_size' contains the number of bytes left at the lower
|
|
* part of the backing store for the use as normal guest-physical RAM.
|
|
* It is initialized with the actual backing store size and then
|
|
* managed by the 'OP_ALLOC_FROM_GUEST' handler.
|
|
*/
|
|
Genode::size_t remaining_size;
|
|
|
|
/**
|
|
* Constructor
|
|
*
|
|
* \param backing_store_size number of bytes of physical RAM to be
|
|
* used as guest-physical and device memory,
|
|
* allocated from core's RAM service
|
|
*/
|
|
Guest_memory(Genode::size_t backing_store_size, Genode::size_t fb_size)
|
|
:
|
|
_ds(Genode::env()->ram_session()->alloc(backing_store_size-fb_size)),
|
|
_fb_ds(Genode::env()->ram_session()->alloc(fb_size)),
|
|
_backing_store_size(backing_store_size),
|
|
_fb_size(fb_size),
|
|
_local_addr(0),
|
|
_fb_addr(0),
|
|
remaining_size(backing_store_size-fb_size)
|
|
{
|
|
try {
|
|
/*
|
|
* RAM used as backing store for guest-physical memory
|
|
*/
|
|
_local_addr = Genode::env()->rm_session()->attach(_ds);
|
|
_fb_addr = Genode::env()->rm_session()->attach_at(_fb_ds,
|
|
((Genode::addr_t) _local_addr)+backing_store_size-fb_size);
|
|
|
|
} catch (Genode::Rm_session::Region_conflict) {
|
|
PERR("region conflict");
|
|
}
|
|
}
|
|
|
|
~Guest_memory()
|
|
{
|
|
/* detach and free backing store */
|
|
Genode::env()->rm_session()->detach((void *)_local_addr);
|
|
Genode::env()->ram_session()->free(_ds);
|
|
|
|
Genode::env()->rm_session()->detach((void *)_fb_addr);
|
|
Genode::env()->ram_session()->free(_fb_ds);
|
|
}
|
|
|
|
/**
|
|
* Return pointer to locally mapped backing store
|
|
*/
|
|
char *backing_store_local_base()
|
|
{
|
|
return _local_addr;
|
|
}
|
|
|
|
Genode::size_t backing_store_size()
|
|
{
|
|
return _backing_store_size;
|
|
}
|
|
|
|
/**
|
|
* Return pointer to lo locally mapped fb backing store
|
|
*/
|
|
char *backing_store_fb_local_base()
|
|
{
|
|
return _fb_addr;
|
|
}
|
|
|
|
Genode::size_t fb_size() { return _fb_size; }
|
|
|
|
Genode::Dataspace_capability fb_ds() { return _fb_ds; }
|
|
};
|
|
|
|
|
|
typedef Vmm::Vcpu_dispatcher<Genode::Thread_base> Vcpu_handler;
|
|
|
|
class Vcpu_dispatcher : public Vcpu_handler,
|
|
public StaticReceiver<Vcpu_dispatcher>
|
|
{
|
|
private:
|
|
|
|
/**
|
|
* Pointer to corresponding VCPU model
|
|
*/
|
|
Genode::Synced_interface<VCpu> _vcpu;
|
|
|
|
Vmm::Vcpu_thread *_vcpu_thread;
|
|
|
|
/**
|
|
* Guest-physical memory
|
|
*/
|
|
Guest_memory &_guest_memory;
|
|
|
|
/**
|
|
* Motherboard representing the inter-connections of all device models
|
|
*/
|
|
Synced_motherboard &_motherboard;
|
|
|
|
|
|
/***************
|
|
** Shortcuts **
|
|
***************/
|
|
|
|
static ::Utcb *_utcb_of_myself() {
|
|
return (::Utcb *)Genode::Thread_base::myself()->utcb(); }
|
|
|
|
|
|
/***********************************
|
|
** Virtualization event handlers **
|
|
***********************************/
|
|
|
|
static void _skip_instruction(CpuMessage &msg)
|
|
{
|
|
/* advance EIP */
|
|
assert(msg.mtr_in & MTD_RIP_LEN);
|
|
msg.cpu->eip += msg.cpu->inst_len;
|
|
msg.mtr_out |= MTD_RIP_LEN;
|
|
|
|
/* cancel sti and mov-ss blocking as we emulated an instruction */
|
|
assert(msg.mtr_in & MTD_STATE);
|
|
if (msg.cpu->intr_state & 3) {
|
|
msg.cpu->intr_state &= ~3;
|
|
msg.mtr_out |= MTD_STATE;
|
|
}
|
|
}
|
|
|
|
enum Skip { SKIP = true, NO_SKIP = false };
|
|
|
|
void _handle_vcpu(Skip skip, CpuMessage::Type type)
|
|
{
|
|
Utcb *utcb = _utcb_of_myself();
|
|
|
|
CpuMessage msg(type, static_cast<CpuState *>(utcb), utcb->mtd);
|
|
|
|
if (skip == SKIP)
|
|
_skip_instruction(msg);
|
|
|
|
/**
|
|
* Send the message to the VCpu.
|
|
*/
|
|
if (!_vcpu()->executor.send(msg, true))
|
|
Logging::panic("nobody to execute %s at %x:%x\n",
|
|
__func__, msg.cpu->cs.sel, msg.cpu->eip);
|
|
|
|
/**
|
|
* Check whether we should inject something...
|
|
*/
|
|
if (msg.mtr_in & MTD_INJ && msg.type != CpuMessage::TYPE_CHECK_IRQ) {
|
|
msg.type = CpuMessage::TYPE_CHECK_IRQ;
|
|
if (!_vcpu()->executor.send(msg, true))
|
|
Logging::panic("nobody to execute %s at %x:%x\n",
|
|
__func__, msg.cpu->cs.sel, msg.cpu->eip);
|
|
}
|
|
|
|
/**
|
|
* If the IRQ injection is performed, recalc the IRQ window.
|
|
*/
|
|
if (msg.mtr_out & MTD_INJ) {
|
|
msg.type = CpuMessage::TYPE_CALC_IRQWINDOW;
|
|
if (!_vcpu()->executor.send(msg, true))
|
|
Logging::panic("nobody to execute %s at %x:%x\n",
|
|
__func__, msg.cpu->cs.sel, msg.cpu->eip);
|
|
}
|
|
|
|
msg.cpu->mtd = msg.mtr_out;
|
|
}
|
|
|
|
/**
|
|
* Get position of the least significant 1 bit.
|
|
* bsf is undefined for value == 0.
|
|
*/
|
|
Genode::addr_t bsf(Genode::addr_t value) {
|
|
return __builtin_ctz(value); }
|
|
|
|
bool max_map_crd(Nova::Mem_crd &crd, Genode::addr_t vmm_start,
|
|
Genode::addr_t vm_start, Genode::addr_t size,
|
|
Genode::addr_t vm_fault)
|
|
{
|
|
Nova::Mem_crd crd_save = crd;
|
|
|
|
retry:
|
|
|
|
/* lookup whether page is mapped and its size */
|
|
Nova::uint8_t ret = Nova::lookup(crd);
|
|
if (ret != Nova::NOVA_OK)
|
|
return false;
|
|
|
|
/* page is not mapped, touch it */
|
|
if (crd.is_null()) {
|
|
crd = crd_save;
|
|
Genode::touch_read((unsigned char volatile *)crd.addr());
|
|
goto retry;
|
|
}
|
|
|
|
/* cut-set crd region and vmm region */
|
|
Genode::addr_t cut_start = Genode::max(vmm_start, crd.base());
|
|
Genode::addr_t cut_size = Genode::min(vmm_start + size,
|
|
crd.base() + (1UL << crd.order())) -
|
|
cut_start;
|
|
|
|
/* calculate minimal order of page to be mapped */
|
|
Genode::addr_t map_page = vmm_start + vm_fault - vm_start;
|
|
Genode::addr_t map_order = bsf(vm_fault | map_page | cut_size);
|
|
|
|
Genode::addr_t hotspot = 0;
|
|
|
|
/* calculate maximal aligned order of page to be mapped */
|
|
do {
|
|
crd = Nova::Mem_crd(map_page, map_order,
|
|
crd_save.rights());
|
|
|
|
map_order += 1;
|
|
map_page &= ~((1UL << map_order) - 1);
|
|
hotspot = vm_start + map_page - vmm_start;
|
|
}
|
|
while (cut_start <= map_page &&
|
|
((map_page + (1UL << map_order)) <= (cut_start + cut_size)) &&
|
|
!(hotspot & ((1UL << map_order) - 1)));
|
|
|
|
return true;
|
|
}
|
|
|
|
bool _handle_map_memory(bool need_unmap)
|
|
{
|
|
Utcb *utcb = _utcb_of_myself();
|
|
Genode::addr_t const vm_fault_addr = utcb->qual[1];
|
|
|
|
if (verbose_npt)
|
|
Logging::printf("--> request mapping at 0x%lx\n", vm_fault_addr);
|
|
|
|
MessageMemRegion mem_region(vm_fault_addr >> Vmm::PAGE_SIZE_LOG2);
|
|
|
|
if (!_motherboard()->bus_memregion.send(mem_region, false) ||
|
|
!mem_region.ptr)
|
|
return false;
|
|
|
|
if (verbose_npt)
|
|
Logging::printf("VM page 0x%lx in [0x%lx:0x%lx),"
|
|
" VMM area: [0x%lx:0x%lx)\n",
|
|
mem_region.page, mem_region.start_page,
|
|
mem_region.start_page + mem_region.count,
|
|
(Genode::addr_t)mem_region.ptr >> Vmm::PAGE_SIZE_LOG2,
|
|
((Genode::addr_t)mem_region.ptr >> Vmm::PAGE_SIZE_LOG2)
|
|
+ mem_region.count);
|
|
|
|
Genode::addr_t vmm_memory_base =
|
|
reinterpret_cast<Genode::addr_t>(mem_region.ptr);
|
|
Genode::addr_t vmm_memory_fault = vmm_memory_base +
|
|
(vm_fault_addr - (mem_region.start_page << Vmm::PAGE_SIZE_LOG2));
|
|
|
|
bool read=true, write=true, execute=true;
|
|
/* XXX: Not yet supported by Vancouver.
|
|
if (mem_region.attr == (DESC_TYPE_MEM | DESC_RIGHT_R)) {
|
|
if (verbose_npt)
|
|
Logging::printf("Mapping readonly to %p (err:%x, attr:%x)\n",
|
|
vm_fault_addr, utcb->qual[0], mem_region.attr);
|
|
write = execute = false;
|
|
}*/
|
|
|
|
Nova::Mem_crd crd(vmm_memory_fault >> Vmm::PAGE_SIZE_LOG2, 0,
|
|
Nova::Rights(read, write, execute));
|
|
|
|
if (!max_map_crd(crd, vmm_memory_base >> Vmm::PAGE_SIZE_LOG2,
|
|
mem_region.start_page,
|
|
mem_region.count, mem_region.page))
|
|
Logging::panic("mapping failed");
|
|
|
|
if (need_unmap)
|
|
Logging::panic("_handle_map_memory: need_unmap not handled, yet\n");
|
|
|
|
Genode::addr_t hotspot = (mem_region.start_page << Vmm::PAGE_SIZE_LOG2)
|
|
+ crd.addr() - vmm_memory_base;
|
|
|
|
if (verbose_npt)
|
|
Logging::printf("NPT mapping (base=0x%lx, order=%lu, hotspot=0x%lx)\n",
|
|
crd.base(), crd.order(), hotspot);
|
|
|
|
utcb->mtd = 0;
|
|
|
|
/* EPT violation during IDT vectoring? */
|
|
if (utcb->inj_info & 0x80000000) {
|
|
utcb->mtd |= MTD_INJ;
|
|
Logging::printf("EPT violation during IDT vectoring.\n");
|
|
CpuMessage _win(CpuMessage::TYPE_CALC_IRQWINDOW,
|
|
static_cast<CpuState *>(utcb), utcb->mtd);
|
|
_win.mtr_out = MTD_INJ;
|
|
if (!_vcpu()->executor.send(_win, true))
|
|
Logging::panic("nobody to execute %s at %x:%x\n",
|
|
__func__, utcb->cs.sel, utcb->eip);
|
|
}
|
|
|
|
Nova::Utcb * u = (Nova::Utcb *)utcb;
|
|
u->set_msg_word(0);
|
|
if (!u->append_item(crd, hotspot, false, true))
|
|
Logging::printf("Could not map everything");
|
|
|
|
return true;
|
|
}
|
|
|
|
void _handle_io(bool is_in, unsigned io_order, unsigned port)
|
|
{
|
|
if (verbose_io)
|
|
Logging::printf("--> I/O is_in=%d, io_order=%d, port=%x\n",
|
|
is_in, io_order, port);
|
|
|
|
Utcb *utcb = _utcb_of_myself();
|
|
CpuMessage msg(is_in, static_cast<CpuState *>(utcb), io_order,
|
|
port, &utcb->eax, utcb->mtd);
|
|
_skip_instruction(msg);
|
|
{
|
|
if (!_vcpu()->executor.send(msg, true))
|
|
Logging::panic("nobody to execute %s at %x:%x\n",
|
|
__func__, msg.cpu->cs.sel, msg.cpu->eip);
|
|
}
|
|
|
|
utcb->mtd = msg.mtr_out;
|
|
}
|
|
|
|
/* SVM portal functions */
|
|
void _svm_startup()
|
|
{
|
|
_handle_vcpu(NO_SKIP, CpuMessage::TYPE_CHECK_IRQ);
|
|
}
|
|
|
|
void _svm_npt()
|
|
{
|
|
Utcb *utcb = _utcb_of_myself();
|
|
MessageMemRegion msg(utcb->qual[1] >> Vmm::PAGE_SIZE_LOG2);
|
|
if (!_handle_map_memory(utcb->qual[0] & 1))
|
|
_svm_invalid();
|
|
}
|
|
|
|
void _svm_invalid()
|
|
{
|
|
_handle_vcpu(NO_SKIP, CpuMessage::TYPE_SINGLE_STEP);
|
|
Utcb *utcb = _utcb_of_myself();
|
|
utcb->mtd |= MTD_CTRL;
|
|
utcb->ctrl[0] = 1 << 18; /* cpuid */
|
|
utcb->ctrl[1] = 1 << 0; /* vmrun */
|
|
}
|
|
|
|
void _svm_ioio()
|
|
{
|
|
Utcb *utcb = _utcb_of_myself();
|
|
|
|
if (utcb->qual[0] & 0x4) {
|
|
Logging::printf("invalid gueststate\n");
|
|
utcb->ctrl[1] = 0;
|
|
utcb->mtd = MTD_CTRL;
|
|
} else {
|
|
unsigned order = ((utcb->qual[0] >> 4) & 7) - 1;
|
|
|
|
if (order > 2)
|
|
order = 2;
|
|
|
|
utcb->inst_len = utcb->qual[1] - utcb->eip;
|
|
|
|
_handle_io(utcb->qual[0] & 1, order, utcb->qual[0] >> 16);
|
|
}
|
|
}
|
|
|
|
void _svm_cpuid()
|
|
{
|
|
Utcb *utcb = _utcb_of_myself();
|
|
utcb->inst_len = 2;
|
|
_handle_vcpu(SKIP, CpuMessage::TYPE_CPUID);
|
|
}
|
|
|
|
void _svm_hlt()
|
|
{
|
|
Utcb *utcb = _utcb_of_myself();
|
|
utcb->inst_len = 1;
|
|
_vmx_hlt();
|
|
}
|
|
|
|
void _svm_msr()
|
|
{
|
|
_svm_invalid();
|
|
}
|
|
|
|
void _recall()
|
|
{
|
|
_handle_vcpu(NO_SKIP, CpuMessage::TYPE_CHECK_IRQ);
|
|
}
|
|
|
|
/* VMX portal functions */
|
|
void _vmx_triple()
|
|
{
|
|
_handle_vcpu(NO_SKIP, CpuMessage::TYPE_TRIPLE);
|
|
}
|
|
|
|
void _vmx_init()
|
|
{
|
|
_handle_vcpu(NO_SKIP, CpuMessage::TYPE_INIT);
|
|
}
|
|
|
|
void _vmx_irqwin()
|
|
{
|
|
_handle_vcpu(NO_SKIP, CpuMessage::TYPE_CHECK_IRQ);
|
|
}
|
|
|
|
void _vmx_hlt()
|
|
{
|
|
_handle_vcpu(SKIP, CpuMessage::TYPE_HLT);
|
|
}
|
|
|
|
void _vmx_rdtsc()
|
|
{
|
|
_handle_vcpu(SKIP, CpuMessage::TYPE_RDTSC);
|
|
}
|
|
|
|
void _vmx_vmcall()
|
|
{
|
|
Utcb *utcb = _utcb_of_myself();
|
|
utcb->eip += utcb->inst_len;
|
|
}
|
|
|
|
void _vmx_pause()
|
|
{
|
|
Utcb *utcb = _utcb_of_myself();
|
|
CpuMessage msg(CpuMessage::TYPE_SINGLE_STEP,
|
|
static_cast<CpuState *>(utcb), utcb->mtd);
|
|
_skip_instruction(msg);
|
|
}
|
|
|
|
void _vmx_invalid()
|
|
{
|
|
Utcb *utcb = _utcb_of_myself();
|
|
utcb->efl |= 2;
|
|
_handle_vcpu(NO_SKIP, CpuMessage::TYPE_SINGLE_STEP);
|
|
utcb->mtd |= MTD_RFLAGS;
|
|
}
|
|
|
|
void _vmx_startup()
|
|
{
|
|
Utcb *utcb = _utcb_of_myself();
|
|
_handle_vcpu(NO_SKIP, CpuMessage::TYPE_HLT);
|
|
utcb->mtd |= MTD_CTRL;
|
|
utcb->ctrl[0] = 0;
|
|
utcb->ctrl[1] = 0;
|
|
}
|
|
|
|
void _vmx_recall()
|
|
{
|
|
_handle_vcpu(NO_SKIP, CpuMessage::TYPE_CHECK_IRQ);
|
|
}
|
|
|
|
void _vmx_ioio()
|
|
{
|
|
Utcb *utcb = _utcb_of_myself();
|
|
unsigned order = 0U;
|
|
if (utcb->qual[0] & 0x10) {
|
|
Logging::printf("invalid gueststate\n");
|
|
assert(utcb->mtd & MTD_RFLAGS);
|
|
utcb->efl &= ~2;
|
|
utcb->mtd = MTD_RFLAGS;
|
|
} else {
|
|
order = utcb->qual[0] & 7;
|
|
if (order > 2) order = 2;
|
|
}
|
|
|
|
_handle_io(utcb->qual[0] & 8, order, utcb->qual[0] >> 16);
|
|
}
|
|
|
|
void _vmx_ept()
|
|
{
|
|
Utcb *utcb = _utcb_of_myself();
|
|
|
|
if (!_handle_map_memory(utcb->qual[0] & 0x38))
|
|
/* this is an access to MMIO */
|
|
_handle_vcpu(NO_SKIP, CpuMessage::TYPE_SINGLE_STEP);
|
|
}
|
|
|
|
void _vmx_cpuid()
|
|
{
|
|
_handle_vcpu(SKIP, CpuMessage::TYPE_CPUID);
|
|
}
|
|
|
|
void _vmx_msr_read()
|
|
{
|
|
_handle_vcpu(SKIP, CpuMessage::TYPE_RDMSR);
|
|
}
|
|
|
|
void _vmx_msr_write()
|
|
{
|
|
_handle_vcpu(SKIP, CpuMessage::TYPE_WRMSR);
|
|
}
|
|
|
|
/*
|
|
* This VM exit is in part handled by the NOVA kernel (writing the CR
|
|
* register) and in part by Seoul (updating the PDPTE registers,
|
|
* which requires access to the guest physical memory).
|
|
* Intel manual sections 4.4.1 of Vol. 3A and 26.3.2.4 of Vol. 3C
|
|
* indicate the conditions when the PDPTE registers need to get
|
|
* updated.
|
|
*
|
|
* XXX: not implemented yet
|
|
*
|
|
*/
|
|
void _vmx_mov_crx()
|
|
{
|
|
Logging::panic("%s: not implemented, but needed for VMs using PAE "
|
|
"with nested paging.", __PRETTY_FUNCTION__);
|
|
}
|
|
|
|
/**
|
|
* Shortcut for calling 'Vmm::Vcpu_dispatcher::register_handler'
|
|
* with 'Vcpu_dispatcher' as template argument
|
|
*/
|
|
template <unsigned EV, void (Vcpu_dispatcher::*FUNC)()>
|
|
void _register_handler(Genode::addr_t exc_base, Nova::Mtd mtd)
|
|
{
|
|
if (!register_handler<EV, Vcpu_dispatcher, FUNC>(exc_base, mtd))
|
|
PERR("could not register handler %lx", exc_base + EV);
|
|
}
|
|
|
|
public:
|
|
|
|
enum { STACK_SIZE = 1024*sizeof(Genode::addr_t) };
|
|
|
|
|
|
Vcpu_dispatcher(Genode::Lock &vcpu_lock,
|
|
Genode::Cap_connection &cap_connection,
|
|
VCpu *unsynchronized_vcpu,
|
|
Guest_memory &guest_memory,
|
|
Synced_motherboard &motherboard,
|
|
bool has_svm,
|
|
bool has_vmx,
|
|
Vmm::Vcpu_thread *vcpu_thread,
|
|
Genode::Cpu_session *cpu_session,
|
|
Genode::Affinity::Location &location)
|
|
:
|
|
Vcpu_handler(STACK_SIZE, cap_connection, cpu_session, location),
|
|
_vcpu(vcpu_lock, unsynchronized_vcpu),
|
|
_vcpu_thread(vcpu_thread),
|
|
_guest_memory(guest_memory),
|
|
_motherboard(motherboard)
|
|
{
|
|
using namespace Genode;
|
|
using namespace Nova;
|
|
|
|
/* shortcuts for common message-transfer descriptors */
|
|
Mtd const mtd_all(Mtd::ALL);
|
|
Mtd const mtd_cpuid(Mtd::EIP | Mtd::ACDB | Mtd::IRQ);
|
|
Mtd const mtd_irq(Mtd::IRQ);
|
|
|
|
/*
|
|
* Register vCPU event handlers
|
|
*/
|
|
Genode::addr_t const exc_base = _vcpu_thread->exc_base();
|
|
typedef Vcpu_dispatcher This;
|
|
|
|
if (has_svm) {
|
|
_register_handler<0x64, &This::_vmx_irqwin>
|
|
(exc_base, MTD_IRQ);
|
|
_register_handler<0x72, &This::_svm_cpuid>
|
|
(exc_base, MTD_RIP_LEN | MTD_GPR_ACDB | MTD_IRQ);
|
|
_register_handler<0x78, &This::_svm_hlt>
|
|
(exc_base, MTD_RIP_LEN | MTD_IRQ);
|
|
_register_handler<0x7b, &This::_svm_ioio>
|
|
(exc_base, MTD_RIP_LEN | MTD_QUAL | MTD_GPR_ACDB | MTD_STATE);
|
|
_register_handler<0x7c, &This::_svm_msr>
|
|
(exc_base, MTD_ALL);
|
|
_register_handler<0x7f, &This::_vmx_triple>
|
|
(exc_base, MTD_ALL);
|
|
_register_handler<0xfc, &This::_svm_npt>
|
|
(exc_base, MTD_ALL);
|
|
_register_handler<0xfd, &This::_svm_invalid>
|
|
(exc_base, MTD_ALL);
|
|
_register_handler<0xfe, &This::_svm_startup>
|
|
(exc_base, MTD_ALL);
|
|
_register_handler<0xff, &This::_recall>
|
|
(exc_base, MTD_IRQ);
|
|
|
|
} else if (has_vmx) {
|
|
_register_handler<2, &This::_vmx_triple>
|
|
(exc_base, MTD_ALL);
|
|
_register_handler<3, &This::_vmx_init>
|
|
(exc_base, MTD_ALL);
|
|
_register_handler<7, &This::_vmx_irqwin>
|
|
(exc_base, MTD_IRQ);
|
|
_register_handler<10, &This::_vmx_cpuid>
|
|
(exc_base, MTD_RIP_LEN | MTD_GPR_ACDB | MTD_STATE);
|
|
_register_handler<12, &This::_vmx_hlt>
|
|
(exc_base, MTD_RIP_LEN | MTD_IRQ);
|
|
_register_handler<16, &This::_vmx_rdtsc>
|
|
(exc_base, MTD_RIP_LEN | MTD_GPR_ACDB | MTD_TSC | MTD_STATE);
|
|
_register_handler<18, &This::_vmx_vmcall>
|
|
(exc_base, MTD_RIP_LEN | MTD_GPR_ACDB);
|
|
_register_handler<28, &This::_vmx_mov_crx>
|
|
(exc_base, MTD_ALL);
|
|
_register_handler<30, &This::_vmx_ioio>
|
|
(exc_base, MTD_RIP_LEN | MTD_QUAL | MTD_GPR_ACDB | MTD_STATE | MTD_RFLAGS);
|
|
_register_handler<31, &This::_vmx_msr_read>
|
|
(exc_base, MTD_RIP_LEN | MTD_GPR_ACDB | MTD_TSC | MTD_SYSENTER | MTD_STATE);
|
|
_register_handler<32, &This::_vmx_msr_write>
|
|
(exc_base, MTD_RIP_LEN | MTD_GPR_ACDB | MTD_TSC | MTD_SYSENTER | MTD_STATE);
|
|
_register_handler<33, &This::_vmx_invalid>
|
|
(exc_base, MTD_ALL);
|
|
_register_handler<40, &This::_vmx_pause>
|
|
(exc_base, MTD_RIP_LEN | MTD_STATE);
|
|
_register_handler<48, &This::_vmx_ept>
|
|
(exc_base, MTD_ALL);
|
|
_register_handler<0xfe, &This::_vmx_startup>
|
|
(exc_base, MTD_IRQ);
|
|
_register_handler<0xff, &This::_vmx_recall>
|
|
(exc_base, MTD_IRQ | MTD_RIP_LEN | MTD_GPR_ACDB | MTD_GPR_BSD);
|
|
} else {
|
|
|
|
/*
|
|
* We need Hardware Virtualization Features.
|
|
*/
|
|
Logging::panic("no SVM/VMX available, sorry");
|
|
}
|
|
|
|
/* let vCPU run */
|
|
_vcpu_thread->start(sel_sm_ec() + 1);
|
|
|
|
/* handle cpuid overrides */
|
|
unsynchronized_vcpu->executor.add(this, receive_static<CpuMessage>);
|
|
}
|
|
|
|
/**
|
|
* Destructor
|
|
*/
|
|
~Vcpu_dispatcher() { }
|
|
|
|
|
|
/***********************************
|
|
** Handlers for 'StaticReceiver' **
|
|
***********************************/
|
|
|
|
bool receive(CpuMessage &msg)
|
|
{
|
|
if (msg.type != CpuMessage::TYPE_CPUID)
|
|
return false;
|
|
|
|
/*
|
|
* Linux kernels with guest KVM support compiled in, executed
|
|
* CPUID to query the presence of KVM.
|
|
*/
|
|
enum { CPUID_KVM_SIGNATURE = 0x40000000 };
|
|
|
|
switch (msg.cpuid_index) {
|
|
|
|
case CPUID_KVM_SIGNATURE:
|
|
|
|
msg.cpu->eax = 0;
|
|
msg.cpu->ebx = 0;
|
|
msg.cpu->ecx = 0;
|
|
msg.cpu->edx = 0;
|
|
break;
|
|
|
|
default:
|
|
PDBG("CpuMessage::TYPE_CPUID index %x ignored, return true)",
|
|
msg.cpuid_index);
|
|
}
|
|
|
|
return true;
|
|
}
|
|
};
|
|
|
|
|
|
const void * _forward_pkt;
|
|
|
|
|
|
class Machine : public StaticReceiver<Machine>
|
|
{
|
|
private:
|
|
|
|
Genode::Rom_connection _hip_rom;
|
|
Hip * const _hip;
|
|
Genode::Cap_connection _cap;
|
|
Clock _clock;
|
|
Genode::Lock _motherboard_lock;
|
|
Motherboard _unsynchronized_motherboard;
|
|
Synced_motherboard _motherboard;
|
|
Genode::Lock _timeouts_lock;
|
|
TimeoutList<32, void> _unsynchronized_timeouts;
|
|
Synced_timeout_list _timeouts;
|
|
Guest_memory &_guest_memory;
|
|
Boot_module_provider &_boot_modules;
|
|
Alarm_thread *_alarm_thread;
|
|
|
|
bool _alloc_fb_mem; /* For detecting FB alloc message */
|
|
bool _colocate_vm_vmm;
|
|
unsigned short _vcpus_up;
|
|
|
|
Nic::Session *_nic;
|
|
Rtc::Session *_rtc;
|
|
|
|
public:
|
|
|
|
/*********************************************
|
|
** Callbacks registered at the motherboard **
|
|
*********************************************/
|
|
|
|
bool receive(MessageHostOp &msg)
|
|
{
|
|
switch (msg.type) {
|
|
|
|
/**
|
|
* Request available guest memory starting at specified address
|
|
*/
|
|
case MessageHostOp::OP_GUEST_MEM:
|
|
|
|
if (verbose_debug)
|
|
Logging::printf("OP_GUEST_MEM value=0x%lx\n", msg.value);
|
|
|
|
if (_alloc_fb_mem) {
|
|
msg.len = _guest_memory.fb_size();
|
|
msg.ptr = _guest_memory.backing_store_local_base();
|
|
_alloc_fb_mem = false;
|
|
Logging::printf("_alloc_fb_mem -> len=0x%zx, ptr=0x%p\n",
|
|
msg.len, msg.ptr);
|
|
return true;
|
|
}
|
|
|
|
if (msg.value >= _guest_memory.remaining_size) {
|
|
msg.value = 0;
|
|
} else {
|
|
msg.len = _guest_memory.remaining_size - msg.value;
|
|
msg.ptr = _guest_memory.backing_store_local_base() + msg.value;
|
|
}
|
|
|
|
if (verbose_debug)
|
|
Logging::printf(" -> len=0x%zx, ptr=0x%p\n",
|
|
msg.len, msg.ptr);
|
|
return true;
|
|
|
|
/**
|
|
* Cut off upper range of guest memory by specified amount
|
|
*/
|
|
case MessageHostOp::OP_ALLOC_FROM_GUEST:
|
|
|
|
if (verbose_debug)
|
|
Logging::printf("OP_ALLOC_FROM_GUEST\n");
|
|
|
|
if (msg.value == _guest_memory.fb_size()) {
|
|
_alloc_fb_mem = true;
|
|
msg.phys = _guest_memory.remaining_size;
|
|
return true;
|
|
}
|
|
|
|
if (msg.value > _guest_memory.remaining_size)
|
|
return false;
|
|
|
|
_guest_memory.remaining_size -= msg.value;
|
|
|
|
msg.phys = _guest_memory.remaining_size;
|
|
|
|
if (verbose_debug)
|
|
Logging::printf("-> allocated from guest %08zx+%lx\n",
|
|
_guest_memory.remaining_size, msg.value);
|
|
return true;
|
|
|
|
case MessageHostOp::OP_VCPU_CREATE_BACKEND:
|
|
{
|
|
if (verbose_debug)
|
|
Logging::printf("OP_VCPU_CREATE_BACKEND\n");
|
|
|
|
_vcpus_up ++;
|
|
|
|
Vmm::Vcpu_thread * vcpu_thread;
|
|
Genode::Cpu_session * cpu_session = Genode::env()->cpu_session();
|
|
Genode::Affinity::Space cpu_space = cpu_session->affinity_space();
|
|
Genode::Affinity::Location location = cpu_space.location_of_index(_vcpus_up);
|
|
|
|
if (_colocate_vm_vmm)
|
|
vcpu_thread = new Vmm::Vcpu_same_pd(Vcpu_dispatcher::STACK_SIZE, cpu_session, location);
|
|
else
|
|
vcpu_thread = new Vmm::Vcpu_other_pd(cpu_session, location);
|
|
|
|
Vcpu_dispatcher *vcpu_dispatcher =
|
|
new Vcpu_dispatcher(_motherboard_lock,
|
|
_cap,
|
|
msg.vcpu,
|
|
_guest_memory,
|
|
_motherboard,
|
|
_hip->has_feature_svm(),
|
|
_hip->has_feature_vmx(),
|
|
vcpu_thread,
|
|
cpu_session,
|
|
location);
|
|
|
|
msg.value = vcpu_dispatcher->sel_sm_ec();
|
|
return true;
|
|
}
|
|
|
|
case MessageHostOp::OP_VCPU_RELEASE:
|
|
|
|
if (verbose_debug)
|
|
Logging::printf("OP_VCPU_RELEASE\n");
|
|
|
|
if (msg.len) {
|
|
if (Nova::sm_ctrl(msg.value, Nova::SEMAPHORE_UP) != 0) {
|
|
Logging::printf("vcpu release: sm_ctrl failed\n");
|
|
return false;
|
|
}
|
|
}
|
|
return (Nova::ec_ctrl(Nova::EC_RECALL, msg.value + 1) == 0);
|
|
|
|
case MessageHostOp::OP_VCPU_BLOCK:
|
|
{
|
|
if (verbose_debug)
|
|
Logging::printf("OP_VCPU_BLOCK\n");
|
|
|
|
_motherboard_lock.unlock();
|
|
bool res = (Nova::sm_ctrl(msg.value, Nova::SEMAPHORE_DOWN) == 0);
|
|
if (verbose_debug)
|
|
Logging::printf("woke up from vcpu sem, block on global_lock\n");
|
|
_motherboard_lock.lock();
|
|
return res;
|
|
}
|
|
|
|
case MessageHostOp::OP_GET_MODULE:
|
|
{
|
|
/*
|
|
* Module indices start with 1
|
|
*/
|
|
if (msg.module == 0)
|
|
return false;
|
|
|
|
/*
|
|
* Message arguments
|
|
*/
|
|
int const index = msg.module - 1;
|
|
char * const data_dst = msg.start;
|
|
Genode::size_t const dst_len = msg.size;
|
|
|
|
/*
|
|
* Copy module data to guest RAM
|
|
*/
|
|
Genode::size_t data_len = 0;
|
|
try {
|
|
data_len = _boot_modules.data(index, data_dst, dst_len);
|
|
} catch (Boot_module_provider::Destination_buffer_too_small) {
|
|
Logging::panic("could not load module, destination buffer too small\n");
|
|
return false;
|
|
} catch (Boot_module_provider::Module_loading_failed) {
|
|
Logging::panic("could not load module %d,"
|
|
" unknown reason\n", index);
|
|
return false;
|
|
}
|
|
|
|
/*
|
|
* Detect end of module list
|
|
*/
|
|
if (data_len == 0)
|
|
return false;
|
|
|
|
/*
|
|
* Determine command line offset relative to the start of
|
|
* the loaded boot module. The command line resides right
|
|
* behind the module data, aligned on a page boundary.
|
|
*/
|
|
Genode::addr_t const cmdline_offset =
|
|
Genode::align_addr(data_len, Vmm::PAGE_SIZE_LOG2);
|
|
|
|
if (cmdline_offset >= dst_len) {
|
|
Logging::printf("destination buffer too small for command line\n");
|
|
return false;
|
|
}
|
|
|
|
/*
|
|
* Copy command line to guest RAM
|
|
*/
|
|
Genode::size_t const cmdline_len =
|
|
_boot_modules.cmdline(index, data_dst + cmdline_offset,
|
|
dst_len - cmdline_offset);
|
|
|
|
/*
|
|
* Return module size (w/o the size of the command line,
|
|
* the 'vbios_multiboot' is aware of the one-page gap
|
|
* between modules.
|
|
*/
|
|
msg.size = data_len;
|
|
msg.cmdline = data_dst + cmdline_offset;
|
|
msg.cmdlen = cmdline_len;
|
|
|
|
return true;
|
|
}
|
|
case MessageHostOp::OP_GET_MAC:
|
|
{
|
|
Nic::Packet_allocator *tx_block_alloc =
|
|
new (Genode::env()->heap()) Nic::Packet_allocator(Genode::env()->heap());
|
|
|
|
enum {
|
|
PACKET_SIZE = Nic::Packet_allocator::DEFAULT_PACKET_SIZE,
|
|
BUF_SIZE = Nic::Session::QUEUE_SIZE * PACKET_SIZE,
|
|
};
|
|
|
|
try {
|
|
_nic = new Nic::Connection(tx_block_alloc, BUF_SIZE, BUF_SIZE);
|
|
} catch (...) {
|
|
Logging::printf("No NIC connection possible!\n");
|
|
return false;
|
|
}
|
|
|
|
PINF("Our mac address is %2x:%2x:%2x:%2x:%2x:%2x\n",
|
|
_nic->mac_address().addr[0],
|
|
_nic->mac_address().addr[1],
|
|
_nic->mac_address().addr[2],
|
|
_nic->mac_address().addr[3],
|
|
_nic->mac_address().addr[4],
|
|
_nic->mac_address().addr[5]
|
|
);
|
|
msg.mac = ((Genode::uint64_t)_nic->mac_address().addr[0] & 0xff) << 40 |
|
|
((Genode::uint64_t)_nic->mac_address().addr[1] & 0xff) << 32 |
|
|
((Genode::uint64_t)_nic->mac_address().addr[2] & 0xff) << 24 |
|
|
((Genode::uint64_t)_nic->mac_address().addr[3] & 0xff) << 16 |
|
|
((Genode::uint64_t)_nic->mac_address().addr[4] & 0xff) << 8 |
|
|
((Genode::uint64_t)_nic->mac_address().addr[5] & 0xff);
|
|
|
|
/* start receiver thread for this MAC */
|
|
Vancouver_network * netreceiver = new Vancouver_network(_motherboard, _nic);
|
|
assert(netreceiver);
|
|
|
|
return true;
|
|
}
|
|
default:
|
|
|
|
PWRN("HostOp %d not implemented", msg.type);
|
|
return false;
|
|
}
|
|
}
|
|
|
|
bool receive(MessageDisk &msg)
|
|
{
|
|
if (verbose_debug)
|
|
PDBG("MessageDisk");
|
|
return false;
|
|
}
|
|
|
|
bool receive(MessageTimer &msg)
|
|
{
|
|
switch (msg.type) {
|
|
case MessageTimer::TIMER_NEW:
|
|
|
|
if (verbose_debug)
|
|
Logging::printf("TIMER_NEW\n");
|
|
|
|
if (_alarm_thread == NULL) {
|
|
Logging::printf("Creating alarm thread\n");
|
|
_alarm_thread = new Alarm_thread(_motherboard, _timeouts);
|
|
}
|
|
|
|
msg.nr = _timeouts()->alloc();
|
|
|
|
return true;
|
|
|
|
case MessageTimer::TIMER_REQUEST_TIMEOUT:
|
|
|
|
if (_timeouts()->request(msg.nr, msg.abstime) < 0)
|
|
Logging::printf("Could not program timeout.\n");
|
|
|
|
return true;
|
|
|
|
default:
|
|
return false;
|
|
};
|
|
}
|
|
|
|
bool receive(MessageTime &msg)
|
|
{
|
|
Genode::Lock::Guard guard(*utcb_lock());
|
|
utcb_backup = *Genode::Thread_base::myself()->utcb();
|
|
|
|
if (!_rtc) {
|
|
try {
|
|
_rtc = new Rtc::Connection;
|
|
} catch (...) {
|
|
Logging::printf("No RTC present, returning dummy time.\n");
|
|
msg.wallclocktime = msg.timestamp = 0;
|
|
|
|
*Genode::Thread_base::myself()->utcb() = utcb_backup;
|
|
|
|
return true;
|
|
}
|
|
}
|
|
|
|
Rtc::Timestamp rtc_ts = _rtc->current_time();
|
|
tm_simple tms(rtc_ts.year, rtc_ts.month, rtc_ts.day, rtc_ts.hour,
|
|
rtc_ts.minute, rtc_ts.second);
|
|
|
|
msg.wallclocktime = mktime(&tms) * MessageTime::FREQUENCY;
|
|
Logging::printf("Got time %llx\n", msg.wallclocktime);
|
|
msg.timestamp = _unsynchronized_motherboard.clock()->clock(MessageTime::FREQUENCY);
|
|
|
|
*Genode::Thread_base::myself()->utcb() = utcb_backup;
|
|
|
|
return true;
|
|
}
|
|
|
|
bool receive(MessageNetwork &msg)
|
|
{
|
|
if (msg.type != MessageNetwork::PACKET) return false;
|
|
|
|
Genode::Lock::Guard guard(*utcb_lock());
|
|
utcb_backup = *Genode::Thread_base::myself()->utcb();
|
|
|
|
if (msg.buffer == _forward_pkt) {
|
|
/* don't end in an endless forwarding loop */
|
|
return false;
|
|
}
|
|
|
|
/* allocate transmit packet */
|
|
Nic::Packet_descriptor tx_packet;
|
|
try {
|
|
tx_packet = _nic->tx()->alloc_packet(msg.len);
|
|
} catch (Nic::Session::Tx::Source::Packet_alloc_failed) {
|
|
PERR("tx packet alloc failed");
|
|
return false;
|
|
}
|
|
|
|
/* fill packet with content */
|
|
char *tx_content = _nic->tx()->packet_content(tx_packet);
|
|
_forward_pkt = tx_content;
|
|
for (unsigned i = 0; i < msg.len; i++) {
|
|
tx_content[i] = msg.buffer[i];
|
|
}
|
|
_nic->tx()->submit_packet(tx_packet);
|
|
|
|
/* wait for acknowledgement */
|
|
Nic::Packet_descriptor ack_tx_packet = _nic->tx()->get_acked_packet();
|
|
|
|
if (ack_tx_packet.size() != tx_packet.size()
|
|
|| ack_tx_packet.offset() != tx_packet.offset()) {
|
|
PERR("unexpected acked packet");
|
|
}
|
|
|
|
/* release sent packet to free the space in the tx communication buffer */
|
|
_nic->tx()->release_packet(tx_packet);
|
|
|
|
*Genode::Thread_base::myself()->utcb() = utcb_backup;
|
|
|
|
return true;
|
|
}
|
|
|
|
bool receive(MessagePciConfig &msg)
|
|
{
|
|
if (verbose_debug)
|
|
PDBG("MessagePciConfig");
|
|
return false;
|
|
}
|
|
|
|
bool receive(MessageAcpi &msg)
|
|
{
|
|
if (verbose_debug)
|
|
PDBG("MessageAcpi");
|
|
return false;
|
|
}
|
|
|
|
bool receive(MessageLegacy &msg)
|
|
{
|
|
if (msg.type == MessageLegacy::RESET) {
|
|
Logging::printf("MessageLegacy::RESET requested\n");
|
|
return true;
|
|
}
|
|
return false;
|
|
}
|
|
|
|
/**
|
|
* Constructor
|
|
*/
|
|
Machine(Boot_module_provider &boot_modules, Guest_memory &guest_memory,
|
|
bool colocate)
|
|
:
|
|
_hip_rom("hypervisor_info_page"),
|
|
_hip(Genode::env()->rm_session()->attach(_hip_rom.dataspace())),
|
|
_clock(_hip->tsc_freq*1000),
|
|
_motherboard_lock(Genode::Lock::LOCKED),
|
|
_unsynchronized_motherboard(&_clock, _hip),
|
|
_motherboard(_motherboard_lock, &_unsynchronized_motherboard),
|
|
_timeouts(_timeouts_lock, &_unsynchronized_timeouts),
|
|
_guest_memory(guest_memory),
|
|
_boot_modules(boot_modules),
|
|
_colocate_vm_vmm(colocate),
|
|
_vcpus_up(0)
|
|
{
|
|
_timeouts()->init();
|
|
|
|
/* register host operations, called back by the VMM */
|
|
_unsynchronized_motherboard.bus_hostop.add (this, receive_static<MessageHostOp>);
|
|
_unsynchronized_motherboard.bus_disk.add (this, receive_static<MessageDisk>);
|
|
_unsynchronized_motherboard.bus_timer.add (this, receive_static<MessageTimer>);
|
|
_unsynchronized_motherboard.bus_time.add (this, receive_static<MessageTime>);
|
|
_unsynchronized_motherboard.bus_network.add (this, receive_static<MessageNetwork>);
|
|
_unsynchronized_motherboard.bus_hwpcicfg.add(this, receive_static<MessageHwPciConfig>);
|
|
_unsynchronized_motherboard.bus_acpi.add (this, receive_static<MessageAcpi>);
|
|
_unsynchronized_motherboard.bus_legacy.add (this, receive_static<MessageLegacy>);
|
|
}
|
|
|
|
|
|
/**
|
|
* Exception type thrown on configuration errors
|
|
*/
|
|
class Config_error { };
|
|
|
|
|
|
/**
|
|
* Configure virtual machine according to the provided XML description
|
|
*
|
|
* \param machine_node XML node containing device-model sub nodes
|
|
* \throw Config_error
|
|
*
|
|
* Device models are instantiated in the order of appearance in the XML
|
|
* configuration.
|
|
*/
|
|
void setup_devices(Genode::Xml_node machine_node)
|
|
{
|
|
using namespace Genode;
|
|
|
|
Xml_node node = machine_node.sub_node();
|
|
for (;; node = node.next()) {
|
|
|
|
enum { MODEL_NAME_MAX_LEN = 32 };
|
|
char name[MODEL_NAME_MAX_LEN];
|
|
node.type_name(name, sizeof(name));
|
|
|
|
PINF("device: %s", name);
|
|
Device_model_info *dmi = device_model_registry()->lookup(name);
|
|
|
|
if (!dmi) {
|
|
PERR("configuration error: device model '%s' does not exist", name);
|
|
throw Config_error();
|
|
}
|
|
|
|
/*
|
|
* Read device-model arguments into 'argv' array
|
|
*/
|
|
enum { MAX_ARGS = 8 };
|
|
unsigned long argv[MAX_ARGS];
|
|
|
|
for (int i = 0; i < MAX_ARGS; i++)
|
|
argv[i] = ~0UL;
|
|
|
|
for (int i = 0; dmi->arg_names[i] && (i < MAX_ARGS); i++) {
|
|
|
|
try {
|
|
Xml_node::Attribute arg = node.attribute(dmi->arg_names[i]);
|
|
arg.value(&argv[i]);
|
|
|
|
PINF(" arg[%d]: 0x%x", i, (int)argv[i]);
|
|
}
|
|
catch (Xml_node::Nonexistent_attribute) { }
|
|
}
|
|
|
|
/*
|
|
* Initialize new instance of device model
|
|
*
|
|
* We never pass any argument string to a device model because
|
|
* it is not examined by the existing device models.
|
|
*/
|
|
dmi->create(_unsynchronized_motherboard, argv, "", 0);
|
|
|
|
if (node.is_last())
|
|
break;
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Reset the machine and unblock the VCPUs
|
|
*/
|
|
void boot()
|
|
{
|
|
PINF("VM and VMM are %s. VM is starting with %u %s.",
|
|
_colocate_vm_vmm ? "co-located" : "not co-located",
|
|
_vcpus_up, _vcpus_up > 1 ? "vCPUs" : "vCPU");
|
|
|
|
/* init VCPUs */
|
|
for (VCpu *vcpu = _unsynchronized_motherboard.last_vcpu; vcpu; vcpu = vcpu->get_last()) {
|
|
|
|
/* init CPU strings */
|
|
const char *short_name = "NOVA microHV";
|
|
vcpu->set_cpuid(0, 1, reinterpret_cast<const unsigned *>(short_name)[0]);
|
|
vcpu->set_cpuid(0, 3, reinterpret_cast<const unsigned *>(short_name)[1]);
|
|
vcpu->set_cpuid(0, 2, reinterpret_cast<const unsigned *>(short_name)[2]);
|
|
const char *long_name = "Vancouver VMM proudly presents this VirtualCPU. ";
|
|
for (unsigned i=0; i<12; i++)
|
|
vcpu->set_cpuid(0x80000002 + (i / 4), i % 4, reinterpret_cast<const unsigned *>(long_name)[i]);
|
|
|
|
/* propagate feature flags from the host */
|
|
unsigned ebx_1=0, ecx_1=0, edx_1=0;
|
|
Cpu::cpuid(1, ebx_1, ecx_1, edx_1);
|
|
|
|
/* clflush size */
|
|
vcpu->set_cpuid(1, 1, ebx_1 & 0xff00, 0xff00ff00);
|
|
|
|
/* +SSE3,+SSSE3 */
|
|
vcpu->set_cpuid(1, 2, ecx_1, 0x00000201);
|
|
|
|
/* -PAE,-PSE36, -MTRR,+MMX,+SSE,+SSE2,+CLFLUSH,+SEP */
|
|
vcpu->set_cpuid(1, 3, edx_1, 0x0f88a9bf | (1 << 28));
|
|
}
|
|
|
|
Logging::printf("RESET device state\n");
|
|
MessageLegacy msg2(MessageLegacy::RESET, 0);
|
|
_unsynchronized_motherboard.bus_legacy.send_fifo(msg2);
|
|
|
|
Logging::printf("INIT done\n");
|
|
|
|
_motherboard_lock.unlock();
|
|
}
|
|
|
|
Synced_motherboard &motherboard() { return _motherboard; }
|
|
|
|
Motherboard &unsynchronized_motherboard() { return _unsynchronized_motherboard; }
|
|
|
|
Genode::Lock &motherboard_lock() { return _motherboard_lock; }
|
|
|
|
~Machine()
|
|
{
|
|
Genode::env()->rm_session()->detach(_hip);
|
|
}
|
|
};
|
|
|
|
|
|
extern unsigned long _prog_img_beg; /* begin of program image (link address) */
|
|
extern unsigned long _prog_img_end; /* end of program image */
|
|
|
|
|
|
int main(int argc, char **argv)
|
|
{
|
|
Genode::addr_t fb_size = 4*1024*1024;
|
|
Genode::addr_t vm_size;
|
|
unsigned colocate = 1; /* by default co-locate VM and VMM in same PD */
|
|
|
|
{
|
|
/*
|
|
* Reserve complete lower address space so that nobody else can take
|
|
* it. The context area is moved as far as possible to a high virtual
|
|
* address. So we can use its base address as upper bound. The
|
|
* reservation will be dropped when this scope is left and re-acquired
|
|
* with the actual VM size which is determined below inside this scope.
|
|
*/
|
|
Vmm::Virtual_reservation
|
|
reservation(Genode::Native_config::context_area_virtual_base());
|
|
|
|
Genode::printf("--- Vancouver VMM starting ---\n");
|
|
|
|
/* request max available memory */
|
|
vm_size = Genode::env()->ram_session()->avail();
|
|
/* reserve some memory for the VMM */
|
|
vm_size -= 8 * 1024 * 1024;
|
|
/* calculate max memory for the VM */
|
|
vm_size = vm_size & ~((1UL << Vmm::PAGE_SIZE_LOG2) - 1);
|
|
|
|
/* Find out framebuffer size (default: 4 MiB) */
|
|
try {
|
|
Genode::Xml_node node = Genode::config()->xml_node().sub_node("machine").sub_node("vga");
|
|
Genode::Xml_node::Attribute arg = node.attribute("fb_size");
|
|
|
|
unsigned long val;
|
|
arg.value(&val);
|
|
fb_size = val*1024;
|
|
} catch (...) { }
|
|
|
|
/* read out whether VM and VMM should be colocated or not */
|
|
try {
|
|
Genode::config()->xml_node().attribute("colocate").value(&colocate);
|
|
} catch (...) { }
|
|
}
|
|
|
|
if (colocate)
|
|
/* re-adjust reservation to actual VM size */
|
|
static Vmm::Virtual_reservation reservation(vm_size);
|
|
|
|
/* setup guest memory */
|
|
static Guest_memory guest_memory(vm_size, fb_size);
|
|
|
|
/* diagnostic messages */
|
|
if (colocate)
|
|
Genode::printf("[0x%012lx, 0x%012lx) - %lu MiB - VM accessible "
|
|
"memory\n", 0UL, vm_size, vm_size / 1024 / 1024);
|
|
|
|
if (guest_memory.backing_store_local_base())
|
|
Genode::printf("[0x%12p, 0x%12p) - %lu MiB - VMM accessible shadow "
|
|
"mapping of VM memory \n",
|
|
guest_memory.backing_store_local_base(),
|
|
guest_memory.backing_store_local_base() +
|
|
guest_memory.remaining_size, vm_size / 1024 / 1024);
|
|
|
|
if (guest_memory.backing_store_fb_local_base())
|
|
Genode::printf("[0x%12p, 0x%12p) - %lu MiB - VMM accessible "
|
|
"framebuffer memory of VM\n",
|
|
guest_memory.backing_store_fb_local_base(),
|
|
guest_memory.backing_store_fb_local_base() + fb_size,
|
|
fb_size / 1024 / 1024);
|
|
|
|
Genode::printf("[0x%012lx, 0x%012lx) - Genode thread context area\n",
|
|
Genode::Native_config::context_area_virtual_base(),
|
|
Genode::Native_config::context_area_virtual_base() +
|
|
Genode::Native_config::context_area_virtual_size());
|
|
|
|
Genode::printf("[0x%012lx, 0x%012lx) - VMM program image\n",
|
|
(Genode::addr_t)&_prog_img_beg,
|
|
(Genode::addr_t)&_prog_img_end);
|
|
|
|
if (!guest_memory.backing_store_local_base() ||
|
|
!guest_memory.backing_store_fb_local_base()) {
|
|
PERR("Not enough space left for %s - exit",
|
|
guest_memory.backing_store_local_base() ? "framebuffer" : "VMM");
|
|
return 1;
|
|
}
|
|
|
|
Genode::printf("\n--- Setup VM ---\n");
|
|
|
|
static Boot_module_provider
|
|
boot_modules(Genode::config()->xml_node().sub_node("multiboot"));
|
|
|
|
/* create the PC machine based on the configuration given */
|
|
static Machine machine(boot_modules, guest_memory, colocate);
|
|
|
|
/* create console thread */
|
|
Vancouver_console vcon(machine.motherboard(), fb_size, guest_memory.fb_ds());
|
|
|
|
vcon.register_host_operations(machine.unsynchronized_motherboard());
|
|
|
|
/* create disk thread */
|
|
Vancouver_disk vdisk(machine.motherboard(),
|
|
guest_memory.backing_store_local_base(),
|
|
guest_memory.backing_store_size());
|
|
|
|
vdisk.register_host_operations(machine.unsynchronized_motherboard());
|
|
|
|
machine.setup_devices(Genode::config()->xml_node().sub_node("machine"));
|
|
|
|
Genode::printf("\n--- Booting VM ---\n");
|
|
|
|
machine.boot();
|
|
|
|
Genode::sleep_forever();
|
|
return 0;
|
|
}
|