2018-02-14 06:09:43 +00:00
|
|
|
// Copyright 2018 The Chromium OS Authors. All rights reserved.
|
|
|
|
// Use of this source code is governed by a BSD-style license that can be
|
|
|
|
// found in the LICENSE file.
|
|
|
|
|
2018-12-22 00:01:56 +00:00
|
|
|
pub mod fdt;
|
|
|
|
|
2019-01-24 03:04:43 +00:00
|
|
|
use std::collections::BTreeMap;
|
2019-03-05 01:48:36 +00:00
|
|
|
use std::error::Error as StdError;
|
2019-03-02 02:07:56 +00:00
|
|
|
use std::fmt::{self, Display};
|
2018-02-14 06:09:43 +00:00
|
|
|
use std::fs::File;
|
2019-03-05 01:48:36 +00:00
|
|
|
use std::io::{self, Read, Seek, SeekFrom};
|
2018-10-15 21:32:30 +00:00
|
|
|
use std::os::unix::io::AsRawFd;
|
2018-12-04 07:37:46 +00:00
|
|
|
use std::sync::Arc;
|
2018-02-14 06:09:43 +00:00
|
|
|
|
2018-07-24 00:58:09 +00:00
|
|
|
use devices::virtio::VirtioDevice;
|
2018-10-03 17:22:32 +00:00
|
|
|
use devices::{
|
2018-10-18 23:45:13 +00:00
|
|
|
Bus, BusDevice, BusError, PciDevice, PciDeviceError, PciInterruptPin, PciRoot, ProxyDevice,
|
|
|
|
Serial,
|
2018-10-03 17:22:32 +00:00
|
|
|
};
|
2018-07-24 00:58:09 +00:00
|
|
|
use io_jail::Minijail;
|
2018-10-15 21:32:30 +00:00
|
|
|
use kvm::{IoeventAddress, Kvm, Vcpu, Vm};
|
2018-05-18 01:47:11 +00:00
|
|
|
use resources::SystemAllocator;
|
2018-12-04 07:37:46 +00:00
|
|
|
use sync::Mutex;
|
2018-12-12 23:20:30 +00:00
|
|
|
use sys_util::{syslog, EventFd, GuestAddress, GuestMemory, GuestMemoryError};
|
2018-02-14 06:09:43 +00:00
|
|
|
|
2018-07-24 00:58:09 +00:00
|
|
|
/// Holds the pieces needed to build a VM. Passed to `build_vm` in the `LinuxArch` trait below to
|
|
|
|
/// create a `RunnableLinuxVm`.
|
|
|
|
pub struct VmComponents {
|
|
|
|
pub memory_mb: u64,
|
|
|
|
pub vcpu_count: u32,
|
2019-04-05 16:58:48 +00:00
|
|
|
pub vcpu_affinity: Vec<usize>,
|
2018-07-24 00:58:09 +00:00
|
|
|
pub kernel_image: File,
|
2018-12-22 00:01:56 +00:00
|
|
|
pub android_fstab: Option<File>,
|
2018-12-12 00:29:26 +00:00
|
|
|
pub initrd_image: Option<File>,
|
2018-07-24 00:58:09 +00:00
|
|
|
pub extra_kernel_params: Vec<String>,
|
|
|
|
pub wayland_dmabuf: bool,
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Holds the elements needed to run a Linux VM. Created by `build_vm`.
|
|
|
|
pub struct RunnableLinuxVm {
|
|
|
|
pub vm: Vm,
|
|
|
|
pub kvm: Kvm,
|
|
|
|
pub resources: SystemAllocator,
|
|
|
|
pub stdio_serial: Arc<Mutex<Serial>>,
|
|
|
|
pub exit_evt: EventFd,
|
|
|
|
pub vcpus: Vec<Vcpu>,
|
2019-04-05 16:58:48 +00:00
|
|
|
pub vcpu_affinity: Vec<usize>,
|
2018-07-24 00:58:09 +00:00
|
|
|
pub irq_chip: Option<File>,
|
|
|
|
pub io_bus: Bus,
|
|
|
|
pub mmio_bus: Bus,
|
2019-01-24 03:04:43 +00:00
|
|
|
pub pid_debug_label_map: BTreeMap<u32, String>,
|
2018-07-24 00:58:09 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/// The device and optional jail.
|
|
|
|
pub struct VirtioDeviceStub {
|
2019-03-09 00:56:14 +00:00
|
|
|
pub dev: Box<dyn VirtioDevice>,
|
2018-07-24 00:58:09 +00:00
|
|
|
pub jail: Option<Minijail>,
|
|
|
|
}
|
|
|
|
|
2018-02-14 06:09:43 +00:00
|
|
|
/// Trait which is implemented for each Linux Architecture in order to
|
|
|
|
/// set up the memory, cpus, and system devices and to boot the kernel.
|
|
|
|
pub trait LinuxArch {
|
2019-03-05 01:48:36 +00:00
|
|
|
type Error: StdError;
|
|
|
|
|
2018-07-24 00:58:09 +00:00
|
|
|
/// Takes `VmComponents` and generates a `RunnableLinuxVm`.
|
2018-02-14 06:09:43 +00:00
|
|
|
///
|
|
|
|
/// # Arguments
|
|
|
|
///
|
2018-07-24 00:58:09 +00:00
|
|
|
/// * `components` - Parts to use to build the VM.
|
2019-01-30 05:21:48 +00:00
|
|
|
/// * `split_irqchip` - whether to use a split IRQ chip (i.e. userspace PIT/PIC/IOAPIC)
|
2019-02-20 21:50:42 +00:00
|
|
|
/// * `create_devices` - Function to generate a list of devices.
|
2019-03-05 01:48:36 +00:00
|
|
|
fn build_vm<F, E>(
|
2019-01-30 05:21:48 +00:00
|
|
|
components: VmComponents,
|
|
|
|
split_irqchip: bool,
|
2019-02-20 21:50:42 +00:00
|
|
|
create_devices: F,
|
2019-03-05 01:48:36 +00:00
|
|
|
) -> Result<RunnableLinuxVm, Self::Error>
|
2018-10-03 17:22:32 +00:00
|
|
|
where
|
2019-03-09 00:56:14 +00:00
|
|
|
F: FnOnce(&GuestMemory, &EventFd) -> Result<Vec<(Box<dyn PciDevice>, Option<Minijail>)>, E>,
|
2019-03-05 01:48:36 +00:00
|
|
|
E: StdError + 'static;
|
2018-07-24 00:58:09 +00:00
|
|
|
}
|
2018-02-14 06:09:43 +00:00
|
|
|
|
2018-07-24 00:58:09 +00:00
|
|
|
/// Errors for device manager.
|
|
|
|
#[derive(Debug)]
|
2018-07-09 22:39:34 +00:00
|
|
|
pub enum DeviceRegistrationError {
|
|
|
|
/// Could not allocate IO space for the device.
|
|
|
|
AllocateIoAddrs(PciDeviceError),
|
2019-02-21 02:56:22 +00:00
|
|
|
/// Could not allocate device address space for the device.
|
|
|
|
AllocateDeviceAddrs(PciDeviceError),
|
2018-07-09 22:39:34 +00:00
|
|
|
/// Could not allocate an IRQ number.
|
|
|
|
AllocateIrq,
|
2018-07-24 00:58:09 +00:00
|
|
|
/// Could not create the mmio device to wrap a VirtioDevice.
|
|
|
|
CreateMmioDevice(sys_util::Error),
|
2018-07-09 22:39:34 +00:00
|
|
|
/// Could not create an event fd.
|
|
|
|
EventFdCreate(sys_util::Error),
|
|
|
|
/// Could not add a device to the mmio bus.
|
|
|
|
MmioInsert(BusError),
|
2018-07-24 00:58:09 +00:00
|
|
|
/// Failed to register ioevent with VM.
|
|
|
|
RegisterIoevent(sys_util::Error),
|
|
|
|
/// Failed to register irq eventfd with VM.
|
|
|
|
RegisterIrqfd(sys_util::Error),
|
|
|
|
/// Failed to initialize proxy device for jailed device.
|
|
|
|
ProxyDeviceCreation(devices::ProxyError),
|
|
|
|
/// Appending to kernel command line failed.
|
|
|
|
Cmdline(kernel_cmdline::Error),
|
|
|
|
/// No more IRQs are available.
|
|
|
|
IrqsExhausted,
|
|
|
|
/// No more MMIO space available.
|
|
|
|
AddrsExhausted,
|
2019-03-15 20:13:08 +00:00
|
|
|
/// Could not register PCI device capabilities.
|
|
|
|
RegisterDeviceCapabilities(PciDeviceError),
|
2018-07-24 00:58:09 +00:00
|
|
|
}
|
2018-02-14 06:09:43 +00:00
|
|
|
|
2019-03-02 02:07:56 +00:00
|
|
|
impl Display for DeviceRegistrationError {
|
2018-07-24 00:58:09 +00:00
|
|
|
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
|
2019-03-02 02:07:56 +00:00
|
|
|
use self::DeviceRegistrationError::*;
|
|
|
|
|
2018-07-24 00:58:09 +00:00
|
|
|
match self {
|
2019-03-02 02:07:56 +00:00
|
|
|
AllocateIoAddrs(e) => write!(f, "Allocating IO addresses: {}", e),
|
|
|
|
AllocateDeviceAddrs(e) => write!(f, "Allocating device addresses: {}", e),
|
|
|
|
AllocateIrq => write!(f, "Allocating IRQ number"),
|
|
|
|
CreateMmioDevice(e) => write!(f, "failed to create mmio device: {}", e),
|
|
|
|
Cmdline(e) => write!(f, "unable to add device to kernel command line: {}", e),
|
|
|
|
EventFdCreate(e) => write!(f, "failed to create eventfd: {}", e),
|
|
|
|
MmioInsert(e) => write!(f, "failed to add to mmio bus: {}", e),
|
|
|
|
RegisterIoevent(e) => write!(f, "failed to register ioevent to VM: {}", e),
|
|
|
|
RegisterIrqfd(e) => write!(f, "failed to register irq eventfd to VM: {}", e),
|
|
|
|
ProxyDeviceCreation(e) => write!(f, "failed to create proxy device: {}", e),
|
|
|
|
IrqsExhausted => write!(f, "no more IRQs are available"),
|
|
|
|
AddrsExhausted => write!(f, "no more addresses are available"),
|
2019-03-15 20:13:08 +00:00
|
|
|
RegisterDeviceCapabilities(e) => {
|
|
|
|
write!(f, "could not register PCI device capabilities: {}", e)
|
|
|
|
}
|
2018-07-09 22:39:34 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Creates a root PCI device for use by this Vm.
|
2018-10-03 17:22:32 +00:00
|
|
|
pub fn generate_pci_root(
|
2019-03-09 00:56:14 +00:00
|
|
|
devices: Vec<(Box<dyn PciDevice>, Option<Minijail>)>,
|
2018-10-03 17:22:32 +00:00
|
|
|
mmio_bus: &mut Bus,
|
|
|
|
resources: &mut SystemAllocator,
|
|
|
|
vm: &mut Vm,
|
2019-03-05 01:48:36 +00:00
|
|
|
) -> Result<(PciRoot, Vec<(u32, PciInterruptPin)>, BTreeMap<u32, String>), DeviceRegistrationError>
|
|
|
|
{
|
2018-07-09 22:39:34 +00:00
|
|
|
let mut root = PciRoot::new();
|
|
|
|
let mut pci_irqs = Vec::new();
|
2019-01-24 03:04:43 +00:00
|
|
|
let mut pid_labels = BTreeMap::new();
|
2018-07-09 22:39:34 +00:00
|
|
|
for (dev_idx, (mut device, jail)) in devices.into_iter().enumerate() {
|
2018-09-20 17:59:06 +00:00
|
|
|
let mut keep_fds = device.keep_fds();
|
2018-07-09 22:39:34 +00:00
|
|
|
syslog::push_fds(&mut keep_fds);
|
|
|
|
|
|
|
|
let irqfd = EventFd::new().map_err(DeviceRegistrationError::EventFdCreate)?;
|
2018-10-25 00:06:07 +00:00
|
|
|
let irq_resample_fd = EventFd::new().map_err(DeviceRegistrationError::EventFdCreate)?;
|
2018-07-09 20:35:40 +00:00
|
|
|
let irq_num = resources
|
|
|
|
.allocate_irq()
|
|
|
|
.ok_or(DeviceRegistrationError::AllocateIrq)? as u32;
|
2018-07-09 22:39:34 +00:00
|
|
|
let pci_irq_pin = match dev_idx % 4 {
|
|
|
|
0 => PciInterruptPin::IntA,
|
|
|
|
1 => PciInterruptPin::IntB,
|
|
|
|
2 => PciInterruptPin::IntC,
|
|
|
|
3 => PciInterruptPin::IntD,
|
|
|
|
_ => panic!(""), // Obviously not possible, but the compiler is not smart enough.
|
|
|
|
};
|
2018-10-25 00:06:07 +00:00
|
|
|
vm.register_irqfd_resample(&irqfd, &irq_resample_fd, irq_num)
|
2018-09-17 21:42:59 +00:00
|
|
|
.map_err(DeviceRegistrationError::RegisterIrqfd)?;
|
|
|
|
keep_fds.push(irqfd.as_raw_fd());
|
2018-10-25 00:06:07 +00:00
|
|
|
keep_fds.push(irq_resample_fd.as_raw_fd());
|
|
|
|
device.assign_irq(irqfd, irq_resample_fd, irq_num, pci_irq_pin);
|
2018-09-17 21:42:59 +00:00
|
|
|
pci_irqs.push((dev_idx as u32, pci_irq_pin));
|
2018-07-09 22:39:34 +00:00
|
|
|
|
|
|
|
let ranges = device
|
|
|
|
.allocate_io_bars(resources)
|
|
|
|
.map_err(DeviceRegistrationError::AllocateIoAddrs)?;
|
2019-02-21 02:56:22 +00:00
|
|
|
let device_ranges = device
|
|
|
|
.allocate_device_bars(resources)
|
|
|
|
.map_err(DeviceRegistrationError::AllocateDeviceAddrs)?;
|
2019-03-15 20:13:08 +00:00
|
|
|
device
|
|
|
|
.register_device_capabilities()
|
|
|
|
.map_err(DeviceRegistrationError::RegisterDeviceCapabilities)?;
|
2018-10-05 21:51:22 +00:00
|
|
|
for (event, addr, datamatch) in device.ioeventfds() {
|
2018-07-09 20:35:40 +00:00
|
|
|
let io_addr = IoeventAddress::Mmio(addr);
|
2018-10-05 21:51:22 +00:00
|
|
|
vm.register_ioevent(&event, io_addr, datamatch)
|
2018-07-09 20:35:40 +00:00
|
|
|
.map_err(DeviceRegistrationError::RegisterIoevent)?;
|
|
|
|
keep_fds.push(event.as_raw_fd());
|
|
|
|
}
|
2019-03-09 00:56:14 +00:00
|
|
|
let arced_dev: Arc<Mutex<dyn BusDevice>> = if let Some(jail) = jail {
|
2018-10-18 23:45:13 +00:00
|
|
|
let proxy = ProxyDevice::new(device, &jail, keep_fds)
|
|
|
|
.map_err(DeviceRegistrationError::ProxyDeviceCreation)?;
|
2019-01-24 03:04:43 +00:00
|
|
|
pid_labels.insert(proxy.pid() as u32, proxy.debug_label());
|
2018-10-18 23:45:13 +00:00
|
|
|
Arc::new(Mutex::new(proxy))
|
|
|
|
} else {
|
2019-03-09 04:41:57 +00:00
|
|
|
device.on_sandboxed();
|
2018-10-18 23:45:13 +00:00
|
|
|
Arc::new(Mutex::new(device))
|
|
|
|
};
|
2018-07-09 22:39:34 +00:00
|
|
|
root.add_device(arced_dev.clone());
|
|
|
|
for range in &ranges {
|
2018-10-03 17:22:32 +00:00
|
|
|
mmio_bus
|
|
|
|
.insert(arced_dev.clone(), range.0, range.1, true)
|
2018-07-09 22:39:34 +00:00
|
|
|
.map_err(DeviceRegistrationError::MmioInsert)?;
|
2018-07-24 00:58:09 +00:00
|
|
|
}
|
2019-02-21 02:56:22 +00:00
|
|
|
|
|
|
|
for range in &device_ranges {
|
|
|
|
mmio_bus
|
|
|
|
.insert(arced_dev.clone(), range.0, range.1, true)
|
|
|
|
.map_err(DeviceRegistrationError::MmioInsert)?;
|
|
|
|
}
|
2018-07-24 00:58:09 +00:00
|
|
|
}
|
2019-01-24 03:04:43 +00:00
|
|
|
Ok((root, pci_irqs, pid_labels))
|
2018-07-24 00:58:09 +00:00
|
|
|
}
|
2018-12-12 23:20:30 +00:00
|
|
|
|
|
|
|
/// Errors for image loading.
|
|
|
|
#[derive(Debug)]
|
|
|
|
pub enum LoadImageError {
|
2019-03-05 01:48:36 +00:00
|
|
|
Seek(io::Error),
|
2018-12-12 23:20:30 +00:00
|
|
|
ImageSizeTooLarge(u64),
|
|
|
|
ReadToMemory(GuestMemoryError),
|
|
|
|
}
|
|
|
|
|
2019-03-02 02:07:56 +00:00
|
|
|
impl Display for LoadImageError {
|
2018-12-12 23:20:30 +00:00
|
|
|
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
|
2019-02-13 01:51:26 +00:00
|
|
|
use self::LoadImageError::*;
|
|
|
|
|
2018-12-12 23:20:30 +00:00
|
|
|
match self {
|
2019-02-13 01:51:26 +00:00
|
|
|
Seek(e) => write!(f, "Seek failed: {}", e),
|
|
|
|
ImageSizeTooLarge(size) => write!(f, "Image size too large: {}", size),
|
|
|
|
ReadToMemory(e) => write!(f, "Reading image into memory failed: {}", e),
|
2018-12-12 23:20:30 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Load an image from a file into guest memory.
|
|
|
|
///
|
|
|
|
/// # Arguments
|
|
|
|
///
|
|
|
|
/// * `guest_mem` - The memory to be used by the guest.
|
|
|
|
/// * `guest_addr` - The starting address to load the image in the guest memory.
|
|
|
|
/// * `max_size` - The amount of space in bytes available in the guest memory for the image.
|
|
|
|
/// * `image` - The file containing the image to be loaded.
|
|
|
|
///
|
|
|
|
/// The size in bytes of the loaded image is returned.
|
|
|
|
pub fn load_image<F>(
|
|
|
|
guest_mem: &GuestMemory,
|
|
|
|
image: &mut F,
|
|
|
|
guest_addr: GuestAddress,
|
|
|
|
max_size: u64,
|
2019-03-05 01:48:36 +00:00
|
|
|
) -> Result<usize, LoadImageError>
|
2018-12-12 23:20:30 +00:00
|
|
|
where
|
|
|
|
F: Read + Seek,
|
|
|
|
{
|
|
|
|
let size = image.seek(SeekFrom::End(0)).map_err(LoadImageError::Seek)?;
|
|
|
|
|
|
|
|
if size > usize::max_value() as u64 || size > max_size {
|
|
|
|
return Err(LoadImageError::ImageSizeTooLarge(size));
|
|
|
|
}
|
|
|
|
|
|
|
|
// This is safe due to the bounds check above.
|
|
|
|
let size = size as usize;
|
|
|
|
|
|
|
|
image
|
|
|
|
.seek(SeekFrom::Start(0))
|
|
|
|
.map_err(LoadImageError::Seek)?;
|
|
|
|
|
|
|
|
guest_mem
|
|
|
|
.read_to_memory(guest_addr, image, size)
|
|
|
|
.map_err(LoadImageError::ReadToMemory)?;
|
|
|
|
|
|
|
|
Ok(size)
|
|
|
|
}
|