10ebf007dSSergio Lopez /* 20ebf007dSSergio Lopez * Copyright (c) 2018 Intel Corporation 30ebf007dSSergio Lopez * Copyright (c) 2019 Red Hat, Inc. 40ebf007dSSergio Lopez * 50ebf007dSSergio Lopez * This program is free software; you can redistribute it and/or modify it 60ebf007dSSergio Lopez * under the terms and conditions of the GNU General Public License, 70ebf007dSSergio Lopez * version 2 or later, as published by the Free Software Foundation. 80ebf007dSSergio Lopez * 90ebf007dSSergio Lopez * This program is distributed in the hope it will be useful, but WITHOUT 100ebf007dSSergio Lopez * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 110ebf007dSSergio Lopez * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for 120ebf007dSSergio Lopez * more details. 130ebf007dSSergio Lopez * 140ebf007dSSergio Lopez * You should have received a copy of the GNU General Public License along with 150ebf007dSSergio Lopez * this program. If not, see <http://www.gnu.org/licenses/>. 160ebf007dSSergio Lopez */ 170ebf007dSSergio Lopez 180ebf007dSSergio Lopez #include "qemu/osdep.h" 190ebf007dSSergio Lopez #include "qemu/error-report.h" 200ebf007dSSergio Lopez #include "qemu/cutils.h" 210ebf007dSSergio Lopez #include "qemu/units.h" 220ebf007dSSergio Lopez #include "qapi/error.h" 230ebf007dSSergio Lopez #include "qapi/visitor.h" 240ebf007dSSergio Lopez #include "qapi/qapi-visit-common.h" 250ebf007dSSergio Lopez #include "sysemu/sysemu.h" 260ebf007dSSergio Lopez #include "sysemu/cpus.h" 270ebf007dSSergio Lopez #include "sysemu/numa.h" 280ebf007dSSergio Lopez #include "sysemu/reset.h" 298045df14SGerd Hoffmann #include "sysemu/runstate.h" 308045df14SGerd Hoffmann #include "acpi-microvm.h" 310ebf007dSSergio Lopez 320ebf007dSSergio Lopez #include "hw/loader.h" 330ebf007dSSergio Lopez #include "hw/irq.h" 340ebf007dSSergio Lopez #include "hw/kvm/clock.h" 350ebf007dSSergio Lopez #include "hw/i386/microvm.h" 360ebf007dSSergio Lopez #include "hw/i386/x86.h" 370ebf007dSSergio Lopez #include "target/i386/cpu.h" 38852c27e2SPaolo Bonzini #include "hw/intc/i8259.h" 390ebf007dSSergio Lopez #include "hw/timer/i8254.h" 40673652a7SPaolo Bonzini #include "hw/rtc/mc146818rtc.h" 410ebf007dSSergio Lopez #include "hw/char/serial.h" 420ebf007dSSergio Lopez #include "hw/i386/topology.h" 430ebf007dSSergio Lopez #include "hw/i386/e820_memory_layout.h" 440ebf007dSSergio Lopez #include "hw/i386/fw_cfg.h" 450ebf007dSSergio Lopez #include "hw/virtio/virtio-mmio.h" 468045df14SGerd Hoffmann #include "hw/acpi/acpi.h" 478045df14SGerd Hoffmann #include "hw/acpi/generic_event_device.h" 480ebf007dSSergio Lopez 490ebf007dSSergio Lopez #include "cpu.h" 500ebf007dSSergio Lopez #include "elf.h" 510ebf007dSSergio Lopez #include "kvm_i386.h" 520ebf007dSSergio Lopez #include "hw/xen/start_info.h" 530ebf007dSSergio Lopez 543bee1d1dSGerd Hoffmann #define MICROVM_QBOOT_FILENAME "qboot.rom" 5567eb6a40SGerd Hoffmann #define MICROVM_BIOS_FILENAME "bios-microvm.bin" 560ebf007dSSergio Lopez 570ebf007dSSergio Lopez static void microvm_set_rtc(MicrovmMachineState *mms, ISADevice *s) 580ebf007dSSergio Lopez { 590ebf007dSSergio Lopez X86MachineState *x86ms = X86_MACHINE(mms); 600ebf007dSSergio Lopez int val; 610ebf007dSSergio Lopez 620ebf007dSSergio Lopez val = MIN(x86ms->below_4g_mem_size / KiB, 640); 630ebf007dSSergio Lopez rtc_set_memory(s, 0x15, val); 640ebf007dSSergio Lopez rtc_set_memory(s, 0x16, val >> 8); 650ebf007dSSergio Lopez /* extended memory (next 64MiB) */ 660ebf007dSSergio Lopez if (x86ms->below_4g_mem_size > 1 * MiB) { 670ebf007dSSergio Lopez val = (x86ms->below_4g_mem_size - 1 * MiB) / KiB; 680ebf007dSSergio Lopez } else { 690ebf007dSSergio Lopez val = 0; 700ebf007dSSergio Lopez } 710ebf007dSSergio Lopez if (val > 65535) { 720ebf007dSSergio Lopez val = 65535; 730ebf007dSSergio Lopez } 740ebf007dSSergio Lopez rtc_set_memory(s, 0x17, val); 750ebf007dSSergio Lopez rtc_set_memory(s, 0x18, val >> 8); 760ebf007dSSergio Lopez rtc_set_memory(s, 0x30, val); 770ebf007dSSergio Lopez rtc_set_memory(s, 0x31, val >> 8); 780ebf007dSSergio Lopez /* memory between 16MiB and 4GiB */ 790ebf007dSSergio Lopez if (x86ms->below_4g_mem_size > 16 * MiB) { 800ebf007dSSergio Lopez val = (x86ms->below_4g_mem_size - 16 * MiB) / (64 * KiB); 810ebf007dSSergio Lopez } else { 820ebf007dSSergio Lopez val = 0; 830ebf007dSSergio Lopez } 840ebf007dSSergio Lopez if (val > 65535) { 850ebf007dSSergio Lopez val = 65535; 860ebf007dSSergio Lopez } 870ebf007dSSergio Lopez rtc_set_memory(s, 0x34, val); 880ebf007dSSergio Lopez rtc_set_memory(s, 0x35, val >> 8); 890ebf007dSSergio Lopez /* memory above 4GiB */ 900ebf007dSSergio Lopez val = x86ms->above_4g_mem_size / 65536; 910ebf007dSSergio Lopez rtc_set_memory(s, 0x5b, val); 920ebf007dSSergio Lopez rtc_set_memory(s, 0x5c, val >> 8); 930ebf007dSSergio Lopez rtc_set_memory(s, 0x5d, val >> 16); 940ebf007dSSergio Lopez } 950ebf007dSSergio Lopez 960ebf007dSSergio Lopez static void microvm_gsi_handler(void *opaque, int n, int level) 970ebf007dSSergio Lopez { 980ebf007dSSergio Lopez GSIState *s = opaque; 990ebf007dSSergio Lopez 1000ebf007dSSergio Lopez qemu_set_irq(s->ioapic_irq[n], level); 1010ebf007dSSergio Lopez } 1020ebf007dSSergio Lopez 1030ebf007dSSergio Lopez static void microvm_devices_init(MicrovmMachineState *mms) 1040ebf007dSSergio Lopez { 1050ebf007dSSergio Lopez X86MachineState *x86ms = X86_MACHINE(mms); 1060ebf007dSSergio Lopez ISABus *isa_bus; 1070ebf007dSSergio Lopez ISADevice *rtc_state; 1080ebf007dSSergio Lopez GSIState *gsi_state; 1090ebf007dSSergio Lopez int i; 1100ebf007dSSergio Lopez 1110ebf007dSSergio Lopez /* Core components */ 1120ebf007dSSergio Lopez 1130ebf007dSSergio Lopez gsi_state = g_malloc0(sizeof(*gsi_state)); 1140ebf007dSSergio Lopez if (mms->pic == ON_OFF_AUTO_ON || mms->pic == ON_OFF_AUTO_AUTO) { 1150ebf007dSSergio Lopez x86ms->gsi = qemu_allocate_irqs(gsi_handler, gsi_state, GSI_NUM_PINS); 1160ebf007dSSergio Lopez } else { 1170ebf007dSSergio Lopez x86ms->gsi = qemu_allocate_irqs(microvm_gsi_handler, 1180ebf007dSSergio Lopez gsi_state, GSI_NUM_PINS); 1190ebf007dSSergio Lopez } 1200ebf007dSSergio Lopez 1210ebf007dSSergio Lopez isa_bus = isa_bus_new(NULL, get_system_memory(), get_system_io(), 1220ebf007dSSergio Lopez &error_abort); 1230ebf007dSSergio Lopez isa_bus_irqs(isa_bus, x86ms->gsi); 1240ebf007dSSergio Lopez 1250ebf007dSSergio Lopez ioapic_init_gsi(gsi_state, "machine"); 1260ebf007dSSergio Lopez 1270ebf007dSSergio Lopez kvmclock_create(); 1280ebf007dSSergio Lopez 12955c4b069SGerd Hoffmann mms->virtio_irq_base = x86_machine_is_acpi_enabled(x86ms) ? 16 : 5; 1300ebf007dSSergio Lopez for (i = 0; i < VIRTIO_NUM_TRANSPORTS; i++) { 1310ebf007dSSergio Lopez sysbus_create_simple("virtio-mmio", 1320ebf007dSSergio Lopez VIRTIO_MMIO_BASE + i * 512, 133d4e9d577SGerd Hoffmann x86ms->gsi[mms->virtio_irq_base + i]); 1340ebf007dSSergio Lopez } 1350ebf007dSSergio Lopez 1360ebf007dSSergio Lopez /* Optional and legacy devices */ 1378045df14SGerd Hoffmann if (x86_machine_is_acpi_enabled(x86ms)) { 1388045df14SGerd Hoffmann DeviceState *dev = qdev_new(TYPE_ACPI_GED_X86); 1398045df14SGerd Hoffmann qdev_prop_set_uint32(dev, "ged-event", ACPI_GED_PWR_DOWN_EVT); 1408045df14SGerd Hoffmann sysbus_mmio_map(SYS_BUS_DEVICE(dev), 0, GED_MMIO_BASE); 1418045df14SGerd Hoffmann /* sysbus_mmio_map(SYS_BUS_DEVICE(dev), 1, GED_MMIO_BASE_MEMHP); */ 1428045df14SGerd Hoffmann sysbus_mmio_map(SYS_BUS_DEVICE(dev), 2, GED_MMIO_BASE_REGS); 1438045df14SGerd Hoffmann sysbus_connect_irq(SYS_BUS_DEVICE(dev), 0, 1448045df14SGerd Hoffmann x86ms->gsi[GED_MMIO_IRQ]); 1458045df14SGerd Hoffmann sysbus_realize(SYS_BUS_DEVICE(dev), &error_fatal); 14650aef131SGerd Hoffmann x86ms->acpi_dev = HOTPLUG_HANDLER(dev); 1478045df14SGerd Hoffmann } 1480ebf007dSSergio Lopez 1490ebf007dSSergio Lopez if (mms->pic == ON_OFF_AUTO_ON || mms->pic == ON_OFF_AUTO_AUTO) { 1500ebf007dSSergio Lopez qemu_irq *i8259; 1510ebf007dSSergio Lopez 15289a289c7SPaolo Bonzini i8259 = i8259_init(isa_bus, x86_allocate_cpu_irq()); 1530ebf007dSSergio Lopez for (i = 0; i < ISA_NUM_IRQS; i++) { 1540ebf007dSSergio Lopez gsi_state->i8259_irq[i] = i8259[i]; 1550ebf007dSSergio Lopez } 1560ebf007dSSergio Lopez g_free(i8259); 1570ebf007dSSergio Lopez } 1580ebf007dSSergio Lopez 1590ebf007dSSergio Lopez if (mms->pit == ON_OFF_AUTO_ON || mms->pit == ON_OFF_AUTO_AUTO) { 1600ebf007dSSergio Lopez if (kvm_pit_in_kernel()) { 1610ebf007dSSergio Lopez kvm_pit_init(isa_bus, 0x40); 1620ebf007dSSergio Lopez } else { 1630ebf007dSSergio Lopez i8254_pit_init(isa_bus, 0x40, 0, NULL); 1640ebf007dSSergio Lopez } 1650ebf007dSSergio Lopez } 1660ebf007dSSergio Lopez 1670ebf007dSSergio Lopez if (mms->rtc == ON_OFF_AUTO_ON || 1680ebf007dSSergio Lopez (mms->rtc == ON_OFF_AUTO_AUTO && !kvm_enabled())) { 1690ebf007dSSergio Lopez rtc_state = mc146818_rtc_init(isa_bus, 2000, NULL); 1700ebf007dSSergio Lopez microvm_set_rtc(mms, rtc_state); 1710ebf007dSSergio Lopez } 1720ebf007dSSergio Lopez 1730ebf007dSSergio Lopez if (mms->isa_serial) { 1740ebf007dSSergio Lopez serial_hds_isa_init(isa_bus, 0, 1); 1750ebf007dSSergio Lopez } 1760ebf007dSSergio Lopez 1770ebf007dSSergio Lopez if (bios_name == NULL) { 17867eb6a40SGerd Hoffmann bios_name = x86_machine_is_acpi_enabled(x86ms) 17967eb6a40SGerd Hoffmann ? MICROVM_BIOS_FILENAME 18067eb6a40SGerd Hoffmann : MICROVM_QBOOT_FILENAME; 1810ebf007dSSergio Lopez } 1820ebf007dSSergio Lopez x86_bios_rom_init(get_system_memory(), true); 1830ebf007dSSergio Lopez } 1840ebf007dSSergio Lopez 1850ebf007dSSergio Lopez static void microvm_memory_init(MicrovmMachineState *mms) 1860ebf007dSSergio Lopez { 1870ebf007dSSergio Lopez MachineState *machine = MACHINE(mms); 1880ebf007dSSergio Lopez X86MachineState *x86ms = X86_MACHINE(mms); 1899ad54686SIgor Mammedov MemoryRegion *ram_below_4g, *ram_above_4g; 1900ebf007dSSergio Lopez MemoryRegion *system_memory = get_system_memory(); 1910ebf007dSSergio Lopez FWCfgState *fw_cfg; 192e289655cSGerd Hoffmann ram_addr_t lowmem = 0xc0000000; /* 3G */ 1930ebf007dSSergio Lopez int i; 1940ebf007dSSergio Lopez 1950ebf007dSSergio Lopez if (machine->ram_size > lowmem) { 1960ebf007dSSergio Lopez x86ms->above_4g_mem_size = machine->ram_size - lowmem; 1970ebf007dSSergio Lopez x86ms->below_4g_mem_size = lowmem; 1980ebf007dSSergio Lopez } else { 1990ebf007dSSergio Lopez x86ms->above_4g_mem_size = 0; 2000ebf007dSSergio Lopez x86ms->below_4g_mem_size = machine->ram_size; 2010ebf007dSSergio Lopez } 2020ebf007dSSergio Lopez 2030ebf007dSSergio Lopez ram_below_4g = g_malloc(sizeof(*ram_below_4g)); 2049ad54686SIgor Mammedov memory_region_init_alias(ram_below_4g, NULL, "ram-below-4g", machine->ram, 2050ebf007dSSergio Lopez 0, x86ms->below_4g_mem_size); 2060ebf007dSSergio Lopez memory_region_add_subregion(system_memory, 0, ram_below_4g); 2070ebf007dSSergio Lopez 2080ebf007dSSergio Lopez e820_add_entry(0, x86ms->below_4g_mem_size, E820_RAM); 2090ebf007dSSergio Lopez 2100ebf007dSSergio Lopez if (x86ms->above_4g_mem_size > 0) { 2110ebf007dSSergio Lopez ram_above_4g = g_malloc(sizeof(*ram_above_4g)); 2129ad54686SIgor Mammedov memory_region_init_alias(ram_above_4g, NULL, "ram-above-4g", 2139ad54686SIgor Mammedov machine->ram, 2140ebf007dSSergio Lopez x86ms->below_4g_mem_size, 2150ebf007dSSergio Lopez x86ms->above_4g_mem_size); 2160ebf007dSSergio Lopez memory_region_add_subregion(system_memory, 0x100000000ULL, 2170ebf007dSSergio Lopez ram_above_4g); 2180ebf007dSSergio Lopez e820_add_entry(0x100000000ULL, x86ms->above_4g_mem_size, E820_RAM); 2190ebf007dSSergio Lopez } 2200ebf007dSSergio Lopez 2210ebf007dSSergio Lopez fw_cfg = fw_cfg_init_io_dma(FW_CFG_IO_BASE, FW_CFG_IO_BASE + 4, 2220ebf007dSSergio Lopez &address_space_memory); 2230ebf007dSSergio Lopez 2240ebf007dSSergio Lopez fw_cfg_add_i16(fw_cfg, FW_CFG_NB_CPUS, machine->smp.cpus); 2250ebf007dSSergio Lopez fw_cfg_add_i16(fw_cfg, FW_CFG_MAX_CPUS, machine->smp.max_cpus); 2260ebf007dSSergio Lopez fw_cfg_add_i64(fw_cfg, FW_CFG_RAM_SIZE, (uint64_t)machine->ram_size); 2270ebf007dSSergio Lopez fw_cfg_add_i32(fw_cfg, FW_CFG_IRQ0_OVERRIDE, kvm_allows_irq0_override()); 2280ebf007dSSergio Lopez fw_cfg_add_bytes(fw_cfg, FW_CFG_E820_TABLE, 2290ebf007dSSergio Lopez &e820_reserve, sizeof(e820_reserve)); 2300ebf007dSSergio Lopez fw_cfg_add_file(fw_cfg, "etc/e820", e820_table, 2310ebf007dSSergio Lopez sizeof(struct e820_entry) * e820_get_num_entries()); 2320ebf007dSSergio Lopez 2330ebf007dSSergio Lopez rom_set_fw(fw_cfg); 2340ebf007dSSergio Lopez 2350ebf007dSSergio Lopez if (machine->kernel_filename != NULL) { 2360ebf007dSSergio Lopez x86_load_linux(x86ms, fw_cfg, 0, true, true); 2370ebf007dSSergio Lopez } 2380ebf007dSSergio Lopez 2390ebf007dSSergio Lopez if (mms->option_roms) { 2400ebf007dSSergio Lopez for (i = 0; i < nb_option_roms; i++) { 2410ebf007dSSergio Lopez rom_add_option(option_rom[i].name, option_rom[i].bootindex); 2420ebf007dSSergio Lopez } 2430ebf007dSSergio Lopez } 2440ebf007dSSergio Lopez 2450ebf007dSSergio Lopez x86ms->fw_cfg = fw_cfg; 2460ebf007dSSergio Lopez x86ms->ioapic_as = &address_space_memory; 2470ebf007dSSergio Lopez } 2480ebf007dSSergio Lopez 249d4e9d577SGerd Hoffmann static gchar *microvm_get_mmio_cmdline(gchar *name, uint32_t virtio_irq_base) 2500ebf007dSSergio Lopez { 2510ebf007dSSergio Lopez gchar *cmdline; 2520ebf007dSSergio Lopez gchar *separator; 2530ebf007dSSergio Lopez long int index; 2540ebf007dSSergio Lopez int ret; 2550ebf007dSSergio Lopez 2560ebf007dSSergio Lopez separator = g_strrstr(name, "."); 2570ebf007dSSergio Lopez if (!separator) { 2580ebf007dSSergio Lopez return NULL; 2590ebf007dSSergio Lopez } 2600ebf007dSSergio Lopez 2610ebf007dSSergio Lopez if (qemu_strtol(separator + 1, NULL, 10, &index) != 0) { 2620ebf007dSSergio Lopez return NULL; 2630ebf007dSSergio Lopez } 2640ebf007dSSergio Lopez 2650ebf007dSSergio Lopez cmdline = g_malloc0(VIRTIO_CMDLINE_MAXLEN); 2660ebf007dSSergio Lopez ret = g_snprintf(cmdline, VIRTIO_CMDLINE_MAXLEN, 2670ebf007dSSergio Lopez " virtio_mmio.device=512@0x%lx:%ld", 2680ebf007dSSergio Lopez VIRTIO_MMIO_BASE + index * 512, 269d4e9d577SGerd Hoffmann virtio_irq_base + index); 2700ebf007dSSergio Lopez if (ret < 0 || ret >= VIRTIO_CMDLINE_MAXLEN) { 2710ebf007dSSergio Lopez g_free(cmdline); 2720ebf007dSSergio Lopez return NULL; 2730ebf007dSSergio Lopez } 2740ebf007dSSergio Lopez 2750ebf007dSSergio Lopez return cmdline; 2760ebf007dSSergio Lopez } 2770ebf007dSSergio Lopez 2780ebf007dSSergio Lopez static void microvm_fix_kernel_cmdline(MachineState *machine) 2790ebf007dSSergio Lopez { 2800ebf007dSSergio Lopez X86MachineState *x86ms = X86_MACHINE(machine); 281d4e9d577SGerd Hoffmann MicrovmMachineState *mms = MICROVM_MACHINE(machine); 2820ebf007dSSergio Lopez BusState *bus; 2830ebf007dSSergio Lopez BusChild *kid; 2840ebf007dSSergio Lopez char *cmdline; 2850ebf007dSSergio Lopez 2860ebf007dSSergio Lopez /* 2870ebf007dSSergio Lopez * Find MMIO transports with attached devices, and add them to the kernel 2880ebf007dSSergio Lopez * command line. 2890ebf007dSSergio Lopez * 2900ebf007dSSergio Lopez * Yes, this is a hack, but one that heavily improves the UX without 2910ebf007dSSergio Lopez * introducing any significant issues. 2920ebf007dSSergio Lopez */ 2930ebf007dSSergio Lopez cmdline = g_strdup(machine->kernel_cmdline); 2940ebf007dSSergio Lopez bus = sysbus_get_default(); 2950ebf007dSSergio Lopez QTAILQ_FOREACH(kid, &bus->children, sibling) { 2960ebf007dSSergio Lopez DeviceState *dev = kid->child; 2970ebf007dSSergio Lopez ObjectClass *class = object_get_class(OBJECT(dev)); 2980ebf007dSSergio Lopez 2990ebf007dSSergio Lopez if (class == object_class_by_name(TYPE_VIRTIO_MMIO)) { 3000ebf007dSSergio Lopez VirtIOMMIOProxy *mmio = VIRTIO_MMIO(OBJECT(dev)); 3010ebf007dSSergio Lopez VirtioBusState *mmio_virtio_bus = &mmio->bus; 3020ebf007dSSergio Lopez BusState *mmio_bus = &mmio_virtio_bus->parent_obj; 3030ebf007dSSergio Lopez 3040ebf007dSSergio Lopez if (!QTAILQ_EMPTY(&mmio_bus->children)) { 305d4e9d577SGerd Hoffmann gchar *mmio_cmdline = microvm_get_mmio_cmdline 306d4e9d577SGerd Hoffmann (mmio_bus->name, mms->virtio_irq_base); 3070ebf007dSSergio Lopez if (mmio_cmdline) { 3080ebf007dSSergio Lopez char *newcmd = g_strjoin(NULL, cmdline, mmio_cmdline, NULL); 3090ebf007dSSergio Lopez g_free(mmio_cmdline); 3100ebf007dSSergio Lopez g_free(cmdline); 3110ebf007dSSergio Lopez cmdline = newcmd; 3120ebf007dSSergio Lopez } 3130ebf007dSSergio Lopez } 3140ebf007dSSergio Lopez } 3150ebf007dSSergio Lopez } 3160ebf007dSSergio Lopez 3170ebf007dSSergio Lopez fw_cfg_modify_i32(x86ms->fw_cfg, FW_CFG_CMDLINE_SIZE, strlen(cmdline) + 1); 3180ebf007dSSergio Lopez fw_cfg_modify_string(x86ms->fw_cfg, FW_CFG_CMDLINE_DATA, cmdline); 319c3157b74SSergio Lopez 320c3157b74SSergio Lopez g_free(cmdline); 3210ebf007dSSergio Lopez } 3220ebf007dSSergio Lopez 323*e3ab9873SGerd Hoffmann static void microvm_device_pre_plug_cb(HotplugHandler *hotplug_dev, 324*e3ab9873SGerd Hoffmann DeviceState *dev, Error **errp) 325*e3ab9873SGerd Hoffmann { 326*e3ab9873SGerd Hoffmann x86_cpu_pre_plug(hotplug_dev, dev, errp); 327*e3ab9873SGerd Hoffmann } 328*e3ab9873SGerd Hoffmann 329*e3ab9873SGerd Hoffmann static void microvm_device_plug_cb(HotplugHandler *hotplug_dev, 330*e3ab9873SGerd Hoffmann DeviceState *dev, Error **errp) 331*e3ab9873SGerd Hoffmann { 332*e3ab9873SGerd Hoffmann x86_cpu_plug(hotplug_dev, dev, errp); 333*e3ab9873SGerd Hoffmann } 334*e3ab9873SGerd Hoffmann 335*e3ab9873SGerd Hoffmann static void microvm_device_unplug_request_cb(HotplugHandler *hotplug_dev, 336*e3ab9873SGerd Hoffmann DeviceState *dev, Error **errp) 337*e3ab9873SGerd Hoffmann { 338*e3ab9873SGerd Hoffmann error_setg(errp, "unplug not supported by microvm"); 339*e3ab9873SGerd Hoffmann } 340*e3ab9873SGerd Hoffmann 341*e3ab9873SGerd Hoffmann static void microvm_device_unplug_cb(HotplugHandler *hotplug_dev, 342*e3ab9873SGerd Hoffmann DeviceState *dev, Error **errp) 343*e3ab9873SGerd Hoffmann { 344*e3ab9873SGerd Hoffmann error_setg(errp, "unplug not supported by microvm"); 345*e3ab9873SGerd Hoffmann } 346*e3ab9873SGerd Hoffmann 347*e3ab9873SGerd Hoffmann static HotplugHandler *microvm_get_hotplug_handler(MachineState *machine, 348*e3ab9873SGerd Hoffmann DeviceState *dev) 349*e3ab9873SGerd Hoffmann { 350*e3ab9873SGerd Hoffmann if (object_dynamic_cast(OBJECT(dev), TYPE_CPU)) { 351*e3ab9873SGerd Hoffmann return HOTPLUG_HANDLER(machine); 352*e3ab9873SGerd Hoffmann } 353*e3ab9873SGerd Hoffmann return NULL; 354*e3ab9873SGerd Hoffmann } 355*e3ab9873SGerd Hoffmann 3560ebf007dSSergio Lopez static void microvm_machine_state_init(MachineState *machine) 3570ebf007dSSergio Lopez { 3580ebf007dSSergio Lopez MicrovmMachineState *mms = MICROVM_MACHINE(machine); 3590ebf007dSSergio Lopez X86MachineState *x86ms = X86_MACHINE(machine); 3600ebf007dSSergio Lopez Error *local_err = NULL; 3610ebf007dSSergio Lopez 3620ebf007dSSergio Lopez microvm_memory_init(mms); 3630ebf007dSSergio Lopez 3640ebf007dSSergio Lopez x86_cpus_init(x86ms, CPU_VERSION_LATEST); 3650ebf007dSSergio Lopez if (local_err) { 3660ebf007dSSergio Lopez error_report_err(local_err); 3670ebf007dSSergio Lopez exit(1); 3680ebf007dSSergio Lopez } 3690ebf007dSSergio Lopez 3700ebf007dSSergio Lopez microvm_devices_init(mms); 3710ebf007dSSergio Lopez } 3720ebf007dSSergio Lopez 3730ebf007dSSergio Lopez static void microvm_machine_reset(MachineState *machine) 3740ebf007dSSergio Lopez { 3750ebf007dSSergio Lopez MicrovmMachineState *mms = MICROVM_MACHINE(machine); 3760ebf007dSSergio Lopez CPUState *cs; 3770ebf007dSSergio Lopez X86CPU *cpu; 3780ebf007dSSergio Lopez 379f6f7e2d8SGerd Hoffmann if (!x86_machine_is_acpi_enabled(X86_MACHINE(machine)) && 380f6f7e2d8SGerd Hoffmann machine->kernel_filename != NULL && 3810ebf007dSSergio Lopez mms->auto_kernel_cmdline && !mms->kernel_cmdline_fixed) { 3820ebf007dSSergio Lopez microvm_fix_kernel_cmdline(machine); 3830ebf007dSSergio Lopez mms->kernel_cmdline_fixed = true; 3840ebf007dSSergio Lopez } 3850ebf007dSSergio Lopez 3860ebf007dSSergio Lopez qemu_devices_reset(); 3870ebf007dSSergio Lopez 3880ebf007dSSergio Lopez CPU_FOREACH(cs) { 3890ebf007dSSergio Lopez cpu = X86_CPU(cs); 3900ebf007dSSergio Lopez 3910ebf007dSSergio Lopez if (cpu->apic_state) { 392f703a04cSDamien Hedde device_legacy_reset(cpu->apic_state); 3930ebf007dSSergio Lopez } 3940ebf007dSSergio Lopez } 3950ebf007dSSergio Lopez } 3960ebf007dSSergio Lopez 3970ebf007dSSergio Lopez static void microvm_machine_get_pic(Object *obj, Visitor *v, const char *name, 3980ebf007dSSergio Lopez void *opaque, Error **errp) 3990ebf007dSSergio Lopez { 4000ebf007dSSergio Lopez MicrovmMachineState *mms = MICROVM_MACHINE(obj); 4010ebf007dSSergio Lopez OnOffAuto pic = mms->pic; 4020ebf007dSSergio Lopez 4030ebf007dSSergio Lopez visit_type_OnOffAuto(v, name, &pic, errp); 4040ebf007dSSergio Lopez } 4050ebf007dSSergio Lopez 4060ebf007dSSergio Lopez static void microvm_machine_set_pic(Object *obj, Visitor *v, const char *name, 4070ebf007dSSergio Lopez void *opaque, Error **errp) 4080ebf007dSSergio Lopez { 4090ebf007dSSergio Lopez MicrovmMachineState *mms = MICROVM_MACHINE(obj); 4100ebf007dSSergio Lopez 4110ebf007dSSergio Lopez visit_type_OnOffAuto(v, name, &mms->pic, errp); 4120ebf007dSSergio Lopez } 4130ebf007dSSergio Lopez 4140ebf007dSSergio Lopez static void microvm_machine_get_pit(Object *obj, Visitor *v, const char *name, 4150ebf007dSSergio Lopez void *opaque, Error **errp) 4160ebf007dSSergio Lopez { 4170ebf007dSSergio Lopez MicrovmMachineState *mms = MICROVM_MACHINE(obj); 4180ebf007dSSergio Lopez OnOffAuto pit = mms->pit; 4190ebf007dSSergio Lopez 4200ebf007dSSergio Lopez visit_type_OnOffAuto(v, name, &pit, errp); 4210ebf007dSSergio Lopez } 4220ebf007dSSergio Lopez 4230ebf007dSSergio Lopez static void microvm_machine_set_pit(Object *obj, Visitor *v, const char *name, 4240ebf007dSSergio Lopez void *opaque, Error **errp) 4250ebf007dSSergio Lopez { 4260ebf007dSSergio Lopez MicrovmMachineState *mms = MICROVM_MACHINE(obj); 4270ebf007dSSergio Lopez 4280ebf007dSSergio Lopez visit_type_OnOffAuto(v, name, &mms->pit, errp); 4290ebf007dSSergio Lopez } 4300ebf007dSSergio Lopez 4310ebf007dSSergio Lopez static void microvm_machine_get_rtc(Object *obj, Visitor *v, const char *name, 4320ebf007dSSergio Lopez void *opaque, Error **errp) 4330ebf007dSSergio Lopez { 4340ebf007dSSergio Lopez MicrovmMachineState *mms = MICROVM_MACHINE(obj); 4350ebf007dSSergio Lopez OnOffAuto rtc = mms->rtc; 4360ebf007dSSergio Lopez 4370ebf007dSSergio Lopez visit_type_OnOffAuto(v, name, &rtc, errp); 4380ebf007dSSergio Lopez } 4390ebf007dSSergio Lopez 4400ebf007dSSergio Lopez static void microvm_machine_set_rtc(Object *obj, Visitor *v, const char *name, 4410ebf007dSSergio Lopez void *opaque, Error **errp) 4420ebf007dSSergio Lopez { 4430ebf007dSSergio Lopez MicrovmMachineState *mms = MICROVM_MACHINE(obj); 4440ebf007dSSergio Lopez 4450ebf007dSSergio Lopez visit_type_OnOffAuto(v, name, &mms->rtc, errp); 4460ebf007dSSergio Lopez } 4470ebf007dSSergio Lopez 4480ebf007dSSergio Lopez static bool microvm_machine_get_isa_serial(Object *obj, Error **errp) 4490ebf007dSSergio Lopez { 4500ebf007dSSergio Lopez MicrovmMachineState *mms = MICROVM_MACHINE(obj); 4510ebf007dSSergio Lopez 4520ebf007dSSergio Lopez return mms->isa_serial; 4530ebf007dSSergio Lopez } 4540ebf007dSSergio Lopez 4550ebf007dSSergio Lopez static void microvm_machine_set_isa_serial(Object *obj, bool value, 4560ebf007dSSergio Lopez Error **errp) 4570ebf007dSSergio Lopez { 4580ebf007dSSergio Lopez MicrovmMachineState *mms = MICROVM_MACHINE(obj); 4590ebf007dSSergio Lopez 4600ebf007dSSergio Lopez mms->isa_serial = value; 4610ebf007dSSergio Lopez } 4620ebf007dSSergio Lopez 4630ebf007dSSergio Lopez static bool microvm_machine_get_option_roms(Object *obj, Error **errp) 4640ebf007dSSergio Lopez { 4650ebf007dSSergio Lopez MicrovmMachineState *mms = MICROVM_MACHINE(obj); 4660ebf007dSSergio Lopez 4670ebf007dSSergio Lopez return mms->option_roms; 4680ebf007dSSergio Lopez } 4690ebf007dSSergio Lopez 4700ebf007dSSergio Lopez static void microvm_machine_set_option_roms(Object *obj, bool value, 4710ebf007dSSergio Lopez Error **errp) 4720ebf007dSSergio Lopez { 4730ebf007dSSergio Lopez MicrovmMachineState *mms = MICROVM_MACHINE(obj); 4740ebf007dSSergio Lopez 4750ebf007dSSergio Lopez mms->option_roms = value; 4760ebf007dSSergio Lopez } 4770ebf007dSSergio Lopez 4780ebf007dSSergio Lopez static bool microvm_machine_get_auto_kernel_cmdline(Object *obj, Error **errp) 4790ebf007dSSergio Lopez { 4800ebf007dSSergio Lopez MicrovmMachineState *mms = MICROVM_MACHINE(obj); 4810ebf007dSSergio Lopez 4820ebf007dSSergio Lopez return mms->auto_kernel_cmdline; 4830ebf007dSSergio Lopez } 4840ebf007dSSergio Lopez 4850ebf007dSSergio Lopez static void microvm_machine_set_auto_kernel_cmdline(Object *obj, bool value, 4860ebf007dSSergio Lopez Error **errp) 4870ebf007dSSergio Lopez { 4880ebf007dSSergio Lopez MicrovmMachineState *mms = MICROVM_MACHINE(obj); 4890ebf007dSSergio Lopez 4900ebf007dSSergio Lopez mms->auto_kernel_cmdline = value; 4910ebf007dSSergio Lopez } 4920ebf007dSSergio Lopez 4938045df14SGerd Hoffmann static void microvm_machine_done(Notifier *notifier, void *data) 4948045df14SGerd Hoffmann { 4958045df14SGerd Hoffmann MicrovmMachineState *mms = container_of(notifier, MicrovmMachineState, 4968045df14SGerd Hoffmann machine_done); 4978045df14SGerd Hoffmann 4988045df14SGerd Hoffmann acpi_setup_microvm(mms); 4998045df14SGerd Hoffmann } 5008045df14SGerd Hoffmann 5018045df14SGerd Hoffmann static void microvm_powerdown_req(Notifier *notifier, void *data) 5028045df14SGerd Hoffmann { 5038045df14SGerd Hoffmann MicrovmMachineState *mms = container_of(notifier, MicrovmMachineState, 5048045df14SGerd Hoffmann powerdown_req); 50550aef131SGerd Hoffmann X86MachineState *x86ms = X86_MACHINE(mms); 5068045df14SGerd Hoffmann 50750aef131SGerd Hoffmann if (x86ms->acpi_dev) { 50850aef131SGerd Hoffmann Object *obj = OBJECT(x86ms->acpi_dev); 5098045df14SGerd Hoffmann AcpiDeviceIfClass *adevc = ACPI_DEVICE_IF_GET_CLASS(obj); 51050aef131SGerd Hoffmann adevc->send_event(ACPI_DEVICE_IF(x86ms->acpi_dev), 51150aef131SGerd Hoffmann ACPI_POWER_DOWN_STATUS); 5128045df14SGerd Hoffmann } 5138045df14SGerd Hoffmann } 5148045df14SGerd Hoffmann 5150ebf007dSSergio Lopez static void microvm_machine_initfn(Object *obj) 5160ebf007dSSergio Lopez { 5170ebf007dSSergio Lopez MicrovmMachineState *mms = MICROVM_MACHINE(obj); 5180ebf007dSSergio Lopez 5190ebf007dSSergio Lopez /* Configuration */ 5200ebf007dSSergio Lopez mms->pic = ON_OFF_AUTO_AUTO; 5210ebf007dSSergio Lopez mms->pit = ON_OFF_AUTO_AUTO; 5220ebf007dSSergio Lopez mms->rtc = ON_OFF_AUTO_AUTO; 5230ebf007dSSergio Lopez mms->isa_serial = true; 5240ebf007dSSergio Lopez mms->option_roms = true; 5250ebf007dSSergio Lopez mms->auto_kernel_cmdline = true; 5260ebf007dSSergio Lopez 5270ebf007dSSergio Lopez /* State */ 5280ebf007dSSergio Lopez mms->kernel_cmdline_fixed = false; 5298045df14SGerd Hoffmann 5308045df14SGerd Hoffmann mms->machine_done.notify = microvm_machine_done; 5318045df14SGerd Hoffmann qemu_add_machine_init_done_notifier(&mms->machine_done); 5328045df14SGerd Hoffmann mms->powerdown_req.notify = microvm_powerdown_req; 5338045df14SGerd Hoffmann qemu_register_powerdown_notifier(&mms->powerdown_req); 5340ebf007dSSergio Lopez } 5350ebf007dSSergio Lopez 5360ebf007dSSergio Lopez static void microvm_class_init(ObjectClass *oc, void *data) 5370ebf007dSSergio Lopez { 5380ebf007dSSergio Lopez MachineClass *mc = MACHINE_CLASS(oc); 539*e3ab9873SGerd Hoffmann HotplugHandlerClass *hc = HOTPLUG_HANDLER_CLASS(oc); 5400ebf007dSSergio Lopez 5410ebf007dSSergio Lopez mc->init = microvm_machine_state_init; 5420ebf007dSSergio Lopez 5430ebf007dSSergio Lopez mc->family = "microvm_i386"; 5440ebf007dSSergio Lopez mc->desc = "microvm (i386)"; 5450ebf007dSSergio Lopez mc->units_per_default_bus = 1; 5460ebf007dSSergio Lopez mc->no_floppy = 1; 5470ebf007dSSergio Lopez mc->max_cpus = 288; 5480ebf007dSSergio Lopez mc->has_hotpluggable_cpus = false; 5490ebf007dSSergio Lopez mc->auto_enable_numa_with_memhp = false; 550195784a0SDavid Hildenbrand mc->auto_enable_numa_with_memdev = false; 5510ebf007dSSergio Lopez mc->default_cpu_type = TARGET_DEFAULT_CPU_TYPE; 5520ebf007dSSergio Lopez mc->nvdimm_supported = false; 5539ad54686SIgor Mammedov mc->default_ram_id = "microvm.ram"; 5540ebf007dSSergio Lopez 5550ebf007dSSergio Lopez /* Avoid relying too much on kernel components */ 5560ebf007dSSergio Lopez mc->default_kernel_irqchip_split = true; 5570ebf007dSSergio Lopez 5580ebf007dSSergio Lopez /* Machine class handlers */ 5590ebf007dSSergio Lopez mc->reset = microvm_machine_reset; 5600ebf007dSSergio Lopez 561*e3ab9873SGerd Hoffmann /* hotplug (for cpu coldplug) */ 562*e3ab9873SGerd Hoffmann mc->get_hotplug_handler = microvm_get_hotplug_handler; 563*e3ab9873SGerd Hoffmann hc->pre_plug = microvm_device_pre_plug_cb; 564*e3ab9873SGerd Hoffmann hc->plug = microvm_device_plug_cb; 565*e3ab9873SGerd Hoffmann hc->unplug_request = microvm_device_unplug_request_cb; 566*e3ab9873SGerd Hoffmann hc->unplug = microvm_device_unplug_cb; 567*e3ab9873SGerd Hoffmann 5680ebf007dSSergio Lopez object_class_property_add(oc, MICROVM_MACHINE_PIC, "OnOffAuto", 5690ebf007dSSergio Lopez microvm_machine_get_pic, 5700ebf007dSSergio Lopez microvm_machine_set_pic, 571d2623129SMarkus Armbruster NULL, NULL); 5720ebf007dSSergio Lopez object_class_property_set_description(oc, MICROVM_MACHINE_PIC, 5737eecec7dSMarkus Armbruster "Enable i8259 PIC"); 5740ebf007dSSergio Lopez 5750ebf007dSSergio Lopez object_class_property_add(oc, MICROVM_MACHINE_PIT, "OnOffAuto", 5760ebf007dSSergio Lopez microvm_machine_get_pit, 5770ebf007dSSergio Lopez microvm_machine_set_pit, 578d2623129SMarkus Armbruster NULL, NULL); 5790ebf007dSSergio Lopez object_class_property_set_description(oc, MICROVM_MACHINE_PIT, 5807eecec7dSMarkus Armbruster "Enable i8254 PIT"); 5810ebf007dSSergio Lopez 5820ebf007dSSergio Lopez object_class_property_add(oc, MICROVM_MACHINE_RTC, "OnOffAuto", 5830ebf007dSSergio Lopez microvm_machine_get_rtc, 5840ebf007dSSergio Lopez microvm_machine_set_rtc, 585d2623129SMarkus Armbruster NULL, NULL); 5860ebf007dSSergio Lopez object_class_property_set_description(oc, MICROVM_MACHINE_RTC, 5877eecec7dSMarkus Armbruster "Enable MC146818 RTC"); 5880ebf007dSSergio Lopez 5890ebf007dSSergio Lopez object_class_property_add_bool(oc, MICROVM_MACHINE_ISA_SERIAL, 5900ebf007dSSergio Lopez microvm_machine_get_isa_serial, 591d2623129SMarkus Armbruster microvm_machine_set_isa_serial); 5920ebf007dSSergio Lopez object_class_property_set_description(oc, MICROVM_MACHINE_ISA_SERIAL, 5937eecec7dSMarkus Armbruster "Set off to disable the instantiation an ISA serial port"); 5940ebf007dSSergio Lopez 5950ebf007dSSergio Lopez object_class_property_add_bool(oc, MICROVM_MACHINE_OPTION_ROMS, 5960ebf007dSSergio Lopez microvm_machine_get_option_roms, 597d2623129SMarkus Armbruster microvm_machine_set_option_roms); 5980ebf007dSSergio Lopez object_class_property_set_description(oc, MICROVM_MACHINE_OPTION_ROMS, 5997eecec7dSMarkus Armbruster "Set off to disable loading option ROMs"); 6000ebf007dSSergio Lopez 6010ebf007dSSergio Lopez object_class_property_add_bool(oc, MICROVM_MACHINE_AUTO_KERNEL_CMDLINE, 6020ebf007dSSergio Lopez microvm_machine_get_auto_kernel_cmdline, 603d2623129SMarkus Armbruster microvm_machine_set_auto_kernel_cmdline); 6040ebf007dSSergio Lopez object_class_property_set_description(oc, 6050ebf007dSSergio Lopez MICROVM_MACHINE_AUTO_KERNEL_CMDLINE, 6067eecec7dSMarkus Armbruster "Set off to disable adding virtio-mmio devices to the kernel cmdline"); 6070ebf007dSSergio Lopez } 6080ebf007dSSergio Lopez 6090ebf007dSSergio Lopez static const TypeInfo microvm_machine_info = { 6100ebf007dSSergio Lopez .name = TYPE_MICROVM_MACHINE, 6110ebf007dSSergio Lopez .parent = TYPE_X86_MACHINE, 6120ebf007dSSergio Lopez .instance_size = sizeof(MicrovmMachineState), 6130ebf007dSSergio Lopez .instance_init = microvm_machine_initfn, 6140ebf007dSSergio Lopez .class_size = sizeof(MicrovmMachineClass), 6150ebf007dSSergio Lopez .class_init = microvm_class_init, 6160ebf007dSSergio Lopez .interfaces = (InterfaceInfo[]) { 617*e3ab9873SGerd Hoffmann { TYPE_HOTPLUG_HANDLER }, 6180ebf007dSSergio Lopez { } 6190ebf007dSSergio Lopez }, 6200ebf007dSSergio Lopez }; 6210ebf007dSSergio Lopez 6220ebf007dSSergio Lopez static void microvm_machine_init(void) 6230ebf007dSSergio Lopez { 6240ebf007dSSergio Lopez type_register_static(µvm_machine_info); 6250ebf007dSSergio Lopez } 6260ebf007dSSergio Lopez type_init(microvm_machine_init); 627