// Paravirtualization support. // // Copyright (C) 2013 Kevin O'Connor // Copyright (C) 2009 Red Hat Inc. // // Authors: // Gleb Natapov // // This file may be distributed under the terms of the GNU LGPLv3 license. #include "byteorder.h" // be32_to_cpu #include "config.h" // CONFIG_QEMU #include "e820map.h" // e820_add #include "hw/pci.h" // create_pirtable #include "hw/pci_regs.h" // PCI_DEVICE_ID #include "hw/rtc.h" // CMOS_* #include "malloc.h" // malloc_tmp #include "output.h" // dprintf #include "paravirt.h" // qemu_cfg_preinit #include "romfile.h" // romfile_loadint #include "romfile_loader.h" // romfile_loader_execute #include "string.h" // memset #include "util.h" // pci_setup #include "x86.h" // cpuid #include "xen.h" // xen_biostable_setup #include "stacks.h" // yield // Amount of continuous ram under 4Gig u32 RamSize; // Amount of continuous ram >4Gig u64 RamSizeOver4G; // Type of emulator platform. int PlatformRunningOn VARFSEG; // cfg_dma enabled int cfg_dma_enabled = 0; inline int qemu_cfg_dma_enabled(void) { return cfg_dma_enabled; } /* This CPUID returns the signature 'KVMKVMKVM' in ebx, ecx, and edx. It * should be used to determine that a VM is running under KVM. */ #define KVM_CPUID_SIGNATURE 0x40000000 static void kvm_detect(void) { unsigned int eax, ebx, ecx, edx; char signature[13]; cpuid(KVM_CPUID_SIGNATURE, &eax, &ebx, &ecx, &edx); memcpy(signature + 0, &ebx, 4); memcpy(signature + 4, &ecx, 4); memcpy(signature + 8, &edx, 4); signature[12] = 0; if (strcmp(signature, "KVMKVMKVM") == 0) { dprintf(1, "Running on KVM\n"); PlatformRunningOn |= PF_KVM; } } static void qemu_detect(void) { if (!CONFIG_QEMU_HARDWARE) return; // check northbridge @ 00:00.0 u16 v = pci_config_readw(0, PCI_VENDOR_ID); if (v == 0x0000 || v == 0xffff) return; u16 d = pci_config_readw(0, PCI_DEVICE_ID); u16 sv = pci_config_readw(0, PCI_SUBSYSTEM_VENDOR_ID); u16 sd = pci_config_readw(0, PCI_SUBSYSTEM_ID); if (sv != 0x1af4 || /* Red Hat, Inc */ sd != 0x1100) /* Qemu virtual machine */ return; PlatformRunningOn |= PF_QEMU; switch (d) { case 0x1237: dprintf(1, "Running on QEMU (i440fx)\n"); break; case 0x29c0: dprintf(1, "Running on QEMU (q35)\n"); break; default: dprintf(1, "Running on QEMU (unknown nb: %04x:%04x)\n", v, d); break; } kvm_detect(); } void qemu_preinit(void) { qemu_detect(); if (!CONFIG_QEMU) return; if (runningOnXen()) { xen_ramsize_preinit(); return; } if (!runningOnQEMU()) { dprintf(1, "Warning: No QEMU Northbridge found (isapc?)\n"); PlatformRunningOn |= PF_QEMU; kvm_detect(); } // On emulators, get memory size from nvram. u32 rs = ((rtc_read(CMOS_MEM_EXTMEM2_LOW) << 16) | (rtc_read(CMOS_MEM_EXTMEM2_HIGH) << 24)); if (rs) rs += 16 * 1024 * 1024; else rs = (((rtc_read(CMOS_MEM_EXTMEM_LOW) << 10) | (rtc_read(CMOS_MEM_EXTMEM_HIGH) << 18)) + 1 * 1024 * 1024); RamSize = rs; e820_add(0, rs, E820_RAM); /* reserve 256KB BIOS area at the end of 4 GB */ e820_add(0xfffc0000, 256*1024, E820_RESERVED); dprintf(1, "RamSize: 0x%08x [cmos]\n", RamSize); } void qemu_platform_setup(void) { if (!CONFIG_QEMU) return; if (runningOnXen()) { pci_probe_devices(); xen_hypercall_setup(); xen_biostable_setup(); return; } // Initialize pci pci_setup(); smm_device_setup(); smm_setup(); // Initialize mtrr and smp mtrr_setup(); smp_setup(); // Create bios tables pirtable_setup(); mptable_setup(); smbios_setup(); if (CONFIG_FW_ROMFILE_LOAD) { int loader_err; dprintf(3, "load ACPI tables\n"); loader_err = romfile_loader_execute("etc/table-loader"); RsdpAddr = find_acpi_rsdp(); if (RsdpAddr) return; /* If present, loader should have installed an RSDP. * Not installed? We might still be able to continue * using the builtin RSDP. */ if (!loader_err) warn_internalerror(); } acpi_setup(); } /**************************************************************** * QEMU firmware config (fw_cfg) interface ****************************************************************/ // List of QEMU fw_cfg entries. DO NOT ADD MORE. (All new content // should be passed via the fw_cfg "file" interface.) #define QEMU_CFG_SIGNATURE 0x00 #define QEMU_CFG_ID 0x01 #define QEMU_CFG_UUID 0x02 #define QEMU_CFG_NUMA 0x0d #define QEMU_CFG_BOOT_MENU 0x0e #define QEMU_CFG_MAX_CPUS 0x0f #define QEMU_CFG_FILE_DIR 0x19 #define QEMU_CFG_ARCH_LOCAL 0x8000 #define QEMU_CFG_ACPI_TABLES (QEMU_CFG_ARCH_LOCAL + 0) #define QEMU_CFG_SMBIOS_ENTRIES (QEMU_CFG_ARCH_LOCAL + 1) #define QEMU_CFG_IRQ0_OVERRIDE (QEMU_CFG_ARCH_LOCAL + 2) #define QEMU_CFG_E820_TABLE (QEMU_CFG_ARCH_LOCAL + 3) static void qemu_cfg_select(u16 f) { outw(f, PORT_QEMU_CFG_CTL); } static void qemu_cfg_dma_transfer(void *address, u32 length, u32 control) { QemuCfgDmaAccess access; access.address = cpu_to_be64((u64)(u32)address); access.length = cpu_to_be32(length); access.control = cpu_to_be32(control); barrier(); outl(cpu_to_be32((u32)&access), PORT_QEMU_CFG_DMA_ADDR_LOW); while(be32_to_cpu(access.control) & ~QEMU_CFG_DMA_CTL_ERROR) { yield(); } } static void qemu_cfg_read(void *buf, int len) { if (len == 0) { return; } if (qemu_cfg_dma_enabled()) { qemu_cfg_dma_transfer(buf, len, QEMU_CFG_DMA_CTL_READ); } else { insb(PORT_QEMU_CFG_DATA, buf, len); } } static void qemu_cfg_skip(int len) { if (len == 0) { return; } if (qemu_cfg_dma_enabled()) { qemu_cfg_dma_transfer(0, len, QEMU_CFG_DMA_CTL_SKIP); } else { while (len--) inb(PORT_QEMU_CFG_DATA); } } static void qemu_cfg_read_entry(void *buf, int e, int len) { if (qemu_cfg_dma_enabled()) { u32 control = (e << 16) | QEMU_CFG_DMA_CTL_SELECT | QEMU_CFG_DMA_CTL_READ; qemu_cfg_dma_transfer(buf, len, control); } else { qemu_cfg_select(e); qemu_cfg_read(buf, len); } } struct qemu_romfile_s { struct romfile_s file; int select, skip; }; static int qemu_cfg_read_file(struct romfile_s *file, void *dst, u32 maxlen) { if (file->size > maxlen) return -1; struct qemu_romfile_s *qfile; qfile = container_of(file, struct qemu_romfile_s, file); if (qfile->skip == 0) { /* Do it in one transfer */ qemu_cfg_read_entry(dst, qfile->select, file->size); } else { qemu_cfg_select(qfile->select); qemu_cfg_skip(qfile->skip); qemu_cfg_read(dst, file->size); } return file->size; } static void qemu_romfile_add(char *name, int select, int skip, int size) { struct qemu_romfile_s *qfile = malloc_tmp(sizeof(*qfile)); if (!qfile) { warn_noalloc(); return; } memset(qfile, 0, sizeof(*qfile)); strtcpy(qfile->file.name, name, sizeof(qfile->file.name)); qfile->file.size = size; qfile->select = select; qfile->skip = skip; qfile->file.copy = qemu_cfg_read_file; romfile_add(&qfile->file); } struct e820_reservation { u64 address; u64 length; u32 type; }; #define SMBIOS_FIELD_ENTRY 0 #define SMBIOS_TABLE_ENTRY 1 struct qemu_smbios_header { u16 length; u8 headertype; u8 tabletype; u16 fieldoffset; } PACKED; static void qemu_cfg_e820(void) { struct e820_reservation *table; int i, size; if (!CONFIG_QEMU) return; // "etc/e820" has both ram and reservations table = romfile_loadfile("etc/e820", &size); if (table) { for (i = 0; i < size / sizeof(struct e820_reservation); i++) { switch (table[i].type) { case E820_RAM: dprintf(1, "RamBlock: addr 0x%016llx len 0x%016llx [e820]\n", table[i].address, table[i].length); if (table[i].address < RamSize) // ignore, preinit got it from cmos already and // adding this again would ruin any reservations // done so far continue; if (table[i].address < 0x100000000LL) { // below 4g -- adjust RamSize to mark highest lowram addr if (RamSize < table[i].address + table[i].length) RamSize = table[i].address + table[i].length; } else { // above 4g -- adjust RamSizeOver4G to mark highest ram addr if (0x100000000LL + RamSizeOver4G < table[i].address + table[i].length) RamSizeOver4G = table[i].address + table[i].length - 0x100000000LL; } /* fall through */ case E820_RESERVED: e820_add(table[i].address, table[i].length, table[i].type); break; default: /* * Qemu 1.7 uses RAM + RESERVED only. Ignore * everything else, so we have the option to * extend this in the future without breakage. */ break; } } return; } // QEMU_CFG_E820_TABLE has reservations only u32 count32; qemu_cfg_read_entry(&count32, QEMU_CFG_E820_TABLE, sizeof(count32)); if (count32) { struct e820_reservation entry; int i; for (i = 0; i < count32; i++) { qemu_cfg_read(&entry, sizeof(entry)); e820_add(entry.address, entry.length, entry.type); } } else if (runningOnKVM()) { // Backwards compatibility - provide hard coded range. // 4 pages before the bios, 3 pages for vmx tss pages, the // other page for EPT real mode pagetable e820_add(0xfffbc000, 4*4096, E820_RESERVED); } // Check for memory over 4Gig in cmos u64 high = ((rtc_read(CMOS_MEM_HIGHMEM_LOW) << 16) | ((u32)rtc_read(CMOS_MEM_HIGHMEM_MID) << 24) | ((u64)rtc_read(CMOS_MEM_HIGHMEM_HIGH) << 32)); RamSizeOver4G = high; e820_add(0x100000000ull, high, E820_RAM); dprintf(1, "RamSizeOver4G: 0x%016llx [cmos]\n", RamSizeOver4G); } // Populate romfile entries for legacy fw_cfg ports (that predate the // "file" interface). static void qemu_cfg_legacy(void) { if (!CONFIG_QEMU) return; // Misc config items. qemu_romfile_add("etc/show-boot-menu", QEMU_CFG_BOOT_MENU, 0, 2); qemu_romfile_add("etc/irq0-override", QEMU_CFG_IRQ0_OVERRIDE, 0, 1); qemu_romfile_add("etc/max-cpus", QEMU_CFG_MAX_CPUS, 0, 2); // NUMA data u64 numacount; qemu_cfg_read_entry(&numacount, QEMU_CFG_NUMA, sizeof(numacount)); int max_cpu = romfile_loadint("etc/max-cpus", 0); qemu_romfile_add("etc/numa-cpu-map", QEMU_CFG_NUMA, sizeof(numacount) , max_cpu*sizeof(u64)); qemu_romfile_add("etc/numa-nodes", QEMU_CFG_NUMA , sizeof(numacount) + max_cpu*sizeof(u64) , numacount*sizeof(u64)); // ACPI tables char name[128]; u16 cnt; qemu_cfg_read_entry(&cnt, QEMU_CFG_ACPI_TABLES, sizeof(cnt)); int i, offset = sizeof(cnt); for (i = 0; i < cnt; i++) { u16 len; qemu_cfg_read(&len, sizeof(len)); offset += sizeof(len); snprintf(name, sizeof(name), "acpi/table%d", i); qemu_romfile_add(name, QEMU_CFG_ACPI_TABLES, offset, len); qemu_cfg_skip(len); offset += len; } // SMBIOS info qemu_cfg_read_entry(&cnt, QEMU_CFG_SMBIOS_ENTRIES, sizeof(cnt)); offset = sizeof(cnt); for (i = 0; i < cnt; i++) { struct qemu_smbios_header header; qemu_cfg_read(&header, sizeof(header)); if (header.headertype == SMBIOS_FIELD_ENTRY) { snprintf(name, sizeof(name), "smbios/field%d-%d" , header.tabletype, header.fieldoffset); qemu_romfile_add(name, QEMU_CFG_SMBIOS_ENTRIES , offset + sizeof(header) , header.length - sizeof(header)); } else { snprintf(name, sizeof(name), "smbios/table%d-%d" , header.tabletype, i); qemu_romfile_add(name, QEMU_CFG_SMBIOS_ENTRIES , offset + 3, header.length - 3); } qemu_cfg_skip(header.length - sizeof(header)); offset += header.length; } } struct QemuCfgFile { u32 size; /* file size */ u16 select; /* write this to 0x510 to read it */ u16 reserved; char name[56]; }; void qemu_cfg_init(void) { if (!runningOnQEMU()) return; // Detect fw_cfg interface. qemu_cfg_select(QEMU_CFG_SIGNATURE); char *sig = "QEMU"; int i; for (i = 0; i < 4; i++) if (inb(PORT_QEMU_CFG_DATA) != sig[i]) return; dprintf(1, "Found QEMU fw_cfg\n"); // Detect DMA interface. u32 id; qemu_cfg_read_entry(&id, QEMU_CFG_ID, sizeof(id)); if (id & QEMU_CFG_VERSION_DMA) { dprintf(1, "QEMU fw_cfg DMA interface supported\n"); cfg_dma_enabled = 1; } // Populate romfiles for legacy fw_cfg entries qemu_cfg_legacy(); // Load files found in the fw_cfg file directory u32 count; qemu_cfg_read_entry(&count, QEMU_CFG_FILE_DIR, sizeof(count)); count = be32_to_cpu(count); u32 e; for (e = 0; e < count; e++) { struct QemuCfgFile qfile; qemu_cfg_read(&qfile, sizeof(qfile)); qemu_romfile_add(qfile.name, be16_to_cpu(qfile.select) , 0, be32_to_cpu(qfile.size)); } qemu_cfg_e820(); if (romfile_find("etc/table-loader")) { acpi_pm_base = 0x0600; dprintf(1, "Moving pm_base to 0x%x\n", acpi_pm_base); } }