aboutsummaryrefslogtreecommitdiff
path: root/jslinux-2019-12-21/tinyemu-2019-12-21/x86_machine.c
diff options
context:
space:
mode:
Diffstat (limited to 'jslinux-2019-12-21/tinyemu-2019-12-21/x86_machine.c')
-rw-r--r--jslinux-2019-12-21/tinyemu-2019-12-21/x86_machine.c2569
1 files changed, 2569 insertions, 0 deletions
diff --git a/jslinux-2019-12-21/tinyemu-2019-12-21/x86_machine.c b/jslinux-2019-12-21/tinyemu-2019-12-21/x86_machine.c
new file mode 100644
index 0000000..db8f6bb
--- /dev/null
+++ b/jslinux-2019-12-21/tinyemu-2019-12-21/x86_machine.c
@@ -0,0 +1,2569 @@
+/*
+ * PC emulator
+ *
+ * Copyright (c) 2011-2017 Fabrice Bellard
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a copy
+ * of this software and associated documentation files (the "Software"), to deal
+ * in the Software without restriction, including without limitation the rights
+ * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the Software is
+ * furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+ * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
+ * THE SOFTWARE.
+ */
+#include <stdlib.h>
+#include <stdio.h>
+#include <stdarg.h>
+#include <string.h>
+#include <inttypes.h>
+#include <assert.h>
+#include <fcntl.h>
+#include <errno.h>
+#include <unistd.h>
+#include <time.h>
+#include <sys/time.h>
+
+#include "cutils.h"
+#include "iomem.h"
+#include "virtio.h"
+#include "x86_cpu.h"
+#include "machine.h"
+#include "pci.h"
+#include "ide.h"
+#include "ps2.h"
+
+#if defined(__linux__) && (defined(__i386__) || defined(__x86_64__))
+#define USE_KVM
+#endif
+
+#ifdef USE_KVM
+#include <linux/kvm.h>
+#include <sys/mman.h>
+#include <sys/ioctl.h>
+#include <signal.h>
+#include <sys/time.h>
+#endif
+
+//#define DEBUG_BIOS
+//#define DUMP_IOPORT
+
+/***********************************************************/
+/* cmos emulation */
+
+//#define DEBUG_CMOS
+
+#define RTC_SECONDS 0
+#define RTC_SECONDS_ALARM 1
+#define RTC_MINUTES 2
+#define RTC_MINUTES_ALARM 3
+#define RTC_HOURS 4
+#define RTC_HOURS_ALARM 5
+#define RTC_ALARM_DONT_CARE 0xC0
+
+#define RTC_DAY_OF_WEEK 6
+#define RTC_DAY_OF_MONTH 7
+#define RTC_MONTH 8
+#define RTC_YEAR 9
+
+#define RTC_REG_A 10
+#define RTC_REG_B 11
+#define RTC_REG_C 12
+#define RTC_REG_D 13
+
+#define REG_A_UIP 0x80
+
+#define REG_B_SET 0x80
+#define REG_B_PIE 0x40
+#define REG_B_AIE 0x20
+#define REG_B_UIE 0x10
+
+typedef struct {
+ uint8_t cmos_index;
+ uint8_t cmos_data[128];
+ IRQSignal *irq;
+ BOOL use_local_time;
+ /* used for the periodic irq */
+ uint32_t irq_timeout;
+ uint32_t irq_period;
+} CMOSState;
+
+static void cmos_write(void *opaque, uint32_t offset,
+ uint32_t data, int size_log2);
+static uint32_t cmos_read(void *opaque, uint32_t offset, int size_log2);
+
+static int to_bcd(CMOSState *s, unsigned int a)
+{
+ if (s->cmos_data[RTC_REG_B] & 0x04) {
+ return a;
+ } else {
+ return ((a / 10) << 4) | (a % 10);
+ }
+}
+
+static void cmos_update_time(CMOSState *s, BOOL set_century)
+{
+ struct timeval tv;
+ struct tm tm;
+ time_t ti;
+ int val;
+
+ gettimeofday(&tv, NULL);
+ ti = tv.tv_sec;
+ if (s->use_local_time) {
+ localtime_r(&ti, &tm);
+ } else {
+ gmtime_r(&ti, &tm);
+ }
+
+ s->cmos_data[RTC_SECONDS] = to_bcd(s, tm.tm_sec);
+ s->cmos_data[RTC_MINUTES] = to_bcd(s, tm.tm_min);
+ if (s->cmos_data[RTC_REG_B] & 0x02) {
+ s->cmos_data[RTC_HOURS] = to_bcd(s, tm.tm_hour);
+ } else {
+ s->cmos_data[RTC_HOURS] = to_bcd(s, tm.tm_hour % 12);
+ if (tm.tm_hour >= 12)
+ s->cmos_data[RTC_HOURS] |= 0x80;
+ }
+ s->cmos_data[RTC_DAY_OF_WEEK] = to_bcd(s, tm.tm_wday);
+ s->cmos_data[RTC_DAY_OF_MONTH] = to_bcd(s, tm.tm_mday);
+ s->cmos_data[RTC_MONTH] = to_bcd(s, tm.tm_mon + 1);
+ s->cmos_data[RTC_YEAR] = to_bcd(s, tm.tm_year % 100);
+
+ if (set_century) {
+ /* not set by the hardware, but easier to do it here */
+ val = to_bcd(s, (tm.tm_year / 100) + 19);
+ s->cmos_data[0x32] = val;
+ s->cmos_data[0x37] = val;
+ }
+
+ /* update in progress flag: 8/32768 seconds after change */
+ if (tv.tv_usec < 244) {
+ s->cmos_data[RTC_REG_A] |= REG_A_UIP;
+ } else {
+ s->cmos_data[RTC_REG_A] &= ~REG_A_UIP;
+ }
+}
+
+CMOSState *cmos_init(PhysMemoryMap *port_map, int addr,
+ IRQSignal *irq, BOOL use_local_time)
+{
+ CMOSState *s;
+
+ s = mallocz(sizeof(*s));
+ s->use_local_time = use_local_time;
+
+ s->cmos_index = 0;
+
+ s->cmos_data[RTC_REG_A] = 0x26;
+ s->cmos_data[RTC_REG_B] = 0x02;
+ s->cmos_data[RTC_REG_C] = 0x00;
+ s->cmos_data[RTC_REG_D] = 0x80;
+
+ cmos_update_time(s, TRUE);
+
+ s->irq = irq;
+
+ cpu_register_device(port_map, addr, 2, s, cmos_read, cmos_write,
+ DEVIO_SIZE8);
+ return s;
+}
+
+#define CMOS_FREQ 32768
+
+static uint32_t cmos_get_timer(CMOSState *s)
+{
+ struct timespec ts;
+
+ clock_gettime(CLOCK_MONOTONIC, &ts);
+ return (uint32_t)ts.tv_sec * CMOS_FREQ +
+ ((uint64_t)ts.tv_nsec * CMOS_FREQ / 1000000000);
+}
+
+static void cmos_update_timer(CMOSState *s)
+{
+ int period_code;
+
+ period_code = s->cmos_data[RTC_REG_A] & 0x0f;
+ if ((s->cmos_data[RTC_REG_B] & REG_B_PIE) &&
+ period_code != 0) {
+ if (period_code <= 2)
+ period_code += 7;
+ s->irq_period = 1 << (period_code - 1);
+ s->irq_timeout = (cmos_get_timer(s) + s->irq_period) &
+ ~(s->irq_period - 1);
+ }
+}
+
+/* XXX: could return a delay, but we don't need high precision
+ (Windows 2000 uses it for delay calibration) */
+static void cmos_update_irq(CMOSState *s)
+{
+ uint32_t d;
+ if (s->cmos_data[RTC_REG_B] & REG_B_PIE) {
+ d = cmos_get_timer(s) - s->irq_timeout;
+ if ((int32_t)d >= 0) {
+ /* this is not what the real RTC does. Here we sent the IRQ
+ immediately */
+ s->cmos_data[RTC_REG_C] |= 0xc0;
+ set_irq(s->irq, 1);
+ /* update for the next irq */
+ s->irq_timeout += s->irq_period;
+ }
+ }
+}
+
+static void cmos_write(void *opaque, uint32_t offset,
+ uint32_t data, int size_log2)
+{
+ CMOSState *s = opaque;
+
+ if (offset == 0) {
+ s->cmos_index = data & 0x7f;
+ } else {
+#ifdef DEBUG_CMOS
+ printf("cmos_write: reg=0x%02x val=0x%02x\n", s->cmos_index, data);
+#endif
+ switch(s->cmos_index) {
+ case RTC_REG_A:
+ s->cmos_data[RTC_REG_A] = (data & ~REG_A_UIP) |
+ (s->cmos_data[RTC_REG_A] & REG_A_UIP);
+ cmos_update_timer(s);
+ break;
+ case RTC_REG_B:
+ s->cmos_data[s->cmos_index] = data;
+ cmos_update_timer(s);
+ break;
+ default:
+ s->cmos_data[s->cmos_index] = data;
+ break;
+ }
+ }
+}
+
+static uint32_t cmos_read(void *opaque, uint32_t offset, int size_log2)
+{
+ CMOSState *s = opaque;
+ int ret;
+
+ if (offset == 0) {
+ return 0xff;
+ } else {
+ switch(s->cmos_index) {
+ case RTC_SECONDS:
+ case RTC_MINUTES:
+ case RTC_HOURS:
+ case RTC_DAY_OF_WEEK:
+ case RTC_DAY_OF_MONTH:
+ case RTC_MONTH:
+ case RTC_YEAR:
+ case RTC_REG_A:
+ cmos_update_time(s, FALSE);
+ ret = s->cmos_data[s->cmos_index];
+ break;
+ case RTC_REG_C:
+ ret = s->cmos_data[s->cmos_index];
+ s->cmos_data[RTC_REG_C] = 0x00;
+ set_irq(s->irq, 0);
+ break;
+ default:
+ ret = s->cmos_data[s->cmos_index];
+ }
+#ifdef DEBUG_CMOS
+ printf("cmos_read: reg=0x%02x val=0x%02x\n", s->cmos_index, ret);
+#endif
+ return ret;
+ }
+}
+
+/***********************************************************/
+/* 8259 pic emulation */
+
+//#define DEBUG_PIC
+
+typedef void PICUpdateIRQFunc(void *opaque);
+
+typedef struct {
+ uint8_t last_irr; /* edge detection */
+ uint8_t irr; /* interrupt request register */
+ uint8_t imr; /* interrupt mask register */
+ uint8_t isr; /* interrupt service register */
+ uint8_t priority_add; /* used to compute irq priority */
+ uint8_t irq_base;
+ uint8_t read_reg_select;
+ uint8_t special_mask;
+ uint8_t init_state;
+ uint8_t auto_eoi;
+ uint8_t rotate_on_autoeoi;
+ uint8_t init4; /* true if 4 byte init */
+ uint8_t elcr; /* PIIX edge/trigger selection*/
+ uint8_t elcr_mask;
+ PICUpdateIRQFunc *update_irq;
+ void *opaque;
+} PICState;
+
+static void pic_reset(PICState *s);
+static void pic_write(void *opaque, uint32_t offset,
+ uint32_t val, int size_log2);
+static uint32_t pic_read(void *opaque, uint32_t offset, int size_log2);
+static void pic_elcr_write(void *opaque, uint32_t offset,
+ uint32_t val, int size_log2);
+static uint32_t pic_elcr_read(void *opaque, uint32_t offset, int size_log2);
+
+PICState *pic_init(PhysMemoryMap *port_map, int port, int elcr_port,
+ int elcr_mask,
+ PICUpdateIRQFunc *update_irq, void *opaque)
+{
+ PICState *s;
+
+ s = mallocz(sizeof(*s));
+ s->elcr_mask = elcr_mask;
+ s->update_irq = update_irq;
+ s->opaque = opaque;
+ cpu_register_device(port_map, port, 2, s,
+ pic_read, pic_write, DEVIO_SIZE8);
+ cpu_register_device(port_map, elcr_port, 1, s,
+ pic_elcr_read, pic_elcr_write, DEVIO_SIZE8);
+ pic_reset(s);
+ return s;
+}
+
+static void pic_reset(PICState *s)
+{
+ /* all 8 bit registers */
+ s->last_irr = 0; /* edge detection */
+ s->irr = 0; /* interrupt request register */
+ s->imr = 0; /* interrupt mask register */
+ s->isr = 0; /* interrupt service register */
+ s->priority_add = 0; /* used to compute irq priority */
+ s->irq_base = 0;
+ s->read_reg_select = 0;
+ s->special_mask = 0;
+ s->init_state = 0;
+ s->auto_eoi = 0;
+ s->rotate_on_autoeoi = 0;
+ s->init4 = 0; /* true if 4 byte init */
+}
+
+/* set irq level. If an edge is detected, then the IRR is set to 1 */
+static void pic_set_irq1(PICState *s, int irq, int level)
+{
+ int mask;
+ mask = 1 << irq;
+ if (s->elcr & mask) {
+ /* level triggered */
+ if (level) {
+ s->irr |= mask;
+ s->last_irr |= mask;
+ } else {
+ s->irr &= ~mask;
+ s->last_irr &= ~mask;
+ }
+ } else {
+ /* edge triggered */
+ if (level) {
+ if ((s->last_irr & mask) == 0)
+ s->irr |= mask;
+ s->last_irr |= mask;
+ } else {
+ s->last_irr &= ~mask;
+ }
+ }
+}
+
+static int pic_get_priority(PICState *s, int mask)
+{
+ int priority;
+ if (mask == 0)
+ return -1;
+ priority = 7;
+ while ((mask & (1 << ((priority + s->priority_add) & 7))) == 0)
+ priority--;
+ return priority;
+}
+
+/* return the pic wanted interrupt. return -1 if none */
+static int pic_get_irq(PICState *s)
+{
+ int mask, cur_priority, priority;
+
+ mask = s->irr & ~s->imr;
+ priority = pic_get_priority(s, mask);
+ if (priority < 0)
+ return -1;
+ /* compute current priority */
+ cur_priority = pic_get_priority(s, s->isr);
+ if (priority > cur_priority) {
+ /* higher priority found: an irq should be generated */
+ return priority;
+ } else {
+ return -1;
+ }
+}
+
+/* acknowledge interrupt 'irq' */
+static void pic_intack(PICState *s, int irq)
+{
+ if (s->auto_eoi) {
+ if (s->rotate_on_autoeoi)
+ s->priority_add = (irq + 1) & 7;
+ } else {
+ s->isr |= (1 << irq);
+ }
+ /* We don't clear a level sensitive interrupt here */
+ if (!(s->elcr & (1 << irq)))
+ s->irr &= ~(1 << irq);
+}
+
+static void pic_write(void *opaque, uint32_t offset,
+ uint32_t val, int size_log2)
+{
+ PICState *s = opaque;
+ int priority, addr;
+
+ addr = offset & 1;
+#ifdef DEBUG_PIC
+ console.log("pic_write: addr=" + toHex2(addr) + " val=" + toHex2(val));
+#endif
+ if (addr == 0) {
+ if (val & 0x10) {
+ /* init */
+ pic_reset(s);
+ s->init_state = 1;
+ s->init4 = val & 1;
+ if (val & 0x02)
+ abort(); /* "single mode not supported" */
+ if (val & 0x08)
+ abort(); /* "level sensitive irq not supported" */
+ } else if (val & 0x08) {
+ if (val & 0x02)
+ s->read_reg_select = val & 1;
+ if (val & 0x40)
+ s->special_mask = (val >> 5) & 1;
+ } else {
+ switch(val) {
+ case 0x00:
+ case 0x80:
+ s->rotate_on_autoeoi = val >> 7;
+ break;
+ case 0x20: /* end of interrupt */
+ case 0xa0:
+ priority = pic_get_priority(s, s->isr);
+ if (priority >= 0) {
+ s->isr &= ~(1 << ((priority + s->priority_add) & 7));
+ }
+ if (val == 0xa0)
+ s->priority_add = (s->priority_add + 1) & 7;
+ break;
+ case 0x60:
+ case 0x61:
+ case 0x62:
+ case 0x63:
+ case 0x64:
+ case 0x65:
+ case 0x66:
+ case 0x67:
+ priority = val & 7;
+ s->isr &= ~(1 << priority);
+ break;
+ case 0xc0:
+ case 0xc1:
+ case 0xc2:
+ case 0xc3:
+ case 0xc4:
+ case 0xc5:
+ case 0xc6:
+ case 0xc7:
+ s->priority_add = (val + 1) & 7;
+ break;
+ case 0xe0:
+ case 0xe1:
+ case 0xe2:
+ case 0xe3:
+ case 0xe4:
+ case 0xe5:
+ case 0xe6:
+ case 0xe7:
+ priority = val & 7;
+ s->isr &= ~(1 << priority);
+ s->priority_add = (priority + 1) & 7;
+ break;
+ }
+ }
+ } else {
+ switch(s->init_state) {
+ case 0:
+ /* normal mode */
+ s->imr = val;
+ s->update_irq(s->opaque);
+ break;
+ case 1:
+ s->irq_base = val & 0xf8;
+ s->init_state = 2;
+ break;
+ case 2:
+ if (s->init4) {
+ s->init_state = 3;
+ } else {
+ s->init_state = 0;
+ }
+ break;
+ case 3:
+ s->auto_eoi = (val >> 1) & 1;
+ s->init_state = 0;
+ break;
+ }
+ }
+}
+
+static uint32_t pic_read(void *opaque, uint32_t offset, int size_log2)
+{
+ PICState *s = opaque;
+ int addr, ret;
+
+ addr = offset & 1;
+ if (addr == 0) {
+ if (s->read_reg_select)
+ ret = s->isr;
+ else
+ ret = s->irr;
+ } else {
+ ret = s->imr;
+ }
+#ifdef DEBUG_PIC
+ console.log("pic_read: addr=" + toHex2(addr1) + " val=" + toHex2(ret));
+#endif
+ return ret;
+}
+
+static void pic_elcr_write(void *opaque, uint32_t offset,
+ uint32_t val, int size_log2)
+{
+ PICState *s = opaque;
+ s->elcr = val & s->elcr_mask;
+}
+
+static uint32_t pic_elcr_read(void *opaque, uint32_t offset, int size_log2)
+{
+ PICState *s = opaque;
+ return s->elcr;
+}
+
+typedef struct {
+ PICState *pics[2];
+ int irq_requested;
+ void (*cpu_set_irq)(void *opaque, int level);
+ void *opaque;
+#if defined(DEBUG_PIC)
+ uint8_t irq_level[16];
+#endif
+ IRQSignal *irqs;
+} PIC2State;
+
+static void pic2_update_irq(void *opaque);
+static void pic2_set_irq(void *opaque, int irq, int level);
+
+PIC2State *pic2_init(PhysMemoryMap *port_map, uint32_t addr0, uint32_t addr1,
+ uint32_t elcr_addr0, uint32_t elcr_addr1,
+ void (*cpu_set_irq)(void *opaque, int level),
+ void *opaque, IRQSignal *irqs)
+{
+ PIC2State *s;
+ int i;
+
+ s = mallocz(sizeof(*s));
+
+ for(i = 0; i < 16; i++) {
+ irq_init(&irqs[i], pic2_set_irq, s, i);
+ }
+ s->cpu_set_irq = cpu_set_irq;
+ s->opaque = opaque;
+ s->pics[0] = pic_init(port_map, addr0, elcr_addr0, 0xf8, pic2_update_irq, s);
+ s->pics[1] = pic_init(port_map, addr1, elcr_addr1, 0xde, pic2_update_irq, s);
+ s->irq_requested = 0;
+ return s;
+}
+
+void pic2_set_elcr(PIC2State *s, const uint8_t *elcr)
+{
+ int i;
+ for(i = 0; i < 2; i++) {
+ s->pics[i]->elcr = elcr[i] & s->pics[i]->elcr_mask;
+ }
+}
+
+/* raise irq to CPU if necessary. must be called every time the active
+ irq may change */
+static void pic2_update_irq(void *opaque)
+{
+ PIC2State *s = opaque;
+ int irq2, irq;
+
+ /* first look at slave pic */
+ irq2 = pic_get_irq(s->pics[1]);
+ if (irq2 >= 0) {
+ /* if irq request by slave pic, signal master PIC */
+ pic_set_irq1(s->pics[0], 2, 1);
+ pic_set_irq1(s->pics[0], 2, 0);
+ }
+ /* look at requested irq */
+ irq = pic_get_irq(s->pics[0]);
+#if 0
+ console.log("irr=" + toHex2(s->pics[0].irr) + " imr=" + toHex2(s->pics[0].imr) + " isr=" + toHex2(s->pics[0].isr) + " irq="+ irq);
+#endif
+ if (irq >= 0) {
+ /* raise IRQ request on the CPU */
+ s->cpu_set_irq(s->opaque, 1);
+ } else {
+ /* lower irq */
+ s->cpu_set_irq(s->opaque, 0);
+ }
+}
+
+static void pic2_set_irq(void *opaque, int irq, int level)
+{
+ PIC2State *s = opaque;
+#if defined(DEBUG_PIC)
+ if (irq != 0 && level != s->irq_level[irq]) {
+ console.log("pic_set_irq: irq=" + irq + " level=" + level);
+ s->irq_level[irq] = level;
+ }
+#endif
+ pic_set_irq1(s->pics[irq >> 3], irq & 7, level);
+ pic2_update_irq(s);
+}
+
+/* called from the CPU to get the hardware interrupt number */
+static int pic2_get_hard_intno(PIC2State *s)
+{
+ int irq, irq2, intno;
+
+ irq = pic_get_irq(s->pics[0]);
+ if (irq >= 0) {
+ pic_intack(s->pics[0], irq);
+ if (irq == 2) {
+ irq2 = pic_get_irq(s->pics[1]);
+ if (irq2 >= 0) {
+ pic_intack(s->pics[1], irq2);
+ } else {
+ /* spurious IRQ on slave controller */
+ irq2 = 7;
+ }
+ intno = s->pics[1]->irq_base + irq2;
+ irq = irq2 + 8;
+ } else {
+ intno = s->pics[0]->irq_base + irq;
+ }
+ } else {
+ /* spurious IRQ on host controller */
+ irq = 7;
+ intno = s->pics[0]->irq_base + irq;
+ }
+ pic2_update_irq(s);
+
+#if defined(DEBUG_PIC)
+ if (irq != 0 && irq != 14)
+ printf("pic_interrupt: irq=%d\n", irq);
+#endif
+ return intno;
+}
+
+/***********************************************************/
+/* 8253 PIT emulation */
+
+#define PIT_FREQ 1193182
+
+#define RW_STATE_LSB 0
+#define RW_STATE_MSB 1
+#define RW_STATE_WORD0 2
+#define RW_STATE_WORD1 3
+#define RW_STATE_LATCHED_WORD0 4
+#define RW_STATE_LATCHED_WORD1 5
+
+//#define DEBUG_PIT
+
+typedef int64_t PITGetTicksFunc(void *opaque);
+
+typedef struct PITState PITState;
+
+typedef struct {
+ PITState *pit_state;
+ uint32_t count;
+ uint32_t latched_count;
+ uint8_t rw_state;
+ uint8_t mode;
+ uint8_t bcd;
+ uint8_t gate;
+ int64_t count_load_time;
+ int64_t last_irq_time;
+} PITChannel;
+
+struct PITState {
+ PITChannel pit_channels[3];
+ uint8_t speaker_data_on;
+ PITGetTicksFunc *get_ticks;
+ IRQSignal *irq;
+ void *opaque;
+};
+
+static void pit_load_count(PITChannel *pc, int val);
+static void pit_write(void *opaque, uint32_t offset,
+ uint32_t val, int size_log2);
+static uint32_t pit_read(void *opaque, uint32_t offset, int size_log2);
+static void speaker_write(void *opaque, uint32_t offset,
+ uint32_t val, int size_log2);
+static uint32_t speaker_read(void *opaque, uint32_t offset, int size_log2);
+
+PITState *pit_init(PhysMemoryMap *port_map, int addr0, int addr1,
+ IRQSignal *irq,
+ PITGetTicksFunc *get_ticks, void *opaque)
+{
+ PITState *s;
+ PITChannel *pc;
+ int i;
+
+ s = mallocz(sizeof(*s));
+
+ s->irq = irq;
+ s->get_ticks = get_ticks;
+ s->opaque = opaque;
+
+ for(i = 0; i < 3; i++) {
+ pc = &s->pit_channels[i];
+ pc->pit_state = s;
+ pc->mode = 3;
+ pc->gate = (i != 2) >> 0;
+ pit_load_count(pc, 0);
+ }
+ s->speaker_data_on = 0;
+
+ cpu_register_device(port_map, addr0, 4, s, pit_read, pit_write,
+ DEVIO_SIZE8);
+
+ cpu_register_device(port_map, addr1, 1, s, speaker_read, speaker_write,
+ DEVIO_SIZE8);
+ return s;
+}
+
+/* unit = PIT frequency */
+static int64_t pit_get_time(PITChannel *pc)
+{
+ PITState *s = pc->pit_state;
+ return s->get_ticks(s->opaque);
+}
+
+static uint32_t pit_get_count(PITChannel *pc)
+{
+ uint32_t counter;
+ uint64_t d;
+
+ d = pit_get_time(pc) - pc->count_load_time;
+ switch(pc->mode) {
+ case 0:
+ case 1:
+ case 4:
+ case 5:
+ counter = (pc->count - d) & 0xffff;
+ break;
+ default:
+ counter = pc->count - (d % pc->count);
+ break;
+ }
+ return counter;
+}
+
+/* get pit output bit */
+static int pit_get_out(PITChannel *pc)
+{
+ int out;
+ int64_t d;
+
+ d = pit_get_time(pc) - pc->count_load_time;
+ switch(pc->mode) {
+ default:
+ case 0:
+ out = (d >= pc->count) >> 0;
+ break;
+ case 1:
+ out = (d < pc->count) >> 0;
+ break;
+ case 2:
+ /* mode used by Linux */
+ if ((d % pc->count) == 0 && d != 0)
+ out = 1;
+ else
+ out = 0;
+ break;
+ case 3:
+ out = ((d % pc->count) < (pc->count >> 1)) >> 0;
+ break;
+ case 4:
+ case 5:
+ out = (d == pc->count) >> 0;
+ break;
+ }
+ return out;
+}
+
+static void pit_load_count(PITChannel *s, int val)
+{
+ if (val == 0)
+ val = 0x10000;
+ s->count_load_time = pit_get_time(s);
+ s->last_irq_time = 0;
+ s->count = val;
+}
+
+static void pit_write(void *opaque, uint32_t offset,
+ uint32_t val, int size_log2)
+{
+ PITState *pit = opaque;
+ int channel, access, addr;
+ PITChannel *s;
+
+ addr = offset & 3;
+#ifdef DEBUG_PIT
+ printf("pit_write: off=%d val=0x%02x\n", addr, val);
+#endif
+ if (addr == 3) {
+ channel = val >> 6;
+ if (channel == 3)
+ return;
+ s = &pit->pit_channels[channel];
+ access = (val >> 4) & 3;
+ switch(access) {
+ case 0:
+ s->latched_count = pit_get_count(s);
+ s->rw_state = RW_STATE_LATCHED_WORD0;
+ break;
+ default:
+ s->mode = (val >> 1) & 7;
+ s->bcd = val & 1;
+ s->rw_state = access - 1 + RW_STATE_LSB;
+ break;
+ }
+ } else {
+ s = &pit->pit_channels[addr];
+ switch(s->rw_state) {
+ case RW_STATE_LSB:
+ pit_load_count(s, val);
+ break;
+ case RW_STATE_MSB:
+ pit_load_count(s, val << 8);
+ break;
+ case RW_STATE_WORD0:
+ case RW_STATE_WORD1:
+ if (s->rw_state & 1) {
+ pit_load_count(s, (s->latched_count & 0xff) | (val << 8));
+ } else {
+ s->latched_count = val;
+ }
+ s->rw_state ^= 1;
+ break;
+ }
+ }
+}
+
+static uint32_t pit_read(void *opaque, uint32_t offset, int size_log2)
+{
+ PITState *pit = opaque;
+ PITChannel *s;
+ int ret, count, addr;
+
+ addr = offset & 3;
+ if (addr == 3)
+ return 0xff;
+
+ s = &pit->pit_channels[addr];
+ switch(s->rw_state) {
+ case RW_STATE_LSB:
+ case RW_STATE_MSB:
+ case RW_STATE_WORD0:
+ case RW_STATE_WORD1:
+ count = pit_get_count(s);
+ if (s->rw_state & 1)
+ ret = (count >> 8) & 0xff;
+ else
+ ret = count & 0xff;
+ if (s->rw_state & 2)
+ s->rw_state ^= 1;
+ break;
+ default:
+ case RW_STATE_LATCHED_WORD0:
+ case RW_STATE_LATCHED_WORD1:
+ if (s->rw_state & 1)
+ ret = s->latched_count >> 8;
+ else
+ ret = s->latched_count & 0xff;
+ s->rw_state ^= 1;
+ break;
+ }
+#ifdef DEBUG_PIT
+ printf("pit_read: off=%d val=0x%02x\n", addr, ret);
+#endif
+ return ret;
+}
+
+static void speaker_write(void *opaque, uint32_t offset,
+ uint32_t val, int size_log2)
+{
+ PITState *pit = opaque;
+ pit->speaker_data_on = (val >> 1) & 1;
+ pit->pit_channels[2].gate = val & 1;
+}
+
+static uint32_t speaker_read(void *opaque, uint32_t offset, int size_log2)
+{
+ PITState *pit = opaque;
+ PITChannel *s;
+ int out, val;
+
+ s = &pit->pit_channels[2];
+ out = pit_get_out(s);
+ val = (pit->speaker_data_on << 1) | s->gate | (out << 5);
+#ifdef DEBUG_PIT
+ // console.log("speaker_read: addr=" + toHex2(addr) + " val=" + toHex2(val));
+#endif
+ return val;
+}
+
+/* set the IRQ if necessary and return the delay in ms until the next
+ IRQ. Note: The code does not handle all the PIT configurations. */
+static int pit_update_irq(PITState *pit)
+{
+ PITChannel *s;
+ int64_t d, delay;
+
+ s = &pit->pit_channels[0];
+
+ delay = PIT_FREQ; /* could be infinity delay */
+
+ d = pit_get_time(s) - s->count_load_time;
+ switch(s->mode) {
+ default:
+ case 0:
+ case 1:
+ case 4:
+ case 5:
+ if (s->last_irq_time == 0) {
+ delay = s->count - d;
+ if (delay <= 0) {
+ set_irq(pit->irq, 1);
+ set_irq(pit->irq, 0);
+ s->last_irq_time = d;
+ }
+ }
+ break;
+ case 2: /* mode used by Linux */
+ case 3:
+ delay = s->last_irq_time + s->count - d;
+ if (delay <= 0) {
+ set_irq(pit->irq, 1);
+ set_irq(pit->irq, 0);
+ s->last_irq_time += s->count;
+ }
+ break;
+ }
+
+ if (delay <= 0)
+ return 0;
+ else
+ return delay / (PIT_FREQ / 1000);
+}
+
+/***********************************************************/
+/* serial port emulation */
+
+#define UART_LCR_DLAB 0x80 /* Divisor latch access bit */
+
+#define UART_IER_MSI 0x08 /* Enable Modem status interrupt */
+#define UART_IER_RLSI 0x04 /* Enable receiver line status interrupt */
+#define UART_IER_THRI 0x02 /* Enable Transmitter holding register int. */
+#define UART_IER_RDI 0x01 /* Enable receiver data interrupt */
+
+#define UART_IIR_NO_INT 0x01 /* No interrupts pending */
+#define UART_IIR_ID 0x06 /* Mask for the interrupt ID */
+
+#define UART_IIR_MSI 0x00 /* Modem status interrupt */
+#define UART_IIR_THRI 0x02 /* Transmitter holding register empty */
+#define UART_IIR_RDI 0x04 /* Receiver data interrupt */
+#define UART_IIR_RLSI 0x06 /* Receiver line status interrupt */
+#define UART_IIR_FE 0xC0 /* Fifo enabled */
+
+#define UART_LSR_TEMT 0x40 /* Transmitter empty */
+#define UART_LSR_THRE 0x20 /* Transmit-hold-register empty */
+#define UART_LSR_BI 0x10 /* Break interrupt indicator */
+#define UART_LSR_FE 0x08 /* Frame error indicator */
+#define UART_LSR_PE 0x04 /* Parity error indicator */
+#define UART_LSR_OE 0x02 /* Overrun error indicator */
+#define UART_LSR_DR 0x01 /* Receiver data ready */
+
+#define UART_FCR_XFR 0x04 /* XMIT Fifo Reset */
+#define UART_FCR_RFR 0x02 /* RCVR Fifo Reset */
+#define UART_FCR_FE 0x01 /* FIFO Enable */
+
+#define UART_FIFO_LENGTH 16 /* 16550A Fifo Length */
+
+typedef struct {
+ uint8_t divider;
+ uint8_t rbr; /* receive register */
+ uint8_t ier;
+ uint8_t iir; /* read only */
+ uint8_t lcr;
+ uint8_t mcr;
+ uint8_t lsr; /* read only */
+ uint8_t msr;
+ uint8_t scr;
+ uint8_t fcr;
+ IRQSignal *irq;
+ void (*write_func)(void *opaque, const uint8_t *buf, int buf_len);
+ void *opaque;
+} SerialState;
+
+static void serial_write(void *opaque, uint32_t offset,
+ uint32_t val, int size_log2);
+static uint32_t serial_read(void *opaque, uint32_t offset, int size_log2);
+
+SerialState *serial_init(PhysMemoryMap *port_map, int addr,
+ IRQSignal *irq,
+ void (*write_func)(void *opaque, const uint8_t *buf, int buf_len), void *opaque)
+{
+ SerialState *s;
+ s = mallocz(sizeof(*s));
+
+ /* all 8 bit registers */
+ s->divider = 0;
+ s->rbr = 0; /* receive register */
+ s->ier = 0;
+ s->iir = UART_IIR_NO_INT; /* read only */
+ s->lcr = 0;
+ s->mcr = 0;
+ s->lsr = UART_LSR_TEMT | UART_LSR_THRE; /* read only */
+ s->msr = 0;
+ s->scr = 0;
+ s->fcr = 0;
+
+ s->irq = irq;
+ s->write_func = write_func;
+ s->opaque = opaque;
+
+ cpu_register_device(port_map, addr, 8, s, serial_read, serial_write,
+ DEVIO_SIZE8);
+ return s;
+}
+
+static void serial_update_irq(SerialState *s)
+{
+ if ((s->lsr & UART_LSR_DR) && (s->ier & UART_IER_RDI)) {
+ s->iir = UART_IIR_RDI;
+ } else if ((s->lsr & UART_LSR_THRE) && (s->ier & UART_IER_THRI)) {
+ s->iir = UART_IIR_THRI;
+ } else {
+ s->iir = UART_IIR_NO_INT;
+ }
+ if (s->iir != UART_IIR_NO_INT) {
+ set_irq(s->irq, 1);
+ } else {
+ set_irq(s->irq, 0);
+ }
+}
+
+#if 0
+/* send remainining chars in fifo */
+Serial.prototype.write_tx_fifo = function()
+{
+ if (s->tx_fifo != "") {
+ s->write_func(s->tx_fifo);
+ s->tx_fifo = "";
+
+ s->lsr |= UART_LSR_THRE;
+ s->lsr |= UART_LSR_TEMT;
+ s->update_irq();
+ }
+}
+#endif
+
+static void serial_write(void *opaque, uint32_t offset,
+ uint32_t val, int size_log2)
+{
+ SerialState *s = opaque;
+ int addr;
+
+ addr = offset & 7;
+ switch(addr) {
+ default:
+ case 0:
+ if (s->lcr & UART_LCR_DLAB) {
+ s->divider = (s->divider & 0xff00) | val;
+ } else {
+#if 0
+ if (s->fcr & UART_FCR_FE) {
+ s->tx_fifo += String.fromCharCode(val);
+ s->lsr &= ~UART_LSR_THRE;
+ serial_update_irq(s);
+ if (s->tx_fifo.length >= UART_FIFO_LENGTH) {
+ /* write to the terminal */
+ s->write_tx_fifo();
+ }
+ } else
+#endif
+ {
+ uint8_t ch;
+ s->lsr &= ~UART_LSR_THRE;
+ serial_update_irq(s);
+
+ /* write to the terminal */
+ ch = val;
+ s->write_func(s->opaque, &ch, 1);
+ s->lsr |= UART_LSR_THRE;
+ s->lsr |= UART_LSR_TEMT;
+ serial_update_irq(s);
+ }
+ }
+ break;
+ case 1:
+ if (s->lcr & UART_LCR_DLAB) {
+ s->divider = (s->divider & 0x00ff) | (val << 8);
+ } else {
+ s->ier = val;
+ serial_update_irq(s);
+ }
+ break;
+ case 2:
+#if 0
+ if ((s->fcr ^ val) & UART_FCR_FE) {
+ /* clear fifos */
+ val |= UART_FCR_XFR | UART_FCR_RFR;
+ }
+ if (val & UART_FCR_XFR)
+ s->tx_fifo = "";
+ if (val & UART_FCR_RFR)
+ s->rx_fifo = "";
+ s->fcr = val & UART_FCR_FE;
+#endif
+ break;
+ case 3:
+ s->lcr = val;
+ break;
+ case 4:
+ s->mcr = val;
+ break;
+ case 5:
+ break;
+ case 6:
+ s->msr = val;
+ break;
+ case 7:
+ s->scr = val;
+ break;
+ }
+}
+
+static uint32_t serial_read(void *opaque, uint32_t offset, int size_log2)
+{
+ SerialState *s = opaque;
+ int ret, addr;
+
+ addr = offset & 7;
+ switch(addr) {
+ default:
+ case 0:
+ if (s->lcr & UART_LCR_DLAB) {
+ ret = s->divider & 0xff;
+ } else {
+ ret = s->rbr;
+ s->lsr &= ~(UART_LSR_DR | UART_LSR_BI);
+ serial_update_irq(s);
+#if 0
+ /* try to receive next chars */
+ s->send_char_from_fifo();
+#endif
+ }
+ break;
+ case 1:
+ if (s->lcr & UART_LCR_DLAB) {
+ ret = (s->divider >> 8) & 0xff;
+ } else {
+ ret = s->ier;
+ }
+ break;
+ case 2:
+ ret = s->iir;
+ if (s->fcr & UART_FCR_FE)
+ ret |= UART_IIR_FE;
+ break;
+ case 3:
+ ret = s->lcr;
+ break;
+ case 4:
+ ret = s->mcr;
+ break;
+ case 5:
+ ret = s->lsr;
+ break;
+ case 6:
+ ret = s->msr;
+ break;
+ case 7:
+ ret = s->scr;
+ break;
+ }
+ return ret;
+}
+
+void serial_send_break(SerialState *s)
+{
+ s->rbr = 0;
+ s->lsr |= UART_LSR_BI | UART_LSR_DR;
+ serial_update_irq(s);
+}
+
+#if 0
+static void serial_send_char(SerialState *s, int ch)
+{
+ s->rbr = ch;
+ s->lsr |= UART_LSR_DR;
+ serial_update_irq(s);
+}
+
+Serial.prototype.send_char_from_fifo = function()
+{
+ var fifo;
+
+ fifo = s->rx_fifo;
+ if (fifo != "" && !(s->lsr & UART_LSR_DR)) {
+ s->send_char(fifo.charCodeAt(0));
+ s->rx_fifo = fifo.substr(1, fifo.length - 1);
+ }
+}
+
+/* queue the string in the UART receive fifo and send it ASAP */
+Serial.prototype.send_chars = function(str)
+{
+ s->rx_fifo += str;
+ s->send_char_from_fifo();
+}
+
+#endif
+
+#ifdef DEBUG_BIOS
+static void bios_debug_write(void *opaque, uint32_t offset,
+ uint32_t val, int size_log2)
+{
+#ifdef EMSCRIPTEN
+ static char line_buf[256];
+ static int line_buf_index;
+ line_buf[line_buf_index++] = val;
+ if (val == '\n' || line_buf_index >= sizeof(line_buf) - 1) {
+ line_buf[line_buf_index] = '\0';
+ printf("%s", line_buf);
+ line_buf_index = 0;
+ }
+#else
+ putchar(val & 0xff);
+#endif
+}
+
+static uint32_t bios_debug_read(void *opaque, uint32_t offset, int size_log2)
+{
+ return 0;
+}
+#endif
+
+typedef struct PCMachine {
+ VirtMachine common;
+ uint64_t ram_size;
+ PhysMemoryMap *mem_map;
+ PhysMemoryMap *port_map;
+
+ X86CPUState *cpu_state;
+ PIC2State *pic_state;
+ IRQSignal pic_irq[16];
+ PITState *pit_state;
+ I440FXState *i440fx_state;
+ CMOSState *cmos_state;
+ SerialState *serial_state;
+
+ /* input */
+ VIRTIODevice *keyboard_dev;
+ VIRTIODevice *mouse_dev;
+ KBDState *kbd_state;
+ PS2MouseState *ps2_mouse;
+ VMMouseState *vm_mouse;
+ PS2KbdState *ps2_kbd;
+
+#ifdef USE_KVM
+ BOOL kvm_enabled;
+ int kvm_fd;
+ int vm_fd;
+ int vcpu_fd;
+ int kvm_run_size;
+ struct kvm_run *kvm_run;
+#endif
+} PCMachine;
+
+static void copy_kernel(PCMachine *s, const uint8_t *buf, int buf_len,
+ const char *cmd_line);
+
+static void port80_write(void *opaque, uint32_t offset,
+ uint32_t val64, int size_log2)
+{
+}
+
+static uint32_t port80_read(void *opaque, uint32_t offset, int size_log2)
+{
+ return 0xff;
+}
+
+static void port92_write(void *opaque, uint32_t offset,
+ uint32_t val, int size_log2)
+{
+}
+
+static uint32_t port92_read(void *opaque, uint32_t offset, int size_log2)
+{
+ int a20 = 1; /* A20=0 is not supported */
+ return a20 << 1;
+}
+
+#define VMPORT_MAGIC 0x564D5868
+#define REG_EAX 0
+#define REG_EBX 1
+#define REG_ECX 2
+#define REG_EDX 3
+#define REG_ESI 4
+#define REG_EDI 5
+
+static uint32_t vmport_read(void *opaque, uint32_t addr, int size_log2)
+{
+ PCMachine *s = opaque;
+ uint32_t regs[6];
+
+#ifdef USE_KVM
+ if (s->kvm_enabled) {
+ struct kvm_regs r;
+
+ ioctl(s->vcpu_fd, KVM_GET_REGS, &r);
+ regs[REG_EAX] = r.rax;
+ regs[REG_EBX] = r.rbx;
+ regs[REG_ECX] = r.rcx;
+ regs[REG_EDX] = r.rdx;
+ regs[REG_ESI] = r.rsi;
+ regs[REG_EDI] = r.rdi;
+
+ if (regs[REG_EAX] == VMPORT_MAGIC) {
+
+ vmmouse_handler(s->vm_mouse, regs);
+
+ /* Note: in 64 bits the high parts are reset to zero
+ in all cases. */
+ r.rax = regs[REG_EAX];
+ r.rbx = regs[REG_EBX];
+ r.rcx = regs[REG_ECX];
+ r.rdx = regs[REG_EDX];
+ r.rsi = regs[REG_ESI];
+ r.rdi = regs[REG_EDI];
+ ioctl(s->vcpu_fd, KVM_SET_REGS, &r);
+ }
+ } else
+#endif
+ {
+ regs[REG_EAX] = x86_cpu_get_reg(s->cpu_state, 0);
+ regs[REG_EBX] = x86_cpu_get_reg(s->cpu_state, 3);
+ regs[REG_ECX] = x86_cpu_get_reg(s->cpu_state, 1);
+ regs[REG_EDX] = x86_cpu_get_reg(s->cpu_state, 2);
+ regs[REG_ESI] = x86_cpu_get_reg(s->cpu_state, 6);
+ regs[REG_EDI] = x86_cpu_get_reg(s->cpu_state, 7);
+
+ if (regs[REG_EAX] == VMPORT_MAGIC) {
+ vmmouse_handler(s->vm_mouse, regs);
+
+ x86_cpu_set_reg(s->cpu_state, 0, regs[REG_EAX]);
+ x86_cpu_set_reg(s->cpu_state, 3, regs[REG_EBX]);
+ x86_cpu_set_reg(s->cpu_state, 1, regs[REG_ECX]);
+ x86_cpu_set_reg(s->cpu_state, 2, regs[REG_EDX]);
+ x86_cpu_set_reg(s->cpu_state, 6, regs[REG_ESI]);
+ x86_cpu_set_reg(s->cpu_state, 7, regs[REG_EDI]);
+ }
+ }
+ return regs[REG_EAX];
+}
+
+static void vmport_write(void *opaque, uint32_t addr, uint32_t val,
+ int size_log2)
+{
+}
+
+static void pic_set_irq_cb(void *opaque, int level)
+{
+ PCMachine *s = opaque;
+ x86_cpu_set_irq(s->cpu_state, level);
+}
+
+static void serial_write_cb(void *opaque, const uint8_t *buf, int buf_len)
+{
+ PCMachine *s = opaque;
+ if (s->common.console) {
+ s->common.console->write_data(s->common.console->opaque, buf, buf_len);
+ }
+}
+
+static int get_hard_intno_cb(void *opaque)
+{
+ PCMachine *s = opaque;
+ return pic2_get_hard_intno(s->pic_state);
+}
+
+static int64_t pit_get_ticks_cb(void *opaque)
+{
+ struct timespec ts;
+
+ clock_gettime(CLOCK_MONOTONIC, &ts);
+ return (uint64_t)ts.tv_sec * PIT_FREQ +
+ ((uint64_t)ts.tv_nsec * PIT_FREQ / 1000000000);
+}
+
+#define FRAMEBUFFER_BASE_ADDR 0xf0400000
+
+static uint8_t *get_ram_ptr(PCMachine *s, uint64_t paddr)
+{
+ PhysMemoryRange *pr;
+ pr = get_phys_mem_range(s->mem_map, paddr);
+ if (!pr || !pr->is_ram)
+ return NULL;
+ return pr->phys_mem + (uintptr_t)(paddr - pr->addr);
+}
+
+#ifdef DUMP_IOPORT
+static BOOL dump_port(int port)
+{
+ return !((port >= 0x1f0 && port <= 0x1f7) ||
+ (port >= 0x20 && port <= 0x21) ||
+ (port >= 0xa0 && port <= 0xa1));
+}
+#endif
+
+static void st_port(void *opaque, uint32_t port, uint32_t val, int size_log2)
+{
+ PCMachine *s = opaque;
+ PhysMemoryRange *pr;
+#ifdef DUMP_IOPORT
+ if (dump_port(port))
+ printf("write port=0x%x val=0x%x s=%d\n", port, val, 1 << size_log2);
+#endif
+ pr = get_phys_mem_range(s->port_map, port);
+ if (!pr) {
+ return;
+ }
+ port -= pr->addr;
+ if ((pr->devio_flags >> size_log2) & 1) {
+ pr->write_func(pr->opaque, port, (uint32_t)val, size_log2);
+ } else if (size_log2 == 1 && (pr->devio_flags & DEVIO_SIZE8)) {
+ pr->write_func(pr->opaque, port, val & 0xff, 0);
+ pr->write_func(pr->opaque, port + 1, (val >> 8) & 0xff, 0);
+ }
+}
+
+static uint32_t ld_port(void *opaque, uint32_t port1, int size_log2)
+{
+ PCMachine *s = opaque;
+ PhysMemoryRange *pr;
+ uint32_t val, port;
+
+ port = port1;
+ pr = get_phys_mem_range(s->port_map, port);
+ if (!pr) {
+ val = -1;
+ } else {
+ port -= pr->addr;
+ if ((pr->devio_flags >> size_log2) & 1) {
+ val = pr->read_func(pr->opaque, port, size_log2);
+ } else if (size_log2 == 1 && (pr->devio_flags & DEVIO_SIZE8)) {
+ val = pr->read_func(pr->opaque, port, 0) & 0xff;
+ val |= (pr->read_func(pr->opaque, port + 1, 0) & 0xff) << 8;
+ } else {
+ val = -1;
+ }
+ }
+#ifdef DUMP_IOPORT
+ if (dump_port(port1))
+ printf("read port=0x%x val=0x%x s=%d\n", port1, val, 1 << size_log2);
+#endif
+ return val;
+}
+
+static void pc_machine_set_defaults(VirtMachineParams *p)
+{
+ p->accel_enable = TRUE;
+}
+
+#ifdef USE_KVM
+
+static void sigalrm_handler(int sig)
+{
+}
+
+#define CPUID_APIC (1 << 9)
+#define CPUID_ACPI (1 << 22)
+
+static void kvm_set_cpuid(PCMachine *s)
+{
+ struct kvm_cpuid2 *kvm_cpuid;
+ int n_ent_max, i;
+ struct kvm_cpuid_entry2 *ent;
+
+ n_ent_max = 128;
+ kvm_cpuid = mallocz(sizeof(struct kvm_cpuid2) + n_ent_max * sizeof(kvm_cpuid->entries[0]));
+
+ kvm_cpuid->nent = n_ent_max;
+ if (ioctl(s->kvm_fd, KVM_GET_SUPPORTED_CPUID, kvm_cpuid) < 0) {
+ perror("KVM_GET_SUPPORTED_CPUID");
+ exit(1);
+ }
+
+ for(i = 0; i < kvm_cpuid->nent; i++) {
+ ent = &kvm_cpuid->entries[i];
+ /* remove the APIC & ACPI to be in sync with the emulator */
+ if (ent->function == 1 || ent->function == 0x80000001) {
+ ent->edx &= ~(CPUID_APIC | CPUID_ACPI);
+ }
+ }
+
+ if (ioctl(s->vcpu_fd, KVM_SET_CPUID2, kvm_cpuid) < 0) {
+ perror("KVM_SET_CPUID2");
+ exit(1);
+ }
+ free(kvm_cpuid);
+}
+
+/* XXX: should check overlapping mappings */
+static void kvm_map_ram(PhysMemoryMap *mem_map, PhysMemoryRange *pr)
+{
+ PCMachine *s = mem_map->opaque;
+ struct kvm_userspace_memory_region region;
+ int flags;
+
+ region.slot = pr - mem_map->phys_mem_range;
+ flags = 0;
+ if (pr->devram_flags & DEVRAM_FLAG_ROM)
+ flags |= KVM_MEM_READONLY;
+ if (pr->devram_flags & DEVRAM_FLAG_DIRTY_BITS)
+ flags |= KVM_MEM_LOG_DIRTY_PAGES;
+ region.flags = flags;
+ region.guest_phys_addr = pr->addr;
+ region.memory_size = pr->size;
+#if 0
+ printf("map slot %d: %08lx %08lx\n",
+ region.slot, pr->addr, pr->size);
+#endif
+ region.userspace_addr = (uintptr_t)pr->phys_mem;
+ if (ioctl(s->vm_fd, KVM_SET_USER_MEMORY_REGION, &region) < 0) {
+ perror("KVM_SET_USER_MEMORY_REGION");
+ exit(1);
+ }
+}
+
+/* XXX: just for one region */
+static PhysMemoryRange *kvm_register_ram(PhysMemoryMap *mem_map, uint64_t addr,
+ uint64_t size, int devram_flags)
+{
+ PhysMemoryRange *pr;
+ uint8_t *phys_mem;
+
+ pr = register_ram_entry(mem_map, addr, size, devram_flags);
+
+ phys_mem = mmap(NULL, size, PROT_READ | PROT_WRITE,
+ MAP_SHARED | MAP_ANONYMOUS, -1, 0);
+ if (!phys_mem)
+ return NULL;
+ pr->phys_mem = phys_mem;
+ if (devram_flags & DEVRAM_FLAG_DIRTY_BITS) {
+ int n_pages = size >> 12;
+ pr->dirty_bits_size = ((n_pages + 63) / 64) * 8;
+ pr->dirty_bits = mallocz(pr->dirty_bits_size);
+ }
+
+ if (pr->size != 0) {
+ kvm_map_ram(mem_map, pr);
+ }
+ return pr;
+}
+
+static void kvm_set_ram_addr(PhysMemoryMap *mem_map,
+ PhysMemoryRange *pr, uint64_t addr, BOOL enabled)
+{
+ if (enabled) {
+ if (pr->size == 0 || addr != pr->addr) {
+ /* move or create the region */
+ pr->size = pr->org_size;
+ pr->addr = addr;
+ kvm_map_ram(mem_map, pr);
+ }
+ } else {
+ if (pr->size != 0) {
+ pr->addr = 0;
+ pr->size = 0;
+ /* map a zero size region to disable */
+ kvm_map_ram(mem_map, pr);
+ }
+ }
+}
+
+static const uint32_t *kvm_get_dirty_bits(PhysMemoryMap *mem_map,
+ PhysMemoryRange *pr)
+{
+ PCMachine *s = mem_map->opaque;
+ struct kvm_dirty_log dlog;
+
+ if (pr->size == 0) {
+ /* not mapped: we assume no modification was made */
+ memset(pr->dirty_bits, 0, pr->dirty_bits_size);
+ } else {
+ dlog.slot = pr - mem_map->phys_mem_range;
+ dlog.dirty_bitmap = pr->dirty_bits;
+ if (ioctl(s->vm_fd, KVM_GET_DIRTY_LOG, &dlog) < 0) {
+ perror("KVM_GET_DIRTY_LOG");
+ exit(1);
+ }
+ }
+ return pr->dirty_bits;
+}
+
+static void kvm_free_ram(PhysMemoryMap *mem_map, PhysMemoryRange *pr)
+{
+ /* XXX: do it */
+ munmap(pr->phys_mem, pr->org_size);
+ free(pr->dirty_bits);
+}
+
+static void kvm_pic_set_irq(void *opaque, int irq_num, int level)
+{
+ PCMachine *s = opaque;
+ struct kvm_irq_level irq_level;
+ irq_level.irq = irq_num;
+ irq_level.level = level;
+ if (ioctl(s->vm_fd, KVM_IRQ_LINE, &irq_level) < 0) {
+ perror("KVM_IRQ_LINE");
+ exit(1);
+ }
+}
+
+static void kvm_init(PCMachine *s)
+{
+ int ret, i;
+ struct sigaction act;
+ struct kvm_pit_config pit_config;
+ uint64_t base_addr;
+
+ s->kvm_enabled = FALSE;
+ s->kvm_fd = open("/dev/kvm", O_RDWR);
+ if (s->kvm_fd < 0) {
+ fprintf(stderr, "KVM not available\n");
+ return;
+ }
+ ret = ioctl(s->kvm_fd, KVM_GET_API_VERSION, 0);
+ if (ret < 0) {
+ perror("KVM_GET_API_VERSION");
+ exit(1);
+ }
+ if (ret != 12) {
+ fprintf(stderr, "Unsupported KVM version\n");
+ close(s->kvm_fd);
+ s->kvm_fd = -1;
+ return;
+ }
+ s->vm_fd = ioctl(s->kvm_fd, KVM_CREATE_VM, 0);
+ if (s->vm_fd < 0) {
+ perror("KVM_CREATE_VM");
+ exit(1);
+ }
+
+ /* just before the BIOS */
+ base_addr = 0xfffbc000;
+ if (ioctl(s->vm_fd, KVM_SET_IDENTITY_MAP_ADDR, &base_addr) < 0) {
+ perror("KVM_SET_IDENTITY_MAP_ADDR");
+ exit(1);
+ }
+
+ if (ioctl(s->vm_fd, KVM_SET_TSS_ADDR, (long)(base_addr + 0x1000)) < 0) {
+ perror("KVM_SET_TSS_ADDR");
+ exit(1);
+ }
+
+ if (ioctl(s->vm_fd, KVM_CREATE_IRQCHIP, 0) < 0) {
+ perror("KVM_CREATE_IRQCHIP");
+ exit(1);
+ }
+
+ memset(&pit_config, 0, sizeof(pit_config));
+ pit_config.flags = KVM_PIT_SPEAKER_DUMMY;
+ if (ioctl(s->vm_fd, KVM_CREATE_PIT2, &pit_config)) {
+ perror("KVM_CREATE_PIT2");
+ exit(1);
+ }
+
+ s->vcpu_fd = ioctl(s->vm_fd, KVM_CREATE_VCPU, 0);
+ if (s->vcpu_fd < 0) {
+ perror("KVM_CREATE_VCPU");
+ exit(1);
+ }
+
+ kvm_set_cpuid(s);
+
+ /* map the kvm_run structure */
+ s->kvm_run_size = ioctl(s->kvm_fd, KVM_GET_VCPU_MMAP_SIZE, NULL);
+ if (s->kvm_run_size < 0) {
+ perror("KVM_GET_VCPU_MMAP_SIZE");
+ exit(1);
+ }
+
+ s->kvm_run = mmap(NULL, s->kvm_run_size, PROT_READ | PROT_WRITE,
+ MAP_SHARED, s->vcpu_fd, 0);
+ if (!s->kvm_run) {
+ perror("mmap kvm_run");
+ exit(1);
+ }
+
+ for(i = 0; i < 16; i++) {
+ irq_init(&s->pic_irq[i], kvm_pic_set_irq, s, i);
+ }
+
+ act.sa_handler = sigalrm_handler;
+ sigemptyset(&act.sa_mask);
+ act.sa_flags = 0;
+ sigaction(SIGALRM, &act, NULL);
+
+ s->kvm_enabled = TRUE;
+
+ s->mem_map->register_ram = kvm_register_ram;
+ s->mem_map->free_ram = kvm_free_ram;
+ s->mem_map->get_dirty_bits = kvm_get_dirty_bits;
+ s->mem_map->set_ram_addr = kvm_set_ram_addr;
+ s->mem_map->opaque = s;
+}
+
+static void kvm_exit_io(PCMachine *s, struct kvm_run *run)
+{
+ uint8_t *ptr;
+ int i;
+
+ ptr = (uint8_t *)run + run->io.data_offset;
+ // printf("port: addr=%04x\n", run->io.port);
+
+ for(i = 0; i < run->io.count; i++) {
+ if (run->io.direction == KVM_EXIT_IO_OUT) {
+ switch(run->io.size) {
+ case 1:
+ st_port(s, run->io.port, *(uint8_t *)ptr, 0);
+ break;
+ case 2:
+ st_port(s, run->io.port, *(uint16_t *)ptr, 1);
+ break;
+ case 4:
+ st_port(s, run->io.port, *(uint32_t *)ptr, 2);
+ break;
+ default:
+ abort();
+ }
+ } else {
+ switch(run->io.size) {
+ case 1:
+ *(uint8_t *)ptr = ld_port(s, run->io.port, 0);
+ break;
+ case 2:
+ *(uint16_t *)ptr = ld_port(s, run->io.port, 1);
+ break;
+ case 4:
+ *(uint32_t *)ptr = ld_port(s, run->io.port, 2);
+ break;
+ default:
+ abort();
+ }
+ }
+ ptr += run->io.size;
+ }
+}
+
+static void kvm_exit_mmio(PCMachine *s, struct kvm_run *run)
+{
+ uint8_t *data = run->mmio.data;
+ PhysMemoryRange *pr;
+ uint64_t addr;
+
+ pr = get_phys_mem_range(s->mem_map, run->mmio.phys_addr);
+ if (run->mmio.is_write) {
+ if (!pr || pr->is_ram)
+ return;
+ addr = run->mmio.phys_addr - pr->addr;
+ switch(run->mmio.len) {
+ case 1:
+ if (pr->devio_flags & DEVIO_SIZE8) {
+ pr->write_func(pr->opaque, addr, *(uint8_t *)data, 0);
+ }
+ break;
+ case 2:
+ if (pr->devio_flags & DEVIO_SIZE16) {
+ pr->write_func(pr->opaque, addr, *(uint16_t *)data, 1);
+ }
+ break;
+ case 4:
+ if (pr->devio_flags & DEVIO_SIZE32) {
+ pr->write_func(pr->opaque, addr, *(uint32_t *)data, 2);
+ }
+ break;
+ case 8:
+ if (pr->devio_flags & DEVIO_SIZE32) {
+ pr->write_func(pr->opaque, addr, *(uint32_t *)data, 2);
+ pr->write_func(pr->opaque, addr + 4, *(uint32_t *)(data + 4), 2);
+ }
+ break;
+ default:
+ abort();
+ }
+ } else {
+ if (!pr || pr->is_ram)
+ goto no_dev;
+ addr = run->mmio.phys_addr - pr->addr;
+ switch(run->mmio.len) {
+ case 1:
+ if (!(pr->devio_flags & DEVIO_SIZE8))
+ goto no_dev;
+ *(uint8_t *)data = pr->read_func(pr->opaque, addr, 0);
+ break;
+ case 2:
+ if (!(pr->devio_flags & DEVIO_SIZE16))
+ goto no_dev;
+ *(uint16_t *)data = pr->read_func(pr->opaque, addr, 1);
+ break;
+ case 4:
+ if (!(pr->devio_flags & DEVIO_SIZE32))
+ goto no_dev;
+ *(uint32_t *)data = pr->read_func(pr->opaque, addr, 2);
+ break;
+ case 8:
+ if (pr->devio_flags & DEVIO_SIZE32) {
+ *(uint32_t *)data =
+ pr->read_func(pr->opaque, addr, 2);
+ *(uint32_t *)(data + 4) =
+ pr->read_func(pr->opaque, addr + 4, 2);
+ } else {
+ no_dev:
+ memset(run->mmio.data, 0, run->mmio.len);
+ }
+ break;
+ default:
+ abort();
+ }
+
+ }
+}
+
+static void kvm_exec(PCMachine *s)
+{
+ struct kvm_run *run = s->kvm_run;
+ struct itimerval ival;
+ int ret;
+
+ /* Not efficient but simple: we use a timer to interrupt the
+ execution after a given time */
+ ival.it_interval.tv_sec = 0;
+ ival.it_interval.tv_usec = 0;
+ ival.it_value.tv_sec = 0;
+ ival.it_value.tv_usec = 10 * 1000; /* 10 ms max */
+ setitimer(ITIMER_REAL, &ival, NULL);
+
+ ret = ioctl(s->vcpu_fd, KVM_RUN, 0);
+ if (ret < 0) {
+ if (errno == EINTR || errno == EAGAIN) {
+ /* timeout */
+ return;
+ }
+ perror("KVM_RUN");
+ exit(1);
+ }
+ // printf("exit=%d\n", run->exit_reason);
+ switch(run->exit_reason) {
+ case KVM_EXIT_HLT:
+ break;
+ case KVM_EXIT_IO:
+ kvm_exit_io(s, run);
+ break;
+ case KVM_EXIT_MMIO:
+ kvm_exit_mmio(s, run);
+ break;
+ case KVM_EXIT_FAIL_ENTRY:
+ fprintf(stderr, "KVM_EXIT_FAIL_ENTRY: reason=0x%" PRIx64 "\n",
+ (uint64_t)run->fail_entry.hardware_entry_failure_reason);
+#if 0
+ {
+ struct kvm_regs regs;
+ if (ioctl(s->vcpu_fd, KVM_GET_REGS, &regs) < 0) {
+ perror("KVM_SET_REGS");
+ exit(1);
+ }
+ printf("RIP=%016" PRIx64 "\n", (uint64_t)regs.rip);
+ }
+#endif
+ exit(1);
+ case KVM_EXIT_INTERNAL_ERROR:
+ fprintf(stderr, "KVM_EXIT_INTERNAL_ERROR: suberror=0x%x\n",
+ (uint32_t)run->internal.suberror);
+ exit(1);
+ default:
+ fprintf(stderr, "KVM: unsupported exit_reason=%d\n", run->exit_reason);
+ exit(1);
+ }
+}
+#endif
+
+#if defined(EMSCRIPTEN)
+/* with Javascript clock_gettime() is not enough precise enough to
+ have a reliable TSC counter. XXX: increment the cycles during the
+ power down time */
+static uint64_t cpu_get_tsc(void *opaque)
+{
+ PCMachine *s = opaque;
+ uint64_t c;
+ c = x86_cpu_get_cycles(s->cpu_state);
+ return c;
+}
+#else
+
+#define TSC_FREQ 100000000
+
+static uint64_t cpu_get_tsc(void *opaque)
+{
+ struct timespec ts;
+
+ clock_gettime(CLOCK_MONOTONIC, &ts);
+ return (uint64_t)ts.tv_sec * TSC_FREQ +
+ (ts.tv_nsec / (1000000000 / TSC_FREQ));
+}
+#endif
+
+static void pc_flush_tlb_write_range(void *opaque, uint8_t *ram_addr,
+ size_t ram_size)
+{
+ PCMachine *s = opaque;
+ x86_cpu_flush_tlb_write_range_ram(s->cpu_state, ram_addr, ram_size);
+}
+
+static VirtMachine *pc_machine_init(const VirtMachineParams *p)
+{
+ PCMachine *s;
+ int i, piix3_devfn;
+ PCIBus *pci_bus;
+ VIRTIOBusDef vbus_s, *vbus = &vbus_s;
+
+ if (strcmp(p->machine_name, "pc") != 0) {
+ vm_error("unsupported machine: %s\n", p->machine_name);
+ return NULL;
+ }
+
+ assert(p->ram_size >= (1 << 20));
+
+ s = mallocz(sizeof(*s));
+ s->common.vmc = p->vmc;
+ s->ram_size = p->ram_size;
+
+ s->port_map = phys_mem_map_init();
+ s->mem_map = phys_mem_map_init();
+
+#ifdef USE_KVM
+ if (p->accel_enable) {
+ kvm_init(s);
+ }
+#endif
+
+#ifdef USE_KVM
+ if (!s->kvm_enabled)
+#endif
+ {
+ s->cpu_state = x86_cpu_init(s->mem_map);
+ x86_cpu_set_get_tsc(s->cpu_state, cpu_get_tsc, s);
+ x86_cpu_set_port_io(s->cpu_state, ld_port, st_port, s);
+
+ /* needed to handle the RAM dirty bits */
+ s->mem_map->opaque = s;
+ s->mem_map->flush_tlb_write_range = pc_flush_tlb_write_range;
+ }
+
+ /* set the RAM mapping and leave the VGA addresses empty */
+ cpu_register_ram(s->mem_map, 0xc0000, p->ram_size - 0xc0000, 0);
+ cpu_register_ram(s->mem_map, 0, 0xa0000, 0);
+
+ /* devices */
+ cpu_register_device(s->port_map, 0x80, 2, s, port80_read, port80_write,
+ DEVIO_SIZE8);
+ cpu_register_device(s->port_map, 0x92, 2, s, port92_read, port92_write,
+ DEVIO_SIZE8);
+
+ /* setup the bios */
+ if (p->files[VM_FILE_BIOS].len > 0) {
+ int bios_size, bios_size1;
+ uint8_t *bios_buf, *ptr;
+ uint32_t bios_addr;
+
+ bios_size = p->files[VM_FILE_BIOS].len;
+ bios_buf = p->files[VM_FILE_BIOS].buf;
+ assert((bios_size % 65536) == 0 && bios_size != 0);
+ bios_addr = -bios_size;
+ /* at the top of the 4GB memory */
+ cpu_register_ram(s->mem_map, bios_addr, bios_size, DEVRAM_FLAG_ROM);
+ ptr = get_ram_ptr(s, bios_addr);
+ memcpy(ptr, bios_buf, bios_size);
+ /* in the lower 1MB memory (currently set as RAM) */
+ bios_size1 = min_int(bios_size, 128 * 1024);
+ ptr = get_ram_ptr(s, 0x100000 - bios_size1);
+ memcpy(ptr, bios_buf + bios_size - bios_size1, bios_size1);
+#ifdef DEBUG_BIOS
+ cpu_register_device(s->port_map, 0x402, 2, s,
+ bios_debug_read, bios_debug_write,
+ DEVIO_SIZE8);
+#endif
+ }
+
+#ifdef USE_KVM
+ if (!s->kvm_enabled)
+#endif
+ {
+ s->pic_state = pic2_init(s->port_map, 0x20, 0xa0,
+ 0x4d0, 0x4d1,
+ pic_set_irq_cb, s,
+ s->pic_irq);
+ x86_cpu_set_get_hard_intno(s->cpu_state, get_hard_intno_cb, s);
+ s->pit_state = pit_init(s->port_map, 0x40, 0x61, &s->pic_irq[0],
+ pit_get_ticks_cb, s);
+ }
+
+ s->cmos_state = cmos_init(s->port_map, 0x70, &s->pic_irq[8],
+ p->rtc_local_time);
+
+ /* various cmos data */
+ {
+ int size;
+ /* memory size */
+ size = min_int((s->ram_size - (1 << 20)) >> 10, 65535);
+ put_le16(s->cmos_state->cmos_data + 0x30, size);
+ if (s->ram_size >= (16 << 20)) {
+ size = min_int((s->ram_size - (16 << 20)) >> 16, 65535);
+ put_le16(s->cmos_state->cmos_data + 0x34, size);
+ }
+ s->cmos_state->cmos_data[0x14] = 0x06; /* mouse + FPU present */
+ }
+
+ s->i440fx_state = i440fx_init(&pci_bus, &piix3_devfn, s->mem_map,
+ s->port_map, s->pic_irq);
+
+ s->common.console = p->console;
+ /* serial console */
+ if (0) {
+ s->serial_state = serial_init(s->port_map, 0x3f8, &s->pic_irq[4],
+ serial_write_cb, s);
+ }
+
+ memset(vbus, 0, sizeof(*vbus));
+ vbus->pci_bus = pci_bus;
+
+ if (p->console) {
+ /* virtio console */
+ s->common.console_dev = virtio_console_init(vbus, p->console);
+ }
+
+ /* block devices */
+ for(i = 0; i < p->drive_count;) {
+ const VMDriveEntry *de = &p->tab_drive[i];
+
+ if (!de->device || !strcmp(de->device, "virtio")) {
+ virtio_block_init(vbus, p->tab_drive[i].block_dev);
+ i++;
+ } else if (!strcmp(de->device, "ide")) {
+ BlockDevice *tab_bs[2];
+
+ tab_bs[0] = p->tab_drive[i++].block_dev;
+ tab_bs[1] = NULL;
+ if (i < p->drive_count)
+ tab_bs[1] = p->tab_drive[i++].block_dev;
+ ide_init(s->port_map, 0x1f0, 0x3f6, &s->pic_irq[14], tab_bs);
+ piix3_ide_init(pci_bus, piix3_devfn + 1);
+ }
+ }
+
+ /* virtio filesystem */
+ for(i = 0; i < p->fs_count; i++) {
+ virtio_9p_init(vbus, p->tab_fs[i].fs_dev,
+ p->tab_fs[i].tag);
+ }
+
+ if (p->display_device) {
+ FBDevice *fb_dev;
+
+ fb_dev = mallocz(sizeof(*fb_dev));
+ s->common.fb_dev = fb_dev;
+ if (!strcmp(p->display_device, "vga")) {
+ int bios_size;
+ uint8_t *bios_buf;
+ bios_size = p->files[VM_FILE_VGA_BIOS].len;
+ bios_buf = p->files[VM_FILE_VGA_BIOS].buf;
+ pci_vga_init(pci_bus, fb_dev, p->width, p->height,
+ bios_buf, bios_size);
+ } else if (!strcmp(p->display_device, "simplefb")) {
+ simplefb_init(s->mem_map,
+ FRAMEBUFFER_BASE_ADDR,
+ fb_dev, p->width, p->height);
+ } else {
+ vm_error("unsupported display device: %s\n", p->display_device);
+ exit(1);
+ }
+ }
+
+ if (p->input_device) {
+ if (!strcmp(p->input_device, "virtio")) {
+ s->keyboard_dev = virtio_input_init(vbus, VIRTIO_INPUT_TYPE_KEYBOARD);
+
+ s->mouse_dev = virtio_input_init(vbus, VIRTIO_INPUT_TYPE_TABLET);
+ } else if (!strcmp(p->input_device, "ps2")) {
+ s->kbd_state = i8042_init(&s->ps2_kbd, &s->ps2_mouse,
+ s->port_map,
+ &s->pic_irq[1], &s->pic_irq[12], 0x60);
+ /* vmmouse */
+ cpu_register_device(s->port_map, 0x5658, 1, s,
+ vmport_read, vmport_write,
+ DEVIO_SIZE32);
+ s->vm_mouse = vmmouse_init(s->ps2_mouse);
+ } else {
+ vm_error("unsupported input device: %s\n", p->input_device);
+ exit(1);
+ }
+ }
+
+ /* virtio net device */
+ for(i = 0; i < p->eth_count; i++) {
+ virtio_net_init(vbus, p->tab_eth[i].net);
+ s->common.net = p->tab_eth[i].net;
+ }
+
+ if (p->files[VM_FILE_KERNEL].buf) {
+ copy_kernel(s, p->files[VM_FILE_KERNEL].buf,
+ p->files[VM_FILE_KERNEL].len,
+ p->cmdline ? p->cmdline : "");
+ }
+
+ return (VirtMachine *)s;
+}
+
+static void pc_machine_end(VirtMachine *s1)
+{
+ PCMachine *s = (PCMachine *)s1;
+ /* XXX: free all */
+ if (s->cpu_state) {
+ x86_cpu_end(s->cpu_state);
+ }
+ phys_mem_map_end(s->mem_map);
+ phys_mem_map_end(s->port_map);
+ free(s);
+}
+
+static void pc_vm_send_key_event(VirtMachine *s1, BOOL is_down, uint16_t key_code)
+{
+ PCMachine *s = (PCMachine *)s1;
+ if (s->keyboard_dev) {
+ virtio_input_send_key_event(s->keyboard_dev, is_down, key_code);
+ } else if (s->ps2_kbd) {
+ ps2_put_keycode(s->ps2_kbd, is_down, key_code);
+ }
+}
+
+static BOOL pc_vm_mouse_is_absolute(VirtMachine *s1)
+{
+ PCMachine *s = (PCMachine *)s1;
+ if (s->mouse_dev) {
+ return TRUE;
+ } else if (s->vm_mouse) {
+ return vmmouse_is_absolute(s->vm_mouse);
+ } else {
+ return FALSE;
+ }
+}
+
+static void pc_vm_send_mouse_event(VirtMachine *s1, int dx, int dy, int dz,
+ unsigned int buttons)
+{
+ PCMachine *s = (PCMachine *)s1;
+ if (s->mouse_dev) {
+ virtio_input_send_mouse_event(s->mouse_dev, dx, dy, dz, buttons);
+ } else if (s->vm_mouse) {
+ vmmouse_send_mouse_event(s->vm_mouse, dx, dy, dz, buttons);
+ }
+}
+
+struct screen_info {
+} __attribute__((packed));
+
+/* from plex86 (BSD license) */
+struct __attribute__ ((packed)) linux_params {
+ /* screen_info structure */
+ uint8_t orig_x; /* 0x00 */
+ uint8_t orig_y; /* 0x01 */
+ uint16_t ext_mem_k; /* 0x02 */
+ uint16_t orig_video_page; /* 0x04 */
+ uint8_t orig_video_mode; /* 0x06 */
+ uint8_t orig_video_cols; /* 0x07 */
+ uint8_t flags; /* 0x08 */
+ uint8_t unused2; /* 0x09 */
+ uint16_t orig_video_ega_bx;/* 0x0a */
+ uint16_t unused3; /* 0x0c */
+ uint8_t orig_video_lines; /* 0x0e */
+ uint8_t orig_video_isVGA; /* 0x0f */
+ uint16_t orig_video_points;/* 0x10 */
+
+ /* VESA graphic mode -- linear frame buffer */
+ uint16_t lfb_width; /* 0x12 */
+ uint16_t lfb_height; /* 0x14 */
+ uint16_t lfb_depth; /* 0x16 */
+ uint32_t lfb_base; /* 0x18 */
+ uint32_t lfb_size; /* 0x1c */
+ uint16_t cl_magic, cl_offset; /* 0x20 */
+ uint16_t lfb_linelength; /* 0x24 */
+ uint8_t red_size; /* 0x26 */
+ uint8_t red_pos; /* 0x27 */
+ uint8_t green_size; /* 0x28 */
+ uint8_t green_pos; /* 0x29 */
+ uint8_t blue_size; /* 0x2a */
+ uint8_t blue_pos; /* 0x2b */
+ uint8_t rsvd_size; /* 0x2c */
+ uint8_t rsvd_pos; /* 0x2d */
+ uint16_t vesapm_seg; /* 0x2e */
+ uint16_t vesapm_off; /* 0x30 */
+ uint16_t pages; /* 0x32 */
+ uint16_t vesa_attributes; /* 0x34 */
+ uint32_t capabilities; /* 0x36 */
+ uint32_t ext_lfb_base; /* 0x3a */
+ uint8_t _reserved[2]; /* 0x3e */
+
+ /* 0x040 */ uint8_t apm_bios_info[20]; // struct apm_bios_info
+ /* 0x054 */ uint8_t pad2[0x80 - 0x54];
+
+ // Following 2 from 'struct drive_info_struct' in drivers/block/cciss.h.
+ // Might be truncated?
+ /* 0x080 */ uint8_t hd0_info[16]; // hd0-disk-parameter from intvector 0x41
+ /* 0x090 */ uint8_t hd1_info[16]; // hd1-disk-parameter from intvector 0x46
+
+ // System description table truncated to 16 bytes
+ // From 'struct sys_desc_table_struct' in linux/arch/i386/kernel/setup.c.
+ /* 0x0a0 */ uint16_t sys_description_len;
+ /* 0x0a2 */ uint8_t sys_description_table[14];
+ // [0] machine id
+ // [1] machine submodel id
+ // [2] BIOS revision
+ // [3] bit1: MCA bus
+
+ /* 0x0b0 */ uint8_t pad3[0x1e0 - 0xb0];
+ /* 0x1e0 */ uint32_t alt_mem_k;
+ /* 0x1e4 */ uint8_t pad4[4];
+ /* 0x1e8 */ uint8_t e820map_entries;
+ /* 0x1e9 */ uint8_t eddbuf_entries; // EDD_NR
+ /* 0x1ea */ uint8_t pad5[0x1f1 - 0x1ea];
+ /* 0x1f1 */ uint8_t setup_sects; // size of setup.S, number of sectors
+ /* 0x1f2 */ uint16_t mount_root_rdonly; // MOUNT_ROOT_RDONLY (if !=0)
+ /* 0x1f4 */ uint16_t sys_size; // size of compressed kernel-part in the
+ // (b)zImage-file (in 16 byte units, rounded up)
+ /* 0x1f6 */ uint16_t swap_dev; // (unused AFAIK)
+ /* 0x1f8 */ uint16_t ramdisk_flags;
+ /* 0x1fa */ uint16_t vga_mode; // (old one)
+ /* 0x1fc */ uint16_t orig_root_dev; // (high=Major, low=minor)
+ /* 0x1fe */ uint8_t pad6[1];
+ /* 0x1ff */ uint8_t aux_device_info;
+ /* 0x200 */ uint16_t jump_setup; // Jump to start of setup code,
+ // aka "reserved" field.
+ /* 0x202 */ uint8_t setup_signature[4]; // Signature for SETUP-header, ="HdrS"
+ /* 0x206 */ uint16_t header_format_version; // Version number of header format;
+ /* 0x208 */ uint8_t setup_S_temp0[8]; // Used by setup.S for communication with
+ // boot loaders, look there.
+ /* 0x210 */ uint8_t loader_type;
+ // 0 for old one.
+ // else 0xTV:
+ // T=0: LILO
+ // T=1: Loadlin
+ // T=2: bootsect-loader
+ // T=3: SYSLINUX
+ // T=4: ETHERBOOT
+ // V=version
+ /* 0x211 */ uint8_t loadflags;
+ // bit0 = 1: kernel is loaded high (bzImage)
+ // bit7 = 1: Heap and pointer (see below) set by boot
+ // loader.
+ /* 0x212 */ uint16_t setup_S_temp1;
+ /* 0x214 */ uint32_t kernel_start;
+ /* 0x218 */ uint32_t initrd_start;
+ /* 0x21c */ uint32_t initrd_size;
+ /* 0x220 */ uint8_t setup_S_temp2[4];
+ /* 0x224 */ uint16_t setup_S_heap_end_pointer;
+ /* 0x226 */ uint16_t pad70;
+ /* 0x228 */ uint32_t cmd_line_ptr;
+ /* 0x22c */ uint8_t pad7[0x2d0 - 0x22c];
+
+ /* 0x2d0 : Int 15, ax=e820 memory map. */
+ // (linux/include/asm-i386/e820.h, 'struct e820entry')
+#define E820MAX 32
+#define E820_RAM 1
+#define E820_RESERVED 2
+#define E820_ACPI 3 /* usable as RAM once ACPI tables have been read */
+#define E820_NVS 4
+ struct {
+ uint64_t addr;
+ uint64_t size;
+ uint32_t type;
+ } e820map[E820MAX];
+
+ /* 0x550 */ uint8_t pad8[0x600 - 0x550];
+
+ // BIOS Enhanced Disk Drive Services.
+ // (From linux/include/asm-i386/edd.h, 'struct edd_info')
+ // Each 'struct edd_info is 78 bytes, times a max of 6 structs in array.
+ /* 0x600 */ uint8_t eddbuf[0x7d4 - 0x600];
+
+ /* 0x7d4 */ uint8_t pad9[0x800 - 0x7d4];
+ /* 0x800 */ uint8_t commandline[0x800];
+
+ uint64_t gdt_table[4];
+};
+
+#define KERNEL_PARAMS_ADDR 0x00090000
+
+static void copy_kernel(PCMachine *s, const uint8_t *buf, int buf_len,
+ const char *cmd_line)
+{
+ uint8_t *ram_ptr;
+ int setup_sects, header_len, copy_len, setup_hdr_start, setup_hdr_end;
+ uint32_t load_address;
+ struct linux_params *params;
+ FBDevice *fb_dev;
+
+ if (buf_len < 1024) {
+ too_small:
+ fprintf(stderr, "Kernel too small\n");
+ exit(1);
+ }
+ if (buf[0x1fe] != 0x55 || buf[0x1ff] != 0xaa) {
+ fprintf(stderr, "Invalid kernel magic\n");
+ exit(1);
+ }
+ setup_sects = buf[0x1f1];
+ if (setup_sects == 0)
+ setup_sects = 4;
+ header_len = (setup_sects + 1) * 512;
+ if (buf_len < header_len)
+ goto too_small;
+ if (memcmp(buf + 0x202, "HdrS", 4) != 0) {
+ fprintf(stderr, "Kernel too old\n");
+ exit(1);
+ }
+ load_address = 0x100000; /* we don't support older protocols */
+
+ ram_ptr = get_ram_ptr(s, load_address);
+ copy_len = buf_len - header_len;
+ if (copy_len > (s->ram_size - load_address)) {
+ fprintf(stderr, "Not enough RAM\n");
+ exit(1);
+ }
+ memcpy(ram_ptr, buf + header_len, copy_len);
+
+ params = (void *)get_ram_ptr(s, KERNEL_PARAMS_ADDR);
+
+ memset(params, 0, sizeof(struct linux_params));
+
+ /* copy the setup header */
+ setup_hdr_start = 0x1f1;
+ setup_hdr_end = 0x202 + buf[0x201];
+ memcpy((uint8_t *)params + setup_hdr_start, buf + setup_hdr_start,
+ setup_hdr_end - setup_hdr_start);
+
+ strcpy((char *)params->commandline, cmd_line);
+
+ params->mount_root_rdonly = 0;
+ params->cmd_line_ptr = KERNEL_PARAMS_ADDR +
+ offsetof(struct linux_params, commandline);
+ params->alt_mem_k = (s->ram_size / 1024) - 1024;
+ params->loader_type = 0x01;
+#if 0
+ if (initrd_size > 0) {
+ params->initrd_start = INITRD_LOAD_ADDR;
+ params->initrd_size = initrd_size;
+ }
+#endif
+ params->orig_video_lines = 0;
+ params->orig_video_cols = 0;
+
+ fb_dev = s->common.fb_dev;
+ if (fb_dev) {
+
+ params->orig_video_isVGA = 0x23; /* VIDEO_TYPE_VLFB */
+
+ params->lfb_depth = 32;
+ params->red_size = 8;
+ params->red_pos = 16;
+ params->green_size = 8;
+ params->green_pos = 8;
+ params->blue_size = 8;
+ params->blue_pos = 0;
+ params->rsvd_size = 8;
+ params->rsvd_pos = 24;
+
+ params->lfb_width = fb_dev->width;
+ params->lfb_height = fb_dev->height;
+ params->lfb_linelength = fb_dev->stride;
+ params->lfb_size = fb_dev->fb_size;
+ params->lfb_base = FRAMEBUFFER_BASE_ADDR;
+ }
+
+ params->gdt_table[2] = 0x00cf9b000000ffffLL; /* CS */
+ params->gdt_table[3] = 0x00cf93000000ffffLL; /* DS */
+
+#ifdef USE_KVM
+ if (s->kvm_enabled) {
+ struct kvm_sregs sregs;
+ struct kvm_segment seg;
+ struct kvm_regs regs;
+
+ /* init flat protected mode */
+
+ if (ioctl(s->vcpu_fd, KVM_GET_SREGS, &sregs) < 0) {
+ perror("KVM_GET_SREGS");
+ exit(1);
+ }
+
+ sregs.cr0 |= (1 << 0); /* CR0_PE */
+ sregs.gdt.base = KERNEL_PARAMS_ADDR +
+ offsetof(struct linux_params, gdt_table);
+ sregs.gdt.limit = sizeof(params->gdt_table) - 1;
+
+ memset(&seg, 0, sizeof(seg));
+ seg.limit = 0xffffffff;
+ seg.present = 1;
+ seg.db = 1;
+ seg.s = 1; /* code/data */
+ seg.g = 1; /* 4KB granularity */
+
+ seg.type = 0xb; /* code */
+ seg.selector = 2 << 3;
+ sregs.cs = seg;
+
+ seg.type = 0x3; /* data */
+ seg.selector = 3 << 3;
+ sregs.ds = seg;
+ sregs.es = seg;
+ sregs.ss = seg;
+ sregs.fs = seg;
+ sregs.gs = seg;
+
+ if (ioctl(s->vcpu_fd, KVM_SET_SREGS, &sregs) < 0) {
+ perror("KVM_SET_SREGS");
+ exit(1);
+ }
+
+ memset(&regs, 0, sizeof(regs));
+ regs.rip = load_address;
+ regs.rsi = KERNEL_PARAMS_ADDR;
+ regs.rflags = 0x2;
+ if (ioctl(s->vcpu_fd, KVM_SET_REGS, &regs) < 0) {
+ perror("KVM_SET_REGS");
+ exit(1);
+ }
+ } else
+#endif
+ {
+ int i;
+ X86CPUSeg sd;
+ uint32_t val;
+ val = x86_cpu_get_reg(s->cpu_state, X86_CPU_REG_CR0);
+ x86_cpu_set_reg(s->cpu_state, X86_CPU_REG_CR0, val | (1 << 0));
+
+ sd.base = KERNEL_PARAMS_ADDR +
+ offsetof(struct linux_params, gdt_table);
+ sd.limit = sizeof(params->gdt_table) - 1;
+ x86_cpu_set_seg(s->cpu_state, X86_CPU_SEG_GDT, &sd);
+ sd.sel = 2 << 3;
+ sd.base = 0;
+ sd.limit = 0xffffffff;
+ sd.flags = 0xc09b;
+ x86_cpu_set_seg(s->cpu_state, X86_CPU_SEG_CS, &sd);
+ sd.sel = 3 << 3;
+ sd.flags = 0xc093;
+ for(i = 0; i < 6; i++) {
+ if (i != X86_CPU_SEG_CS) {
+ x86_cpu_set_seg(s->cpu_state, i, &sd);
+ }
+ }
+
+ x86_cpu_set_reg(s->cpu_state, X86_CPU_REG_EIP, load_address);
+ x86_cpu_set_reg(s->cpu_state, 6, KERNEL_PARAMS_ADDR); /* esi */
+ }
+
+ /* map PCI interrupts (no BIOS, so we must do it) */
+ {
+ uint8_t elcr[2];
+ static const uint8_t pci_irqs[4] = { 9, 10, 11, 12 };
+
+ i440fx_map_interrupts(s->i440fx_state, elcr, pci_irqs);
+ /* XXX: KVM support */
+ if (s->pic_state) {
+ pic2_set_elcr(s->pic_state, elcr);
+ }
+ }
+}
+
+/* in ms */
+static int pc_machine_get_sleep_duration(VirtMachine *s1, int delay)
+{
+ PCMachine *s = (PCMachine *)s1;
+
+#ifdef USE_KVM
+ if (s->kvm_enabled) {
+ /* XXX: improve */
+ cmos_update_irq(s->cmos_state);
+ delay = 0;
+ } else
+#endif
+ {
+ cmos_update_irq(s->cmos_state);
+ delay = min_int(delay, pit_update_irq(s->pit_state));
+ if (!x86_cpu_get_power_down(s->cpu_state))
+ delay = 0;
+ }
+ return delay;
+}
+
+static void pc_machine_interp(VirtMachine *s1, int max_exec_cycles)
+{
+ PCMachine *s = (PCMachine *)s1;
+#ifdef USE_KVM
+ if (s->kvm_enabled) {
+ kvm_exec(s);
+ } else
+#endif
+ {
+ x86_cpu_interp(s->cpu_state, max_exec_cycles);
+ }
+}
+
+const VirtMachineClass pc_machine_class = {
+ "pc",
+ pc_machine_set_defaults,
+ pc_machine_init,
+ pc_machine_end,
+ pc_machine_get_sleep_duration,
+ pc_machine_interp,
+ pc_vm_mouse_is_absolute,
+ pc_vm_send_mouse_event,
+ pc_vm_send_key_event,
+};