2 * This file is part of the Palacios Virtual Machine Monitor developed
3 * by the V3VEE Project with funding from the United States National
4 * Science Foundation and the Department of Energy.
6 * The V3VEE Project is a joint project between Northwestern University
7 * and the University of New Mexico. You can find out more at
10 * Copyright (c) 2009, Lei Xia <lxia@northwestern.edu>
11 * Copyright (c) 2009, Chang Seok Bae <jhuell@gmail.com>
12 * Copyright (c) 2009, Jack Lange <jarusl@cs.northwestern.edu>
13 * Copyright (c) 2009, The V3VEE Project <http://www.v3vee.org>
14 * All rights reserved.
16 * Author: Lei Xia <lxia@northwestern.edu>
17 * Chang Seok Bae <jhuell@gmail.com>
18 * Jack Lange <jarusl@cs.northwestern.edu>
20 * This is free software. You are permitted to use,
21 * redistribute, and modify it as specified in the file "V3VEE_LICENSE".
26 #include <palacios/vmm.h>
27 #include <palacios/vmm_types.h>
28 #include <palacios/vmm_io.h>
29 #include <palacios/vmm_intr.h>
30 #include <palacios/vmm_rbtree.h>
32 #include <devices/pci.h>
33 #include <devices/pci_types.h>
37 #define PrintDebug(fmt, args...)
41 #define CONFIG_ADDR_PORT 0x0cf8
42 #define CONFIG_DATA_PORT 0x0cfc
45 #define PCI_BUS_COUNT 1
47 // This must always be a multiple of 8
48 #define MAX_BUS_DEVICES 32
61 } __attribute__((packed));
62 } __attribute__((packed));
63 } __attribute__((packed));
72 // Red Black tree containing all attached devices
73 struct rb_root devices;
75 // Bitmap of the allocated device numbers
76 uint8_t dev_map[MAX_BUS_DEVICES / 8];
82 // Configuration address register
83 struct pci_addr_reg addr_reg;
86 struct pci_bus bus_list[PCI_BUS_COUNT];
95 static void pci_dump_state(struct pci_internal * pci_state) {
96 struct rb_node * node = v3_rb_first(&(pci_state->bus_list[0].devices));
97 struct pci_device * tmp_dev = NULL;
99 PrintDebug("===PCI: Dumping state Begin ==========\n");
102 tmp_dev = rb_entry(node, struct pci_device, dev_tree_node);
104 PrintDebug("PCI Device Number: %d (%s):\n", tmp_dev->dev_num, tmp_dev->name);
105 PrintDebug("irq = %d\n", tmp_dev->config_header.intr_line);
106 PrintDebug("Vend ID: 0x%x\n", tmp_dev->config_header.vendor_id);
107 PrintDebug("Device ID: 0x%x\n", tmp_dev->config_header.device_id);
109 } while ((node = v3_rb_next(node)));
111 PrintDebug("====PCI: Dumping state End==========\n");
119 // Scan the dev_map bitmap for the first '0' bit
120 static int get_free_dev_num(struct pci_bus * bus) {
123 for (i = 0; i < sizeof(bus->dev_map); i++) {
124 if (bus->dev_map[i] != 0xff) {
126 for (j = 0; j < 8; j++) {
127 if (!(bus->dev_map[i] & (0x1 << j))) {
128 return ((i * 8) + j) * 8;
137 static void allocate_dev_num(struct pci_bus * bus, int dev_num) {
138 int major = (dev_num / 8) / 8;
139 int minor = dev_num % 8;
141 bus->dev_map[major] |= (0x1 << minor);
147 struct pci_device * __add_device_to_bus(struct pci_bus * bus, struct pci_device * dev) {
149 struct rb_node ** p = &(bus->devices.rb_node);
150 struct rb_node * parent = NULL;
151 struct pci_device * tmp_dev = NULL;
155 tmp_dev = rb_entry(parent, struct pci_device, dev_tree_node);
157 if (dev->dev_num < tmp_dev->dev_num) {
159 } else if (dev->dev_num > tmp_dev->dev_num) {
166 rb_link_node(&(dev->dev_tree_node), parent, p);
173 struct pci_device * add_device_to_bus(struct pci_bus * bus, struct pci_device * dev) {
175 struct pci_device * ret = NULL;
177 if ((ret = __add_device_to_bus(bus, dev))) {
181 v3_rb_insert_color(&(dev->dev_tree_node), &(bus->devices));
183 allocate_dev_num(bus, dev->dev_num);
189 static struct pci_device * get_device(struct pci_bus * bus, int dev_num) {
190 struct rb_node * n = bus->devices.rb_node;
191 struct pci_device * dev = NULL;
194 dev = rb_entry(n, struct pci_device, dev_tree_node);
196 if (dev_num < dev->dev_num) {
198 } else if (dev_num > dev->dev_num) {
214 static int addr_port_read(ushort_t port, void * dst, uint_t length, struct vm_device * dev) {
215 struct pci_internal * pci_state = (struct pci_internal *)dev->private_data;
216 int reg_offset = port & 0x3;
217 uint8_t * reg_addr = ((uint8_t *)&(pci_state->addr_reg.val)) + reg_offset;
219 PrintDebug("Reading PCI Address Port (%x): %x\n", port, pci_state->addr_reg.val);
222 if (reg_offset != 0) {
223 PrintError("Invalid Address Port Read\n");
226 *(uint32_t *)dst = *(uint32_t *)reg_addr;
227 } else if (length == 2) {
228 if (reg_offset > 2) {
229 PrintError("Invalid Address Port Read\n");
232 *(uint16_t *)dst = *(uint16_t *)reg_addr;
233 } else if (length == 1) {
234 *(uint8_t *)dst = *(uint8_t *)reg_addr;
236 PrintError("Invalid read length (%d) for PCI address register\n", length);
245 static int addr_port_write(ushort_t port, void * src, uint_t length, struct vm_device * dev) {
246 struct pci_internal * pci_state = (struct pci_internal *)dev->private_data;
247 int reg_offset = port & 0x3;
248 uint8_t * reg_addr = ((uint8_t *)&(pci_state->addr_reg.val)) + reg_offset;
252 if (reg_offset != 0) {
253 PrintError("Invalid Address Port Write\n");
257 PrintDebug("Writing PCI 4 bytes Val=%x\n", *(uint32_t *)src);
259 *(uint32_t *)reg_addr = *(uint32_t *)src;
260 } else if (length == 2) {
261 if (reg_offset > 2) {
262 PrintError("Invalid Address Port Write\n");
266 PrintDebug("Writing PCI 2 byte Val=%x\n", *(uint16_t *)src);
268 *(uint16_t *)reg_addr = *(uint16_t *)src;
269 } else if (length == 1) {
270 PrintDebug("Writing PCI 1 byte Val=%x\n", *(uint8_t *)src);
271 *(uint8_t *)reg_addr = *(uint8_t *)src;
273 PrintError("Invalid write length (%d) for PCI address register\n", length);
277 PrintDebug("Writing PCI Address Port(%x): %x\n", port, pci_state->addr_reg.val);
284 static int data_port_read(ushort_t port, void * dst, uint_t length, struct vm_device * vmdev) {
285 struct pci_internal * pci_state = (struct pci_internal *)vmdev->private_data;;
286 struct pci_device * pci_dev = NULL;
287 uint_t reg_num = pci_state->addr_reg.reg_num + (port & 0x3);
290 PrintDebug("Reading PCI Data register. bus = %d, dev = %d, reg = %d (%x), cfg_reg = %x\n",
291 pci_state->addr_reg.bus_num,
292 pci_state->addr_reg.dev_num,
294 pci_state->addr_reg.val);
297 pci_dev = get_device(&(pci_state->bus_list[0]), pci_state->addr_reg.dev_num);
299 if (pci_dev == NULL) {
300 for (i = 0; i < length; i++) {
301 *((uint8_t *)dst + i) = 0xff;
307 for (i = 0; i < length; i++) {
308 *((uint8_t *)dst + i) = pci_dev->config_space[reg_num + i];
315 static inline int is_cfg_reg_writable(uchar_t header_type, int reg_num) {
316 if (header_type == 0x00) {
335 // PCI to PCI Bridge = 0x01
336 // CardBus Bridge = 0x02
339 PrintError("Invalid PCI Header type (0x%.2x)\n", header_type);
346 static int data_port_write(ushort_t port, void * src, uint_t length, struct vm_device * vmdev) {
347 struct pci_internal * pci_state = (struct pci_internal *)vmdev->private_data;
348 struct pci_device * pci_dev = NULL;
349 uint_t reg_num = pci_state->addr_reg.reg_num + (port & 0x3);
352 PrintDebug("Writing PCI Data register. bus = %d, dev = %d, reg = %d (%x) addr_reg = %x\n",
353 pci_state->addr_reg.bus_num,
354 pci_state->addr_reg.dev_num,
356 pci_state->addr_reg.val);
359 pci_dev = get_device(&(pci_state->bus_list[0]), pci_state->addr_reg.dev_num);
361 if (pci_dev == NULL) {
362 PrintError("Writing configuration space for non-present device (dev_num=%d)\n",
363 pci_state->addr_reg.dev_num);
368 for (i = 0; i < length; i++) {
369 uint_t cur_reg = reg_num + i;
371 if (is_cfg_reg_writable(pci_dev->config_header.header_type, cur_reg)) {
372 pci_dev->config_space[cur_reg] = *((uint8_t *)src + i);
374 if ((cur_reg >= 0x10) && (cur_reg < 0x28)) {
376 int bar_reg = (cur_reg & ~0x3) - 0x10;
378 if (pci_dev->bar[bar_reg].bar_update) {
379 pci_dev->bar_update_flag = 1;
380 pci_dev->bar[bar_reg].updated = 1;
382 } else if ((cur_reg >= 0x30) && (cur_reg < 0x34)) {
383 pci_dev->ext_rom_update_flag = 1;
384 } else if (cur_reg == 0x04) {
386 uint8_t command = *((uint8_t *)src + i);
388 pci_dev->config_space[cur_reg] = command;
390 if (pci_dev->cmd_update) {
391 pci_dev->cmd_update(pci_dev, (command & 0x01), (command & 0x02));
395 } else if (cur_reg == 0x0f) {
397 pci_dev->config_header.BIST = 0x00;
402 if (pci_dev->config_update) {
403 pci_dev->config_update(pci_dev, reg_num, length);
406 // Scan for BAR updated
407 if (pci_dev->bar_update_flag) {
408 for (i = 0; i < 6; i++) {
409 if (pci_dev->bar[i].updated) {
410 int bar_offset = 0x10 + 4 * i;
412 *(uint32_t *)(pci_dev->config_space + bar_offset) &= pci_dev->bar[i].mask;
414 if (pci_dev->bar[i].bar_update) {
415 pci_dev->bar[i].bar_update(pci_dev, i);
417 pci_dev->bar[i].updated = 0;
420 pci_dev->bar_update_flag = 0;
423 if ((pci_dev->ext_rom_update_flag) && (pci_dev->ext_rom_update)) {
424 pci_dev->ext_rom_update(pci_dev);
425 pci_dev->ext_rom_update_flag = 0;
434 static int pci_reset_device(struct vm_device * dev) {
435 PrintDebug("pci: reset device\n");
440 static int pci_start_device(struct vm_device * dev) {
441 PrintDebug("pci: start device\n");
446 static int pci_stop_device(struct vm_device * dev) {
447 PrintDebug("pci: stop device\n");
453 static int pci_deinit_device(struct vm_device * dev) {
456 for (i = 0; i < 4; i++){
457 v3_dev_unhook_io(dev, CONFIG_ADDR_PORT + i);
458 v3_dev_unhook_io(dev, CONFIG_DATA_PORT + i);
467 static int init_i440fx(struct vm_device * dev) {
468 struct pci_device * pci_dev = NULL;
469 struct v3_pci_bar bars[6];
472 for (i = 0; i < 6; i++) {
473 bars[i].type = PCI_BAR_NONE;
474 bars[i].mem_hook = 0;
475 bars[i].num_pages = 0;
476 bars[i].bar_update = NULL;
479 pci_dev = v3_pci_register_device(dev, PCI_STD_DEVICE, 0, "i440FX", 0, bars,
480 NULL, NULL, NULL, NULL);
486 pci_dev->config_header.vendor_id = 0x8086;
487 pci_dev->config_header.device_id = 0x1237;
488 pci_dev->config_header.revision = 0x0002;
489 pci_dev->config_header.subclass = 0x00; // SubClass: host2pci
490 pci_dev->config_header.class = 0x06; // Class: PCI bridge
492 pci_dev->bus_num = 0;
498 static void init_pci_busses(struct pci_internal * pci_state) {
501 for (i = 0; i < PCI_BUS_COUNT; i++) {
502 pci_state->bus_list[i].bus_num = i;
503 pci_state->bus_list[i].devices.rb_node = NULL;
504 memset(pci_state->bus_list[i].dev_map, 0, sizeof(pci_state->bus_list[i].dev_map));
510 static int pci_init_device(struct vm_device * dev) {
511 struct pci_internal * pci_state = (struct pci_internal *)dev->private_data;;
514 PrintDebug("pci: init_device\n");
517 // dev->vm->pci = dev; //should be in vmm_config.c
519 pci_state->addr_reg.val = 0;
521 init_pci_busses(pci_state);
523 if (init_i440fx(dev) == -1) {
524 PrintError("Could not intialize i440fx\n");
528 PrintDebug("Sizeof config header=%d\n", (int)sizeof(struct pci_config_header));
530 for (i = 0; i < 4; i++) {
531 v3_dev_hook_io(dev, CONFIG_ADDR_PORT + i, &addr_port_read, &addr_port_write);
532 v3_dev_hook_io(dev, CONFIG_DATA_PORT + i, &data_port_read, &data_port_write);
539 static struct vm_device_ops dev_ops = {
540 .init = pci_init_device,
541 .deinit = pci_deinit_device,
542 .reset = pci_reset_device,
543 .start = pci_start_device,
544 .stop = pci_stop_device,
548 struct vm_device * v3_create_pci() {
549 struct pci_internal * pci_state = V3_Malloc(sizeof(struct pci_internal));
551 PrintDebug("PCI internal at %p\n",(void *)pci_state);
553 struct vm_device * device = v3_create_device("PCI", &dev_ops, pci_state);
560 static inline int init_bars(struct pci_device * pci_dev) {
563 for (i = 0; i < 6; i++) {
564 int bar_offset = 0x10 + 4 * i;
566 if (pci_dev->bar[i].type == PCI_BAR_IO) {
567 pci_dev->bar[i].mask = 0x0000fffd;
568 *(uint32_t *)(pci_dev->config_space + bar_offset) = 0x00000001;
569 } else if (pci_dev->bar[i].type == PCI_BAR_MEM32) {
570 pci_dev->bar[i].mask = ~((pci_dev->bar[i].num_pages << 12) - 1);
571 pci_dev->bar[i].mask |= 0xf; // preserve the configuration flags
573 *(uint32_t *)(pci_dev->config_space + bar_offset) = 0x00000008;
575 if (pci_dev->bar[i].mem_hook) {
576 // clear the prefetchable flag...
577 *(uint8_t *)(pci_dev->config_space + bar_offset) &= ~0x00000008;
579 } else if (pci_dev->bar[i].type == PCI_BAR_MEM16) {
580 PrintError("16 Bit memory ranges not supported (reg: %d)\n", i);
581 } else if (pci_dev->bar[i].type == PCI_BAR_NONE) {
582 *(uint32_t *)(pci_dev->config_space + bar_offset) = 0x00000000;
584 PrintError("Invalid BAR type for bar #%d\n", i);
596 // if dev_num == -1, auto assign
597 struct pci_device * v3_pci_register_device(struct vm_device * pci,
598 pci_device_type_t dev_type,
602 struct v3_pci_bar * bars,
603 int (*config_update)(struct pci_device * pci_dev, uint_t reg_num, int length),
604 int (*cmd_update)(struct pci_device *pci_dev, uchar_t io_enabled, uchar_t mem_enabled),
605 int (*ext_rom_update)(struct pci_device * pci_dev),
606 void * private_data) {
608 struct pci_internal * pci_state = (struct pci_internal *)pci->private_data;
609 struct pci_bus * bus = &(pci_state->bus_list[bus_num]);
610 struct pci_device * pci_dev = NULL;
613 if (dev_num > MAX_BUS_DEVICES) {
614 PrintError("Requested Invalid device number (%d)\n", dev_num);
619 if ((dev_num = get_free_dev_num(bus)) == -1) {
620 PrintError("No more available PCI slots on bus %d\n", bus->bus_num);
625 if (get_device(bus, dev_num) != NULL) {
626 PrintError("PCI Device already registered at slot %d on bus %d\n",
627 dev_num, bus->bus_num);
632 pci_dev = (struct pci_device *)V3_Malloc(sizeof(struct pci_device));
634 if (pci_dev == NULL) {
638 memset(pci_dev, 0, sizeof(struct pci_device));
643 pci_dev->config_header.header_type = 0x00;
646 PrintError("Unhandled PCI Device Type: %d\n", dev_type);
650 pci_dev->bus_num = bus_num;
651 pci_dev->dev_num = dev_num;
653 strncpy(pci_dev->name, name, sizeof(pci_dev->name));
654 pci_dev->vm_dev = pci;
656 // register update callbacks
657 pci_dev->config_update = config_update;
658 pci_dev->cmd_update = cmd_update;
659 pci_dev->ext_rom_update = ext_rom_update;
661 pci_dev->priv_data = private_data;
665 for (i = 0; i < 6; i ++){
666 pci_dev->bar[i].type = bars[i].type;
667 pci_dev->bar[i].num_pages = bars[i].num_pages;
668 pci_dev->bar[i].mem_hook = bars[i].mem_hook;
669 pci_dev->bar[i].bar_update = bars[i].bar_update;
672 if (init_bars(pci_dev) == -1) {
673 PrintError("could not initialize bar registers\n");
677 pci_dev->cmd_update = cmd_update;
678 pci_dev->ext_rom_update = ext_rom_update;
681 add_device_to_bus(bus, pci_dev);
685 pci_dump_state(pci_state);