/* * This file is part of the Palacios Virtual Machine Monitor developed * by the V3VEE Project with funding from the United States National * Science Foundation and the Department of Energy. * * The V3VEE Project is a joint project between Northwestern University * and the University of New Mexico. You can find out more at * http://www.v3vee.org * * Copyright (c) 2008, Jack Lange * Copyright (c) 2008, The V3VEE Project * All rights reserved. * * Author: Jack Lange * * This is free software. You are permitted to use, * redistribute, and modify it as specified in the file "V3VEE_LICENSE". */ #include #include #include void delete_page_tables_pde32(pde32_t * pde) { int i;//, j; if (pde == NULL) { return; } for (i = 0; (i < MAX_PDE32_ENTRIES); i++) { if (pde[i].present) { // We double cast, first to an addr_t to handle 64 bit issues, then to the pointer PrintDebug("PTE base addr %x \n", pde[i].pt_base_addr); pte32_t * pte = (pte32_t *)((addr_t)(uint_t)(pde[i].pt_base_addr << PAGE_POWER)); /* for (j = 0; (j < MAX_PTE32_ENTRIES); j++) { if ((pte[j].present)) { os_hooks->free_page((void *)(pte[j].page_base_addr << PAGE_POWER)); } } */ PrintDebug("Deleting PTE %d (%p)\n", i, pte); V3_FreePage(pte); } } PrintDebug("Deleting PDE (%p)\n", pde); V3_FreePage(V3_PAddr(pde)); } int pt32_lookup(pde32_t * pd, addr_t vaddr, addr_t * paddr) { addr_t pde_entry; pde32_entry_type_t pde_entry_type; if (pd == 0) { return -1; } pde_entry_type = pde32_lookup(pd, vaddr, &pde_entry); if (pde_entry_type == PDE32_ENTRY_PTE32) { return pte32_lookup((pte32_t *)pde_entry, vaddr, paddr); } else if (pde_entry_type == PDE32_ENTRY_LARGE_PAGE) { *paddr = pde_entry; return 0; } return -1; } /* We can't do a full lookup because we don't know what context the page tables are in... * The entry addresses could be pointing to either guest physical memory or host physical memory * Instead we just return the entry address, and a flag to show if it points to a pte or a large page... */ pde32_entry_type_t pde32_lookup(pde32_t * pd, addr_t addr, addr_t * entry) { pde32_t * pde_entry = &(pd[PDE32_INDEX(addr)]); if (!pde_entry->present) { *entry = 0; return PDE32_ENTRY_NOT_PRESENT; } else { if (pde_entry->large_page) { pde32_4MB_t * large_pde = (pde32_4MB_t *)pde_entry; *entry = PDE32_4MB_T_ADDR(*large_pde); *entry += PD32_4MB_PAGE_OFFSET(addr); return PDE32_ENTRY_LARGE_PAGE; } else { *entry = PDE32_T_ADDR(*pde_entry); return PDE32_ENTRY_PTE32; } } return PDE32_ENTRY_NOT_PRESENT; } /* Takes a virtual addr (addr) and returns the physical addr (entry) as defined in the page table */ int pte32_lookup(pte32_t * pt, addr_t addr, addr_t * entry) { pte32_t * pte_entry = &(pt[PTE32_INDEX(addr)]); if (!pte_entry->present) { *entry = 0; PrintDebug("Lookup at non present page (index=%d)\n", PTE32_INDEX(addr)); return -1; } else { *entry = PTE32_T_ADDR(*pte_entry) + PT32_PAGE_OFFSET(addr); return 0; } return -1; } pt_access_status_t can_access_pde32(pde32_t * pde, addr_t addr, pf_error_t access_type) { pde32_t * entry = &pde[PDE32_INDEX(addr)]; if (entry->present == 0) { return PT_ENTRY_NOT_PRESENT; } else if ((entry->writable == 0) && (access_type.write == 1)) { return PT_WRITE_ERROR; } else if ((entry->user_page == 0) && (access_type.user == 1)) { // Check CR0.WP? return PT_USER_ERROR; } return PT_ACCESS_OK; } pt_access_status_t can_access_pte32(pte32_t * pte, addr_t addr, pf_error_t access_type) { pte32_t * entry = &pte[PTE32_INDEX(addr)]; if (entry->present == 0) { return PT_ENTRY_NOT_PRESENT; } else if ((entry->writable == 0) && (access_type.write == 1)) { return PT_WRITE_ERROR; } else if ((entry->user_page == 0) && (access_type.user == 1)) { // Check CR0.WP? return PT_USER_ERROR; } return PT_ACCESS_OK; } /* We generate a page table to correspond to a given memory layout * pulling pages from the mem_list when necessary * If there are any gaps in the layout, we add them as unmapped pages */ pde32_t * create_passthrough_pts_32(struct guest_info * guest_info) { addr_t current_page_addr = 0; int i, j; struct shadow_map * map = &(guest_info->mem_map); pde32_t * pde = V3_VAddr(V3_AllocPages(1)); for (i = 0; i < MAX_PDE32_ENTRIES; i++) { int pte_present = 0; pte32_t * pte = V3_VAddr(V3_AllocPages(1)); for (j = 0; j < MAX_PTE32_ENTRIES; j++) { struct shadow_region * region = get_shadow_region_by_addr(map, current_page_addr); if (!region || (region->host_type == HOST_REGION_HOOK) || (region->host_type == HOST_REGION_UNALLOCATED) || (region->host_type == HOST_REGION_MEMORY_MAPPED_DEVICE) || (region->host_type == HOST_REGION_REMOTE) || (region->host_type == HOST_REGION_SWAPPED)) { pte[j].present = 0; pte[j].writable = 0; pte[j].user_page = 0; pte[j].write_through = 0; pte[j].cache_disable = 0; pte[j].accessed = 0; pte[j].dirty = 0; pte[j].pte_attr = 0; pte[j].global_page = 0; pte[j].vmm_info = 0; pte[j].page_base_addr = 0; } else { addr_t host_addr; pte[j].present = 1; pte[j].writable = 1; pte[j].user_page = 1; pte[j].write_through = 0; pte[j].cache_disable = 0; pte[j].accessed = 0; pte[j].dirty = 0; pte[j].pte_attr = 0; pte[j].global_page = 0; pte[j].vmm_info = 0; if (guest_pa_to_host_pa(guest_info, current_page_addr, &host_addr) == -1) { // BIG ERROR // PANIC return NULL; } pte[j].page_base_addr = host_addr >> 12; pte_present = 1; } current_page_addr += PAGE_SIZE; } if (pte_present == 0) { V3_FreePage(V3_PAddr(pte)); pde[i].present = 0; pde[i].writable = 0; pde[i].user_page = 0; pde[i].write_through = 0; pde[i].cache_disable = 0; pde[i].accessed = 0; pde[i].reserved = 0; pde[i].large_page = 0; pde[i].global_page = 0; pde[i].vmm_info = 0; pde[i].pt_base_addr = 0; } else { pde[i].present = 1; pde[i].writable = 1; pde[i].user_page = 1; pde[i].write_through = 0; pde[i].cache_disable = 0; pde[i].accessed = 0; pde[i].reserved = 0; pde[i].large_page = 0; pde[i].global_page = 0; pde[i].vmm_info = 0; pde[i].pt_base_addr = PAGE_ALIGNED_ADDR((addr_t)V3_PAddr(pte)); } } return pde; } pml4e64_t * create_passthrough_pts_64(struct guest_info * info) { addr_t current_page_addr = 0; int i, j, k, m; struct shadow_map * map = &(info->mem_map); pml4e64_t * pml = V3_VAddr(V3_AllocPages(1)); for (i = 0; i < 1; i++) { int pdpe_present = 0; pdpe64_t * pdpe = V3_VAddr(V3_AllocPages(1)); for (j = 0; j < 1; j++) { int pde_present = 0; pde64_t * pde = V3_VAddr(V3_AllocPages(1)); for (k = 0; k < MAX_PDE64_ENTRIES; k++) { int pte_present = 0; pte64_t * pte = V3_VAddr(V3_AllocPages(1)); for (m = 0; m < MAX_PTE64_ENTRIES; m++) { struct shadow_region * region = get_shadow_region_by_addr(map, current_page_addr); if (!region || (region->host_type == HOST_REGION_HOOK) || (region->host_type == HOST_REGION_UNALLOCATED) || (region->host_type == HOST_REGION_MEMORY_MAPPED_DEVICE) || (region->host_type == HOST_REGION_REMOTE) || (region->host_type == HOST_REGION_SWAPPED)) { pte[m].present = 0; pte[m].writable = 0; pte[m].user_page = 0; pte[m].write_through = 0; pte[m].cache_disable = 0; pte[m].accessed = 0; pte[m].dirty = 0; pte[m].pte_attr = 0; pte[m].global_page = 0; pte[m].vmm_info = 0; pte[m].page_base_addr = 0; } else { addr_t host_addr; pte[m].present = 1; pte[m].writable = 1; pte[m].user_page = 1; pte[m].write_through = 0; pte[m].cache_disable = 0; pte[m].accessed = 0; pte[m].dirty = 0; pte[m].pte_attr = 0; pte[m].global_page = 0; pte[m].vmm_info = 0; if (guest_pa_to_host_pa(info, current_page_addr, &host_addr) == -1) { // BIG ERROR // PANIC return NULL; } pte[m].page_base_addr = PTE64_BASE_ADDR(host_addr); //PrintPTE64(current_page_addr, &(pte[m])); pte_present = 1; } current_page_addr += PAGE_SIZE; } if (pte_present == 0) { V3_FreePage(V3_PAddr(pte)); pde[k].present = 0; pde[k].writable = 0; pde[k].user_page = 0; pde[k].write_through = 0; pde[k].cache_disable = 0; pde[k].accessed = 0; pde[k].reserved = 0; pde[k].large_page = 0; //pde[k].global_page = 0; pde[k].vmm_info = 0; pde[k].pt_base_addr = 0; } else { pde[k].present = 1; pde[k].writable = 1; pde[k].user_page = 1; pde[k].write_through = 0; pde[k].cache_disable = 0; pde[k].accessed = 0; pde[k].reserved = 0; pde[k].large_page = 0; //pde[k].global_page = 0; pde[k].vmm_info = 0; pde[k].pt_base_addr = PAGE_ALIGNED_ADDR((addr_t)V3_PAddr(pte)); pde_present = 1; } } if (pde_present == 0) { V3_FreePage(V3_PAddr(pde)); pdpe[j].present = 0; pdpe[j].writable = 0; pdpe[j].user_page = 0; pdpe[j].write_through = 0; pdpe[j].cache_disable = 0; pdpe[j].accessed = 0; pdpe[j].reserved = 0; pdpe[j].large_page = 0; //pdpe[j].global_page = 0; pdpe[j].vmm_info = 0; pdpe[j].pd_base_addr = 0; } else { pdpe[j].present = 1; pdpe[j].writable = 1; pdpe[j].user_page = 1; pdpe[j].write_through = 0; pdpe[j].cache_disable = 0; pdpe[j].accessed = 0; pdpe[j].reserved = 0; pdpe[j].large_page = 0; //pdpe[j].global_page = 0; pdpe[j].vmm_info = 0; pdpe[j].pd_base_addr = PAGE_ALIGNED_ADDR((addr_t)V3_PAddr(pde)); pdpe_present = 1; } } PrintDebug("PML index=%d\n", i); if (pdpe_present == 0) { V3_FreePage(V3_PAddr(pdpe)); pml[i].present = 0; pml[i].writable = 0; pml[i].user_page = 0; pml[i].write_through = 0; pml[i].cache_disable = 0; pml[i].accessed = 0; pml[i].reserved = 0; //pml[i].large_page = 0; //pml[i].global_page = 0; pml[i].vmm_info = 0; pml[i].pdp_base_addr = 0; } else { pml[i].present = 1; pml[i].writable = 1; pml[i].user_page = 1; pml[i].write_through = 0; pml[i].cache_disable = 0; pml[i].accessed = 0; pml[i].reserved = 0; //pml[i].large_page = 0; //pml[i].global_page = 0; pml[i].vmm_info = 0; pml[i].pdp_base_addr = PAGE_ALIGNED_ADDR((addr_t)V3_PAddr(pdpe)); } } return pml; } void PrintPDE32(addr_t virtual_address, pde32_t * pde) { PrintDebug("PDE %p -> %p : present=%x, writable=%x, user=%x, wt=%x, cd=%x, accessed=%x, reserved=%x, largePages=%x, globalPage=%x, kernelInfo=%x\n", (void *)virtual_address, (void *)(addr_t) (pde->pt_base_addr << PAGE_POWER), pde->present, pde->writable, pde->user_page, pde->write_through, pde->cache_disable, pde->accessed, pde->reserved, pde->large_page, pde->global_page, pde->vmm_info); } void PrintPTE32(addr_t virtual_address, pte32_t * pte) { PrintDebug("PTE %p -> %p : present=%x, writable=%x, user=%x, wt=%x, cd=%x, accessed=%x, dirty=%x, pteAttribute=%x, globalPage=%x, vmm_info=%x\n", (void *)virtual_address, (void*)(addr_t)(pte->page_base_addr << PAGE_POWER), pte->present, pte->writable, pte->user_page, pte->write_through, pte->cache_disable, pte->accessed, pte->dirty, pte->pte_attr, pte->global_page, pte->vmm_info); } void PrintPDE64(addr_t virtual_address, pde64_t * pde) { PrintDebug("PDE64 %p -> %p : present=%x, writable=%x, user=%x, wt=%x, cd=%x, accessed=%x, reserved=%x, largePages=%x, globalPage=%x, kernelInfo=%x\n", (void *)virtual_address, (void *)(addr_t) (pde->pt_base_addr << PAGE_POWER), pde->present, pde->writable, pde->user_page, pde->write_through, pde->cache_disable, pde->accessed, pde->reserved, pde->large_page, 0,//pde->global_page, pde->vmm_info); } void PrintPTE64(addr_t virtual_address, pte64_t * pte) { PrintDebug("PTE64 %p -> %p : present=%x, writable=%x, user=%x, wt=%x, cd=%x, accessed=%x, dirty=%x, pteAttribute=%x, globalPage=%x, vmm_info=%x\n", (void *)virtual_address, (void*)(addr_t)(pte->page_base_addr << PAGE_POWER), pte->present, pte->writable, pte->user_page, pte->write_through, pte->cache_disable, pte->accessed, pte->dirty, pte->pte_attr, pte->global_page, pte->vmm_info); } void PrintPD32(pde32_t * pde) { int i; PrintDebug("Page Directory at %p:\n", pde); for (i = 0; (i < MAX_PDE32_ENTRIES); i++) { if ( pde[i].present) { PrintPDE32((addr_t)(PAGE_SIZE * MAX_PTE32_ENTRIES * i), &(pde[i])); } } } void PrintPT32(addr_t starting_address, pte32_t * pte) { int i; PrintDebug("Page Table at %p:\n", pte); for (i = 0; (i < MAX_PTE32_ENTRIES) ; i++) { if (pte[i].present) { PrintPTE32(starting_address + (PAGE_SIZE * i), &(pte[i])); } } } void PrintDebugPageTables(pde32_t * pde) { int i; PrintDebug("Dumping the pages starting with the pde page at %p\n", pde); for (i = 0; (i < MAX_PDE32_ENTRIES); i++) { if (pde[i].present) { PrintPDE32((addr_t)(PAGE_SIZE * MAX_PTE32_ENTRIES * i), &(pde[i])); PrintPT32((addr_t)(PAGE_SIZE * MAX_PTE32_ENTRIES * i), (pte32_t *)V3_VAddr((void *)(addr_t)(pde[i].pt_base_addr << PAGE_POWER))); } } }