X-Git-Url: http://v3vee.org/palacios/gitweb/gitweb.cgi?a=blobdiff_plain;f=palacios%2Fsrc%2Fpalacios%2Fvmm_direct_paging_64.h;h=baae5d54d223b792df8f25e42b85bdfeaf574009;hb=2a9554f33cc3bdaab08d59ac54d6dd1f4472285d;hp=a840c2b94564b95a1af2a2577adf4d2f43cf7727;hpb=c255ba778677e2006f1d7ebad69a8f7005747907;p=palacios.git diff --git a/palacios/src/palacios/vmm_direct_paging_64.h b/palacios/src/palacios/vmm_direct_paging_64.h index a840c2b..baae5d5 100644 --- a/palacios/src/palacios/vmm_direct_paging_64.h +++ b/palacios/src/palacios/vmm_direct_paging_64.h @@ -27,104 +27,216 @@ #include #include +// Reference: AMD Software Developer Manual Vol.2 Ch.5 "Page Translation and Protection" + +static inline int handle_passthrough_pagefault_64(struct guest_info * core, addr_t fault_addr, pf_error_t error_code) { + pml4e64_t * pml = NULL; + pdpe64_t * pdpe = NULL; + pde64_t * pde = NULL; + pde64_2MB_t * pde2mb = NULL; + pte64_t * pte = NULL; + addr_t host_addr = 0; + + int pml_index = PML4E64_INDEX(fault_addr); + int pdpe_index = PDPE64_INDEX(fault_addr); + int pde_index = PDE64_INDEX(fault_addr); + int pte_index = PTE64_INDEX(fault_addr); + + struct v3_mem_region * region = v3_get_mem_region(core->vm_info, core->cpu_id, fault_addr); + int page_size = PAGE_SIZE_4KB; + + if (region == NULL) { + PrintError("%s: invalid region, addr=%p\n", __FUNCTION__, (void *)fault_addr); + return -1; + } -static inline int handle_passthrough_pagefault_64(struct guest_info * info, - addr_t fault_addr, - pf_error_t error_code) { - pml4e64_t * pml = CR3_TO_PML4E64_VA(info->ctrl_regs.cr3); - pdpe64_t * pdpe = NULL; - pde64_t * pde = NULL; - pte64_t * pte = NULL; - addr_t host_addr = 0; - - int pml_index = PML4E64_INDEX(fault_addr); - int pdpe_index = PDPE64_INDEX(fault_addr); - int pde_index = PDE64_INDEX(fault_addr); - int pte_index = PTE64_INDEX(fault_addr); - - struct v3_shadow_region * region = v3_get_shadow_region(info, fault_addr); - - if ((region == NULL) || - (region->host_type == SHDW_REGION_INVALID)) { - PrintError("Invalid region in passthrough page fault 64, addr=%p\n", - (void *)fault_addr); - return -1; - } - - host_addr = v3_get_shadow_addr(region, fault_addr); - - //Fix up the PML entry - if (pml[pml_index].present == 0) { - pdpe = (pdpe64_t *)create_generic_pt_page(); - - pml[pml_index].present = 1; - // Set default PML Flags... - pml[pml_index].pdp_base_addr = PAGE_BASE_ADDR((addr_t)V3_PAddr(pdpe)); - } else { - pdpe = V3_VAddr((void*)BASE_TO_PAGE_ADDR(pml[pml_index].pdp_base_addr)); - } + /* Check if: + * 1. the guest is configured to use large pages and + * 2. the memory regions can be referenced by a large page + */ + if ((core->use_large_pages == 1) || (core->use_giant_pages == 1)) { + page_size = v3_get_max_page_size(core, fault_addr, LONG); + } + + PrintDebug("Using page size of %dKB\n", page_size / 1024); - // Fix up the PDPE entry - if (pdpe[pdpe_index].present == 0) { - pde = (pde64_t *)create_generic_pt_page(); + + // Lookup the correct PML address based on the PAGING MODE + if (core->shdw_pg_mode == SHADOW_PAGING) { + pml = CR3_TO_PML4E64_VA(core->ctrl_regs.cr3); + } else { + pml = CR3_TO_PML4E64_VA(core->direct_map_pt); + } + + //Fix up the PML entry + if (pml[pml_index].present == 0) { + pdpe = (pdpe64_t *)create_generic_pt_page(); - pdpe[pdpe_index].present = 1; - // Set default PDPE Flags... - pdpe[pdpe_index].pd_base_addr = PAGE_BASE_ADDR((addr_t)V3_PAddr(pde)); - } else { - pde = V3_VAddr((void*)BASE_TO_PAGE_ADDR(pdpe[pdpe_index].pd_base_addr)); - } + // Set default PML Flags... + pml[pml_index].present = 1; + pml[pml_index].writable = 1; + pml[pml_index].user_page = 1; + pml[pml_index].pdp_base_addr = PAGE_BASE_ADDR_4KB((addr_t)V3_PAddr(pdpe)); + } else { + pdpe = V3_VAddr((void*)BASE_TO_PAGE_ADDR_4KB(pml[pml_index].pdp_base_addr)); + } - // Fix up the PDE entry - if (pde[pde_index].present == 0) { - pte = (pte64_t *)create_generic_pt_page(); + // Fix up the PDPE entry + if (pdpe[pdpe_index].present == 0) { + pde = (pde64_t *)create_generic_pt_page(); + + // Set default PDPE Flags... + pdpe[pdpe_index].present = 1; + pdpe[pdpe_index].writable = 1; + pdpe[pdpe_index].user_page = 1; - pde[pde_index].present = 1; - pde[pde_index].writable = 1; - pde[pde_index].user_page = 1; + pdpe[pdpe_index].pd_base_addr = PAGE_BASE_ADDR_4KB((addr_t)V3_PAddr(pde)); + } else { + pde = V3_VAddr((void*)BASE_TO_PAGE_ADDR_4KB(pdpe[pdpe_index].pd_base_addr)); + } - pde[pde_index].pt_base_addr = PAGE_BASE_ADDR((addr_t)V3_PAddr(pte)); - } else { - pte = V3_VAddr((void*)BASE_TO_PAGE_ADDR(pde[pde_index].pt_base_addr)); - } + // Fix up the 2MiB PDE and exit here + if (page_size == PAGE_SIZE_2MB) { + pde2mb = (pde64_2MB_t *)pde; // all but these two lines are the same for PTE + pde2mb[pde_index].large_page = 1; + + if (pde2mb[pde_index].present == 0) { + pde2mb[pde_index].user_page = 1; + + if ( (region->flags.alloced == 1) && + (region->flags.read == 1)) { + // Full access + pde2mb[pde_index].present = 1; + + if (region->flags.write == 1) { + pde2mb[pde_index].writable = 1; + } else { + pde2mb[pde_index].writable = 0; + } + + if (v3_gpa_to_hpa(core, fault_addr, &host_addr) == -1) { + PrintError("Error Could not translate fault addr (%p)\n", (void *)fault_addr); + return -1; + } + + pde2mb[pde_index].page_base_addr = PAGE_BASE_ADDR_2MB(host_addr); + } else { + return region->unhandled(core, fault_addr, fault_addr, region, error_code); + } + } else { + // We fix all permissions on the first pass, + // so we only get here if its an unhandled exception + + return region->unhandled(core, fault_addr, fault_addr, region, error_code); + } + + // All done + return 0; + } + + // Continue with the 4KiB page heirarchy + + // Fix up the PDE entry + if (pde[pde_index].present == 0) { + pte = (pte64_t *)create_generic_pt_page(); + + pde[pde_index].present = 1; + pde[pde_index].writable = 1; + pde[pde_index].user_page = 1; + + pde[pde_index].pt_base_addr = PAGE_BASE_ADDR_4KB((addr_t)V3_PAddr(pte)); + } else { + pte = V3_VAddr((void*)BASE_TO_PAGE_ADDR_4KB(pde[pde_index].pt_base_addr)); + } + // Fix up the PTE entry + if (pte[pte_index].present == 0) { + pte[pte_index].user_page = 1; + + if ((region->flags.alloced == 1) && + (region->flags.read == 1)) { + // Full access + pte[pte_index].present = 1; + + if (region->flags.write == 1) { + pte[pte_index].writable = 1; + } else { + pte[pte_index].writable = 0; + } + + if (v3_gpa_to_hpa(core, fault_addr, &host_addr) == -1) { + PrintError("Error Could not translate fault addr (%p)\n", (void *)fault_addr); + return -1; + } + + pte[pte_index].page_base_addr = PAGE_BASE_ADDR_4KB(host_addr); + } else { + return region->unhandled(core, fault_addr, fault_addr, region, error_code); + } + } else { + // We fix all permissions on the first pass, + // so we only get here if its an unhandled exception - // Fix up the PTE entry - if (pte[pte_index].present == 0) { - pte[pte_index].user_page = 1; + return region->unhandled(core, fault_addr, fault_addr, region, error_code); + } - if (region->host_type == SHDW_REGION_ALLOCATED) { - // Full access - pte[pte_index].present = 1; - pte[pte_index].writable = 1; + return 0; +} - pte[pte_index].page_base_addr = PAGE_BASE_ADDR(host_addr); +static inline int invalidate_addr_64(struct guest_info * core, addr_t inv_addr) { + pml4e64_t * pml = NULL; + pdpe64_t * pdpe = NULL; + pde64_t * pde = NULL; + pte64_t * pte = NULL; - } else if (region->host_type == SHDW_REGION_WRITE_HOOK) { - // Only trap writes - pte[pte_index].present = 1; - pte[pte_index].writable = 0; - pte[pte_index].page_base_addr = PAGE_BASE_ADDR(host_addr); + // TODO: + // Call INVLPGA - } else if (region->host_type == SHDW_REGION_FULL_HOOK) { - // trap all accesses - return v3_handle_mem_full_hook(info, fault_addr, fault_addr, region, error_code); + // clear the page table entry + int pml_index = PML4E64_INDEX(inv_addr); + int pdpe_index = PDPE64_INDEX(inv_addr); + int pde_index = PDE64_INDEX(inv_addr); + int pte_index = PTE64_INDEX(inv_addr); + + // Lookup the correct PDE address based on the PAGING MODE + if (core->shdw_pg_mode == SHADOW_PAGING) { + pml = CR3_TO_PML4E64_VA(core->ctrl_regs.cr3); } else { - PrintError("Unknown Region Type...\n"); - return -1; + pml = CR3_TO_PML4E64_VA(core->direct_map_pt); + } + + if (pml[pml_index].present == 0) { + return 0; + } + + pdpe = V3_VAddr((void*)BASE_TO_PAGE_ADDR(pml[pml_index].pdp_base_addr)); + + if (pdpe[pdpe_index].present == 0) { + return 0; + } else if (pdpe[pdpe_index].large_page == 1) { // 1GiB + pdpe[pdpe_index].present = 0; + return 0; } - } - - if ( (region->host_type == SHDW_REGION_WRITE_HOOK) && - (error_code.write == 1) ) { - return v3_handle_mem_wr_hook(info, fault_addr, fault_addr, region, error_code); - } - return 0; + pde = V3_VAddr((void*)BASE_TO_PAGE_ADDR(pdpe[pdpe_index].pd_base_addr)); + + if (pde[pde_index].present == 0) { + return 0; + } else if (pde[pde_index].large_page == 1) { // 2MiB + pde[pde_index].present = 0; + return 0; + } + + pte = V3_VAddr((void*)BASE_TO_PAGE_ADDR(pde[pde_index].pt_base_addr)); + + pte[pte_index].present = 0; // 4KiB + + return 0; } + #endif