Palacios Public Git Repository

To checkout Palacios execute

  git clone http://v3vee.org/palacios/palacios.web/palacios.git
This will give you the master branch. You probably want the devel branch or one of the release branches. To switch to the devel branch, simply execute
  cd palacios
  git checkout --track -b devel origin/devel
The other branches are similar.


minor changes to organization
[palacios.git] / palacios / src / palacios / svm_handler.c
index 4c4aa2c..da85eb2 100644 (file)
 #include <palacios/vmm_hypercall.h>
 #include <palacios/vmm_cpuid.h>
 #include <palacios/vmm_direct_paging.h>
+#include <palacios/vmm_syscall_hijack.h>
 
-#ifdef CONFIG_TELEMETRY
-#include <palacios/vmm_telemetry.h>
+#ifndef V3_CONFIG_DEBUG_SVM
+#undef PrintDebug
+#define PrintDebug(fmt, args...)
 #endif
 
-
-int v3_handle_svm_exit(struct guest_info * info) {
-    vmcb_ctrl_t * guest_ctrl = 0;
-    vmcb_saved_state_t * guest_state = 0;
-    ulong_t exit_code = 0;
-    
-    guest_ctrl = GET_VMCB_CTRL_AREA((vmcb_t*)(info->vmm_data));
-    guest_state = GET_VMCB_SAVE_STATE_AREA((vmcb_t*)(info->vmm_data));
-  
-    // Update the high level state 
-    info->rip = guest_state->rip;
-    info->vm_regs.rsp = guest_state->rsp;
-    info->vm_regs.rax = guest_state->rax;
-
-    info->cpl = guest_state->cpl;
-
-    info->ctrl_regs.cr0 = guest_state->cr0;
-    info->ctrl_regs.cr2 = guest_state->cr2;
-    info->ctrl_regs.cr3 = guest_state->cr3;
-    info->ctrl_regs.cr4 = guest_state->cr4;
-    info->dbg_regs.dr6 = guest_state->dr6;
-    info->dbg_regs.dr7 = guest_state->dr7;
-    info->ctrl_regs.cr8 = guest_ctrl->guest_ctrl.V_TPR;
-    info->ctrl_regs.rflags = guest_state->rflags;
-    info->ctrl_regs.efer = guest_state->efer;
-    
-    v3_get_vmcb_segments((vmcb_t*)(info->vmm_data), &(info->segments));
-    info->cpu_mode = v3_get_vm_cpu_mode(info);
-    info->mem_mode = v3_get_vm_mem_mode(info);
-
-    exit_code = guest_ctrl->exit_code;
-
-    //    PrintDebug("SVM Exit: %s (rip=%p) (info1=%p)\n", vmexit_code_to_str(exit_code), 
-    //        (void *)(addr_t)info->rip, (void *)(addr_t)guest_ctrl->exit_info1);
-
-    if ((info->intr_state.irq_pending == 1) && (guest_ctrl->guest_ctrl.V_IRQ == 0)) {
-
-#ifdef CONFIG_DEBUG_INTERRUPTS
-       PrintDebug("INTAK cycle completed for irq %d\n", info->intr_state.irq_vector);
+#ifdef V3_CONFIG_TELEMETRY
+#include <palacios/vmm_telemetry.h>
 #endif
 
-       info->intr_state.irq_started = 1;
-       info->intr_state.irq_pending = 0;
-
-       v3_injecting_intr(info, info->intr_state.irq_vector, V3_EXTERNAL_IRQ);
-    }
 
-    if ((info->intr_state.irq_started == 1) && (guest_ctrl->exit_int_info.valid == 0)) {
-#ifdef CONFIG_DEBUG_INTERRUPTS
-       PrintDebug("Interrupt %d taken by guest\n", info->intr_state.irq_vector);
-#endif
 
-       // Interrupt was taken fully vectored
-       info->intr_state.irq_started = 0;
+int v3_handle_svm_exit(struct guest_info * info, addr_t exit_code, addr_t exit_info1, addr_t exit_info2) {
 
-    } else {
-#ifdef CONFIG_DEBUG_INTERRUPTS
-       PrintDebug("EXIT INT INFO is set (vec=%d)\n", guest_ctrl->exit_int_info.vector);
-#endif
-    }
-
-
-#ifdef CONFIG_TELEMETRY
-    if (info->enable_telemetry) {
+#ifdef V3_CONFIG_TELEMETRY
+    if (info->vm_info->enable_telemetry) {
        v3_telemetry_start_exit(info);
     }
 #endif
@@ -111,16 +59,16 @@ int v3_handle_svm_exit(struct guest_info * info) {
 
     switch (exit_code) {
        case VMEXIT_IOIO: {
-           struct svm_io_info * io_info = (struct svm_io_info *)&(guest_ctrl->exit_info1);
+           struct svm_io_info * io_info = (struct svm_io_info *)&(exit_info1);
 
            if (io_info->type == 0) {
                if (io_info->str) {
 
-                   if (v3_handle_svm_io_outs(info) == -1 ) {
+                   if (v3_handle_svm_io_outs(info, io_info) == -1 ) {
                        return -1;
                    }
                } else {
-                   if (v3_handle_svm_io_out(info) == -1) {
+                   if (v3_handle_svm_io_out(info, io_info) == -1) {
                        return -1;
                    }
                }
@@ -128,24 +76,27 @@ int v3_handle_svm_exit(struct guest_info * info) {
            } else {
 
                if (io_info->str) {
-                   if (v3_handle_svm_io_ins(info) == -1) {
+                   if (v3_handle_svm_io_ins(info, io_info) == -1) {
                        return -1;
                    }
                } else {
-                   if (v3_handle_svm_io_in(info) == -1) {
+                   if (v3_handle_svm_io_in(info, io_info) == -1) {
                        return -1;
                    }
                }
            }
+
+           info->rip = exit_info2;
+
            break;
        }
        case VMEXIT_MSR:
 
-           if (guest_ctrl->exit_info1 == 0) {
+           if (exit_info1 == 0) {
                if (v3_handle_msr_read(info) == -1) {
                    return -1;
                }
-           } else if (guest_ctrl->exit_info1 == 1) {
+           } else if (exit_info1 == 1) {
                if (v3_handle_msr_write(info) == -1) {
                    return -1;
                }
@@ -164,7 +115,7 @@ int v3_handle_svm_exit(struct guest_info * info) {
 
            break;
        case VMEXIT_CR0_WRITE: 
-#ifdef CONFIG_DEBUG_CTRL_REGS
+#ifdef V3_CONFIG_DEBUG_CTRL_REGS
            PrintDebug("CR0 Write\n");
 #endif
            if (v3_handle_cr0_write(info) == -1) {
@@ -172,7 +123,7 @@ int v3_handle_svm_exit(struct guest_info * info) {
            }
            break;
        case VMEXIT_CR0_READ: 
-#ifdef CONFIG_DEBUG_CTRL_REGS
+#ifdef V3_CONFIG_DEBUG_CTRL_REGS
            PrintDebug("CR0 Read\n");
 #endif
            if (v3_handle_cr0_read(info) == -1) {
@@ -180,15 +131,16 @@ int v3_handle_svm_exit(struct guest_info * info) {
            }
            break;
        case VMEXIT_CR3_WRITE: 
-#ifdef CONFIG_DEBUG_CTRL_REGS
+#ifdef V3_CONFIG_DEBUG_CTRL_REGS
            PrintDebug("CR3 Write\n");
 #endif
            if (v3_handle_cr3_write(info) == -1) {
                return -1;
            }    
+
            break;
        case  VMEXIT_CR3_READ: 
-#ifdef CONFIG_DEBUG_CTRL_REGS
+#ifdef V3_CONFIG_DEBUG_CTRL_REGS
            PrintDebug("CR3 Read\n");
 #endif
            if (v3_handle_cr3_read(info) == -1) {
@@ -196,7 +148,7 @@ int v3_handle_svm_exit(struct guest_info * info) {
            }
            break;
        case VMEXIT_CR4_WRITE: 
-#ifdef CONFIG_DEBUG_CTRL_REGS
+#ifdef V3_CONFIG_DEBUG_CTRL_REGS
            PrintDebug("CR4 Write\n");
 #endif
            if (v3_handle_cr4_write(info) == -1) {
@@ -204,7 +156,7 @@ int v3_handle_svm_exit(struct guest_info * info) {
            }    
            break;
        case  VMEXIT_CR4_READ: 
-#ifdef CONFIG_DEBUG_CTRL_REGS
+#ifdef V3_CONFIG_DEBUG_CTRL_REGS
            PrintDebug("CR4 Read\n");
 #endif
            if (v3_handle_cr4_read(info) == -1) {
@@ -212,9 +164,9 @@ int v3_handle_svm_exit(struct guest_info * info) {
            }
            break;
        case VMEXIT_EXCP14: {
-           addr_t fault_addr = guest_ctrl->exit_info2;
-           pf_error_t * error_code = (pf_error_t *)&(guest_ctrl->exit_info1);
-#ifdef CONFIG_DEBUG_SHADOW_PAGING
+           addr_t fault_addr = exit_info2;
+           pf_error_t * error_code = (pf_error_t *)&(exit_info1);
+#ifdef V3_CONFIG_DEBUG_SHADOW_PAGING
            PrintDebug("PageFault at %p (error=%d)\n", 
                       (void *)fault_addr, *(uint_t *)error_code);
 #endif
@@ -229,8 +181,8 @@ int v3_handle_svm_exit(struct guest_info * info) {
            break;
        } 
        case VMEXIT_NPF: {
-           addr_t fault_addr = guest_ctrl->exit_info2;
-           pf_error_t * error_code = (pf_error_t *)&(guest_ctrl->exit_info1);
+           addr_t fault_addr = exit_info2;
+           pf_error_t * error_code = (pf_error_t *)&(exit_info1);
 
            if (info->shdw_pg_mode == NESTED_PAGING) {
                if (v3_handle_nested_pagefault(info, fault_addr, *error_code) == -1) {
@@ -242,9 +194,18 @@ int v3_handle_svm_exit(struct guest_info * info) {
                    }
            break;
            }
+    case VMEXIT_SWINT:
+#ifdef CONFIG_DEBUG_INTERRUPTS
+        PrintDebug("Intercepted SW Interrupt\n");
+#endif
+        if (v3_handle_swintr(info) == -1) {
+            PrintError("Error handling software interrupt\n");
+            return -1;
+        }
+        break;
        case VMEXIT_INVLPG: 
            if (info->shdw_pg_mode == SHADOW_PAGING) {
-#ifdef CONFIG_DEBUG_SHADOW_PAGING
+#ifdef V3_CONFIG_DEBUG_SHADOW_PAGING
                PrintDebug("Invlpg\n");
 #endif
                if (v3_handle_shadow_invlpg(info) == -1) {
@@ -256,14 +217,20 @@ int v3_handle_svm_exit(struct guest_info * info) {
            /* 
             * Hypercall 
             */
-               
+
+           // VMMCALL is a 3 byte op
+           // We do this early because some hypercalls can change the rip...
+           info->rip += 3;         
+
            if (v3_handle_hypercall(info) == -1) {
+               PrintError("Error handling Hypercall\n");
                return -1;
            }
-               
-           // VMMCALL is a 3 byte op
-           info->rip += 3;
-           break;          
+
+           break;      
+       case VMEXIT_NMI:
+           // handled by interrupt dispatcher
+           break;
        case VMEXIT_INTR:
            // handled by interrupt dispatch earlier
            break;
@@ -271,7 +238,7 @@ int v3_handle_svm_exit(struct guest_info * info) {
            //   handle_svm_smi(info); // ignored for now
            break;
        case VMEXIT_HLT:
-#ifdef CONFIG_DEBUG_HALT
+#ifdef V3_CONFIG_DEBUG_HALT
            PrintDebug("Guest halted\n");
 #endif
            if (v3_handle_halt(info) == -1) {
@@ -279,22 +246,45 @@ int v3_handle_svm_exit(struct guest_info * info) {
            }
            break;
        case VMEXIT_PAUSE:
-           //PrintDebug("Guest paused\n");
+           //      PrintDebug("Guest paused\n");
            if (v3_handle_svm_pause(info) == -1) { 
                return -1;
            }
            break;
        case VMEXIT_WBINVD:   
-#ifdef CONFIG_DEBUG_EMULATOR
+#ifdef V3_CONFIG_DEBUG_EMULATOR
            PrintDebug("WBINVD\n");
 #endif
            if (v3_handle_svm_wbinvd(info) == -1) { 
                return -1;
            }
            break;
-       
+        case VMEXIT_RDTSC:
+#ifdef V3_CONFIG_DEBUG_TIME
+           PrintDebug("RDTSC/RDTSCP\n");
+#endif 
+           if (v3_handle_rdtsc(info) == -1) {
+               PrintError("Error Handling RDTSC instruction\n");
+               return -1;
+           }
+           break;
+        case VMEXIT_RDTSCP:
+#ifdef V3_CONFIG_DEBUG_TIME
+           PrintDebug("RDTSCP\n");
+#endif 
+           if (v3_handle_rdtscp(info) == -1) {
+               PrintError("Error Handling RDTSCP instruction\n");
+               return -1;
+           }
+           break;
+       case VMEXIT_SHUTDOWN:
+           PrintDebug("Guest-initiated shutdown\n");
 
+           info->vm_info->run_state = VM_STOPPED;
 
+           // Force exit on other cores
+
+           break;
 
 
            /* Exits Following this line are NOT HANDLED */
@@ -304,22 +294,22 @@ int v3_handle_svm_exit(struct guest_info * info) {
 
            addr_t rip_addr;
            
-           PrintDebug("Unhandled SVM Exit: %s\n", vmexit_code_to_str(exit_code));
+           PrintError("Unhandled SVM Exit: %s\n", vmexit_code_to_str(exit_code));
            
-           rip_addr = get_addr_linear(info, guest_state->rip, &(info->segments.cs));
+           rip_addr = get_addr_linear(info, info->rip, &(info->segments.cs));
            
            
            PrintError("SVM Returned:(VMCB=%p)\n", (void *)(info->vmm_data)); 
-           PrintError("RIP: %p\n", (void *)(addr_t)(guest_state->rip));
+           PrintError("RIP: %p\n", (void *)(addr_t)(info->rip));
            PrintError("RIP Linear: %p\n", (void *)(addr_t)(rip_addr));
            
            PrintError("SVM Returned: Exit Code: %p\n", (void *)(addr_t)exit_code); 
            
-           PrintError("io_info1 low = 0x%.8x\n", *(uint_t*)&(guest_ctrl->exit_info1));
-           PrintError("io_info1 high = 0x%.8x\n", *(uint_t *)(((uchar_t *)&(guest_ctrl->exit_info1)) + 4));
+           PrintError("io_info1 low = 0x%.8x\n", *(uint_t*)&(exit_info1));
+           PrintError("io_info1 high = 0x%.8x\n", *(uint_t *)(((uchar_t *)&(exit_info1)) + 4));
            
-           PrintError("io_info2 low = 0x%.8x\n", *(uint_t*)&(guest_ctrl->exit_info2));
-           PrintError("io_info2 high = 0x%.8x\n", *(uint_t *)(((uchar_t *)&(guest_ctrl->exit_info2)) + 4));
+           PrintError("io_info2 low = 0x%.8x\n", *(uint_t*)&(exit_info2));
+           PrintError("io_info2 high = 0x%.8x\n", *(uint_t *)(((uchar_t *)&(exit_info2)) + 4));
            
            
            if (info->shdw_pg_mode == SHADOW_PAGING) {
@@ -332,102 +322,13 @@ int v3_handle_svm_exit(struct guest_info * info) {
     }
     // END OF SWITCH (EXIT_CODE)
 
-#ifdef CONFIG_TELEMETRY
-    if (info->enable_telemetry) {
+#ifdef V3_CONFIG_TELEMETRY
+    if (info->vm_info->enable_telemetry) {
        v3_telemetry_end_exit(info, exit_code);
     }
 #endif
 
 
-    if (v3_excp_pending(info)) {
-       uint_t excp = v3_get_excp_number(info);
-       
-       guest_ctrl->EVENTINJ.type = SVM_INJECTION_EXCEPTION;
-       
-       if (info->excp_state.excp_error_code_valid) {
-           guest_ctrl->EVENTINJ.error_code = info->excp_state.excp_error_code;
-           guest_ctrl->EVENTINJ.ev = 1;
-#ifdef CONFIG_DEBUG_INTERRUPTS
-           PrintDebug("Injecting exception %d with error code %x\n", excp, guest_ctrl->EVENTINJ.error_code);
-#endif
-       }
-       
-       guest_ctrl->EVENTINJ.vector = excp;
-       
-       guest_ctrl->EVENTINJ.valid = 1;
-#ifdef CONFIG_DEBUG_INTERRUPTS
-       PrintDebug("Injecting Exception %d (EIP=%p)\n", 
-                  guest_ctrl->EVENTINJ.vector, 
-                  (void *)(addr_t)info->rip);
-#endif
-       v3_injecting_excp(info, excp);
-    } else if (info->intr_state.irq_started == 1) {
-#ifdef CONFIG_DEBUG_INTERRUPTS
-       PrintDebug("IRQ pending from previous injection\n");
-#endif
-       guest_ctrl->guest_ctrl.V_IRQ = 1;
-       guest_ctrl->guest_ctrl.V_INTR_VECTOR = info->intr_state.irq_vector;
-       guest_ctrl->guest_ctrl.V_IGN_TPR = 1;
-       guest_ctrl->guest_ctrl.V_INTR_PRIO = 0xf;
-
-    } else {
-       switch (v3_intr_pending(info)) {
-           case V3_EXTERNAL_IRQ: {
-               uint32_t irq = v3_get_intr(info);
-
-               guest_ctrl->guest_ctrl.V_IRQ = 1;
-               guest_ctrl->guest_ctrl.V_INTR_VECTOR = irq;
-               guest_ctrl->guest_ctrl.V_IGN_TPR = 1;
-               guest_ctrl->guest_ctrl.V_INTR_PRIO = 0xf;
-
-#ifdef CONFIG_DEBUG_INTERRUPTS
-               PrintDebug("Injecting Interrupt %d (EIP=%p)\n", 
-                          guest_ctrl->guest_ctrl.V_INTR_VECTOR, 
-                          (void *)(addr_t)info->rip);
-#endif
-
-               info->intr_state.irq_pending = 1;
-               info->intr_state.irq_vector = irq;
-               
-               break;
-           }
-           case V3_NMI:
-               guest_ctrl->EVENTINJ.type = SVM_INJECTION_NMI;
-               break;
-           case V3_SOFTWARE_INTR:
-               guest_ctrl->EVENTINJ.type = SVM_INJECTION_SOFT_INTR;
-               break;
-           case V3_VIRTUAL_IRQ:
-               guest_ctrl->EVENTINJ.type = SVM_INJECTION_IRQ;
-               break;
-
-           case V3_INVALID_INTR:
-           default:
-               break;
-       }
-       
-    }
-
-
-    guest_state->cr0 = info->ctrl_regs.cr0;
-    guest_state->cr2 = info->ctrl_regs.cr2;
-    guest_state->cr3 = info->ctrl_regs.cr3;
-    guest_state->cr4 = info->ctrl_regs.cr4;
-    guest_state->dr6 = info->dbg_regs.dr6;
-    guest_state->dr7 = info->dbg_regs.dr7;
-    guest_ctrl->guest_ctrl.V_TPR = info->ctrl_regs.cr8 & 0xff;
-    guest_state->rflags = info->ctrl_regs.rflags;
-    guest_state->efer = info->ctrl_regs.efer;
-    
-    guest_state->cpl = info->cpl;
-
-    guest_state->rax = info->vm_regs.rax;
-    guest_state->rip = info->rip;
-    guest_state->rsp = info->vm_regs.rsp;
-
-
-    v3_set_vmcb_segments((vmcb_t*)(info->vmm_data), &(info->segments));
-
     if (exit_code == VMEXIT_INTR) {
        //PrintDebug("INTR ret IP = %x\n", guest_state->rip);
     }