1 | ; $Id: CPUMAllA.asm 5999 2007-12-07 15:05:06Z vboxsync $
|
---|
2 | ;; @file
|
---|
3 | ; CPUM - Guest Context Assembly Routines.
|
---|
4 | ;
|
---|
5 |
|
---|
6 | ;
|
---|
7 | ; Copyright (C) 2006-2007 innotek GmbH
|
---|
8 | ;
|
---|
9 | ; This file is part of VirtualBox Open Source Edition (OSE), as
|
---|
10 | ; available from http://www.virtualbox.org. This file is free software;
|
---|
11 | ; you can redistribute it and/or modify it under the terms of the GNU
|
---|
12 | ; General Public License (GPL) as published by the Free Software
|
---|
13 | ; Foundation, in version 2 as it comes in the "COPYING" file of the
|
---|
14 | ; VirtualBox OSE distribution. VirtualBox OSE is distributed in the
|
---|
15 | ; hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
|
---|
16 | ;
|
---|
17 |
|
---|
18 | ;*******************************************************************************
|
---|
19 | ;* Header Files *
|
---|
20 | ;*******************************************************************************
|
---|
21 | %include "VBox/asmdefs.mac"
|
---|
22 | %include "VBox/vm.mac"
|
---|
23 | %include "VBox/err.mac"
|
---|
24 | %include "VBox/stam.mac"
|
---|
25 | %include "CPUMInternal.mac"
|
---|
26 | %include "VBox/x86.mac"
|
---|
27 | %include "VBox/cpum.mac"
|
---|
28 |
|
---|
29 | %ifdef IN_RING3
|
---|
30 | %error "The jump table doesn't link on leopard."
|
---|
31 | %endif
|
---|
32 |
|
---|
33 | ;
|
---|
34 | ; Enables write protection of Hypervisor memory pages.
|
---|
35 | ; !note! Must be commented out for Trap8 debug handler.
|
---|
36 | ;
|
---|
37 | %define ENABLE_WRITE_PROTECTION 1
|
---|
38 |
|
---|
39 | ;; @def CPUM_REG
|
---|
40 | ; The register which we load the CPUM pointer into.
|
---|
41 | %ifdef RT_ARCH_AMD64
|
---|
42 | %define CPUM_REG rdx
|
---|
43 | %else
|
---|
44 | %define CPUM_REG edx
|
---|
45 | %endif
|
---|
46 |
|
---|
47 | BEGINCODE
|
---|
48 |
|
---|
49 |
|
---|
50 | ;;
|
---|
51 | ; Handles lazy FPU saving and restoring.
|
---|
52 | ;
|
---|
53 | ; This handler will implement lazy fpu (sse/mmx/stuff) saving.
|
---|
54 | ; Two actions may be taken in this handler since the Guest OS may
|
---|
55 | ; be doing lazy fpu switching. So, we'll have to generate those
|
---|
56 | ; traps which the Guest CPU CTX shall have according to the
|
---|
57 | ; its CR0 flags. If no traps for the Guest OS, we'll save the host
|
---|
58 | ; context and restore the guest context.
|
---|
59 | ;
|
---|
60 | ; @returns 0 if caller should continue execution.
|
---|
61 | ; @returns VINF_EM_RAW_GUEST_TRAP if a guest trap should be generated.
|
---|
62 | ; @param pCPUM x86:[esp+4] GCC:rdi MSC:rcx CPUM pointer
|
---|
63 | ;
|
---|
64 | align 16
|
---|
65 | BEGINPROC CPUMHandleLazyFPUAsm
|
---|
66 | ;
|
---|
67 | ; Figure out what to do.
|
---|
68 | ;
|
---|
69 | ; There are two basic actions:
|
---|
70 | ; 1. Save host fpu and restore guest fpu.
|
---|
71 | ; 2. Generate guest trap.
|
---|
72 | ;
|
---|
73 | ; When entering the hypervisor we'll always enable MP (for proper wait
|
---|
74 | ; trapping) and TS (for intercepting all fpu/mmx/sse stuff). The EM flag
|
---|
75 | ; is taken from the guest OS in order to get proper SSE handling.
|
---|
76 | ;
|
---|
77 | ;
|
---|
78 | ; Actions taken depending on the guest CR0 flags:
|
---|
79 | ;
|
---|
80 | ; 3 2 1
|
---|
81 | ; TS | EM | MP | FPUInstr | WAIT :: VMM Action
|
---|
82 | ; ------------------------------------------------------------------------
|
---|
83 | ; 0 | 0 | 0 | Exec | Exec :: Clear TS & MP, Save HC, Load GC.
|
---|
84 | ; 0 | 0 | 1 | Exec | Exec :: Clear TS, Save HC, Load GC.
|
---|
85 | ; 0 | 1 | 0 | #NM | Exec :: Clear TS & MP, Save HC, Load GC;
|
---|
86 | ; 0 | 1 | 1 | #NM | Exec :: Clear TS, Save HC, Load GC.
|
---|
87 | ; 1 | 0 | 0 | #NM | Exec :: Clear MP, Save HC, Load GC. (EM is already cleared.)
|
---|
88 | ; 1 | 0 | 1 | #NM | #NM :: Go to host taking trap there.
|
---|
89 | ; 1 | 1 | 0 | #NM | Exec :: Clear MP, Save HC, Load GC. (EM is already set.)
|
---|
90 | ; 1 | 1 | 1 | #NM | #NM :: Go to host taking trap there.
|
---|
91 |
|
---|
92 | ;
|
---|
93 | ; Before taking any of these actions we're checking if we have already
|
---|
94 | ; loaded the GC FPU. Because if we have, this is an trap for the guest - raw ring-3.
|
---|
95 | ;
|
---|
96 | %ifdef RT_ARCH_AMD64
|
---|
97 | %ifdef RT_OS_WINDOWS
|
---|
98 | mov xDX, rcx
|
---|
99 | %else
|
---|
100 | mov xDX, rdi
|
---|
101 | %endif
|
---|
102 | %else
|
---|
103 | mov xDX, dword [esp + 4]
|
---|
104 | %endif
|
---|
105 | test dword [xDX + CPUM.fUseFlags], CPUM_USED_FPU
|
---|
106 | jz hlfpua_not_loaded
|
---|
107 | jmp hlfpua_to_host
|
---|
108 |
|
---|
109 | ;
|
---|
110 | ; Take action.
|
---|
111 | ;
|
---|
112 | align 16
|
---|
113 | hlfpua_not_loaded:
|
---|
114 | mov eax, [xDX + CPUM.Guest.cr0]
|
---|
115 | and eax, X86_CR0_MP | X86_CR0_EM | X86_CR0_TS
|
---|
116 | %ifdef RT_ARCH_AMD64
|
---|
117 | lea r8, [hlfpuajmp1 wrt rip]
|
---|
118 | jmp qword [rax*4 + r8]
|
---|
119 | %else
|
---|
120 | jmp dword [eax*2 + hlfpuajmp1]
|
---|
121 | %endif
|
---|
122 | align 16
|
---|
123 | ;; jump table using fpu related cr0 flags as index.
|
---|
124 | hlfpuajmp1:
|
---|
125 | RTCCPTR_DEF hlfpua_switch_fpu_ctx
|
---|
126 | RTCCPTR_DEF hlfpua_switch_fpu_ctx
|
---|
127 | RTCCPTR_DEF hlfpua_switch_fpu_ctx
|
---|
128 | RTCCPTR_DEF hlfpua_switch_fpu_ctx
|
---|
129 | RTCCPTR_DEF hlfpua_switch_fpu_ctx
|
---|
130 | RTCCPTR_DEF hlfpua_to_host
|
---|
131 | RTCCPTR_DEF hlfpua_switch_fpu_ctx
|
---|
132 | RTCCPTR_DEF hlfpua_to_host
|
---|
133 | ;; and mask for cr0.
|
---|
134 | hlfpu_afFlags:
|
---|
135 | RTCCPTR_DEF ~(X86_CR0_TS | X86_CR0_MP)
|
---|
136 | RTCCPTR_DEF ~(X86_CR0_TS)
|
---|
137 | RTCCPTR_DEF ~(X86_CR0_TS | X86_CR0_MP)
|
---|
138 | RTCCPTR_DEF ~(X86_CR0_TS)
|
---|
139 | RTCCPTR_DEF ~(X86_CR0_MP)
|
---|
140 | RTCCPTR_DEF 0
|
---|
141 | RTCCPTR_DEF ~(X86_CR0_MP)
|
---|
142 | RTCCPTR_DEF 0
|
---|
143 |
|
---|
144 | ;
|
---|
145 | ; Action - switch FPU context and change cr0 flags.
|
---|
146 | ;
|
---|
147 | align 16
|
---|
148 | hlfpua_switch_fpu_ctx:
|
---|
149 | %ifndef IN_RING3 ; IN_GC or IN_RING0
|
---|
150 | mov xCX, cr0
|
---|
151 | %ifdef RT_ARCH_AMD64
|
---|
152 | lea r8, [hlfpu_afFlags wrt rip]
|
---|
153 | and rcx, [rax*4 + r8] ; calc the new cr0 flags.
|
---|
154 | %else
|
---|
155 | and ecx, [eax*2 + hlfpu_afFlags] ; calc the new cr0 flags.
|
---|
156 | %endif
|
---|
157 | mov xAX, cr0
|
---|
158 | and xAX, ~(X86_CR0_TS | X86_CR0_EM)
|
---|
159 | mov cr0, xAX ; clear flags so we don't trap here.
|
---|
160 | %endif
|
---|
161 | %ifndef RT_ARCH_AMD64
|
---|
162 | test dword [xDX + CPUM.CPUFeatures.edx], X86_CPUID_FEATURE_EDX_FXSR
|
---|
163 | jz short hlfpua_no_fxsave
|
---|
164 | %endif
|
---|
165 |
|
---|
166 | fxsave [xDX + CPUM.Host.fpu]
|
---|
167 | or dword [xDX + CPUM.fUseFlags], (CPUM_USED_FPU | CPUM_USED_FPU_SINCE_REM)
|
---|
168 | fxrstor [xDX + CPUM.Guest.fpu]
|
---|
169 | hlfpua_finished_switch:
|
---|
170 | %ifdef IN_GC
|
---|
171 | mov cr0, xCX ; load the new cr0 flags.
|
---|
172 | %endif
|
---|
173 | ; return continue execution.
|
---|
174 | xor eax, eax
|
---|
175 | ret
|
---|
176 |
|
---|
177 | %ifndef RT_ARCH_AMD64
|
---|
178 | ; legacy support.
|
---|
179 | hlfpua_no_fxsave:
|
---|
180 | fnsave [xDX + CPUM.Host.fpu]
|
---|
181 | or dword [xDX + CPUM.fUseFlags], dword (CPUM_USED_FPU | CPUM_USED_FPU_SINCE_REM) ; yasm / nasm
|
---|
182 | mov eax, [xDX + CPUM.Guest.fpu] ; control word
|
---|
183 | not eax ; 1 means exception ignored (6 LS bits)
|
---|
184 | and eax, byte 03Fh ; 6 LS bits only
|
---|
185 | test eax, [xDX + CPUM.Guest.fpu + 4]; status word
|
---|
186 | jz short hlfpua_no_exceptions_pending
|
---|
187 | ; technically incorrect, but we certainly don't want any exceptions now!!
|
---|
188 | and dword [xDX + CPUM.Guest.fpu + 4], ~03Fh
|
---|
189 | hlfpua_no_exceptions_pending:
|
---|
190 | frstor [xDX + CPUM.Guest.fpu]
|
---|
191 | jmp near hlfpua_finished_switch
|
---|
192 | %endif ; !RT_ARCH_AMD64
|
---|
193 |
|
---|
194 |
|
---|
195 | ;
|
---|
196 | ; Action - Generate Guest trap.
|
---|
197 | ;
|
---|
198 | hlfpua_action_4:
|
---|
199 | hlfpua_to_host:
|
---|
200 | mov eax, VINF_EM_RAW_GUEST_TRAP
|
---|
201 | ret
|
---|
202 | ENDPROC CPUMHandleLazyFPUAsm
|
---|
203 |
|
---|
204 |
|
---|
205 | ;;
|
---|
206 | ; Restores the host's FPU/XMM state
|
---|
207 | ;
|
---|
208 | ; @returns 0
|
---|
209 | ; @param pCPUM x86:[esp+4] GCC:rdi MSC:rcx CPUM pointer
|
---|
210 | ;
|
---|
211 | align 16
|
---|
212 | BEGINPROC CPUMRestoreHostFPUStateAsm
|
---|
213 | %ifdef RT_ARCH_AMD64
|
---|
214 | %ifdef RT_OS_WINDOWS
|
---|
215 | mov xDX, rcx
|
---|
216 | %else
|
---|
217 | mov xDX, rdi
|
---|
218 | %endif
|
---|
219 | %else
|
---|
220 | mov xDX, dword [esp + 4]
|
---|
221 | %endif
|
---|
222 |
|
---|
223 | ; Restore FPU if guest has used it.
|
---|
224 | ; Using fxrstor should ensure that we're not causing unwanted exception on the host.
|
---|
225 | test dword [xDX + CPUM.fUseFlags], CPUM_USED_FPU
|
---|
226 | jz short gth_fpu_no
|
---|
227 |
|
---|
228 | mov xAX, cr0
|
---|
229 | mov xCX, xAX ; save old CR0
|
---|
230 | and xAX, ~(X86_CR0_TS | X86_CR0_EM)
|
---|
231 | mov cr0, xAX
|
---|
232 |
|
---|
233 | fxsave [xDX + CPUM.Guest.fpu]
|
---|
234 | fxrstor [xDX + CPUM.Host.fpu]
|
---|
235 |
|
---|
236 | mov cr0, xCX ; and restore old CR0 again
|
---|
237 | and dword [xDX + CPUM.fUseFlags], ~CPUM_USED_FPU
|
---|
238 | gth_fpu_no:
|
---|
239 | xor eax, eax
|
---|
240 | ret
|
---|
241 | ENDPROC CPUMRestoreHostFPUStateAsm
|
---|
242 |
|
---|