VirtualBox

source: vbox/trunk/src/VBox/VMM/VMMAll/PGMAllPhys.cpp@ 90802

Last change on this file since 90802 was 90439, checked in by vboxsync, 3 years ago

VMM/PGM: Check PGMCritSectEnter status code when we don't return it. bugref:6695

  • Property svn:eol-style set to native
  • Property svn:keywords set to Id Revision
File size: 160.4 KB
Line 
1/* $Id: PGMAllPhys.cpp 90439 2021-07-30 16:41:49Z vboxsync $ */
2/** @file
3 * PGM - Page Manager and Monitor, Physical Memory Addressing.
4 */
5
6/*
7 * Copyright (C) 2006-2020 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 */
17
18
19/*********************************************************************************************************************************
20* Header Files *
21*********************************************************************************************************************************/
22#define LOG_GROUP LOG_GROUP_PGM_PHYS
23#define VBOX_WITHOUT_PAGING_BIT_FIELDS /* 64-bit bitfields are just asking for trouble. See @bugref{9841} and others. */
24#include <VBox/vmm/pgm.h>
25#include <VBox/vmm/trpm.h>
26#include <VBox/vmm/vmm.h>
27#include <VBox/vmm/iom.h>
28#include <VBox/vmm/em.h>
29#include <VBox/vmm/nem.h>
30#include "PGMInternal.h"
31#include <VBox/vmm/vmcc.h>
32#include "PGMInline.h"
33#include <VBox/param.h>
34#include <VBox/err.h>
35#include <iprt/assert.h>
36#include <iprt/string.h>
37#include <iprt/asm-amd64-x86.h>
38#include <VBox/log.h>
39#ifdef IN_RING3
40# include <iprt/thread.h>
41#endif
42
43
44/*********************************************************************************************************************************
45* Defined Constants And Macros *
46*********************************************************************************************************************************/
47/** Enable the physical TLB. */
48#define PGM_WITH_PHYS_TLB
49
50/** @def PGM_HANDLER_PHYS_IS_VALID_STATUS
51 * Checks if valid physical access handler return code (normal handler, not PF).
52 *
53 * Checks if the given strict status code is one of the expected ones for a
54 * physical access handler in the current context.
55 *
56 * @returns true or false.
57 * @param a_rcStrict The status code.
58 * @param a_fWrite Whether it is a write or read being serviced.
59 *
60 * @remarks We wish to keep the list of statuses here as short as possible.
61 * When changing, please make sure to update the PGMPhysRead,
62 * PGMPhysWrite, PGMPhysReadGCPtr and PGMPhysWriteGCPtr docs too.
63 */
64#ifdef IN_RING3
65# define PGM_HANDLER_PHYS_IS_VALID_STATUS(a_rcStrict, a_fWrite) \
66 ( (a_rcStrict) == VINF_SUCCESS \
67 || (a_rcStrict) == VINF_PGM_HANDLER_DO_DEFAULT)
68#elif defined(IN_RING0)
69#define PGM_HANDLER_PHYS_IS_VALID_STATUS(a_rcStrict, a_fWrite) \
70 ( (a_rcStrict) == VINF_SUCCESS \
71 || (a_rcStrict) == VINF_PGM_HANDLER_DO_DEFAULT \
72 \
73 || (a_rcStrict) == ((a_fWrite) ? VINF_IOM_R3_MMIO_WRITE : VINF_IOM_R3_MMIO_READ) \
74 || (a_rcStrict) == VINF_IOM_R3_MMIO_READ_WRITE \
75 || ((a_rcStrict) == VINF_IOM_R3_MMIO_COMMIT_WRITE && (a_fWrite)) \
76 \
77 || (a_rcStrict) == VINF_EM_RAW_EMULATE_INSTR \
78 || (a_rcStrict) == VINF_EM_DBG_STOP \
79 || (a_rcStrict) == VINF_EM_DBG_EVENT \
80 || (a_rcStrict) == VINF_EM_DBG_BREAKPOINT \
81 || (a_rcStrict) == VINF_EM_OFF \
82 || (a_rcStrict) == VINF_EM_SUSPEND \
83 || (a_rcStrict) == VINF_EM_RESET \
84 )
85#else
86# error "Context?"
87#endif
88
89/** @def PGM_HANDLER_VIRT_IS_VALID_STATUS
90 * Checks if valid virtual access handler return code (normal handler, not PF).
91 *
92 * Checks if the given strict status code is one of the expected ones for a
93 * virtual access handler in the current context.
94 *
95 * @returns true or false.
96 * @param a_rcStrict The status code.
97 * @param a_fWrite Whether it is a write or read being serviced.
98 *
99 * @remarks We wish to keep the list of statuses here as short as possible.
100 * When changing, please make sure to update the PGMPhysRead,
101 * PGMPhysWrite, PGMPhysReadGCPtr and PGMPhysWriteGCPtr docs too.
102 */
103#ifdef IN_RING3
104# define PGM_HANDLER_VIRT_IS_VALID_STATUS(a_rcStrict, a_fWrite) \
105 ( (a_rcStrict) == VINF_SUCCESS \
106 || (a_rcStrict) == VINF_PGM_HANDLER_DO_DEFAULT)
107#elif defined(IN_RING0)
108# define PGM_HANDLER_VIRT_IS_VALID_STATUS(a_rcStrict, a_fWrite) \
109 (false /* no virtual handlers in ring-0! */ )
110#else
111# error "Context?"
112#endif
113
114
115
116#ifndef IN_RING3
117
118/**
119 * @callback_method_impl{FNPGMPHYSHANDLER,
120 * Dummy for forcing ring-3 handling of the access.}
121 */
122DECLEXPORT(VBOXSTRICTRC)
123pgmPhysHandlerRedirectToHC(PVMCC pVM, PVMCPUCC pVCpu, RTGCPHYS GCPhys, void *pvPhys, void *pvBuf, size_t cbBuf,
124 PGMACCESSTYPE enmAccessType, PGMACCESSORIGIN enmOrigin, void *pvUser)
125{
126 NOREF(pVM); NOREF(pVCpu); NOREF(GCPhys); NOREF(pvPhys); NOREF(pvBuf); NOREF(cbBuf);
127 NOREF(enmAccessType); NOREF(enmOrigin); NOREF(pvUser);
128 return VINF_EM_RAW_EMULATE_INSTR;
129}
130
131
132/**
133 * @callback_method_impl{FNPGMRZPHYSPFHANDLER,
134 * Dummy for forcing ring-3 handling of the access.}
135 */
136VMMDECL(VBOXSTRICTRC) pgmPhysPfHandlerRedirectToHC(PVMCC pVM, PVMCPUCC pVCpu, RTGCUINT uErrorCode, PCPUMCTXCORE pRegFrame,
137 RTGCPTR pvFault, RTGCPHYS GCPhysFault, void *pvUser)
138{
139 NOREF(pVM); NOREF(pVCpu); NOREF(uErrorCode); NOREF(pRegFrame); NOREF(pvFault); NOREF(GCPhysFault); NOREF(pvUser);
140 return VINF_EM_RAW_EMULATE_INSTR;
141}
142
143
144/**
145 * @callback_method_impl{FNPGMRZPHYSPFHANDLER,
146 * \#PF access handler callback for guest ROM range write access.}
147 *
148 * @remarks The @a pvUser argument points to the PGMROMRANGE.
149 */
150DECLEXPORT(VBOXSTRICTRC) pgmPhysRomWritePfHandler(PVMCC pVM, PVMCPUCC pVCpu, RTGCUINT uErrorCode, PCPUMCTXCORE pRegFrame,
151 RTGCPTR pvFault, RTGCPHYS GCPhysFault, void *pvUser)
152{
153 int rc;
154 PPGMROMRANGE pRom = (PPGMROMRANGE)pvUser;
155 uint32_t iPage = (GCPhysFault - pRom->GCPhys) >> PAGE_SHIFT;
156 NOREF(uErrorCode); NOREF(pvFault);
157
158 Assert(uErrorCode & X86_TRAP_PF_RW); /* This shall not be used for read access! */
159
160 Assert(iPage < (pRom->cb >> PAGE_SHIFT));
161 switch (pRom->aPages[iPage].enmProt)
162 {
163 case PGMROMPROT_READ_ROM_WRITE_IGNORE:
164 case PGMROMPROT_READ_RAM_WRITE_IGNORE:
165 {
166 /*
167 * If it's a simple instruction which doesn't change the cpu state
168 * we will simply skip it. Otherwise we'll have to defer it to REM.
169 */
170 uint32_t cbOp;
171 PDISCPUSTATE pDis = &pVCpu->pgm.s.DisState;
172 rc = EMInterpretDisasCurrent(pVM, pVCpu, pDis, &cbOp);
173 if ( RT_SUCCESS(rc)
174 && pDis->uCpuMode == DISCPUMODE_32BIT /** @todo why does this matter? */
175 && !(pDis->fPrefix & (DISPREFIX_REPNE | DISPREFIX_REP | DISPREFIX_SEG)))
176 {
177 switch (pDis->bOpCode)
178 {
179 /** @todo Find other instructions we can safely skip, possibly
180 * adding this kind of detection to DIS or EM. */
181 case OP_MOV:
182 pRegFrame->rip += cbOp;
183 STAM_COUNTER_INC(&pVCpu->pgm.s.CTX_SUFF(pStats)->StatRZGuestROMWriteHandled);
184 return VINF_SUCCESS;
185 }
186 }
187 break;
188 }
189
190 case PGMROMPROT_READ_RAM_WRITE_RAM:
191 pRom->aPages[iPage].LiveSave.fWrittenTo = true;
192 rc = PGMHandlerPhysicalPageTempOff(pVM, pRom->GCPhys, GCPhysFault & X86_PTE_PG_MASK);
193 AssertRC(rc);
194 break; /** @todo Must edit the shadow PT and restart the instruction, not use the interpreter! */
195
196 case PGMROMPROT_READ_ROM_WRITE_RAM:
197 /* Handle it in ring-3 because it's *way* easier there. */
198 pRom->aPages[iPage].LiveSave.fWrittenTo = true;
199 break;
200
201 default:
202 AssertMsgFailedReturn(("enmProt=%d iPage=%d GCPhysFault=%RGp\n",
203 pRom->aPages[iPage].enmProt, iPage, GCPhysFault),
204 VERR_IPE_NOT_REACHED_DEFAULT_CASE);
205 }
206
207 STAM_COUNTER_INC(&pVCpu->pgm.s.CTX_SUFF(pStats)->StatRZGuestROMWriteUnhandled);
208 return VINF_EM_RAW_EMULATE_INSTR;
209}
210
211#endif /* !IN_RING3 */
212
213
214/**
215 * @callback_method_impl{FNPGMPHYSHANDLER,
216 * Access handler callback for ROM write accesses.}
217 *
218 * @remarks The @a pvUser argument points to the PGMROMRANGE.
219 */
220PGM_ALL_CB2_DECL(VBOXSTRICTRC)
221pgmPhysRomWriteHandler(PVMCC pVM, PVMCPUCC pVCpu, RTGCPHYS GCPhys, void *pvPhys, void *pvBuf, size_t cbBuf,
222 PGMACCESSTYPE enmAccessType, PGMACCESSORIGIN enmOrigin, void *pvUser)
223{
224 PPGMROMRANGE pRom = (PPGMROMRANGE)pvUser;
225 const uint32_t iPage = (GCPhys - pRom->GCPhys) >> PAGE_SHIFT;
226 Assert(iPage < (pRom->cb >> PAGE_SHIFT));
227 PPGMROMPAGE pRomPage = &pRom->aPages[iPage];
228 Log5(("pgmPhysRomWriteHandler: %d %c %#08RGp %#04zx\n", pRomPage->enmProt, enmAccessType == PGMACCESSTYPE_READ ? 'R' : 'W', GCPhys, cbBuf));
229 NOREF(pVCpu); NOREF(pvPhys); NOREF(enmOrigin);
230
231 if (enmAccessType == PGMACCESSTYPE_READ)
232 {
233 switch (pRomPage->enmProt)
234 {
235 /*
236 * Take the default action.
237 */
238 case PGMROMPROT_READ_ROM_WRITE_IGNORE:
239 case PGMROMPROT_READ_RAM_WRITE_IGNORE:
240 case PGMROMPROT_READ_ROM_WRITE_RAM:
241 case PGMROMPROT_READ_RAM_WRITE_RAM:
242 return VINF_PGM_HANDLER_DO_DEFAULT;
243
244 default:
245 AssertMsgFailedReturn(("enmProt=%d iPage=%d GCPhys=%RGp\n",
246 pRom->aPages[iPage].enmProt, iPage, GCPhys),
247 VERR_IPE_NOT_REACHED_DEFAULT_CASE);
248 }
249 }
250 else
251 {
252 Assert(enmAccessType == PGMACCESSTYPE_WRITE);
253 switch (pRomPage->enmProt)
254 {
255 /*
256 * Ignore writes.
257 */
258 case PGMROMPROT_READ_ROM_WRITE_IGNORE:
259 case PGMROMPROT_READ_RAM_WRITE_IGNORE:
260 return VINF_SUCCESS;
261
262 /*
263 * Write to the RAM page.
264 */
265 case PGMROMPROT_READ_ROM_WRITE_RAM:
266 case PGMROMPROT_READ_RAM_WRITE_RAM: /* yes this will get here too, it's *way* simpler that way. */
267 {
268 /* This should be impossible now, pvPhys doesn't work cross page anylonger. */
269 Assert(((GCPhys - pRom->GCPhys + cbBuf - 1) >> PAGE_SHIFT) == iPage);
270
271 /*
272 * Take the lock, do lazy allocation, map the page and copy the data.
273 *
274 * Note that we have to bypass the mapping TLB since it works on
275 * guest physical addresses and entering the shadow page would
276 * kind of screw things up...
277 */
278 PGM_LOCK_VOID(pVM);
279
280 PPGMPAGE pShadowPage = &pRomPage->Shadow;
281 if (!PGMROMPROT_IS_ROM(pRomPage->enmProt))
282 {
283 pShadowPage = pgmPhysGetPage(pVM, GCPhys);
284 AssertLogRelReturn(pShadowPage, VERR_PGM_PHYS_PAGE_GET_IPE);
285 }
286
287 void *pvDstPage;
288 int rc = pgmPhysPageMakeWritableAndMap(pVM, pShadowPage, GCPhys & X86_PTE_PG_MASK, &pvDstPage);
289 if (RT_SUCCESS(rc))
290 {
291 memcpy((uint8_t *)pvDstPage + (GCPhys & PAGE_OFFSET_MASK), pvBuf, cbBuf);
292 pRomPage->LiveSave.fWrittenTo = true;
293
294 AssertMsg( rc == VINF_SUCCESS
295 || ( rc == VINF_PGM_SYNC_CR3
296 && VMCPU_FF_IS_ANY_SET(pVCpu, VMCPU_FF_PGM_SYNC_CR3 | VMCPU_FF_PGM_SYNC_CR3_NON_GLOBAL))
297 , ("%Rrc\n", rc));
298 rc = VINF_SUCCESS;
299 }
300
301 PGM_UNLOCK(pVM);
302 return rc;
303 }
304
305 default:
306 AssertMsgFailedReturn(("enmProt=%d iPage=%d GCPhys=%RGp\n",
307 pRom->aPages[iPage].enmProt, iPage, GCPhys),
308 VERR_IPE_NOT_REACHED_DEFAULT_CASE);
309 }
310 }
311}
312
313
314/**
315 * Invalidates the RAM range TLBs.
316 *
317 * @param pVM The cross context VM structure.
318 */
319void pgmPhysInvalidRamRangeTlbs(PVMCC pVM)
320{
321 PGM_LOCK_VOID(pVM);
322 RT_ZERO(pVM->pgm.s.apRamRangesTlbR3);
323 RT_ZERO(pVM->pgm.s.apRamRangesTlbR0);
324 PGM_UNLOCK(pVM);
325}
326
327
328/**
329 * Tests if a value of type RTGCPHYS is negative if the type had been signed
330 * instead of unsigned.
331 *
332 * @returns @c true if negative, @c false if positive or zero.
333 * @param a_GCPhys The value to test.
334 * @todo Move me to iprt/types.h.
335 */
336#define RTGCPHYS_IS_NEGATIVE(a_GCPhys) ((a_GCPhys) & ((RTGCPHYS)1 << (sizeof(RTGCPHYS)*8 - 1)))
337
338
339/**
340 * Slow worker for pgmPhysGetRange.
341 *
342 * @copydoc pgmPhysGetRange
343 */
344PPGMRAMRANGE pgmPhysGetRangeSlow(PVM pVM, RTGCPHYS GCPhys)
345{
346 STAM_COUNTER_INC(&pVM->pgm.s.CTX_SUFF(pStats)->CTX_MID_Z(Stat,RamRangeTlbMisses));
347
348 PPGMRAMRANGE pRam = pVM->pgm.s.CTX_SUFF(pRamRangeTree);
349 while (pRam)
350 {
351 RTGCPHYS off = GCPhys - pRam->GCPhys;
352 if (off < pRam->cb)
353 {
354 pVM->pgm.s.CTX_SUFF(apRamRangesTlb)[PGM_RAMRANGE_TLB_IDX(GCPhys)] = pRam;
355 return pRam;
356 }
357 if (RTGCPHYS_IS_NEGATIVE(off))
358 pRam = pRam->CTX_SUFF(pLeft);
359 else
360 pRam = pRam->CTX_SUFF(pRight);
361 }
362 return NULL;
363}
364
365
366/**
367 * Slow worker for pgmPhysGetRangeAtOrAbove.
368 *
369 * @copydoc pgmPhysGetRangeAtOrAbove
370 */
371PPGMRAMRANGE pgmPhysGetRangeAtOrAboveSlow(PVM pVM, RTGCPHYS GCPhys)
372{
373 STAM_COUNTER_INC(&pVM->pgm.s.CTX_SUFF(pStats)->CTX_MID_Z(Stat,RamRangeTlbMisses));
374
375 PPGMRAMRANGE pLastLeft = NULL;
376 PPGMRAMRANGE pRam = pVM->pgm.s.CTX_SUFF(pRamRangeTree);
377 while (pRam)
378 {
379 RTGCPHYS off = GCPhys - pRam->GCPhys;
380 if (off < pRam->cb)
381 {
382 pVM->pgm.s.CTX_SUFF(apRamRangesTlb)[PGM_RAMRANGE_TLB_IDX(GCPhys)] = pRam;
383 return pRam;
384 }
385 if (RTGCPHYS_IS_NEGATIVE(off))
386 {
387 pLastLeft = pRam;
388 pRam = pRam->CTX_SUFF(pLeft);
389 }
390 else
391 pRam = pRam->CTX_SUFF(pRight);
392 }
393 return pLastLeft;
394}
395
396
397/**
398 * Slow worker for pgmPhysGetPage.
399 *
400 * @copydoc pgmPhysGetPage
401 */
402PPGMPAGE pgmPhysGetPageSlow(PVM pVM, RTGCPHYS GCPhys)
403{
404 STAM_COUNTER_INC(&pVM->pgm.s.CTX_SUFF(pStats)->CTX_MID_Z(Stat,RamRangeTlbMisses));
405
406 PPGMRAMRANGE pRam = pVM->pgm.s.CTX_SUFF(pRamRangeTree);
407 while (pRam)
408 {
409 RTGCPHYS off = GCPhys - pRam->GCPhys;
410 if (off < pRam->cb)
411 {
412 pVM->pgm.s.CTX_SUFF(apRamRangesTlb)[PGM_RAMRANGE_TLB_IDX(GCPhys)] = pRam;
413 return &pRam->aPages[off >> PAGE_SHIFT];
414 }
415
416 if (RTGCPHYS_IS_NEGATIVE(off))
417 pRam = pRam->CTX_SUFF(pLeft);
418 else
419 pRam = pRam->CTX_SUFF(pRight);
420 }
421 return NULL;
422}
423
424
425/**
426 * Slow worker for pgmPhysGetPageEx.
427 *
428 * @copydoc pgmPhysGetPageEx
429 */
430int pgmPhysGetPageExSlow(PVM pVM, RTGCPHYS GCPhys, PPPGMPAGE ppPage)
431{
432 STAM_COUNTER_INC(&pVM->pgm.s.CTX_SUFF(pStats)->CTX_MID_Z(Stat,RamRangeTlbMisses));
433
434 PPGMRAMRANGE pRam = pVM->pgm.s.CTX_SUFF(pRamRangeTree);
435 while (pRam)
436 {
437 RTGCPHYS off = GCPhys - pRam->GCPhys;
438 if (off < pRam->cb)
439 {
440 pVM->pgm.s.CTX_SUFF(apRamRangesTlb)[PGM_RAMRANGE_TLB_IDX(GCPhys)] = pRam;
441 *ppPage = &pRam->aPages[off >> PAGE_SHIFT];
442 return VINF_SUCCESS;
443 }
444
445 if (RTGCPHYS_IS_NEGATIVE(off))
446 pRam = pRam->CTX_SUFF(pLeft);
447 else
448 pRam = pRam->CTX_SUFF(pRight);
449 }
450
451 *ppPage = NULL;
452 return VERR_PGM_INVALID_GC_PHYSICAL_ADDRESS;
453}
454
455
456/**
457 * Slow worker for pgmPhysGetPageAndRangeEx.
458 *
459 * @copydoc pgmPhysGetPageAndRangeEx
460 */
461int pgmPhysGetPageAndRangeExSlow(PVM pVM, RTGCPHYS GCPhys, PPPGMPAGE ppPage, PPGMRAMRANGE *ppRam)
462{
463 STAM_COUNTER_INC(&pVM->pgm.s.CTX_SUFF(pStats)->CTX_MID_Z(Stat,RamRangeTlbMisses));
464
465 PPGMRAMRANGE pRam = pVM->pgm.s.CTX_SUFF(pRamRangeTree);
466 while (pRam)
467 {
468 RTGCPHYS off = GCPhys - pRam->GCPhys;
469 if (off < pRam->cb)
470 {
471 pVM->pgm.s.CTX_SUFF(apRamRangesTlb)[PGM_RAMRANGE_TLB_IDX(GCPhys)] = pRam;
472 *ppRam = pRam;
473 *ppPage = &pRam->aPages[off >> PAGE_SHIFT];
474 return VINF_SUCCESS;
475 }
476
477 if (RTGCPHYS_IS_NEGATIVE(off))
478 pRam = pRam->CTX_SUFF(pLeft);
479 else
480 pRam = pRam->CTX_SUFF(pRight);
481 }
482
483 *ppRam = NULL;
484 *ppPage = NULL;
485 return VERR_PGM_INVALID_GC_PHYSICAL_ADDRESS;
486}
487
488
489/**
490 * Checks if Address Gate 20 is enabled or not.
491 *
492 * @returns true if enabled.
493 * @returns false if disabled.
494 * @param pVCpu The cross context virtual CPU structure.
495 */
496VMMDECL(bool) PGMPhysIsA20Enabled(PVMCPU pVCpu)
497{
498 LogFlow(("PGMPhysIsA20Enabled %d\n", pVCpu->pgm.s.fA20Enabled));
499 return pVCpu->pgm.s.fA20Enabled;
500}
501
502
503/**
504 * Validates a GC physical address.
505 *
506 * @returns true if valid.
507 * @returns false if invalid.
508 * @param pVM The cross context VM structure.
509 * @param GCPhys The physical address to validate.
510 */
511VMMDECL(bool) PGMPhysIsGCPhysValid(PVMCC pVM, RTGCPHYS GCPhys)
512{
513 PPGMPAGE pPage = pgmPhysGetPage(pVM, GCPhys);
514 return pPage != NULL;
515}
516
517
518/**
519 * Checks if a GC physical address is a normal page,
520 * i.e. not ROM, MMIO or reserved.
521 *
522 * @returns true if normal.
523 * @returns false if invalid, ROM, MMIO or reserved page.
524 * @param pVM The cross context VM structure.
525 * @param GCPhys The physical address to check.
526 */
527VMMDECL(bool) PGMPhysIsGCPhysNormal(PVMCC pVM, RTGCPHYS GCPhys)
528{
529 PPGMPAGE pPage = pgmPhysGetPage(pVM, GCPhys);
530 return pPage
531 && PGM_PAGE_GET_TYPE(pPage) == PGMPAGETYPE_RAM;
532}
533
534
535/**
536 * Converts a GC physical address to a HC physical address.
537 *
538 * @returns VINF_SUCCESS on success.
539 * @returns VERR_PGM_PHYS_PAGE_RESERVED it it's a valid GC physical
540 * page but has no physical backing.
541 * @returns VERR_PGM_INVALID_GC_PHYSICAL_ADDRESS if it's not a valid
542 * GC physical address.
543 *
544 * @param pVM The cross context VM structure.
545 * @param GCPhys The GC physical address to convert.
546 * @param pHCPhys Where to store the HC physical address on success.
547 */
548VMM_INT_DECL(int) PGMPhysGCPhys2HCPhys(PVMCC pVM, RTGCPHYS GCPhys, PRTHCPHYS pHCPhys)
549{
550 PGM_LOCK_VOID(pVM);
551 PPGMPAGE pPage;
552 int rc = pgmPhysGetPageEx(pVM, GCPhys, &pPage);
553 if (RT_SUCCESS(rc))
554 *pHCPhys = PGM_PAGE_GET_HCPHYS(pPage) | (GCPhys & PAGE_OFFSET_MASK);
555 PGM_UNLOCK(pVM);
556 return rc;
557}
558
559
560/**
561 * Invalidates all page mapping TLBs.
562 *
563 * @param pVM The cross context VM structure.
564 */
565void pgmPhysInvalidatePageMapTLB(PVMCC pVM)
566{
567 PGM_LOCK_VOID(pVM);
568 STAM_COUNTER_INC(&pVM->pgm.s.CTX_SUFF(pStats)->StatPageMapTlbFlushes);
569
570 /* Clear the R3 & R0 TLBs completely. */
571 for (unsigned i = 0; i < RT_ELEMENTS(pVM->pgm.s.PhysTlbR0.aEntries); i++)
572 {
573 pVM->pgm.s.PhysTlbR0.aEntries[i].GCPhys = NIL_RTGCPHYS;
574 pVM->pgm.s.PhysTlbR0.aEntries[i].pPage = 0;
575#ifndef VBOX_WITH_RAM_IN_KERNEL
576 pVM->pgm.s.PhysTlbR0.aEntries[i].pMap = 0;
577#endif
578 pVM->pgm.s.PhysTlbR0.aEntries[i].pv = 0;
579 }
580
581 for (unsigned i = 0; i < RT_ELEMENTS(pVM->pgm.s.PhysTlbR3.aEntries); i++)
582 {
583 pVM->pgm.s.PhysTlbR3.aEntries[i].GCPhys = NIL_RTGCPHYS;
584 pVM->pgm.s.PhysTlbR3.aEntries[i].pPage = 0;
585 pVM->pgm.s.PhysTlbR3.aEntries[i].pMap = 0;
586 pVM->pgm.s.PhysTlbR3.aEntries[i].pv = 0;
587 }
588
589 PGM_UNLOCK(pVM);
590}
591
592
593/**
594 * Invalidates a page mapping TLB entry
595 *
596 * @param pVM The cross context VM structure.
597 * @param GCPhys GCPhys entry to flush
598 */
599void pgmPhysInvalidatePageMapTLBEntry(PVMCC pVM, RTGCPHYS GCPhys)
600{
601 PGM_LOCK_ASSERT_OWNER(pVM);
602
603 STAM_COUNTER_INC(&pVM->pgm.s.CTX_SUFF(pStats)->StatPageMapTlbFlushEntry);
604
605 unsigned const idx = PGM_PAGER3MAPTLB_IDX(GCPhys);
606
607 pVM->pgm.s.PhysTlbR0.aEntries[idx].GCPhys = NIL_RTGCPHYS;
608 pVM->pgm.s.PhysTlbR0.aEntries[idx].pPage = 0;
609#ifndef VBOX_WITH_RAM_IN_KERNEL
610 pVM->pgm.s.PhysTlbR0.aEntries[idx].pMap = 0;
611#endif
612 pVM->pgm.s.PhysTlbR0.aEntries[idx].pv = 0;
613
614 pVM->pgm.s.PhysTlbR3.aEntries[idx].GCPhys = NIL_RTGCPHYS;
615 pVM->pgm.s.PhysTlbR3.aEntries[idx].pPage = 0;
616 pVM->pgm.s.PhysTlbR3.aEntries[idx].pMap = 0;
617 pVM->pgm.s.PhysTlbR3.aEntries[idx].pv = 0;
618}
619
620
621/**
622 * Makes sure that there is at least one handy page ready for use.
623 *
624 * This will also take the appropriate actions when reaching water-marks.
625 *
626 * @returns VBox status code.
627 * @retval VINF_SUCCESS on success.
628 * @retval VERR_EM_NO_MEMORY if we're really out of memory.
629 *
630 * @param pVM The cross context VM structure.
631 *
632 * @remarks Must be called from within the PGM critical section. It may
633 * nip back to ring-3/0 in some cases.
634 */
635static int pgmPhysEnsureHandyPage(PVMCC pVM)
636{
637 AssertMsg(pVM->pgm.s.cHandyPages <= RT_ELEMENTS(pVM->pgm.s.aHandyPages), ("%d\n", pVM->pgm.s.cHandyPages));
638
639 /*
640 * Do we need to do anything special?
641 */
642#ifdef IN_RING3
643 if (pVM->pgm.s.cHandyPages <= RT_MAX(PGM_HANDY_PAGES_SET_FF, PGM_HANDY_PAGES_R3_ALLOC))
644#else
645 if (pVM->pgm.s.cHandyPages <= RT_MAX(PGM_HANDY_PAGES_SET_FF, PGM_HANDY_PAGES_RZ_TO_R3))
646#endif
647 {
648 /*
649 * Allocate pages only if we're out of them, or in ring-3, almost out.
650 */
651#ifdef IN_RING3
652 if (pVM->pgm.s.cHandyPages <= PGM_HANDY_PAGES_R3_ALLOC)
653#else
654 if (pVM->pgm.s.cHandyPages <= PGM_HANDY_PAGES_RZ_ALLOC)
655#endif
656 {
657 Log(("PGM: cHandyPages=%u out of %u -> allocate more; VM_FF_PGM_NO_MEMORY=%RTbool\n",
658 pVM->pgm.s.cHandyPages, RT_ELEMENTS(pVM->pgm.s.aHandyPages), VM_FF_IS_SET(pVM, VM_FF_PGM_NO_MEMORY) ));
659#ifdef IN_RING3
660 int rc = PGMR3PhysAllocateHandyPages(pVM);
661#else
662 int rc = VMMRZCallRing3NoCpu(pVM, VMMCALLRING3_PGM_ALLOCATE_HANDY_PAGES, 0);
663#endif
664 if (RT_UNLIKELY(rc != VINF_SUCCESS))
665 {
666 if (RT_FAILURE(rc))
667 return rc;
668 AssertMsgReturn(rc == VINF_EM_NO_MEMORY, ("%Rrc\n", rc), VERR_IPE_UNEXPECTED_INFO_STATUS);
669 if (!pVM->pgm.s.cHandyPages)
670 {
671 LogRel(("PGM: no more handy pages!\n"));
672 return VERR_EM_NO_MEMORY;
673 }
674 Assert(VM_FF_IS_SET(pVM, VM_FF_PGM_NEED_HANDY_PAGES));
675 Assert(VM_FF_IS_SET(pVM, VM_FF_PGM_NO_MEMORY));
676#ifndef IN_RING3
677 VMCPU_FF_SET(VMMGetCpu(pVM), VMCPU_FF_TO_R3); /* paranoia */
678#endif
679 }
680 AssertMsgReturn( pVM->pgm.s.cHandyPages > 0
681 && pVM->pgm.s.cHandyPages <= RT_ELEMENTS(pVM->pgm.s.aHandyPages),
682 ("%u\n", pVM->pgm.s.cHandyPages),
683 VERR_PGM_HANDY_PAGE_IPE);
684 }
685 else
686 {
687 if (pVM->pgm.s.cHandyPages <= PGM_HANDY_PAGES_SET_FF)
688 VM_FF_SET(pVM, VM_FF_PGM_NEED_HANDY_PAGES);
689#ifndef IN_RING3
690 if (pVM->pgm.s.cHandyPages <= PGM_HANDY_PAGES_RZ_TO_R3)
691 {
692 Log(("PGM: VM_FF_TO_R3 - cHandyPages=%u out of %u\n", pVM->pgm.s.cHandyPages, RT_ELEMENTS(pVM->pgm.s.aHandyPages)));
693 VMCPU_FF_SET(VMMGetCpu(pVM), VMCPU_FF_TO_R3);
694 }
695#endif
696 }
697 }
698
699 return VINF_SUCCESS;
700}
701
702
703
704/**
705 * Replace a zero or shared page with new page that we can write to.
706 *
707 * @returns The following VBox status codes.
708 * @retval VINF_SUCCESS on success, pPage is modified.
709 * @retval VINF_PGM_SYNC_CR3 on success and a page pool flush is pending.
710 * @retval VERR_EM_NO_MEMORY if we're totally out of memory.
711 *
712 * @todo Propagate VERR_EM_NO_MEMORY up the call tree.
713 *
714 * @param pVM The cross context VM structure.
715 * @param pPage The physical page tracking structure. This will
716 * be modified on success.
717 * @param GCPhys The address of the page.
718 *
719 * @remarks Must be called from within the PGM critical section. It may
720 * nip back to ring-3/0 in some cases.
721 *
722 * @remarks This function shouldn't really fail, however if it does
723 * it probably means we've screwed up the size of handy pages and/or
724 * the low-water mark. Or, that some device I/O is causing a lot of
725 * pages to be allocated while while the host is in a low-memory
726 * condition. This latter should be handled elsewhere and in a more
727 * controlled manner, it's on the @bugref{3170} todo list...
728 */
729int pgmPhysAllocPage(PVMCC pVM, PPGMPAGE pPage, RTGCPHYS GCPhys)
730{
731 LogFlow(("pgmPhysAllocPage: %R[pgmpage] %RGp\n", pPage, GCPhys));
732
733 /*
734 * Prereqs.
735 */
736 PGM_LOCK_ASSERT_OWNER(pVM);
737 AssertMsg(PGM_PAGE_IS_ZERO(pPage) || PGM_PAGE_IS_SHARED(pPage), ("%R[pgmpage] %RGp\n", pPage, GCPhys));
738 Assert(!PGM_PAGE_IS_MMIO_OR_ALIAS(pPage));
739
740# ifdef PGM_WITH_LARGE_PAGES
741 /*
742 * Try allocate a large page if applicable.
743 */
744 if ( PGMIsUsingLargePages(pVM)
745 && PGM_PAGE_GET_TYPE(pPage) == PGMPAGETYPE_RAM
746 && !VM_IS_NEM_ENABLED(pVM)) /** @todo NEM: Implement large pages support. */
747 {
748 RTGCPHYS GCPhysBase = GCPhys & X86_PDE2M_PAE_PG_MASK;
749 PPGMPAGE pBasePage;
750
751 int rc = pgmPhysGetPageEx(pVM, GCPhysBase, &pBasePage);
752 AssertRCReturn(rc, rc); /* paranoia; can't happen. */
753 if (PGM_PAGE_GET_PDE_TYPE(pBasePage) == PGM_PAGE_PDE_TYPE_DONTCARE)
754 {
755 rc = pgmPhysAllocLargePage(pVM, GCPhys);
756 if (rc == VINF_SUCCESS)
757 return rc;
758 }
759 /* Mark the base as type page table, so we don't check over and over again. */
760 PGM_PAGE_SET_PDE_TYPE(pVM, pBasePage, PGM_PAGE_PDE_TYPE_PT);
761
762 /* fall back to 4KB pages. */
763 }
764# endif
765
766 /*
767 * Flush any shadow page table mappings of the page.
768 * When VBOX_WITH_NEW_LAZY_PAGE_ALLOC isn't defined, there shouldn't be any.
769 */
770 bool fFlushTLBs = false;
771 int rc = pgmPoolTrackUpdateGCPhys(pVM, GCPhys, pPage, true /*fFlushTLBs*/, &fFlushTLBs);
772 AssertMsgReturn(rc == VINF_SUCCESS || rc == VINF_PGM_SYNC_CR3, ("%Rrc\n", rc), RT_FAILURE(rc) ? rc : VERR_IPE_UNEXPECTED_STATUS);
773
774 /*
775 * Ensure that we've got a page handy, take it and use it.
776 */
777 int rc2 = pgmPhysEnsureHandyPage(pVM);
778 if (RT_FAILURE(rc2))
779 {
780 if (fFlushTLBs)
781 PGM_INVL_ALL_VCPU_TLBS(pVM);
782 Assert(rc2 == VERR_EM_NO_MEMORY);
783 return rc2;
784 }
785 /* re-assert preconditions since pgmPhysEnsureHandyPage may do a context switch. */
786 PGM_LOCK_ASSERT_OWNER(pVM);
787 AssertMsg(PGM_PAGE_IS_ZERO(pPage) || PGM_PAGE_IS_SHARED(pPage), ("%R[pgmpage] %RGp\n", pPage, GCPhys));
788 Assert(!PGM_PAGE_IS_MMIO_OR_ALIAS(pPage));
789
790 uint32_t iHandyPage = --pVM->pgm.s.cHandyPages;
791 AssertMsg(iHandyPage < RT_ELEMENTS(pVM->pgm.s.aHandyPages), ("%d\n", iHandyPage));
792 Assert(pVM->pgm.s.aHandyPages[iHandyPage].HCPhysGCPhys != NIL_RTHCPHYS);
793 Assert(!(pVM->pgm.s.aHandyPages[iHandyPage].HCPhysGCPhys & ~X86_PTE_PAE_PG_MASK));
794 Assert(pVM->pgm.s.aHandyPages[iHandyPage].idPage != NIL_GMM_PAGEID);
795 Assert(pVM->pgm.s.aHandyPages[iHandyPage].idSharedPage == NIL_GMM_PAGEID);
796
797 /*
798 * There are one or two action to be taken the next time we allocate handy pages:
799 * - Tell the GMM (global memory manager) what the page is being used for.
800 * (Speeds up replacement operations - sharing and defragmenting.)
801 * - If the current backing is shared, it must be freed.
802 */
803 const RTHCPHYS HCPhys = pVM->pgm.s.aHandyPages[iHandyPage].HCPhysGCPhys;
804 pVM->pgm.s.aHandyPages[iHandyPage].HCPhysGCPhys = GCPhys & ~(RTGCPHYS)PAGE_OFFSET_MASK;
805
806 void const *pvSharedPage = NULL;
807 if (PGM_PAGE_IS_SHARED(pPage))
808 {
809 /* Mark this shared page for freeing/dereferencing. */
810 pVM->pgm.s.aHandyPages[iHandyPage].idSharedPage = PGM_PAGE_GET_PAGEID(pPage);
811 Assert(PGM_PAGE_GET_PAGEID(pPage) != NIL_GMM_PAGEID);
812
813 Log(("PGM: Replaced shared page %#x at %RGp with %#x / %RHp\n", PGM_PAGE_GET_PAGEID(pPage),
814 GCPhys, pVM->pgm.s.aHandyPages[iHandyPage].idPage, HCPhys));
815 STAM_COUNTER_INC(&pVM->pgm.s.CTX_SUFF(pStats)->CTX_MID_Z(Stat,PageReplaceShared));
816 pVM->pgm.s.cSharedPages--;
817
818 /* Grab the address of the page so we can make a copy later on. (safe) */
819 rc = pgmPhysPageMapReadOnly(pVM, pPage, GCPhys, &pvSharedPage);
820 AssertRC(rc);
821 }
822 else
823 {
824 Log2(("PGM: Replaced zero page %RGp with %#x / %RHp\n", GCPhys, pVM->pgm.s.aHandyPages[iHandyPage].idPage, HCPhys));
825 STAM_COUNTER_INC(&pVM->pgm.s.CTX_SUFF(pStats)->StatRZPageReplaceZero);
826 pVM->pgm.s.cZeroPages--;
827 }
828
829 /*
830 * Do the PGMPAGE modifications.
831 */
832 pVM->pgm.s.cPrivatePages++;
833 PGM_PAGE_SET_HCPHYS(pVM, pPage, HCPhys);
834 PGM_PAGE_SET_PAGEID(pVM, pPage, pVM->pgm.s.aHandyPages[iHandyPage].idPage);
835 PGM_PAGE_SET_STATE(pVM, pPage, PGM_PAGE_STATE_ALLOCATED);
836 PGM_PAGE_SET_PDE_TYPE(pVM, pPage, PGM_PAGE_PDE_TYPE_PT);
837 pgmPhysInvalidatePageMapTLBEntry(pVM, GCPhys);
838
839 /* Copy the shared page contents to the replacement page. */
840 if (pvSharedPage)
841 {
842 /* Get the virtual address of the new page. */
843 PGMPAGEMAPLOCK PgMpLck;
844 void *pvNewPage;
845 rc = pgmPhysGCPhys2CCPtrInternal(pVM, pPage, GCPhys, &pvNewPage, &PgMpLck); AssertRC(rc);
846 if (RT_SUCCESS(rc))
847 {
848 memcpy(pvNewPage, pvSharedPage, PAGE_SIZE); /** @todo todo write ASMMemCopyPage */
849 pgmPhysReleaseInternalPageMappingLock(pVM, &PgMpLck);
850 }
851 }
852
853 if ( fFlushTLBs
854 && rc != VINF_PGM_GCPHYS_ALIASED)
855 PGM_INVL_ALL_VCPU_TLBS(pVM);
856
857 /*
858 * Notify NEM about the mapping change for this page.
859 *
860 * Note! Shadow ROM pages are complicated as they can definitely be
861 * allocated while not visible, so play safe.
862 */
863 if (VM_IS_NEM_ENABLED(pVM))
864 {
865 PGMPAGETYPE enmType = (PGMPAGETYPE)PGM_PAGE_GET_TYPE(pPage);
866 if ( enmType != PGMPAGETYPE_ROM_SHADOW
867 || pgmPhysGetPage(pVM, GCPhys) == pPage)
868 {
869 uint8_t u2State = PGM_PAGE_GET_NEM_STATE(pPage);
870 rc2 = NEMHCNotifyPhysPageAllocated(pVM, GCPhys & ~(RTGCPHYS)X86_PAGE_OFFSET_MASK, HCPhys,
871 pgmPhysPageCalcNemProtection(pPage, enmType), enmType, &u2State);
872 if (RT_SUCCESS(rc))
873 PGM_PAGE_SET_NEM_STATE(pPage, u2State);
874 else
875 rc = rc2;
876 }
877 }
878
879 return rc;
880}
881
882#ifdef PGM_WITH_LARGE_PAGES
883
884/**
885 * Replace a 2 MB range of zero pages with new pages that we can write to.
886 *
887 * @returns The following VBox status codes.
888 * @retval VINF_SUCCESS on success, pPage is modified.
889 * @retval VINF_PGM_SYNC_CR3 on success and a page pool flush is pending.
890 * @retval VERR_EM_NO_MEMORY if we're totally out of memory.
891 *
892 * @todo Propagate VERR_EM_NO_MEMORY up the call tree.
893 *
894 * @param pVM The cross context VM structure.
895 * @param GCPhys The address of the page.
896 *
897 * @remarks Must be called from within the PGM critical section. It may
898 * nip back to ring-3/0 in some cases.
899 */
900int pgmPhysAllocLargePage(PVMCC pVM, RTGCPHYS GCPhys)
901{
902 RTGCPHYS GCPhysBase = GCPhys & X86_PDE2M_PAE_PG_MASK;
903 LogFlow(("pgmPhysAllocLargePage: %RGp base %RGp\n", GCPhys, GCPhysBase));
904 Assert(!VM_IS_NEM_ENABLED(pVM)); /** @todo NEM: Large page support. */
905
906 /*
907 * Prereqs.
908 */
909 PGM_LOCK_ASSERT_OWNER(pVM);
910 Assert(PGMIsUsingLargePages(pVM));
911
912 PPGMPAGE pFirstPage;
913 int rc = pgmPhysGetPageEx(pVM, GCPhysBase, &pFirstPage);
914 if ( RT_SUCCESS(rc)
915 && PGM_PAGE_GET_TYPE(pFirstPage) == PGMPAGETYPE_RAM)
916 {
917 unsigned uPDEType = PGM_PAGE_GET_PDE_TYPE(pFirstPage);
918
919 /* Don't call this function for already allocated pages. */
920 Assert(uPDEType != PGM_PAGE_PDE_TYPE_PDE);
921
922 if ( uPDEType == PGM_PAGE_PDE_TYPE_DONTCARE
923 && PGM_PAGE_GET_STATE(pFirstPage) == PGM_PAGE_STATE_ZERO)
924 {
925 /* Lazy approach: check all pages in the 2 MB range.
926 * The whole range must be ram and unallocated. */
927 GCPhys = GCPhysBase;
928 unsigned iPage;
929 for (iPage = 0; iPage < _2M/PAGE_SIZE; iPage++)
930 {
931 PPGMPAGE pSubPage;
932 rc = pgmPhysGetPageEx(pVM, GCPhys, &pSubPage);
933 if ( RT_FAILURE(rc)
934 || PGM_PAGE_GET_TYPE(pSubPage) != PGMPAGETYPE_RAM /* Anything other than ram implies monitoring. */
935 || PGM_PAGE_GET_STATE(pSubPage) != PGM_PAGE_STATE_ZERO) /* Allocated, monitored or shared means we can't use a large page here */
936 {
937 LogFlow(("Found page %RGp with wrong attributes (type=%d; state=%d); cancel check. rc=%d\n", GCPhys, PGM_PAGE_GET_TYPE(pSubPage), PGM_PAGE_GET_STATE(pSubPage), rc));
938 break;
939 }
940 Assert(PGM_PAGE_GET_PDE_TYPE(pSubPage) == PGM_PAGE_PDE_TYPE_DONTCARE);
941 GCPhys += PAGE_SIZE;
942 }
943 if (iPage != _2M/PAGE_SIZE)
944 {
945 /* Failed. Mark as requiring a PT so we don't check the whole thing again in the future. */
946 STAM_REL_COUNTER_INC(&pVM->pgm.s.StatLargePageRefused);
947 PGM_PAGE_SET_PDE_TYPE(pVM, pFirstPage, PGM_PAGE_PDE_TYPE_PT);
948 return VERR_PGM_INVALID_LARGE_PAGE_RANGE;
949 }
950
951 /*
952 * Do the allocation.
953 */
954# ifdef IN_RING3
955 rc = PGMR3PhysAllocateLargeHandyPage(pVM, GCPhysBase);
956# else
957 rc = VMMRZCallRing3NoCpu(pVM, VMMCALLRING3_PGM_ALLOCATE_LARGE_HANDY_PAGE, GCPhysBase);
958# endif
959 if (RT_SUCCESS(rc))
960 {
961 Assert(PGM_PAGE_GET_STATE(pFirstPage) == PGM_PAGE_STATE_ALLOCATED);
962 pVM->pgm.s.cLargePages++;
963 return VINF_SUCCESS;
964 }
965
966 /* If we fail once, it most likely means the host's memory is too
967 fragmented; don't bother trying again. */
968 LogFlow(("pgmPhysAllocLargePage failed with %Rrc\n", rc));
969 PGMSetLargePageUsage(pVM, false);
970 return rc;
971 }
972 }
973 return VERR_PGM_INVALID_LARGE_PAGE_RANGE;
974}
975
976
977/**
978 * Recheck the entire 2 MB range to see if we can use it again as a large page.
979 *
980 * @returns The following VBox status codes.
981 * @retval VINF_SUCCESS on success, the large page can be used again
982 * @retval VERR_PGM_INVALID_LARGE_PAGE_RANGE if it can't be reused
983 *
984 * @param pVM The cross context VM structure.
985 * @param GCPhys The address of the page.
986 * @param pLargePage Page structure of the base page
987 */
988int pgmPhysRecheckLargePage(PVMCC pVM, RTGCPHYS GCPhys, PPGMPAGE pLargePage)
989{
990 STAM_REL_COUNTER_INC(&pVM->pgm.s.StatLargePageRecheck);
991
992 Assert(!VM_IS_NEM_ENABLED(pVM)); /** @todo NEM: Large page support. */
993
994 GCPhys &= X86_PDE2M_PAE_PG_MASK;
995
996 /* Check the base page. */
997 Assert(PGM_PAGE_GET_PDE_TYPE(pLargePage) == PGM_PAGE_PDE_TYPE_PDE_DISABLED);
998 if ( PGM_PAGE_GET_STATE(pLargePage) != PGM_PAGE_STATE_ALLOCATED
999 || PGM_PAGE_GET_TYPE(pLargePage) != PGMPAGETYPE_RAM
1000 || PGM_PAGE_GET_HNDL_PHYS_STATE(pLargePage) != PGM_PAGE_HNDL_PHYS_STATE_NONE)
1001 {
1002 LogFlow(("pgmPhysRecheckLargePage: checks failed for base page %x %x %x\n", PGM_PAGE_GET_STATE(pLargePage), PGM_PAGE_GET_TYPE(pLargePage), PGM_PAGE_GET_HNDL_PHYS_STATE(pLargePage)));
1003 return VERR_PGM_INVALID_LARGE_PAGE_RANGE;
1004 }
1005
1006 STAM_PROFILE_START(&pVM->pgm.s.CTX_SUFF(pStats)->CTX_MID_Z(Stat,IsValidLargePage), a);
1007 /* Check all remaining pages in the 2 MB range. */
1008 unsigned i;
1009 GCPhys += PAGE_SIZE;
1010 for (i = 1; i < _2M/PAGE_SIZE; i++)
1011 {
1012 PPGMPAGE pPage;
1013 int rc = pgmPhysGetPageEx(pVM, GCPhys, &pPage);
1014 AssertRCBreak(rc);
1015
1016 if ( PGM_PAGE_GET_STATE(pPage) != PGM_PAGE_STATE_ALLOCATED
1017 || PGM_PAGE_GET_PDE_TYPE(pPage) != PGM_PAGE_PDE_TYPE_PDE
1018 || PGM_PAGE_GET_TYPE(pPage) != PGMPAGETYPE_RAM
1019 || PGM_PAGE_GET_HNDL_PHYS_STATE(pPage) != PGM_PAGE_HNDL_PHYS_STATE_NONE)
1020 {
1021 LogFlow(("pgmPhysRecheckLargePage: checks failed for page %d; %x %x %x\n", i, PGM_PAGE_GET_STATE(pPage), PGM_PAGE_GET_TYPE(pPage), PGM_PAGE_GET_HNDL_PHYS_STATE(pPage)));
1022 break;
1023 }
1024
1025 GCPhys += PAGE_SIZE;
1026 }
1027 STAM_PROFILE_STOP(&pVM->pgm.s.CTX_SUFF(pStats)->CTX_MID_Z(Stat,IsValidLargePage), a);
1028
1029 if (i == _2M/PAGE_SIZE)
1030 {
1031 PGM_PAGE_SET_PDE_TYPE(pVM, pLargePage, PGM_PAGE_PDE_TYPE_PDE);
1032 pVM->pgm.s.cLargePagesDisabled--;
1033 Log(("pgmPhysRecheckLargePage: page %RGp can be reused!\n", GCPhys - _2M));
1034 return VINF_SUCCESS;
1035 }
1036
1037 return VERR_PGM_INVALID_LARGE_PAGE_RANGE;
1038}
1039
1040#endif /* PGM_WITH_LARGE_PAGES */
1041
1042
1043/**
1044 * Deal with a write monitored page.
1045 *
1046 * @returns VBox strict status code.
1047 *
1048 * @param pVM The cross context VM structure.
1049 * @param pPage The physical page tracking structure.
1050 * @param GCPhys The guest physical address of the page.
1051 * PGMPhysReleasePageMappingLock() passes NIL_RTGCPHYS in a
1052 * very unlikely situation where it is okay that we let NEM
1053 * fix the page access in a lazy fasion.
1054 *
1055 * @remarks Called from within the PGM critical section.
1056 */
1057void pgmPhysPageMakeWriteMonitoredWritable(PVMCC pVM, PPGMPAGE pPage, RTGCPHYS GCPhys)
1058{
1059 Assert(PGM_PAGE_GET_STATE(pPage) == PGM_PAGE_STATE_WRITE_MONITORED);
1060 PGM_PAGE_SET_WRITTEN_TO(pVM, pPage);
1061 PGM_PAGE_SET_STATE(pVM, pPage, PGM_PAGE_STATE_ALLOCATED);
1062 Assert(pVM->pgm.s.cMonitoredPages > 0);
1063 pVM->pgm.s.cMonitoredPages--;
1064 pVM->pgm.s.cWrittenToPages++;
1065
1066 /*
1067 * Notify NEM about the protection change so we won't spin forever.
1068 *
1069 * Note! NEM need to be handle to lazily correct page protection as we cannot
1070 * really get it 100% right here it seems. The page pool does this too.
1071 */
1072 if (VM_IS_NEM_ENABLED(pVM) && GCPhys != NIL_RTGCPHYS)
1073 {
1074 uint8_t u2State = PGM_PAGE_GET_NEM_STATE(pPage);
1075 PGMPAGETYPE enmType = (PGMPAGETYPE)PGM_PAGE_GET_TYPE(pPage);
1076 NEMHCNotifyPhysPageProtChanged(pVM, GCPhys, PGM_PAGE_GET_HCPHYS(pPage),
1077 pgmPhysPageCalcNemProtection(pPage, enmType), enmType, &u2State);
1078 PGM_PAGE_SET_NEM_STATE(pPage, u2State);
1079 }
1080}
1081
1082
1083/**
1084 * Deal with pages that are not writable, i.e. not in the ALLOCATED state.
1085 *
1086 * @returns VBox strict status code.
1087 * @retval VINF_SUCCESS on success.
1088 * @retval VINF_PGM_SYNC_CR3 on success and a page pool flush is pending.
1089 * @retval VERR_PGM_PHYS_PAGE_RESERVED it it's a valid page but has no physical backing.
1090 *
1091 * @param pVM The cross context VM structure.
1092 * @param pPage The physical page tracking structure.
1093 * @param GCPhys The address of the page.
1094 *
1095 * @remarks Called from within the PGM critical section.
1096 */
1097int pgmPhysPageMakeWritable(PVMCC pVM, PPGMPAGE pPage, RTGCPHYS GCPhys)
1098{
1099 PGM_LOCK_ASSERT_OWNER(pVM);
1100 switch (PGM_PAGE_GET_STATE(pPage))
1101 {
1102 case PGM_PAGE_STATE_WRITE_MONITORED:
1103 pgmPhysPageMakeWriteMonitoredWritable(pVM, pPage, GCPhys);
1104 RT_FALL_THRU();
1105 default: /* to shut up GCC */
1106 case PGM_PAGE_STATE_ALLOCATED:
1107 return VINF_SUCCESS;
1108
1109 /*
1110 * Zero pages can be dummy pages for MMIO or reserved memory,
1111 * so we need to check the flags before joining cause with
1112 * shared page replacement.
1113 */
1114 case PGM_PAGE_STATE_ZERO:
1115 if (PGM_PAGE_IS_MMIO(pPage))
1116 return VERR_PGM_PHYS_PAGE_RESERVED;
1117 RT_FALL_THRU();
1118 case PGM_PAGE_STATE_SHARED:
1119 return pgmPhysAllocPage(pVM, pPage, GCPhys);
1120
1121 /* Not allowed to write to ballooned pages. */
1122 case PGM_PAGE_STATE_BALLOONED:
1123 return VERR_PGM_PHYS_PAGE_BALLOONED;
1124 }
1125}
1126
1127
1128/**
1129 * Internal usage: Map the page specified by its GMM ID.
1130 *
1131 * This is similar to pgmPhysPageMap
1132 *
1133 * @returns VBox status code.
1134 *
1135 * @param pVM The cross context VM structure.
1136 * @param idPage The Page ID.
1137 * @param HCPhys The physical address (for SUPR0HCPhysToVirt).
1138 * @param ppv Where to store the mapping address.
1139 *
1140 * @remarks Called from within the PGM critical section. The mapping is only
1141 * valid while you are inside this section.
1142 */
1143int pgmPhysPageMapByPageID(PVMCC pVM, uint32_t idPage, RTHCPHYS HCPhys, void **ppv)
1144{
1145 /*
1146 * Validation.
1147 */
1148 PGM_LOCK_ASSERT_OWNER(pVM);
1149 AssertReturn(HCPhys && !(HCPhys & PAGE_OFFSET_MASK), VERR_INVALID_PARAMETER);
1150 const uint32_t idChunk = idPage >> GMM_CHUNKID_SHIFT;
1151 AssertReturn(idChunk != NIL_GMM_CHUNKID, VERR_INVALID_PARAMETER);
1152
1153#if defined(IN_RING0) && defined(VBOX_WITH_RAM_IN_KERNEL)
1154# ifdef VBOX_WITH_LINEAR_HOST_PHYS_MEM
1155 return SUPR0HCPhysToVirt(HCPhys & ~(RTHCPHYS)PAGE_OFFSET_MASK, ppv);
1156# else
1157 return GMMR0PageIdToVirt(pVM, idPage, ppv);
1158# endif
1159
1160#else
1161 /*
1162 * Find/make Chunk TLB entry for the mapping chunk.
1163 */
1164 PPGMCHUNKR3MAP pMap;
1165 PPGMCHUNKR3MAPTLBE pTlbe = &pVM->pgm.s.ChunkR3Map.Tlb.aEntries[PGM_CHUNKR3MAPTLB_IDX(idChunk)];
1166 if (pTlbe->idChunk == idChunk)
1167 {
1168 STAM_COUNTER_INC(&pVM->pgm.s.CTX_SUFF(pStats)->CTX_MID_Z(Stat,ChunkR3MapTlbHits));
1169 pMap = pTlbe->pChunk;
1170 }
1171 else
1172 {
1173 STAM_COUNTER_INC(&pVM->pgm.s.CTX_SUFF(pStats)->CTX_MID_Z(Stat,ChunkR3MapTlbMisses));
1174
1175 /*
1176 * Find the chunk, map it if necessary.
1177 */
1178 pMap = (PPGMCHUNKR3MAP)RTAvlU32Get(&pVM->pgm.s.ChunkR3Map.pTree, idChunk);
1179 if (pMap)
1180 pMap->iLastUsed = pVM->pgm.s.ChunkR3Map.iNow;
1181 else
1182 {
1183# ifdef IN_RING0
1184 int rc = VMMRZCallRing3NoCpu(pVM, VMMCALLRING3_PGM_MAP_CHUNK, idChunk);
1185 AssertRCReturn(rc, rc);
1186 pMap = (PPGMCHUNKR3MAP)RTAvlU32Get(&pVM->pgm.s.ChunkR3Map.pTree, idChunk);
1187 Assert(pMap);
1188# else
1189 int rc = pgmR3PhysChunkMap(pVM, idChunk, &pMap);
1190 if (RT_FAILURE(rc))
1191 return rc;
1192# endif
1193 }
1194
1195 /*
1196 * Enter it into the Chunk TLB.
1197 */
1198 pTlbe->idChunk = idChunk;
1199 pTlbe->pChunk = pMap;
1200 }
1201
1202 *ppv = (uint8_t *)pMap->pv + ((idPage &GMM_PAGEID_IDX_MASK) << PAGE_SHIFT);
1203 return VINF_SUCCESS;
1204#endif
1205}
1206
1207
1208/**
1209 * Maps a page into the current virtual address space so it can be accessed.
1210 *
1211 * @returns VBox status code.
1212 * @retval VINF_SUCCESS on success.
1213 * @retval VERR_PGM_PHYS_PAGE_RESERVED it it's a valid page but has no physical backing.
1214 *
1215 * @param pVM The cross context VM structure.
1216 * @param pPage The physical page tracking structure.
1217 * @param GCPhys The address of the page.
1218 * @param ppMap Where to store the address of the mapping tracking structure.
1219 * @param ppv Where to store the mapping address of the page. The page
1220 * offset is masked off!
1221 *
1222 * @remarks Called from within the PGM critical section.
1223 */
1224static int pgmPhysPageMapCommon(PVMCC pVM, PPGMPAGE pPage, RTGCPHYS GCPhys, PPPGMPAGEMAP ppMap, void **ppv)
1225{
1226 PGM_LOCK_ASSERT_OWNER(pVM);
1227 NOREF(GCPhys);
1228
1229 /*
1230 * Special cases: MMIO2, ZERO and specially aliased MMIO pages.
1231 */
1232 if ( PGM_PAGE_GET_TYPE(pPage) == PGMPAGETYPE_MMIO2
1233 || PGM_PAGE_GET_TYPE(pPage) == PGMPAGETYPE_MMIO2_ALIAS_MMIO)
1234 {
1235 /* Decode the page id to a page in a MMIO2 ram range. */
1236 uint8_t idMmio2 = PGM_MMIO2_PAGEID_GET_MMIO2_ID(PGM_PAGE_GET_PAGEID(pPage));
1237 uint32_t iPage = PGM_MMIO2_PAGEID_GET_IDX(PGM_PAGE_GET_PAGEID(pPage));
1238 AssertLogRelMsgReturn((uint8_t)(idMmio2 - 1U) < RT_ELEMENTS(pVM->pgm.s.CTX_SUFF(apMmio2Ranges)),
1239 ("idMmio2=%u size=%u type=%u GCPHys=%#RGp Id=%u State=%u", idMmio2,
1240 RT_ELEMENTS(pVM->pgm.s.CTX_SUFF(apMmio2Ranges)), PGM_PAGE_GET_TYPE(pPage), GCPhys,
1241 pPage->s.idPage, pPage->s.uStateY),
1242 VERR_PGM_PHYS_PAGE_MAP_MMIO2_IPE);
1243 PPGMREGMMIO2RANGE pMmio2Range = pVM->pgm.s.CTX_SUFF(apMmio2Ranges)[idMmio2 - 1];
1244 AssertLogRelReturn(pMmio2Range, VERR_PGM_PHYS_PAGE_MAP_MMIO2_IPE);
1245 AssertLogRelReturn(pMmio2Range->idMmio2 == idMmio2, VERR_PGM_PHYS_PAGE_MAP_MMIO2_IPE);
1246 AssertLogRelReturn(iPage < (pMmio2Range->RamRange.cb >> PAGE_SHIFT), VERR_PGM_PHYS_PAGE_MAP_MMIO2_IPE);
1247 *ppMap = NULL;
1248# if defined(IN_RING0) && defined(VBOX_WITH_RAM_IN_KERNEL) && defined(VBOX_WITH_LINEAR_HOST_PHYS_MEM)
1249 return SUPR0HCPhysToVirt(PGM_PAGE_GET_HCPHYS(pPage), ppv);
1250# elif defined(IN_RING0) && defined(VBOX_WITH_RAM_IN_KERNEL)
1251 *ppv = (uint8_t *)pMmio2Range->pvR0 + ((uintptr_t)iPage << PAGE_SHIFT);
1252 return VINF_SUCCESS;
1253# else
1254 *ppv = (uint8_t *)pMmio2Range->RamRange.pvR3 + ((uintptr_t)iPage << PAGE_SHIFT);
1255 return VINF_SUCCESS;
1256# endif
1257 }
1258
1259 const uint32_t idChunk = PGM_PAGE_GET_CHUNKID(pPage);
1260 if (idChunk == NIL_GMM_CHUNKID)
1261 {
1262 AssertMsgReturn(PGM_PAGE_GET_PAGEID(pPage) == NIL_GMM_PAGEID, ("pPage=%R[pgmpage]\n", pPage),
1263 VERR_PGM_PHYS_PAGE_MAP_IPE_1);
1264 if (!PGM_PAGE_IS_SPECIAL_ALIAS_MMIO(pPage))
1265 {
1266 AssertMsgReturn(PGM_PAGE_IS_ZERO(pPage), ("pPage=%R[pgmpage]\n", pPage),
1267 VERR_PGM_PHYS_PAGE_MAP_IPE_3);
1268 AssertMsgReturn(PGM_PAGE_GET_HCPHYS(pPage)== pVM->pgm.s.HCPhysZeroPg, ("pPage=%R[pgmpage]\n", pPage),
1269 VERR_PGM_PHYS_PAGE_MAP_IPE_4);
1270 *ppv = pVM->pgm.s.CTXALLSUFF(pvZeroPg);
1271 }
1272 else
1273 *ppv = pVM->pgm.s.CTXALLSUFF(pvZeroPg);
1274 *ppMap = NULL;
1275 return VINF_SUCCESS;
1276 }
1277
1278# if defined(IN_RING0) && defined(VBOX_WITH_RAM_IN_KERNEL) && defined(VBOX_WITH_LINEAR_HOST_PHYS_MEM)
1279 /*
1280 * Just use the physical address.
1281 */
1282 *ppMap = NULL;
1283 return SUPR0HCPhysToVirt(PGM_PAGE_GET_HCPHYS(pPage), ppv);
1284
1285# elif defined(IN_RING0) && defined(VBOX_WITH_RAM_IN_KERNEL)
1286 /*
1287 * Go by page ID thru GMMR0.
1288 */
1289 *ppMap = NULL;
1290 return GMMR0PageIdToVirt(pVM, PGM_PAGE_GET_PAGEID(pPage), ppv);
1291
1292# else
1293 /*
1294 * Find/make Chunk TLB entry for the mapping chunk.
1295 */
1296 PPGMCHUNKR3MAP pMap;
1297 PPGMCHUNKR3MAPTLBE pTlbe = &pVM->pgm.s.ChunkR3Map.Tlb.aEntries[PGM_CHUNKR3MAPTLB_IDX(idChunk)];
1298 if (pTlbe->idChunk == idChunk)
1299 {
1300 STAM_COUNTER_INC(&pVM->pgm.s.CTX_SUFF(pStats)->CTX_MID_Z(Stat,ChunkR3MapTlbHits));
1301 pMap = pTlbe->pChunk;
1302 AssertPtr(pMap->pv);
1303 }
1304 else
1305 {
1306 STAM_COUNTER_INC(&pVM->pgm.s.CTX_SUFF(pStats)->CTX_MID_Z(Stat,ChunkR3MapTlbMisses));
1307
1308 /*
1309 * Find the chunk, map it if necessary.
1310 */
1311 pMap = (PPGMCHUNKR3MAP)RTAvlU32Get(&pVM->pgm.s.ChunkR3Map.pTree, idChunk);
1312 if (pMap)
1313 {
1314 AssertPtr(pMap->pv);
1315 pMap->iLastUsed = pVM->pgm.s.ChunkR3Map.iNow;
1316 }
1317 else
1318 {
1319# ifdef IN_RING0
1320 int rc = VMMRZCallRing3NoCpu(pVM, VMMCALLRING3_PGM_MAP_CHUNK, idChunk);
1321 AssertRCReturn(rc, rc);
1322 pMap = (PPGMCHUNKR3MAP)RTAvlU32Get(&pVM->pgm.s.ChunkR3Map.pTree, idChunk);
1323 Assert(pMap);
1324# else
1325 int rc = pgmR3PhysChunkMap(pVM, idChunk, &pMap);
1326 if (RT_FAILURE(rc))
1327 return rc;
1328# endif
1329 AssertPtr(pMap->pv);
1330 }
1331
1332 /*
1333 * Enter it into the Chunk TLB.
1334 */
1335 pTlbe->idChunk = idChunk;
1336 pTlbe->pChunk = pMap;
1337 }
1338
1339 *ppv = (uint8_t *)pMap->pv + (PGM_PAGE_GET_PAGE_IN_CHUNK(pPage) << PAGE_SHIFT);
1340 *ppMap = pMap;
1341 return VINF_SUCCESS;
1342# endif /* !IN_RING0 || !VBOX_WITH_RAM_IN_KERNEL */
1343}
1344
1345
1346/**
1347 * Combination of pgmPhysPageMakeWritable and pgmPhysPageMapWritable.
1348 *
1349 * This is typically used is paths where we cannot use the TLB methods (like ROM
1350 * pages) or where there is no point in using them since we won't get many hits.
1351 *
1352 * @returns VBox strict status code.
1353 * @retval VINF_SUCCESS on success.
1354 * @retval VINF_PGM_SYNC_CR3 on success and a page pool flush is pending.
1355 * @retval VERR_PGM_PHYS_PAGE_RESERVED it it's a valid page but has no physical backing.
1356 *
1357 * @param pVM The cross context VM structure.
1358 * @param pPage The physical page tracking structure.
1359 * @param GCPhys The address of the page.
1360 * @param ppv Where to store the mapping address of the page. The page
1361 * offset is masked off!
1362 *
1363 * @remarks Called from within the PGM critical section. The mapping is only
1364 * valid while you are inside section.
1365 */
1366int pgmPhysPageMakeWritableAndMap(PVMCC pVM, PPGMPAGE pPage, RTGCPHYS GCPhys, void **ppv)
1367{
1368 int rc = pgmPhysPageMakeWritable(pVM, pPage, GCPhys);
1369 if (RT_SUCCESS(rc))
1370 {
1371 AssertMsg(rc == VINF_SUCCESS || rc == VINF_PGM_SYNC_CR3 /* returned */, ("%Rrc\n", rc));
1372 PPGMPAGEMAP pMapIgnore;
1373 int rc2 = pgmPhysPageMapCommon(pVM, pPage, GCPhys, &pMapIgnore, ppv);
1374 if (RT_FAILURE(rc2)) /* preserve rc */
1375 rc = rc2;
1376 }
1377 return rc;
1378}
1379
1380
1381/**
1382 * Maps a page into the current virtual address space so it can be accessed for
1383 * both writing and reading.
1384 *
1385 * This is typically used is paths where we cannot use the TLB methods (like ROM
1386 * pages) or where there is no point in using them since we won't get many hits.
1387 *
1388 * @returns VBox status code.
1389 * @retval VINF_SUCCESS on success.
1390 * @retval VERR_PGM_PHYS_PAGE_RESERVED it it's a valid page but has no physical backing.
1391 *
1392 * @param pVM The cross context VM structure.
1393 * @param pPage The physical page tracking structure. Must be in the
1394 * allocated state.
1395 * @param GCPhys The address of the page.
1396 * @param ppv Where to store the mapping address of the page. The page
1397 * offset is masked off!
1398 *
1399 * @remarks Called from within the PGM critical section. The mapping is only
1400 * valid while you are inside section.
1401 */
1402int pgmPhysPageMap(PVMCC pVM, PPGMPAGE pPage, RTGCPHYS GCPhys, void **ppv)
1403{
1404 Assert(PGM_PAGE_GET_STATE(pPage) == PGM_PAGE_STATE_ALLOCATED);
1405 PPGMPAGEMAP pMapIgnore;
1406 return pgmPhysPageMapCommon(pVM, pPage, GCPhys, &pMapIgnore, ppv);
1407}
1408
1409
1410/**
1411 * Maps a page into the current virtual address space so it can be accessed for
1412 * reading.
1413 *
1414 * This is typically used is paths where we cannot use the TLB methods (like ROM
1415 * pages) or where there is no point in using them since we won't get many hits.
1416 *
1417 * @returns VBox status code.
1418 * @retval VINF_SUCCESS on success.
1419 * @retval VERR_PGM_PHYS_PAGE_RESERVED it it's a valid page but has no physical backing.
1420 *
1421 * @param pVM The cross context VM structure.
1422 * @param pPage The physical page tracking structure.
1423 * @param GCPhys The address of the page.
1424 * @param ppv Where to store the mapping address of the page. The page
1425 * offset is masked off!
1426 *
1427 * @remarks Called from within the PGM critical section. The mapping is only
1428 * valid while you are inside this section.
1429 */
1430int pgmPhysPageMapReadOnly(PVMCC pVM, PPGMPAGE pPage, RTGCPHYS GCPhys, void const **ppv)
1431{
1432 PPGMPAGEMAP pMapIgnore;
1433 return pgmPhysPageMapCommon(pVM, pPage, GCPhys, &pMapIgnore, (void **)ppv);
1434}
1435
1436
1437/**
1438 * Load a guest page into the ring-3 physical TLB.
1439 *
1440 * @returns VBox status code.
1441 * @retval VINF_SUCCESS on success
1442 * @retval VERR_PGM_INVALID_GC_PHYSICAL_ADDRESS if it's not a valid physical address.
1443 * @param pVM The cross context VM structure.
1444 * @param GCPhys The guest physical address in question.
1445 */
1446int pgmPhysPageLoadIntoTlb(PVMCC pVM, RTGCPHYS GCPhys)
1447{
1448 PGM_LOCK_ASSERT_OWNER(pVM);
1449
1450 /*
1451 * Find the ram range and page and hand it over to the with-page function.
1452 * 99.8% of requests are expected to be in the first range.
1453 */
1454 PPGMPAGE pPage = pgmPhysGetPage(pVM, GCPhys);
1455 if (!pPage)
1456 {
1457 STAM_COUNTER_INC(&pVM->pgm.s.CTX_SUFF(pStats)->CTX_MID_Z(Stat,PageMapTlbMisses));
1458 return VERR_PGM_INVALID_GC_PHYSICAL_ADDRESS;
1459 }
1460
1461 return pgmPhysPageLoadIntoTlbWithPage(pVM, pPage, GCPhys);
1462}
1463
1464
1465/**
1466 * Load a guest page into the ring-3 physical TLB.
1467 *
1468 * @returns VBox status code.
1469 * @retval VINF_SUCCESS on success
1470 * @retval VERR_PGM_INVALID_GC_PHYSICAL_ADDRESS if it's not a valid physical address.
1471 *
1472 * @param pVM The cross context VM structure.
1473 * @param pPage Pointer to the PGMPAGE structure corresponding to
1474 * GCPhys.
1475 * @param GCPhys The guest physical address in question.
1476 */
1477int pgmPhysPageLoadIntoTlbWithPage(PVMCC pVM, PPGMPAGE pPage, RTGCPHYS GCPhys)
1478{
1479 PGM_LOCK_ASSERT_OWNER(pVM);
1480 STAM_COUNTER_INC(&pVM->pgm.s.CTX_SUFF(pStats)->CTX_MID_Z(Stat,PageMapTlbMisses));
1481
1482 /*
1483 * Map the page.
1484 * Make a special case for the zero page as it is kind of special.
1485 */
1486 PPGMPAGEMAPTLBE pTlbe = &pVM->pgm.s.CTX_SUFF(PhysTlb).aEntries[PGM_PAGEMAPTLB_IDX(GCPhys)];
1487 if ( !PGM_PAGE_IS_ZERO(pPage)
1488 && !PGM_PAGE_IS_BALLOONED(pPage))
1489 {
1490 void *pv;
1491 PPGMPAGEMAP pMap;
1492 int rc = pgmPhysPageMapCommon(pVM, pPage, GCPhys, &pMap, &pv);
1493 if (RT_FAILURE(rc))
1494 return rc;
1495# if !defined(IN_RING0) || !defined(VBOX_WITH_RAM_IN_KERNEL)
1496 pTlbe->pMap = pMap;
1497# endif
1498 pTlbe->pv = pv;
1499 Assert(!((uintptr_t)pTlbe->pv & PAGE_OFFSET_MASK));
1500 }
1501 else
1502 {
1503 AssertMsg(PGM_PAGE_GET_HCPHYS(pPage) == pVM->pgm.s.HCPhysZeroPg, ("%RGp/%R[pgmpage]\n", GCPhys, pPage));
1504# if !defined(IN_RING0) || !defined(VBOX_WITH_RAM_IN_KERNEL)
1505 pTlbe->pMap = NULL;
1506# endif
1507 pTlbe->pv = pVM->pgm.s.CTXALLSUFF(pvZeroPg);
1508 }
1509# ifdef PGM_WITH_PHYS_TLB
1510 if ( PGM_PAGE_GET_TYPE(pPage) < PGMPAGETYPE_ROM_SHADOW
1511 || PGM_PAGE_GET_TYPE(pPage) > PGMPAGETYPE_ROM)
1512 pTlbe->GCPhys = GCPhys & X86_PTE_PAE_PG_MASK;
1513 else
1514 pTlbe->GCPhys = NIL_RTGCPHYS; /* ROM: Problematic because of the two pages. :-/ */
1515# else
1516 pTlbe->GCPhys = NIL_RTGCPHYS;
1517# endif
1518 pTlbe->pPage = pPage;
1519 return VINF_SUCCESS;
1520}
1521
1522
1523/**
1524 * Internal version of PGMPhysGCPhys2CCPtr that expects the caller to
1525 * own the PGM lock and therefore not need to lock the mapped page.
1526 *
1527 * @returns VBox status code.
1528 * @retval VINF_SUCCESS on success.
1529 * @retval VERR_PGM_PHYS_PAGE_RESERVED it it's a valid page but has no physical backing.
1530 * @retval VERR_PGM_INVALID_GC_PHYSICAL_ADDRESS if it's not a valid physical address.
1531 *
1532 * @param pVM The cross context VM structure.
1533 * @param GCPhys The guest physical address of the page that should be mapped.
1534 * @param pPage Pointer to the PGMPAGE structure for the page.
1535 * @param ppv Where to store the address corresponding to GCPhys.
1536 *
1537 * @internal
1538 * @deprecated Use pgmPhysGCPhys2CCPtrInternalEx.
1539 */
1540int pgmPhysGCPhys2CCPtrInternalDepr(PVMCC pVM, PPGMPAGE pPage, RTGCPHYS GCPhys, void **ppv)
1541{
1542 int rc;
1543 AssertReturn(pPage, VERR_PGM_PHYS_NULL_PAGE_PARAM);
1544 PGM_LOCK_ASSERT_OWNER(pVM);
1545 pVM->pgm.s.cDeprecatedPageLocks++;
1546
1547 /*
1548 * Make sure the page is writable.
1549 */
1550 if (RT_UNLIKELY(PGM_PAGE_GET_STATE(pPage) != PGM_PAGE_STATE_ALLOCATED))
1551 {
1552 rc = pgmPhysPageMakeWritable(pVM, pPage, GCPhys);
1553 if (RT_FAILURE(rc))
1554 return rc;
1555 AssertMsg(rc == VINF_SUCCESS || rc == VINF_PGM_SYNC_CR3 /* not returned */, ("%Rrc\n", rc));
1556 }
1557 Assert(PGM_PAGE_GET_HCPHYS(pPage) != 0);
1558
1559 /*
1560 * Get the mapping address.
1561 */
1562 PPGMPAGEMAPTLBE pTlbe;
1563 rc = pgmPhysPageQueryTlbeWithPage(pVM, pPage, GCPhys, &pTlbe);
1564 if (RT_FAILURE(rc))
1565 return rc;
1566 *ppv = (void *)((uintptr_t)pTlbe->pv | (uintptr_t)(GCPhys & PAGE_OFFSET_MASK));
1567 return VINF_SUCCESS;
1568}
1569
1570
1571/**
1572 * Locks a page mapping for writing.
1573 *
1574 * @param pVM The cross context VM structure.
1575 * @param pPage The page.
1576 * @param pTlbe The mapping TLB entry for the page.
1577 * @param pLock The lock structure (output).
1578 */
1579DECLINLINE(void) pgmPhysPageMapLockForWriting(PVM pVM, PPGMPAGE pPage, PPGMPAGEMAPTLBE pTlbe, PPGMPAGEMAPLOCK pLock)
1580{
1581# if !defined(IN_RING0) || !defined(VBOX_WITH_RAM_IN_KERNEL)
1582 PPGMPAGEMAP pMap = pTlbe->pMap;
1583 if (pMap)
1584 pMap->cRefs++;
1585# else
1586 RT_NOREF(pTlbe);
1587# endif
1588
1589 unsigned cLocks = PGM_PAGE_GET_WRITE_LOCKS(pPage);
1590 if (RT_LIKELY(cLocks < PGM_PAGE_MAX_LOCKS - 1))
1591 {
1592 if (cLocks == 0)
1593 pVM->pgm.s.cWriteLockedPages++;
1594 PGM_PAGE_INC_WRITE_LOCKS(pPage);
1595 }
1596 else if (cLocks != PGM_PAGE_MAX_LOCKS)
1597 {
1598 PGM_PAGE_INC_WRITE_LOCKS(pPage);
1599 AssertMsgFailed(("%R[pgmpage] is entering permanent write locked state!\n", pPage));
1600# if !defined(IN_RING0) || !defined(VBOX_WITH_RAM_IN_KERNEL)
1601 if (pMap)
1602 pMap->cRefs++; /* Extra ref to prevent it from going away. */
1603# endif
1604 }
1605
1606 pLock->uPageAndType = (uintptr_t)pPage | PGMPAGEMAPLOCK_TYPE_WRITE;
1607# if !defined(IN_RING0) || !defined(VBOX_WITH_RAM_IN_KERNEL)
1608 pLock->pvMap = pMap;
1609# else
1610 pLock->pvMap = NULL;
1611# endif
1612}
1613
1614/**
1615 * Locks a page mapping for reading.
1616 *
1617 * @param pVM The cross context VM structure.
1618 * @param pPage The page.
1619 * @param pTlbe The mapping TLB entry for the page.
1620 * @param pLock The lock structure (output).
1621 */
1622DECLINLINE(void) pgmPhysPageMapLockForReading(PVM pVM, PPGMPAGE pPage, PPGMPAGEMAPTLBE pTlbe, PPGMPAGEMAPLOCK pLock)
1623{
1624# if !defined(IN_RING0) || !defined(VBOX_WITH_RAM_IN_KERNEL)
1625 PPGMPAGEMAP pMap = pTlbe->pMap;
1626 if (pMap)
1627 pMap->cRefs++;
1628# else
1629 RT_NOREF(pTlbe);
1630# endif
1631
1632 unsigned cLocks = PGM_PAGE_GET_READ_LOCKS(pPage);
1633 if (RT_LIKELY(cLocks < PGM_PAGE_MAX_LOCKS - 1))
1634 {
1635 if (cLocks == 0)
1636 pVM->pgm.s.cReadLockedPages++;
1637 PGM_PAGE_INC_READ_LOCKS(pPage);
1638 }
1639 else if (cLocks != PGM_PAGE_MAX_LOCKS)
1640 {
1641 PGM_PAGE_INC_READ_LOCKS(pPage);
1642 AssertMsgFailed(("%R[pgmpage] is entering permanent read locked state!\n", pPage));
1643# if !defined(IN_RING0) || !defined(VBOX_WITH_RAM_IN_KERNEL)
1644 if (pMap)
1645 pMap->cRefs++; /* Extra ref to prevent it from going away. */
1646# endif
1647 }
1648
1649 pLock->uPageAndType = (uintptr_t)pPage | PGMPAGEMAPLOCK_TYPE_READ;
1650# if !defined(IN_RING0) || !defined(VBOX_WITH_RAM_IN_KERNEL)
1651 pLock->pvMap = pMap;
1652# else
1653 pLock->pvMap = NULL;
1654# endif
1655}
1656
1657
1658/**
1659 * Internal version of PGMPhysGCPhys2CCPtr that expects the caller to
1660 * own the PGM lock and have access to the page structure.
1661 *
1662 * @returns VBox status code.
1663 * @retval VINF_SUCCESS on success.
1664 * @retval VERR_PGM_PHYS_PAGE_RESERVED it it's a valid page but has no physical backing.
1665 * @retval VERR_PGM_INVALID_GC_PHYSICAL_ADDRESS if it's not a valid physical address.
1666 *
1667 * @param pVM The cross context VM structure.
1668 * @param GCPhys The guest physical address of the page that should be mapped.
1669 * @param pPage Pointer to the PGMPAGE structure for the page.
1670 * @param ppv Where to store the address corresponding to GCPhys.
1671 * @param pLock Where to store the lock information that
1672 * pgmPhysReleaseInternalPageMappingLock needs.
1673 *
1674 * @internal
1675 */
1676int pgmPhysGCPhys2CCPtrInternal(PVMCC pVM, PPGMPAGE pPage, RTGCPHYS GCPhys, void **ppv, PPGMPAGEMAPLOCK pLock)
1677{
1678 int rc;
1679 AssertReturn(pPage, VERR_PGM_PHYS_NULL_PAGE_PARAM);
1680 PGM_LOCK_ASSERT_OWNER(pVM);
1681
1682 /*
1683 * Make sure the page is writable.
1684 */
1685 if (RT_UNLIKELY(PGM_PAGE_GET_STATE(pPage) != PGM_PAGE_STATE_ALLOCATED))
1686 {
1687 rc = pgmPhysPageMakeWritable(pVM, pPage, GCPhys);
1688 if (RT_FAILURE(rc))
1689 return rc;
1690 AssertMsg(rc == VINF_SUCCESS || rc == VINF_PGM_SYNC_CR3 /* not returned */, ("%Rrc\n", rc));
1691 }
1692 Assert(PGM_PAGE_GET_HCPHYS(pPage) != 0);
1693
1694 /*
1695 * Do the job.
1696 */
1697 PPGMPAGEMAPTLBE pTlbe;
1698 rc = pgmPhysPageQueryTlbeWithPage(pVM, pPage, GCPhys, &pTlbe);
1699 if (RT_FAILURE(rc))
1700 return rc;
1701 pgmPhysPageMapLockForWriting(pVM, pPage, pTlbe, pLock);
1702 *ppv = (void *)((uintptr_t)pTlbe->pv | (uintptr_t)(GCPhys & PAGE_OFFSET_MASK));
1703 return VINF_SUCCESS;
1704}
1705
1706
1707/**
1708 * Internal version of PGMPhysGCPhys2CCPtrReadOnly that expects the caller to
1709 * own the PGM lock and have access to the page structure.
1710 *
1711 * @returns VBox status code.
1712 * @retval VINF_SUCCESS on success.
1713 * @retval VERR_PGM_PHYS_PAGE_RESERVED it it's a valid page but has no physical backing.
1714 * @retval VERR_PGM_INVALID_GC_PHYSICAL_ADDRESS if it's not a valid physical address.
1715 *
1716 * @param pVM The cross context VM structure.
1717 * @param GCPhys The guest physical address of the page that should be mapped.
1718 * @param pPage Pointer to the PGMPAGE structure for the page.
1719 * @param ppv Where to store the address corresponding to GCPhys.
1720 * @param pLock Where to store the lock information that
1721 * pgmPhysReleaseInternalPageMappingLock needs.
1722 *
1723 * @internal
1724 */
1725int pgmPhysGCPhys2CCPtrInternalReadOnly(PVMCC pVM, PPGMPAGE pPage, RTGCPHYS GCPhys, const void **ppv, PPGMPAGEMAPLOCK pLock)
1726{
1727 AssertReturn(pPage, VERR_PGM_PHYS_NULL_PAGE_PARAM);
1728 PGM_LOCK_ASSERT_OWNER(pVM);
1729 Assert(PGM_PAGE_GET_HCPHYS(pPage) != 0);
1730
1731 /*
1732 * Do the job.
1733 */
1734 PPGMPAGEMAPTLBE pTlbe;
1735 int rc = pgmPhysPageQueryTlbeWithPage(pVM, pPage, GCPhys, &pTlbe);
1736 if (RT_FAILURE(rc))
1737 return rc;
1738 pgmPhysPageMapLockForReading(pVM, pPage, pTlbe, pLock);
1739 *ppv = (void *)((uintptr_t)pTlbe->pv | (uintptr_t)(GCPhys & PAGE_OFFSET_MASK));
1740 return VINF_SUCCESS;
1741}
1742
1743
1744/**
1745 * Requests the mapping of a guest page into the current context.
1746 *
1747 * This API should only be used for very short term, as it will consume scarse
1748 * resources (R0 and GC) in the mapping cache. When you're done with the page,
1749 * call PGMPhysReleasePageMappingLock() ASAP to release it.
1750 *
1751 * This API will assume your intention is to write to the page, and will
1752 * therefore replace shared and zero pages. If you do not intend to modify
1753 * the page, use the PGMPhysGCPhys2CCPtrReadOnly() API.
1754 *
1755 * @returns VBox status code.
1756 * @retval VINF_SUCCESS on success.
1757 * @retval VERR_PGM_PHYS_PAGE_RESERVED it it's a valid page but has no physical backing.
1758 * @retval VERR_PGM_INVALID_GC_PHYSICAL_ADDRESS if it's not a valid physical address.
1759 *
1760 * @param pVM The cross context VM structure.
1761 * @param GCPhys The guest physical address of the page that should be
1762 * mapped.
1763 * @param ppv Where to store the address corresponding to GCPhys.
1764 * @param pLock Where to store the lock information that
1765 * PGMPhysReleasePageMappingLock needs.
1766 *
1767 * @remarks The caller is responsible for dealing with access handlers.
1768 * @todo Add an informational return code for pages with access handlers?
1769 *
1770 * @remark Avoid calling this API from within critical sections (other than
1771 * the PGM one) because of the deadlock risk. External threads may
1772 * need to delegate jobs to the EMTs.
1773 * @remarks Only one page is mapped! Make no assumption about what's after or
1774 * before the returned page!
1775 * @thread Any thread.
1776 */
1777VMM_INT_DECL(int) PGMPhysGCPhys2CCPtr(PVMCC pVM, RTGCPHYS GCPhys, void **ppv, PPGMPAGEMAPLOCK pLock)
1778{
1779 int rc = PGM_LOCK(pVM);
1780 AssertRCReturn(rc, rc);
1781
1782 /*
1783 * Query the Physical TLB entry for the page (may fail).
1784 */
1785 PPGMPAGEMAPTLBE pTlbe;
1786 rc = pgmPhysPageQueryTlbe(pVM, GCPhys, &pTlbe);
1787 if (RT_SUCCESS(rc))
1788 {
1789 /*
1790 * If the page is shared, the zero page, or being write monitored
1791 * it must be converted to a page that's writable if possible.
1792 */
1793 PPGMPAGE pPage = pTlbe->pPage;
1794 if (RT_UNLIKELY(PGM_PAGE_GET_STATE(pPage) != PGM_PAGE_STATE_ALLOCATED))
1795 {
1796 rc = pgmPhysPageMakeWritable(pVM, pPage, GCPhys);
1797 if (RT_SUCCESS(rc))
1798 {
1799 AssertMsg(rc == VINF_SUCCESS || rc == VINF_PGM_SYNC_CR3 /* not returned */, ("%Rrc\n", rc));
1800 rc = pgmPhysPageQueryTlbeWithPage(pVM, pPage, GCPhys, &pTlbe);
1801 }
1802 }
1803 if (RT_SUCCESS(rc))
1804 {
1805 /*
1806 * Now, just perform the locking and calculate the return address.
1807 */
1808 pgmPhysPageMapLockForWriting(pVM, pPage, pTlbe, pLock);
1809 *ppv = (void *)((uintptr_t)pTlbe->pv | (uintptr_t)(GCPhys & PAGE_OFFSET_MASK));
1810 }
1811 }
1812
1813 PGM_UNLOCK(pVM);
1814 return rc;
1815}
1816
1817
1818/**
1819 * Requests the mapping of a guest page into the current context.
1820 *
1821 * This API should only be used for very short term, as it will consume scarse
1822 * resources (R0 and GC) in the mapping cache. When you're done with the page,
1823 * call PGMPhysReleasePageMappingLock() ASAP to release it.
1824 *
1825 * @returns VBox status code.
1826 * @retval VINF_SUCCESS on success.
1827 * @retval VERR_PGM_PHYS_PAGE_RESERVED it it's a valid page but has no physical backing.
1828 * @retval VERR_PGM_INVALID_GC_PHYSICAL_ADDRESS if it's not a valid physical address.
1829 *
1830 * @param pVM The cross context VM structure.
1831 * @param GCPhys The guest physical address of the page that should be
1832 * mapped.
1833 * @param ppv Where to store the address corresponding to GCPhys.
1834 * @param pLock Where to store the lock information that
1835 * PGMPhysReleasePageMappingLock needs.
1836 *
1837 * @remarks The caller is responsible for dealing with access handlers.
1838 * @todo Add an informational return code for pages with access handlers?
1839 *
1840 * @remarks Avoid calling this API from within critical sections (other than
1841 * the PGM one) because of the deadlock risk.
1842 * @remarks Only one page is mapped! Make no assumption about what's after or
1843 * before the returned page!
1844 * @thread Any thread.
1845 */
1846VMM_INT_DECL(int) PGMPhysGCPhys2CCPtrReadOnly(PVMCC pVM, RTGCPHYS GCPhys, void const **ppv, PPGMPAGEMAPLOCK pLock)
1847{
1848 int rc = PGM_LOCK(pVM);
1849 AssertRCReturn(rc, rc);
1850
1851 /*
1852 * Query the Physical TLB entry for the page (may fail).
1853 */
1854 PPGMPAGEMAPTLBE pTlbe;
1855 rc = pgmPhysPageQueryTlbe(pVM, GCPhys, &pTlbe);
1856 if (RT_SUCCESS(rc))
1857 {
1858 /* MMIO pages doesn't have any readable backing. */
1859 PPGMPAGE pPage = pTlbe->pPage;
1860 if (RT_UNLIKELY(PGM_PAGE_IS_MMIO_OR_SPECIAL_ALIAS(pPage)))
1861 rc = VERR_PGM_PHYS_PAGE_RESERVED;
1862 else
1863 {
1864 /*
1865 * Now, just perform the locking and calculate the return address.
1866 */
1867 pgmPhysPageMapLockForReading(pVM, pPage, pTlbe, pLock);
1868 *ppv = (void *)((uintptr_t)pTlbe->pv | (uintptr_t)(GCPhys & PAGE_OFFSET_MASK));
1869 }
1870 }
1871
1872 PGM_UNLOCK(pVM);
1873 return rc;
1874}
1875
1876
1877/**
1878 * Requests the mapping of a guest page given by virtual address into the current context.
1879 *
1880 * This API should only be used for very short term, as it will consume
1881 * scarse resources (R0 and GC) in the mapping cache. When you're done
1882 * with the page, call PGMPhysReleasePageMappingLock() ASAP to release it.
1883 *
1884 * This API will assume your intention is to write to the page, and will
1885 * therefore replace shared and zero pages. If you do not intend to modify
1886 * the page, use the PGMPhysGCPtr2CCPtrReadOnly() API.
1887 *
1888 * @returns VBox status code.
1889 * @retval VINF_SUCCESS on success.
1890 * @retval VERR_PAGE_TABLE_NOT_PRESENT if the page directory for the virtual address isn't present.
1891 * @retval VERR_PAGE_NOT_PRESENT if the page at the virtual address isn't present.
1892 * @retval VERR_PGM_PHYS_PAGE_RESERVED it it's a valid page but has no physical backing.
1893 * @retval VERR_PGM_INVALID_GC_PHYSICAL_ADDRESS if it's not a valid physical address.
1894 *
1895 * @param pVCpu The cross context virtual CPU structure.
1896 * @param GCPtr The guest physical address of the page that should be
1897 * mapped.
1898 * @param ppv Where to store the address corresponding to GCPhys.
1899 * @param pLock Where to store the lock information that PGMPhysReleasePageMappingLock needs.
1900 *
1901 * @remark Avoid calling this API from within critical sections (other than
1902 * the PGM one) because of the deadlock risk.
1903 * @thread EMT
1904 */
1905VMM_INT_DECL(int) PGMPhysGCPtr2CCPtr(PVMCPUCC pVCpu, RTGCPTR GCPtr, void **ppv, PPGMPAGEMAPLOCK pLock)
1906{
1907 VM_ASSERT_EMT(pVCpu->CTX_SUFF(pVM));
1908 RTGCPHYS GCPhys;
1909 int rc = PGMPhysGCPtr2GCPhys(pVCpu, GCPtr, &GCPhys);
1910 if (RT_SUCCESS(rc))
1911 rc = PGMPhysGCPhys2CCPtr(pVCpu->CTX_SUFF(pVM), GCPhys, ppv, pLock);
1912 return rc;
1913}
1914
1915
1916/**
1917 * Requests the mapping of a guest page given by virtual address into the current context.
1918 *
1919 * This API should only be used for very short term, as it will consume
1920 * scarse resources (R0 and GC) in the mapping cache. When you're done
1921 * with the page, call PGMPhysReleasePageMappingLock() ASAP to release it.
1922 *
1923 * @returns VBox status code.
1924 * @retval VINF_SUCCESS on success.
1925 * @retval VERR_PAGE_TABLE_NOT_PRESENT if the page directory for the virtual address isn't present.
1926 * @retval VERR_PAGE_NOT_PRESENT if the page at the virtual address isn't present.
1927 * @retval VERR_PGM_PHYS_PAGE_RESERVED it it's a valid page but has no physical backing.
1928 * @retval VERR_PGM_INVALID_GC_PHYSICAL_ADDRESS if it's not a valid physical address.
1929 *
1930 * @param pVCpu The cross context virtual CPU structure.
1931 * @param GCPtr The guest physical address of the page that should be
1932 * mapped.
1933 * @param ppv Where to store the address corresponding to GCPtr.
1934 * @param pLock Where to store the lock information that PGMPhysReleasePageMappingLock needs.
1935 *
1936 * @remark Avoid calling this API from within critical sections (other than
1937 * the PGM one) because of the deadlock risk.
1938 * @thread EMT
1939 */
1940VMM_INT_DECL(int) PGMPhysGCPtr2CCPtrReadOnly(PVMCPUCC pVCpu, RTGCPTR GCPtr, void const **ppv, PPGMPAGEMAPLOCK pLock)
1941{
1942 VM_ASSERT_EMT(pVCpu->CTX_SUFF(pVM));
1943 RTGCPHYS GCPhys;
1944 int rc = PGMPhysGCPtr2GCPhys(pVCpu, GCPtr, &GCPhys);
1945 if (RT_SUCCESS(rc))
1946 rc = PGMPhysGCPhys2CCPtrReadOnly(pVCpu->CTX_SUFF(pVM), GCPhys, ppv, pLock);
1947 return rc;
1948}
1949
1950
1951/**
1952 * Release the mapping of a guest page.
1953 *
1954 * This is the counter part of PGMPhysGCPhys2CCPtr, PGMPhysGCPhys2CCPtrReadOnly
1955 * PGMPhysGCPtr2CCPtr and PGMPhysGCPtr2CCPtrReadOnly.
1956 *
1957 * @param pVM The cross context VM structure.
1958 * @param pLock The lock structure initialized by the mapping function.
1959 */
1960VMMDECL(void) PGMPhysReleasePageMappingLock(PVMCC pVM, PPGMPAGEMAPLOCK pLock)
1961{
1962# if !defined(IN_RING0) || !defined(VBOX_WITH_RAM_IN_KERNEL)
1963 PPGMPAGEMAP pMap = (PPGMPAGEMAP)pLock->pvMap;
1964# endif
1965 PPGMPAGE pPage = (PPGMPAGE)(pLock->uPageAndType & ~PGMPAGEMAPLOCK_TYPE_MASK);
1966 bool fWriteLock = (pLock->uPageAndType & PGMPAGEMAPLOCK_TYPE_MASK) == PGMPAGEMAPLOCK_TYPE_WRITE;
1967
1968 pLock->uPageAndType = 0;
1969 pLock->pvMap = NULL;
1970
1971 PGM_LOCK_VOID(pVM);
1972 if (fWriteLock)
1973 {
1974 unsigned cLocks = PGM_PAGE_GET_WRITE_LOCKS(pPage);
1975 Assert(cLocks > 0);
1976 if (RT_LIKELY(cLocks > 0 && cLocks < PGM_PAGE_MAX_LOCKS))
1977 {
1978 if (cLocks == 1)
1979 {
1980 Assert(pVM->pgm.s.cWriteLockedPages > 0);
1981 pVM->pgm.s.cWriteLockedPages--;
1982 }
1983 PGM_PAGE_DEC_WRITE_LOCKS(pPage);
1984 }
1985
1986 if (PGM_PAGE_GET_STATE(pPage) != PGM_PAGE_STATE_WRITE_MONITORED)
1987 { /* probably extremely likely */ }
1988 else
1989 pgmPhysPageMakeWriteMonitoredWritable(pVM, pPage, NIL_RTGCPHYS);
1990 }
1991 else
1992 {
1993 unsigned cLocks = PGM_PAGE_GET_READ_LOCKS(pPage);
1994 Assert(cLocks > 0);
1995 if (RT_LIKELY(cLocks > 0 && cLocks < PGM_PAGE_MAX_LOCKS))
1996 {
1997 if (cLocks == 1)
1998 {
1999 Assert(pVM->pgm.s.cReadLockedPages > 0);
2000 pVM->pgm.s.cReadLockedPages--;
2001 }
2002 PGM_PAGE_DEC_READ_LOCKS(pPage);
2003 }
2004 }
2005
2006# if !defined(IN_RING0) || !defined(VBOX_WITH_RAM_IN_KERNEL)
2007 if (pMap)
2008 {
2009 Assert(pMap->cRefs >= 1);
2010 pMap->cRefs--;
2011 }
2012# endif
2013 PGM_UNLOCK(pVM);
2014}
2015
2016
2017#ifdef IN_RING3
2018/**
2019 * Release the mapping of multiple guest pages.
2020 *
2021 * This is the counter part to PGMR3PhysBulkGCPhys2CCPtrExternal() and
2022 * PGMR3PhysBulkGCPhys2CCPtrReadOnlyExternal().
2023 *
2024 * @param pVM The cross context VM structure.
2025 * @param cPages Number of pages to unlock.
2026 * @param paLocks Array of locks lock structure initialized by the mapping
2027 * function.
2028 */
2029VMMDECL(void) PGMPhysBulkReleasePageMappingLocks(PVMCC pVM, uint32_t cPages, PPGMPAGEMAPLOCK paLocks)
2030{
2031 Assert(cPages > 0);
2032 bool const fWriteLock = (paLocks[0].uPageAndType & PGMPAGEMAPLOCK_TYPE_MASK) == PGMPAGEMAPLOCK_TYPE_WRITE;
2033#ifdef VBOX_STRICT
2034 for (uint32_t i = 1; i < cPages; i++)
2035 {
2036 Assert(fWriteLock == ((paLocks[i].uPageAndType & PGMPAGEMAPLOCK_TYPE_MASK) == PGMPAGEMAPLOCK_TYPE_WRITE));
2037 AssertPtr(paLocks[i].uPageAndType);
2038 }
2039#endif
2040
2041 PGM_LOCK_VOID(pVM);
2042 if (fWriteLock)
2043 {
2044 /*
2045 * Write locks:
2046 */
2047 for (uint32_t i = 0; i < cPages; i++)
2048 {
2049 PPGMPAGE pPage = (PPGMPAGE)(paLocks[i].uPageAndType & ~PGMPAGEMAPLOCK_TYPE_MASK);
2050 unsigned cLocks = PGM_PAGE_GET_WRITE_LOCKS(pPage);
2051 Assert(cLocks > 0);
2052 if (RT_LIKELY(cLocks > 0 && cLocks < PGM_PAGE_MAX_LOCKS))
2053 {
2054 if (cLocks == 1)
2055 {
2056 Assert(pVM->pgm.s.cWriteLockedPages > 0);
2057 pVM->pgm.s.cWriteLockedPages--;
2058 }
2059 PGM_PAGE_DEC_WRITE_LOCKS(pPage);
2060 }
2061
2062 if (PGM_PAGE_GET_STATE(pPage) != PGM_PAGE_STATE_WRITE_MONITORED)
2063 { /* probably extremely likely */ }
2064 else
2065 pgmPhysPageMakeWriteMonitoredWritable(pVM, pPage, NIL_RTGCPHYS);
2066
2067 PPGMPAGEMAP pMap = (PPGMPAGEMAP)paLocks[i].pvMap;
2068 if (pMap)
2069 {
2070 Assert(pMap->cRefs >= 1);
2071 pMap->cRefs--;
2072 }
2073
2074 /* Yield the lock: */
2075 if ((i & 1023) == 1023 && i + 1 < cPages)
2076 {
2077 PGM_UNLOCK(pVM);
2078 PGM_LOCK_VOID(pVM);
2079 }
2080 }
2081 }
2082 else
2083 {
2084 /*
2085 * Read locks:
2086 */
2087 for (uint32_t i = 0; i < cPages; i++)
2088 {
2089 PPGMPAGE pPage = (PPGMPAGE)(paLocks[i].uPageAndType & ~PGMPAGEMAPLOCK_TYPE_MASK);
2090 unsigned cLocks = PGM_PAGE_GET_READ_LOCKS(pPage);
2091 Assert(cLocks > 0);
2092 if (RT_LIKELY(cLocks > 0 && cLocks < PGM_PAGE_MAX_LOCKS))
2093 {
2094 if (cLocks == 1)
2095 {
2096 Assert(pVM->pgm.s.cReadLockedPages > 0);
2097 pVM->pgm.s.cReadLockedPages--;
2098 }
2099 PGM_PAGE_DEC_READ_LOCKS(pPage);
2100 }
2101
2102 PPGMPAGEMAP pMap = (PPGMPAGEMAP)paLocks[i].pvMap;
2103 if (pMap)
2104 {
2105 Assert(pMap->cRefs >= 1);
2106 pMap->cRefs--;
2107 }
2108
2109 /* Yield the lock: */
2110 if ((i & 1023) == 1023 && i + 1 < cPages)
2111 {
2112 PGM_UNLOCK(pVM);
2113 PGM_LOCK_VOID(pVM);
2114 }
2115 }
2116 }
2117 PGM_UNLOCK(pVM);
2118
2119 RT_BZERO(paLocks, sizeof(paLocks[0]) * cPages);
2120}
2121#endif /* IN_RING3 */
2122
2123
2124/**
2125 * Release the internal mapping of a guest page.
2126 *
2127 * This is the counter part of pgmPhysGCPhys2CCPtrInternalEx and
2128 * pgmPhysGCPhys2CCPtrInternalReadOnly.
2129 *
2130 * @param pVM The cross context VM structure.
2131 * @param pLock The lock structure initialized by the mapping function.
2132 *
2133 * @remarks Caller must hold the PGM lock.
2134 */
2135void pgmPhysReleaseInternalPageMappingLock(PVMCC pVM, PPGMPAGEMAPLOCK pLock)
2136{
2137 PGM_LOCK_ASSERT_OWNER(pVM);
2138 PGMPhysReleasePageMappingLock(pVM, pLock); /* lazy for now */
2139}
2140
2141
2142/**
2143 * Converts a GC physical address to a HC ring-3 pointer.
2144 *
2145 * @returns VINF_SUCCESS on success.
2146 * @returns VERR_PGM_PHYS_PAGE_RESERVED it it's a valid GC physical
2147 * page but has no physical backing.
2148 * @returns VERR_PGM_INVALID_GC_PHYSICAL_ADDRESS if it's not a valid
2149 * GC physical address.
2150 * @returns VERR_PGM_GCPHYS_RANGE_CROSSES_BOUNDARY if the range crosses
2151 * a dynamic ram chunk boundary
2152 *
2153 * @param pVM The cross context VM structure.
2154 * @param GCPhys The GC physical address to convert.
2155 * @param pR3Ptr Where to store the R3 pointer on success.
2156 *
2157 * @deprecated Avoid when possible!
2158 */
2159int pgmPhysGCPhys2R3Ptr(PVMCC pVM, RTGCPHYS GCPhys, PRTR3PTR pR3Ptr)
2160{
2161/** @todo this is kind of hacky and needs some more work. */
2162#ifndef DEBUG_sandervl
2163 VM_ASSERT_EMT(pVM); /* no longer safe for use outside the EMT thread! */
2164#endif
2165
2166 Log(("pgmPhysGCPhys2R3Ptr(,%RGp,): dont use this API!\n", GCPhys)); /** @todo eliminate this API! */
2167 PGM_LOCK_VOID(pVM);
2168
2169 PPGMRAMRANGE pRam;
2170 PPGMPAGE pPage;
2171 int rc = pgmPhysGetPageAndRangeEx(pVM, GCPhys, &pPage, &pRam);
2172 if (RT_SUCCESS(rc))
2173 rc = pgmPhysGCPhys2CCPtrInternalDepr(pVM, pPage, GCPhys, (void **)pR3Ptr);
2174
2175 PGM_UNLOCK(pVM);
2176 Assert(rc <= VINF_SUCCESS);
2177 return rc;
2178}
2179
2180
2181/**
2182 * Converts a guest pointer to a GC physical address.
2183 *
2184 * This uses the current CR3/CR0/CR4 of the guest.
2185 *
2186 * @returns VBox status code.
2187 * @param pVCpu The cross context virtual CPU structure.
2188 * @param GCPtr The guest pointer to convert.
2189 * @param pGCPhys Where to store the GC physical address.
2190 */
2191VMMDECL(int) PGMPhysGCPtr2GCPhys(PVMCPUCC pVCpu, RTGCPTR GCPtr, PRTGCPHYS pGCPhys)
2192{
2193 int rc = PGMGstGetPage(pVCpu, (RTGCUINTPTR)GCPtr, NULL, pGCPhys);
2194 if (pGCPhys && RT_SUCCESS(rc))
2195 *pGCPhys |= (RTGCUINTPTR)GCPtr & PAGE_OFFSET_MASK;
2196 return rc;
2197}
2198
2199
2200/**
2201 * Converts a guest pointer to a HC physical address.
2202 *
2203 * This uses the current CR3/CR0/CR4 of the guest.
2204 *
2205 * @returns VBox status code.
2206 * @param pVCpu The cross context virtual CPU structure.
2207 * @param GCPtr The guest pointer to convert.
2208 * @param pHCPhys Where to store the HC physical address.
2209 */
2210VMM_INT_DECL(int) PGMPhysGCPtr2HCPhys(PVMCPUCC pVCpu, RTGCPTR GCPtr, PRTHCPHYS pHCPhys)
2211{
2212 PVMCC pVM = pVCpu->CTX_SUFF(pVM);
2213 RTGCPHYS GCPhys;
2214 int rc = PGMGstGetPage(pVCpu, (RTGCUINTPTR)GCPtr, NULL, &GCPhys);
2215 if (RT_SUCCESS(rc))
2216 rc = PGMPhysGCPhys2HCPhys(pVM, GCPhys | ((RTGCUINTPTR)GCPtr & PAGE_OFFSET_MASK), pHCPhys);
2217 return rc;
2218}
2219
2220
2221
2222#undef LOG_GROUP
2223#define LOG_GROUP LOG_GROUP_PGM_PHYS_ACCESS
2224
2225
2226#if defined(IN_RING3) && defined(SOME_UNUSED_FUNCTION)
2227/**
2228 * Cache PGMPhys memory access
2229 *
2230 * @param pVM The cross context VM structure.
2231 * @param pCache Cache structure pointer
2232 * @param GCPhys GC physical address
2233 * @param pbHC HC pointer corresponding to physical page
2234 *
2235 * @thread EMT.
2236 */
2237static void pgmPhysCacheAdd(PVM pVM, PGMPHYSCACHE *pCache, RTGCPHYS GCPhys, uint8_t *pbR3)
2238{
2239 uint32_t iCacheIndex;
2240
2241 Assert(VM_IS_EMT(pVM));
2242
2243 GCPhys = PHYS_PAGE_ADDRESS(GCPhys);
2244 pbR3 = (uint8_t *)PAGE_ADDRESS(pbR3);
2245
2246 iCacheIndex = ((GCPhys >> PAGE_SHIFT) & PGM_MAX_PHYSCACHE_ENTRIES_MASK);
2247
2248 ASMBitSet(&pCache->aEntries, iCacheIndex);
2249
2250 pCache->Entry[iCacheIndex].GCPhys = GCPhys;
2251 pCache->Entry[iCacheIndex].pbR3 = pbR3;
2252}
2253#endif /* IN_RING3 */
2254
2255
2256/**
2257 * Deals with reading from a page with one or more ALL access handlers.
2258 *
2259 * @returns Strict VBox status code in ring-0 and raw-mode, ignorable in ring-3.
2260 * See PGM_HANDLER_PHYS_IS_VALID_STATUS and
2261 * PGM_HANDLER_VIRT_IS_VALID_STATUS for details.
2262 *
2263 * @param pVM The cross context VM structure.
2264 * @param pPage The page descriptor.
2265 * @param GCPhys The physical address to start reading at.
2266 * @param pvBuf Where to put the bits we read.
2267 * @param cb How much to read - less or equal to a page.
2268 * @param enmOrigin The origin of this call.
2269 */
2270static VBOXSTRICTRC pgmPhysReadHandler(PVMCC pVM, PPGMPAGE pPage, RTGCPHYS GCPhys, void *pvBuf, size_t cb,
2271 PGMACCESSORIGIN enmOrigin)
2272{
2273 /*
2274 * The most frequent access here is MMIO and shadowed ROM.
2275 * The current code ASSUMES all these access handlers covers full pages!
2276 */
2277
2278 /*
2279 * Whatever we do we need the source page, map it first.
2280 */
2281 PGMPAGEMAPLOCK PgMpLck;
2282 const void *pvSrc = NULL;
2283 int rc = pgmPhysGCPhys2CCPtrInternalReadOnly(pVM, pPage, GCPhys, &pvSrc, &PgMpLck);
2284/** @todo Check how this can work for MMIO pages? */
2285 if (RT_FAILURE(rc))
2286 {
2287 AssertLogRelMsgFailed(("pgmPhysGCPhys2CCPtrInternalReadOnly failed on %RGp / %R[pgmpage] -> %Rrc\n",
2288 GCPhys, pPage, rc));
2289 memset(pvBuf, 0xff, cb);
2290 return VINF_SUCCESS;
2291 }
2292
2293 VBOXSTRICTRC rcStrict = VINF_PGM_HANDLER_DO_DEFAULT;
2294
2295 /*
2296 * Deal with any physical handlers.
2297 */
2298 PVMCPUCC pVCpu = VMMGetCpu(pVM);
2299 PPGMPHYSHANDLER pPhys = NULL;
2300 if ( PGM_PAGE_GET_HNDL_PHYS_STATE(pPage) == PGM_PAGE_HNDL_PHYS_STATE_ALL
2301 || PGM_PAGE_IS_MMIO_OR_SPECIAL_ALIAS(pPage))
2302 {
2303 pPhys = pgmHandlerPhysicalLookup(pVM, GCPhys);
2304 AssertReleaseMsg(pPhys, ("GCPhys=%RGp cb=%#x\n", GCPhys, cb));
2305 Assert(GCPhys >= pPhys->Core.Key && GCPhys <= pPhys->Core.KeyLast);
2306 Assert((pPhys->Core.Key & PAGE_OFFSET_MASK) == 0);
2307 Assert((pPhys->Core.KeyLast & PAGE_OFFSET_MASK) == PAGE_OFFSET_MASK);
2308#ifndef IN_RING3
2309 if (enmOrigin != PGMACCESSORIGIN_IEM)
2310 {
2311 /* Cannot reliably handle informational status codes in this context */
2312 pgmPhysReleaseInternalPageMappingLock(pVM, &PgMpLck);
2313 return VERR_PGM_PHYS_WR_HIT_HANDLER;
2314 }
2315#endif
2316 PFNPGMPHYSHANDLER pfnHandler = PGMPHYSHANDLER_GET_TYPE(pVM, pPhys)->CTX_SUFF(pfnHandler); Assert(pfnHandler);
2317 void *pvUser = pPhys->CTX_SUFF(pvUser);
2318
2319 Log5(("pgmPhysReadHandler: GCPhys=%RGp cb=%#x pPage=%R[pgmpage] phys %s\n", GCPhys, cb, pPage, R3STRING(pPhys->pszDesc) ));
2320 STAM_PROFILE_START(&pPhys->Stat, h);
2321 PGM_LOCK_ASSERT_OWNER(pVM);
2322
2323 /* Release the PGM lock as MMIO handlers take the IOM lock. (deadlock prevention) */
2324 PGM_UNLOCK(pVM);
2325 rcStrict = pfnHandler(pVM, pVCpu, GCPhys, (void *)pvSrc, pvBuf, cb, PGMACCESSTYPE_READ, enmOrigin, pvUser);
2326 PGM_LOCK_VOID(pVM);
2327
2328#ifdef VBOX_WITH_STATISTICS
2329 pPhys = pgmHandlerPhysicalLookup(pVM, GCPhys);
2330 if (pPhys)
2331 STAM_PROFILE_STOP(&pPhys->Stat, h);
2332#else
2333 pPhys = NULL; /* might not be valid anymore. */
2334#endif
2335 AssertLogRelMsg(PGM_HANDLER_PHYS_IS_VALID_STATUS(rcStrict, false),
2336 ("rcStrict=%Rrc GCPhys=%RGp\n", VBOXSTRICTRC_VAL(rcStrict), GCPhys));
2337 if ( rcStrict != VINF_PGM_HANDLER_DO_DEFAULT
2338 && !PGM_PHYS_RW_IS_SUCCESS(rcStrict))
2339 {
2340 pgmPhysReleaseInternalPageMappingLock(pVM, &PgMpLck);
2341 return rcStrict;
2342 }
2343 }
2344
2345 /*
2346 * Take the default action.
2347 */
2348 if (rcStrict == VINF_PGM_HANDLER_DO_DEFAULT)
2349 {
2350 memcpy(pvBuf, pvSrc, cb);
2351 rcStrict = VINF_SUCCESS;
2352 }
2353 pgmPhysReleaseInternalPageMappingLock(pVM, &PgMpLck);
2354 return rcStrict;
2355}
2356
2357
2358/**
2359 * Read physical memory.
2360 *
2361 * This API respects access handlers and MMIO. Use PGMPhysSimpleReadGCPhys() if you
2362 * want to ignore those.
2363 *
2364 * @returns Strict VBox status code in raw-mode and ring-0, normal VBox status
2365 * code in ring-3. Use PGM_PHYS_RW_IS_SUCCESS to check.
2366 * @retval VINF_SUCCESS in all context - read completed.
2367 *
2368 * @retval VINF_EM_OFF in RC and R0 - read completed.
2369 * @retval VINF_EM_SUSPEND in RC and R0 - read completed.
2370 * @retval VINF_EM_RESET in RC and R0 - read completed.
2371 * @retval VINF_EM_HALT in RC and R0 - read completed.
2372 * @retval VINF_SELM_SYNC_GDT in RC only - read completed.
2373 *
2374 * @retval VINF_EM_DBG_STOP in RC and R0 - read completed.
2375 * @retval VINF_EM_DBG_BREAKPOINT in RC and R0 - read completed.
2376 * @retval VINF_EM_RAW_EMULATE_INSTR in RC and R0 only.
2377 *
2378 * @retval VINF_IOM_R3_MMIO_READ in RC and R0.
2379 * @retval VINF_IOM_R3_MMIO_READ_WRITE in RC and R0.
2380 *
2381 * @retval VINF_PATM_CHECK_PATCH_PAGE in RC only.
2382 *
2383 * @retval VERR_PGM_PHYS_WR_HIT_HANDLER in RC and R0 for access origins that
2384 * haven't been cleared for strict status codes yet.
2385 *
2386 * @param pVM The cross context VM structure.
2387 * @param GCPhys Physical address start reading from.
2388 * @param pvBuf Where to put the read bits.
2389 * @param cbRead How many bytes to read.
2390 * @param enmOrigin The origin of this call.
2391 */
2392VMMDECL(VBOXSTRICTRC) PGMPhysRead(PVMCC pVM, RTGCPHYS GCPhys, void *pvBuf, size_t cbRead, PGMACCESSORIGIN enmOrigin)
2393{
2394 AssertMsgReturn(cbRead > 0, ("don't even think about reading zero bytes!\n"), VINF_SUCCESS);
2395 LogFlow(("PGMPhysRead: %RGp %d\n", GCPhys, cbRead));
2396
2397 STAM_COUNTER_INC(&pVM->pgm.s.CTX_SUFF(pStats)->CTX_MID_Z(Stat,PhysRead));
2398 STAM_COUNTER_ADD(&pVM->pgm.s.CTX_SUFF(pStats)->CTX_MID_Z(Stat,PhysReadBytes), cbRead);
2399
2400 PGM_LOCK_VOID(pVM);
2401
2402 /*
2403 * Copy loop on ram ranges.
2404 */
2405 VBOXSTRICTRC rcStrict = VINF_SUCCESS;
2406 PPGMRAMRANGE pRam = pgmPhysGetRangeAtOrAbove(pVM, GCPhys);
2407 for (;;)
2408 {
2409 /* Inside range or not? */
2410 if (pRam && GCPhys >= pRam->GCPhys)
2411 {
2412 /*
2413 * Must work our way thru this page by page.
2414 */
2415 RTGCPHYS off = GCPhys - pRam->GCPhys;
2416 while (off < pRam->cb)
2417 {
2418 unsigned iPage = off >> PAGE_SHIFT;
2419 PPGMPAGE pPage = &pRam->aPages[iPage];
2420 size_t cb = PAGE_SIZE - (off & PAGE_OFFSET_MASK);
2421 if (cb > cbRead)
2422 cb = cbRead;
2423
2424 /*
2425 * Normal page? Get the pointer to it.
2426 */
2427 if ( !PGM_PAGE_HAS_ACTIVE_ALL_HANDLERS(pPage)
2428 && !PGM_PAGE_IS_SPECIAL_ALIAS_MMIO(pPage))
2429 {
2430 /*
2431 * Get the pointer to the page.
2432 */
2433 PGMPAGEMAPLOCK PgMpLck;
2434 const void *pvSrc;
2435 int rc = pgmPhysGCPhys2CCPtrInternalReadOnly(pVM, pPage, pRam->GCPhys + off, &pvSrc, &PgMpLck);
2436 if (RT_SUCCESS(rc))
2437 {
2438 memcpy(pvBuf, pvSrc, cb);
2439 pgmPhysReleaseInternalPageMappingLock(pVM, &PgMpLck);
2440 }
2441 else
2442 {
2443 AssertLogRelMsgFailed(("pgmPhysGCPhys2CCPtrInternalReadOnly failed on %RGp / %R[pgmpage] -> %Rrc\n",
2444 pRam->GCPhys + off, pPage, rc));
2445 memset(pvBuf, 0xff, cb);
2446 }
2447 }
2448 /*
2449 * Have ALL/MMIO access handlers.
2450 */
2451 else
2452 {
2453 VBOXSTRICTRC rcStrict2 = pgmPhysReadHandler(pVM, pPage, pRam->GCPhys + off, pvBuf, cb, enmOrigin);
2454 if (PGM_PHYS_RW_IS_SUCCESS(rcStrict2))
2455 PGM_PHYS_RW_DO_UPDATE_STRICT_RC(rcStrict, rcStrict2);
2456 else
2457 {
2458 memset(pvBuf, 0xff, cb);
2459 PGM_UNLOCK(pVM);
2460 return rcStrict2;
2461 }
2462 }
2463
2464 /* next page */
2465 if (cb >= cbRead)
2466 {
2467 PGM_UNLOCK(pVM);
2468 return rcStrict;
2469 }
2470 cbRead -= cb;
2471 off += cb;
2472 pvBuf = (char *)pvBuf + cb;
2473 } /* walk pages in ram range. */
2474
2475 GCPhys = pRam->GCPhysLast + 1;
2476 }
2477 else
2478 {
2479 LogFlow(("PGMPhysRead: Unassigned %RGp size=%u\n", GCPhys, cbRead));
2480
2481 /*
2482 * Unassigned address space.
2483 */
2484 size_t cb = pRam ? pRam->GCPhys - GCPhys : ~(size_t)0;
2485 if (cb >= cbRead)
2486 {
2487 memset(pvBuf, 0xff, cbRead);
2488 break;
2489 }
2490 memset(pvBuf, 0xff, cb);
2491
2492 cbRead -= cb;
2493 pvBuf = (char *)pvBuf + cb;
2494 GCPhys += cb;
2495 }
2496
2497 /* Advance range if necessary. */
2498 while (pRam && GCPhys > pRam->GCPhysLast)
2499 pRam = pRam->CTX_SUFF(pNext);
2500 } /* Ram range walk */
2501
2502 PGM_UNLOCK(pVM);
2503 return rcStrict;
2504}
2505
2506
2507/**
2508 * Deals with writing to a page with one or more WRITE or ALL access handlers.
2509 *
2510 * @returns Strict VBox status code in ring-0 and raw-mode, ignorable in ring-3.
2511 * See PGM_HANDLER_PHYS_IS_VALID_STATUS and
2512 * PGM_HANDLER_VIRT_IS_VALID_STATUS for details.
2513 *
2514 * @param pVM The cross context VM structure.
2515 * @param pPage The page descriptor.
2516 * @param GCPhys The physical address to start writing at.
2517 * @param pvBuf What to write.
2518 * @param cbWrite How much to write - less or equal to a page.
2519 * @param enmOrigin The origin of this call.
2520 */
2521static VBOXSTRICTRC pgmPhysWriteHandler(PVMCC pVM, PPGMPAGE pPage, RTGCPHYS GCPhys, void const *pvBuf, size_t cbWrite,
2522 PGMACCESSORIGIN enmOrigin)
2523{
2524 PGMPAGEMAPLOCK PgMpLck;
2525 void *pvDst = NULL;
2526 VBOXSTRICTRC rcStrict;
2527
2528 /*
2529 * Give priority to physical handlers (like #PF does).
2530 *
2531 * Hope for a lonely physical handler first that covers the whole
2532 * write area. This should be a pretty frequent case with MMIO and
2533 * the heavy usage of full page handlers in the page pool.
2534 */
2535 PVMCPUCC pVCpu = VMMGetCpu(pVM);
2536 PPGMPHYSHANDLER pCur = pgmHandlerPhysicalLookup(pVM, GCPhys);
2537 if (pCur)
2538 {
2539 Assert(GCPhys >= pCur->Core.Key && GCPhys <= pCur->Core.KeyLast);
2540#ifndef IN_RING3
2541 if (enmOrigin != PGMACCESSORIGIN_IEM)
2542 /* Cannot reliably handle informational status codes in this context */
2543 return VERR_PGM_PHYS_WR_HIT_HANDLER;
2544#endif
2545 size_t cbRange = pCur->Core.KeyLast - GCPhys + 1;
2546 if (cbRange > cbWrite)
2547 cbRange = cbWrite;
2548
2549 Assert(PGMPHYSHANDLER_GET_TYPE(pVM, pCur)->CTX_SUFF(pfnHandler));
2550 Log5(("pgmPhysWriteHandler: GCPhys=%RGp cbRange=%#x pPage=%R[pgmpage] phys %s\n",
2551 GCPhys, cbRange, pPage, R3STRING(pCur->pszDesc) ));
2552 if (!PGM_PAGE_IS_MMIO_OR_SPECIAL_ALIAS(pPage))
2553 rcStrict = pgmPhysGCPhys2CCPtrInternal(pVM, pPage, GCPhys, &pvDst, &PgMpLck);
2554 else
2555 rcStrict = VINF_SUCCESS;
2556 if (RT_SUCCESS(rcStrict))
2557 {
2558 PFNPGMPHYSHANDLER pfnHandler = PGMPHYSHANDLER_GET_TYPE(pVM, pCur)->CTX_SUFF(pfnHandler);
2559 void *pvUser = pCur->CTX_SUFF(pvUser);
2560 STAM_PROFILE_START(&pCur->Stat, h);
2561
2562 /* Release the PGM lock as MMIO handlers take the IOM lock. (deadlock prevention) */
2563 PGM_LOCK_ASSERT_OWNER(pVM);
2564 PGM_UNLOCK(pVM);
2565 rcStrict = pfnHandler(pVM, pVCpu, GCPhys, pvDst, (void *)pvBuf, cbRange, PGMACCESSTYPE_WRITE, enmOrigin, pvUser);
2566 PGM_LOCK_VOID(pVM);
2567
2568#ifdef VBOX_WITH_STATISTICS
2569 pCur = pgmHandlerPhysicalLookup(pVM, GCPhys);
2570 if (pCur)
2571 STAM_PROFILE_STOP(&pCur->Stat, h);
2572#else
2573 pCur = NULL; /* might not be valid anymore. */
2574#endif
2575 if (rcStrict == VINF_PGM_HANDLER_DO_DEFAULT)
2576 {
2577 if (pvDst)
2578 memcpy(pvDst, pvBuf, cbRange);
2579 rcStrict = VINF_SUCCESS;
2580 }
2581 else
2582 AssertLogRelMsg(PGM_HANDLER_PHYS_IS_VALID_STATUS(rcStrict, true),
2583 ("rcStrict=%Rrc GCPhys=%RGp pPage=%R[pgmpage] %s\n",
2584 VBOXSTRICTRC_VAL(rcStrict), GCPhys, pPage, pCur ? R3STRING(pCur->pszDesc) : ""));
2585 }
2586 else
2587 AssertLogRelMsgFailedReturn(("pgmPhysGCPhys2CCPtrInternal failed on %RGp / %R[pgmpage] -> %Rrc\n",
2588 GCPhys, pPage, VBOXSTRICTRC_VAL(rcStrict)), rcStrict);
2589 if (RT_LIKELY(cbRange == cbWrite) || !PGM_PHYS_RW_IS_SUCCESS(rcStrict))
2590 {
2591 if (pvDst)
2592 pgmPhysReleaseInternalPageMappingLock(pVM, &PgMpLck);
2593 return rcStrict;
2594 }
2595
2596 /* more fun to be had below */
2597 cbWrite -= cbRange;
2598 GCPhys += cbRange;
2599 pvBuf = (uint8_t *)pvBuf + cbRange;
2600 pvDst = (uint8_t *)pvDst + cbRange;
2601 }
2602 else /* The handler is somewhere else in the page, deal with it below. */
2603 rcStrict = VINF_SUCCESS;
2604 Assert(!PGM_PAGE_IS_MMIO_OR_ALIAS(pPage)); /* MMIO handlers are all PAGE_SIZEed! */
2605
2606 /*
2607 * Deal with all the odd ends (used to be deal with virt+phys).
2608 */
2609 Assert(rcStrict != VINF_PGM_HANDLER_DO_DEFAULT);
2610
2611 /* We need a writable destination page. */
2612 if (!pvDst)
2613 {
2614 int rc2 = pgmPhysGCPhys2CCPtrInternal(pVM, pPage, GCPhys, &pvDst, &PgMpLck);
2615 AssertLogRelMsgReturn(RT_SUCCESS(rc2),
2616 ("pgmPhysGCPhys2CCPtrInternal failed on %RGp / %R[pgmpage] -> %Rrc\n", GCPhys, pPage, rc2),
2617 rc2);
2618 }
2619
2620 /* The loop state (big + ugly). */
2621 PPGMPHYSHANDLER pPhys = NULL;
2622 uint32_t offPhys = PAGE_SIZE;
2623 uint32_t offPhysLast = PAGE_SIZE;
2624 bool fMorePhys = PGM_PAGE_HAS_ACTIVE_PHYSICAL_HANDLERS(pPage);
2625
2626 /* The loop. */
2627 for (;;)
2628 {
2629 if (fMorePhys && !pPhys)
2630 {
2631 pPhys = pgmHandlerPhysicalLookup(pVM, GCPhys);
2632 if (pPhys)
2633 {
2634 offPhys = 0;
2635 offPhysLast = pPhys->Core.KeyLast - GCPhys; /* ASSUMES < 4GB handlers... */
2636 }
2637 else
2638 {
2639 pPhys = (PPGMPHYSHANDLER)RTAvlroGCPhysGetBestFit(&pVM->pgm.s.CTX_SUFF(pTrees)->PhysHandlers,
2640 GCPhys, true /* fAbove */);
2641 if ( pPhys
2642 && pPhys->Core.Key <= GCPhys + (cbWrite - 1))
2643 {
2644 offPhys = pPhys->Core.Key - GCPhys;
2645 offPhysLast = pPhys->Core.KeyLast - GCPhys; /* ASSUMES < 4GB handlers... */
2646 }
2647 else
2648 {
2649 pPhys = NULL;
2650 fMorePhys = false;
2651 offPhys = offPhysLast = PAGE_SIZE;
2652 }
2653 }
2654 }
2655
2656 /*
2657 * Handle access to space without handlers (that's easy).
2658 */
2659 VBOXSTRICTRC rcStrict2 = VINF_PGM_HANDLER_DO_DEFAULT;
2660 uint32_t cbRange = (uint32_t)cbWrite;
2661
2662 /*
2663 * Physical handler.
2664 */
2665 if (!offPhys)
2666 {
2667#ifndef IN_RING3
2668 if (enmOrigin != PGMACCESSORIGIN_IEM)
2669 /* Cannot reliably handle informational status codes in this context */
2670 return VERR_PGM_PHYS_WR_HIT_HANDLER;
2671#endif
2672 if (cbRange > offPhysLast + 1)
2673 cbRange = offPhysLast + 1;
2674
2675 PFNPGMPHYSHANDLER pfnHandler = PGMPHYSHANDLER_GET_TYPE(pVM, pPhys)->CTX_SUFF(pfnHandler);
2676 void *pvUser = pPhys->CTX_SUFF(pvUser);
2677
2678 Log5(("pgmPhysWriteHandler: GCPhys=%RGp cbRange=%#x pPage=%R[pgmpage] phys %s\n", GCPhys, cbRange, pPage, R3STRING(pPhys->pszDesc) ));
2679 STAM_PROFILE_START(&pPhys->Stat, h);
2680
2681 /* Release the PGM lock as MMIO handlers take the IOM lock. (deadlock prevention) */
2682 PGM_LOCK_ASSERT_OWNER(pVM);
2683 PGM_UNLOCK(pVM);
2684 rcStrict2 = pfnHandler(pVM, pVCpu, GCPhys, pvDst, (void *)pvBuf, cbRange, PGMACCESSTYPE_WRITE, enmOrigin, pvUser);
2685 PGM_LOCK_VOID(pVM);
2686
2687#ifdef VBOX_WITH_STATISTICS
2688 pPhys = pgmHandlerPhysicalLookup(pVM, GCPhys);
2689 if (pPhys)
2690 STAM_PROFILE_STOP(&pPhys->Stat, h);
2691#else
2692 pPhys = NULL; /* might not be valid anymore. */
2693#endif
2694 AssertLogRelMsg(PGM_HANDLER_PHYS_IS_VALID_STATUS(rcStrict2, true),
2695 ("rcStrict2=%Rrc (rcStrict=%Rrc) GCPhys=%RGp pPage=%R[pgmpage] %s\n", VBOXSTRICTRC_VAL(rcStrict2),
2696 VBOXSTRICTRC_VAL(rcStrict), GCPhys, pPage, pPhys ? R3STRING(pPhys->pszDesc) : ""));
2697 }
2698
2699 /*
2700 * Execute the default action and merge the status codes.
2701 */
2702 if (rcStrict2 == VINF_PGM_HANDLER_DO_DEFAULT)
2703 {
2704 memcpy(pvDst, pvBuf, cbRange);
2705 rcStrict2 = VINF_SUCCESS;
2706 }
2707 else if (!PGM_PHYS_RW_IS_SUCCESS(rcStrict2))
2708 {
2709 pgmPhysReleaseInternalPageMappingLock(pVM, &PgMpLck);
2710 return rcStrict2;
2711 }
2712 else
2713 PGM_PHYS_RW_DO_UPDATE_STRICT_RC(rcStrict, rcStrict2);
2714
2715 /*
2716 * Advance if we've got more stuff to do.
2717 */
2718 if (cbRange >= cbWrite)
2719 {
2720 pgmPhysReleaseInternalPageMappingLock(pVM, &PgMpLck);
2721 return rcStrict;
2722 }
2723
2724
2725 cbWrite -= cbRange;
2726 GCPhys += cbRange;
2727 pvBuf = (uint8_t *)pvBuf + cbRange;
2728 pvDst = (uint8_t *)pvDst + cbRange;
2729
2730 offPhys -= cbRange;
2731 offPhysLast -= cbRange;
2732 }
2733}
2734
2735
2736/**
2737 * Write to physical memory.
2738 *
2739 * This API respects access handlers and MMIO. Use PGMPhysSimpleWriteGCPhys() if you
2740 * want to ignore those.
2741 *
2742 * @returns Strict VBox status code in raw-mode and ring-0, normal VBox status
2743 * code in ring-3. Use PGM_PHYS_RW_IS_SUCCESS to check.
2744 * @retval VINF_SUCCESS in all context - write completed.
2745 *
2746 * @retval VINF_EM_OFF in RC and R0 - write completed.
2747 * @retval VINF_EM_SUSPEND in RC and R0 - write completed.
2748 * @retval VINF_EM_RESET in RC and R0 - write completed.
2749 * @retval VINF_EM_HALT in RC and R0 - write completed.
2750 * @retval VINF_SELM_SYNC_GDT in RC only - write completed.
2751 *
2752 * @retval VINF_EM_DBG_STOP in RC and R0 - write completed.
2753 * @retval VINF_EM_DBG_BREAKPOINT in RC and R0 - write completed.
2754 * @retval VINF_EM_RAW_EMULATE_INSTR in RC and R0 only.
2755 *
2756 * @retval VINF_IOM_R3_MMIO_WRITE in RC and R0.
2757 * @retval VINF_IOM_R3_MMIO_READ_WRITE in RC and R0.
2758 * @retval VINF_IOM_R3_MMIO_COMMIT_WRITE in RC and R0.
2759 *
2760 * @retval VINF_EM_RAW_EMULATE_INSTR_GDT_FAULT in RC only - write completed.
2761 * @retval VINF_EM_RAW_EMULATE_INSTR_LDT_FAULT in RC only.
2762 * @retval VINF_EM_RAW_EMULATE_INSTR_TSS_FAULT in RC only.
2763 * @retval VINF_EM_RAW_EMULATE_INSTR_IDT_FAULT in RC only.
2764 * @retval VINF_CSAM_PENDING_ACTION in RC only.
2765 * @retval VINF_PATM_CHECK_PATCH_PAGE in RC only.
2766 *
2767 * @retval VERR_PGM_PHYS_WR_HIT_HANDLER in RC and R0 for access origins that
2768 * haven't been cleared for strict status codes yet.
2769 *
2770 *
2771 * @param pVM The cross context VM structure.
2772 * @param GCPhys Physical address to write to.
2773 * @param pvBuf What to write.
2774 * @param cbWrite How many bytes to write.
2775 * @param enmOrigin Who is calling.
2776 */
2777VMMDECL(VBOXSTRICTRC) PGMPhysWrite(PVMCC pVM, RTGCPHYS GCPhys, const void *pvBuf, size_t cbWrite, PGMACCESSORIGIN enmOrigin)
2778{
2779 AssertMsg(!pVM->pgm.s.fNoMorePhysWrites, ("Calling PGMPhysWrite after pgmR3Save()! enmOrigin=%d\n", enmOrigin));
2780 AssertMsgReturn(cbWrite > 0, ("don't even think about writing zero bytes!\n"), VINF_SUCCESS);
2781 LogFlow(("PGMPhysWrite: %RGp %d\n", GCPhys, cbWrite));
2782
2783 STAM_COUNTER_INC(&pVM->pgm.s.CTX_SUFF(pStats)->CTX_MID_Z(Stat,PhysWrite));
2784 STAM_COUNTER_ADD(&pVM->pgm.s.CTX_SUFF(pStats)->CTX_MID_Z(Stat,PhysWriteBytes), cbWrite);
2785
2786 PGM_LOCK_VOID(pVM);
2787
2788 /*
2789 * Copy loop on ram ranges.
2790 */
2791 VBOXSTRICTRC rcStrict = VINF_SUCCESS;
2792 PPGMRAMRANGE pRam = pgmPhysGetRangeAtOrAbove(pVM, GCPhys);
2793 for (;;)
2794 {
2795 /* Inside range or not? */
2796 if (pRam && GCPhys >= pRam->GCPhys)
2797 {
2798 /*
2799 * Must work our way thru this page by page.
2800 */
2801 RTGCPTR off = GCPhys - pRam->GCPhys;
2802 while (off < pRam->cb)
2803 {
2804 RTGCPTR iPage = off >> PAGE_SHIFT;
2805 PPGMPAGE pPage = &pRam->aPages[iPage];
2806 size_t cb = PAGE_SIZE - (off & PAGE_OFFSET_MASK);
2807 if (cb > cbWrite)
2808 cb = cbWrite;
2809
2810 /*
2811 * Normal page? Get the pointer to it.
2812 */
2813 if ( !PGM_PAGE_HAS_ACTIVE_HANDLERS(pPage)
2814 && !PGM_PAGE_IS_SPECIAL_ALIAS_MMIO(pPage))
2815 {
2816 PGMPAGEMAPLOCK PgMpLck;
2817 void *pvDst;
2818 int rc = pgmPhysGCPhys2CCPtrInternal(pVM, pPage, pRam->GCPhys + off, &pvDst, &PgMpLck);
2819 if (RT_SUCCESS(rc))
2820 {
2821 Assert(!PGM_PAGE_IS_BALLOONED(pPage));
2822 memcpy(pvDst, pvBuf, cb);
2823 pgmPhysReleaseInternalPageMappingLock(pVM, &PgMpLck);
2824 }
2825 /* Ignore writes to ballooned pages. */
2826 else if (!PGM_PAGE_IS_BALLOONED(pPage))
2827 AssertLogRelMsgFailed(("pgmPhysGCPhys2CCPtrInternal failed on %RGp / %R[pgmpage] -> %Rrc\n",
2828 pRam->GCPhys + off, pPage, rc));
2829 }
2830 /*
2831 * Active WRITE or ALL access handlers.
2832 */
2833 else
2834 {
2835 VBOXSTRICTRC rcStrict2 = pgmPhysWriteHandler(pVM, pPage, pRam->GCPhys + off, pvBuf, cb, enmOrigin);
2836 if (PGM_PHYS_RW_IS_SUCCESS(rcStrict2))
2837 PGM_PHYS_RW_DO_UPDATE_STRICT_RC(rcStrict, rcStrict2);
2838 else
2839 {
2840 PGM_UNLOCK(pVM);
2841 return rcStrict2;
2842 }
2843 }
2844
2845 /* next page */
2846 if (cb >= cbWrite)
2847 {
2848 PGM_UNLOCK(pVM);
2849 return rcStrict;
2850 }
2851
2852 cbWrite -= cb;
2853 off += cb;
2854 pvBuf = (const char *)pvBuf + cb;
2855 } /* walk pages in ram range */
2856
2857 GCPhys = pRam->GCPhysLast + 1;
2858 }
2859 else
2860 {
2861 /*
2862 * Unassigned address space, skip it.
2863 */
2864 if (!pRam)
2865 break;
2866 size_t cb = pRam->GCPhys - GCPhys;
2867 if (cb >= cbWrite)
2868 break;
2869 cbWrite -= cb;
2870 pvBuf = (const char *)pvBuf + cb;
2871 GCPhys += cb;
2872 }
2873
2874 /* Advance range if necessary. */
2875 while (pRam && GCPhys > pRam->GCPhysLast)
2876 pRam = pRam->CTX_SUFF(pNext);
2877 } /* Ram range walk */
2878
2879 PGM_UNLOCK(pVM);
2880 return rcStrict;
2881}
2882
2883
2884/**
2885 * Read from guest physical memory by GC physical address, bypassing
2886 * MMIO and access handlers.
2887 *
2888 * @returns VBox status code.
2889 * @param pVM The cross context VM structure.
2890 * @param pvDst The destination address.
2891 * @param GCPhysSrc The source address (GC physical address).
2892 * @param cb The number of bytes to read.
2893 */
2894VMMDECL(int) PGMPhysSimpleReadGCPhys(PVMCC pVM, void *pvDst, RTGCPHYS GCPhysSrc, size_t cb)
2895{
2896 /*
2897 * Treat the first page as a special case.
2898 */
2899 if (!cb)
2900 return VINF_SUCCESS;
2901
2902 /* map the 1st page */
2903 void const *pvSrc;
2904 PGMPAGEMAPLOCK Lock;
2905 int rc = PGMPhysGCPhys2CCPtrReadOnly(pVM, GCPhysSrc, &pvSrc, &Lock);
2906 if (RT_FAILURE(rc))
2907 return rc;
2908
2909 /* optimize for the case where access is completely within the first page. */
2910 size_t cbPage = PAGE_SIZE - (GCPhysSrc & PAGE_OFFSET_MASK);
2911 if (RT_LIKELY(cb <= cbPage))
2912 {
2913 memcpy(pvDst, pvSrc, cb);
2914 PGMPhysReleasePageMappingLock(pVM, &Lock);
2915 return VINF_SUCCESS;
2916 }
2917
2918 /* copy to the end of the page. */
2919 memcpy(pvDst, pvSrc, cbPage);
2920 PGMPhysReleasePageMappingLock(pVM, &Lock);
2921 GCPhysSrc += cbPage;
2922 pvDst = (uint8_t *)pvDst + cbPage;
2923 cb -= cbPage;
2924
2925 /*
2926 * Page by page.
2927 */
2928 for (;;)
2929 {
2930 /* map the page */
2931 rc = PGMPhysGCPhys2CCPtrReadOnly(pVM, GCPhysSrc, &pvSrc, &Lock);
2932 if (RT_FAILURE(rc))
2933 return rc;
2934
2935 /* last page? */
2936 if (cb <= PAGE_SIZE)
2937 {
2938 memcpy(pvDst, pvSrc, cb);
2939 PGMPhysReleasePageMappingLock(pVM, &Lock);
2940 return VINF_SUCCESS;
2941 }
2942
2943 /* copy the entire page and advance */
2944 memcpy(pvDst, pvSrc, PAGE_SIZE);
2945 PGMPhysReleasePageMappingLock(pVM, &Lock);
2946 GCPhysSrc += PAGE_SIZE;
2947 pvDst = (uint8_t *)pvDst + PAGE_SIZE;
2948 cb -= PAGE_SIZE;
2949 }
2950 /* won't ever get here. */
2951}
2952
2953
2954/**
2955 * Write to guest physical memory referenced by GC pointer.
2956 * Write memory to GC physical address in guest physical memory.
2957 *
2958 * This will bypass MMIO and access handlers.
2959 *
2960 * @returns VBox status code.
2961 * @param pVM The cross context VM structure.
2962 * @param GCPhysDst The GC physical address of the destination.
2963 * @param pvSrc The source buffer.
2964 * @param cb The number of bytes to write.
2965 */
2966VMMDECL(int) PGMPhysSimpleWriteGCPhys(PVMCC pVM, RTGCPHYS GCPhysDst, const void *pvSrc, size_t cb)
2967{
2968 LogFlow(("PGMPhysSimpleWriteGCPhys: %RGp %zu\n", GCPhysDst, cb));
2969
2970 /*
2971 * Treat the first page as a special case.
2972 */
2973 if (!cb)
2974 return VINF_SUCCESS;
2975
2976 /* map the 1st page */
2977 void *pvDst;
2978 PGMPAGEMAPLOCK Lock;
2979 int rc = PGMPhysGCPhys2CCPtr(pVM, GCPhysDst, &pvDst, &Lock);
2980 if (RT_FAILURE(rc))
2981 return rc;
2982
2983 /* optimize for the case where access is completely within the first page. */
2984 size_t cbPage = PAGE_SIZE - (GCPhysDst & PAGE_OFFSET_MASK);
2985 if (RT_LIKELY(cb <= cbPage))
2986 {
2987 memcpy(pvDst, pvSrc, cb);
2988 PGMPhysReleasePageMappingLock(pVM, &Lock);
2989 return VINF_SUCCESS;
2990 }
2991
2992 /* copy to the end of the page. */
2993 memcpy(pvDst, pvSrc, cbPage);
2994 PGMPhysReleasePageMappingLock(pVM, &Lock);
2995 GCPhysDst += cbPage;
2996 pvSrc = (const uint8_t *)pvSrc + cbPage;
2997 cb -= cbPage;
2998
2999 /*
3000 * Page by page.
3001 */
3002 for (;;)
3003 {
3004 /* map the page */
3005 rc = PGMPhysGCPhys2CCPtr(pVM, GCPhysDst, &pvDst, &Lock);
3006 if (RT_FAILURE(rc))
3007 return rc;
3008
3009 /* last page? */
3010 if (cb <= PAGE_SIZE)
3011 {
3012 memcpy(pvDst, pvSrc, cb);
3013 PGMPhysReleasePageMappingLock(pVM, &Lock);
3014 return VINF_SUCCESS;
3015 }
3016
3017 /* copy the entire page and advance */
3018 memcpy(pvDst, pvSrc, PAGE_SIZE);
3019 PGMPhysReleasePageMappingLock(pVM, &Lock);
3020 GCPhysDst += PAGE_SIZE;
3021 pvSrc = (const uint8_t *)pvSrc + PAGE_SIZE;
3022 cb -= PAGE_SIZE;
3023 }
3024 /* won't ever get here. */
3025}
3026
3027
3028/**
3029 * Read from guest physical memory referenced by GC pointer.
3030 *
3031 * This function uses the current CR3/CR0/CR4 of the guest and will
3032 * bypass access handlers and not set any accessed bits.
3033 *
3034 * @returns VBox status code.
3035 * @param pVCpu The cross context virtual CPU structure of the calling EMT.
3036 * @param pvDst The destination address.
3037 * @param GCPtrSrc The source address (GC pointer).
3038 * @param cb The number of bytes to read.
3039 */
3040VMMDECL(int) PGMPhysSimpleReadGCPtr(PVMCPUCC pVCpu, void *pvDst, RTGCPTR GCPtrSrc, size_t cb)
3041{
3042 PVMCC pVM = pVCpu->CTX_SUFF(pVM);
3043/** @todo fix the macro / state handling: VMCPU_ASSERT_EMT_OR_GURU(pVCpu); */
3044
3045 /*
3046 * Treat the first page as a special case.
3047 */
3048 if (!cb)
3049 return VINF_SUCCESS;
3050
3051 STAM_COUNTER_INC(&pVM->pgm.s.CTX_SUFF(pStats)->CTX_MID_Z(Stat,PhysSimpleRead));
3052 STAM_COUNTER_ADD(&pVM->pgm.s.CTX_SUFF(pStats)->CTX_MID_Z(Stat,PhysSimpleReadBytes), cb);
3053
3054 /* Take the PGM lock here, because many called functions take the lock for a very short period. That's counter-productive
3055 * when many VCPUs are fighting for the lock.
3056 */
3057 PGM_LOCK_VOID(pVM);
3058
3059 /* map the 1st page */
3060 void const *pvSrc;
3061 PGMPAGEMAPLOCK Lock;
3062 int rc = PGMPhysGCPtr2CCPtrReadOnly(pVCpu, GCPtrSrc, &pvSrc, &Lock);
3063 if (RT_FAILURE(rc))
3064 {
3065 PGM_UNLOCK(pVM);
3066 return rc;
3067 }
3068
3069 /* optimize for the case where access is completely within the first page. */
3070 size_t cbPage = PAGE_SIZE - ((RTGCUINTPTR)GCPtrSrc & PAGE_OFFSET_MASK);
3071 if (RT_LIKELY(cb <= cbPage))
3072 {
3073 memcpy(pvDst, pvSrc, cb);
3074 PGMPhysReleasePageMappingLock(pVM, &Lock);
3075 PGM_UNLOCK(pVM);
3076 return VINF_SUCCESS;
3077 }
3078
3079 /* copy to the end of the page. */
3080 memcpy(pvDst, pvSrc, cbPage);
3081 PGMPhysReleasePageMappingLock(pVM, &Lock);
3082 GCPtrSrc = (RTGCPTR)((RTGCUINTPTR)GCPtrSrc + cbPage);
3083 pvDst = (uint8_t *)pvDst + cbPage;
3084 cb -= cbPage;
3085
3086 /*
3087 * Page by page.
3088 */
3089 for (;;)
3090 {
3091 /* map the page */
3092 rc = PGMPhysGCPtr2CCPtrReadOnly(pVCpu, GCPtrSrc, &pvSrc, &Lock);
3093 if (RT_FAILURE(rc))
3094 {
3095 PGM_UNLOCK(pVM);
3096 return rc;
3097 }
3098
3099 /* last page? */
3100 if (cb <= PAGE_SIZE)
3101 {
3102 memcpy(pvDst, pvSrc, cb);
3103 PGMPhysReleasePageMappingLock(pVM, &Lock);
3104 PGM_UNLOCK(pVM);
3105 return VINF_SUCCESS;
3106 }
3107
3108 /* copy the entire page and advance */
3109 memcpy(pvDst, pvSrc, PAGE_SIZE);
3110 PGMPhysReleasePageMappingLock(pVM, &Lock);
3111 GCPtrSrc = (RTGCPTR)((RTGCUINTPTR)GCPtrSrc + PAGE_SIZE);
3112 pvDst = (uint8_t *)pvDst + PAGE_SIZE;
3113 cb -= PAGE_SIZE;
3114 }
3115 /* won't ever get here. */
3116}
3117
3118
3119/**
3120 * Write to guest physical memory referenced by GC pointer.
3121 *
3122 * This function uses the current CR3/CR0/CR4 of the guest and will
3123 * bypass access handlers and not set dirty or accessed bits.
3124 *
3125 * @returns VBox status code.
3126 * @param pVCpu The cross context virtual CPU structure of the calling EMT.
3127 * @param GCPtrDst The destination address (GC pointer).
3128 * @param pvSrc The source address.
3129 * @param cb The number of bytes to write.
3130 */
3131VMMDECL(int) PGMPhysSimpleWriteGCPtr(PVMCPUCC pVCpu, RTGCPTR GCPtrDst, const void *pvSrc, size_t cb)
3132{
3133 PVMCC pVM = pVCpu->CTX_SUFF(pVM);
3134 VMCPU_ASSERT_EMT(pVCpu);
3135
3136 /*
3137 * Treat the first page as a special case.
3138 */
3139 if (!cb)
3140 return VINF_SUCCESS;
3141
3142 STAM_COUNTER_INC(&pVM->pgm.s.CTX_SUFF(pStats)->CTX_MID_Z(Stat,PhysSimpleWrite));
3143 STAM_COUNTER_ADD(&pVM->pgm.s.CTX_SUFF(pStats)->CTX_MID_Z(Stat,PhysSimpleWriteBytes), cb);
3144
3145 /* map the 1st page */
3146 void *pvDst;
3147 PGMPAGEMAPLOCK Lock;
3148 int rc = PGMPhysGCPtr2CCPtr(pVCpu, GCPtrDst, &pvDst, &Lock);
3149 if (RT_FAILURE(rc))
3150 return rc;
3151
3152 /* optimize for the case where access is completely within the first page. */
3153 size_t cbPage = PAGE_SIZE - ((RTGCUINTPTR)GCPtrDst & PAGE_OFFSET_MASK);
3154 if (RT_LIKELY(cb <= cbPage))
3155 {
3156 memcpy(pvDst, pvSrc, cb);
3157 PGMPhysReleasePageMappingLock(pVM, &Lock);
3158 return VINF_SUCCESS;
3159 }
3160
3161 /* copy to the end of the page. */
3162 memcpy(pvDst, pvSrc, cbPage);
3163 PGMPhysReleasePageMappingLock(pVM, &Lock);
3164 GCPtrDst = (RTGCPTR)((RTGCUINTPTR)GCPtrDst + cbPage);
3165 pvSrc = (const uint8_t *)pvSrc + cbPage;
3166 cb -= cbPage;
3167
3168 /*
3169 * Page by page.
3170 */
3171 for (;;)
3172 {
3173 /* map the page */
3174 rc = PGMPhysGCPtr2CCPtr(pVCpu, GCPtrDst, &pvDst, &Lock);
3175 if (RT_FAILURE(rc))
3176 return rc;
3177
3178 /* last page? */
3179 if (cb <= PAGE_SIZE)
3180 {
3181 memcpy(pvDst, pvSrc, cb);
3182 PGMPhysReleasePageMappingLock(pVM, &Lock);
3183 return VINF_SUCCESS;
3184 }
3185
3186 /* copy the entire page and advance */
3187 memcpy(pvDst, pvSrc, PAGE_SIZE);
3188 PGMPhysReleasePageMappingLock(pVM, &Lock);
3189 GCPtrDst = (RTGCPTR)((RTGCUINTPTR)GCPtrDst + PAGE_SIZE);
3190 pvSrc = (const uint8_t *)pvSrc + PAGE_SIZE;
3191 cb -= PAGE_SIZE;
3192 }
3193 /* won't ever get here. */
3194}
3195
3196
3197/**
3198 * Write to guest physical memory referenced by GC pointer and update the PTE.
3199 *
3200 * This function uses the current CR3/CR0/CR4 of the guest and will
3201 * bypass access handlers but will set any dirty and accessed bits in the PTE.
3202 *
3203 * If you don't want to set the dirty bit, use PGMPhysSimpleWriteGCPtr().
3204 *
3205 * @returns VBox status code.
3206 * @param pVCpu The cross context virtual CPU structure of the calling EMT.
3207 * @param GCPtrDst The destination address (GC pointer).
3208 * @param pvSrc The source address.
3209 * @param cb The number of bytes to write.
3210 */
3211VMMDECL(int) PGMPhysSimpleDirtyWriteGCPtr(PVMCPUCC pVCpu, RTGCPTR GCPtrDst, const void *pvSrc, size_t cb)
3212{
3213 PVMCC pVM = pVCpu->CTX_SUFF(pVM);
3214 VMCPU_ASSERT_EMT(pVCpu);
3215
3216 /*
3217 * Treat the first page as a special case.
3218 * Btw. this is the same code as in PGMPhyssimpleWriteGCPtr excep for the PGMGstModifyPage.
3219 */
3220 if (!cb)
3221 return VINF_SUCCESS;
3222
3223 /* map the 1st page */
3224 void *pvDst;
3225 PGMPAGEMAPLOCK Lock;
3226 int rc = PGMPhysGCPtr2CCPtr(pVCpu, GCPtrDst, &pvDst, &Lock);
3227 if (RT_FAILURE(rc))
3228 return rc;
3229
3230 /* optimize for the case where access is completely within the first page. */
3231 size_t cbPage = PAGE_SIZE - ((RTGCUINTPTR)GCPtrDst & PAGE_OFFSET_MASK);
3232 if (RT_LIKELY(cb <= cbPage))
3233 {
3234 memcpy(pvDst, pvSrc, cb);
3235 PGMPhysReleasePageMappingLock(pVM, &Lock);
3236 rc = PGMGstModifyPage(pVCpu, GCPtrDst, 1, X86_PTE_A | X86_PTE_D, ~(uint64_t)(X86_PTE_A | X86_PTE_D)); AssertRC(rc);
3237 return VINF_SUCCESS;
3238 }
3239
3240 /* copy to the end of the page. */
3241 memcpy(pvDst, pvSrc, cbPage);
3242 PGMPhysReleasePageMappingLock(pVM, &Lock);
3243 rc = PGMGstModifyPage(pVCpu, GCPtrDst, 1, X86_PTE_A | X86_PTE_D, ~(uint64_t)(X86_PTE_A | X86_PTE_D)); AssertRC(rc);
3244 GCPtrDst = (RTGCPTR)((RTGCUINTPTR)GCPtrDst + cbPage);
3245 pvSrc = (const uint8_t *)pvSrc + cbPage;
3246 cb -= cbPage;
3247
3248 /*
3249 * Page by page.
3250 */
3251 for (;;)
3252 {
3253 /* map the page */
3254 rc = PGMPhysGCPtr2CCPtr(pVCpu, GCPtrDst, &pvDst, &Lock);
3255 if (RT_FAILURE(rc))
3256 return rc;
3257
3258 /* last page? */
3259 if (cb <= PAGE_SIZE)
3260 {
3261 memcpy(pvDst, pvSrc, cb);
3262 PGMPhysReleasePageMappingLock(pVM, &Lock);
3263 rc = PGMGstModifyPage(pVCpu, GCPtrDst, 1, X86_PTE_A | X86_PTE_D, ~(uint64_t)(X86_PTE_A | X86_PTE_D)); AssertRC(rc);
3264 return VINF_SUCCESS;
3265 }
3266
3267 /* copy the entire page and advance */
3268 memcpy(pvDst, pvSrc, PAGE_SIZE);
3269 PGMPhysReleasePageMappingLock(pVM, &Lock);
3270 rc = PGMGstModifyPage(pVCpu, GCPtrDst, 1, X86_PTE_A | X86_PTE_D, ~(uint64_t)(X86_PTE_A | X86_PTE_D)); AssertRC(rc);
3271 GCPtrDst = (RTGCPTR)((RTGCUINTPTR)GCPtrDst + PAGE_SIZE);
3272 pvSrc = (const uint8_t *)pvSrc + PAGE_SIZE;
3273 cb -= PAGE_SIZE;
3274 }
3275 /* won't ever get here. */
3276}
3277
3278
3279/**
3280 * Read from guest physical memory referenced by GC pointer.
3281 *
3282 * This function uses the current CR3/CR0/CR4 of the guest and will
3283 * respect access handlers and set accessed bits.
3284 *
3285 * @returns Strict VBox status, see PGMPhysRead for details.
3286 * @retval VERR_PAGE_TABLE_NOT_PRESENT if there is no page mapped at the
3287 * specified virtual address.
3288 *
3289 * @param pVCpu The cross context virtual CPU structure of the calling EMT.
3290 * @param pvDst The destination address.
3291 * @param GCPtrSrc The source address (GC pointer).
3292 * @param cb The number of bytes to read.
3293 * @param enmOrigin Who is calling.
3294 * @thread EMT(pVCpu)
3295 */
3296VMMDECL(VBOXSTRICTRC) PGMPhysReadGCPtr(PVMCPUCC pVCpu, void *pvDst, RTGCPTR GCPtrSrc, size_t cb, PGMACCESSORIGIN enmOrigin)
3297{
3298 RTGCPHYS GCPhys;
3299 uint64_t fFlags;
3300 int rc;
3301 PVMCC pVM = pVCpu->CTX_SUFF(pVM);
3302 VMCPU_ASSERT_EMT(pVCpu);
3303
3304 /*
3305 * Anything to do?
3306 */
3307 if (!cb)
3308 return VINF_SUCCESS;
3309
3310 LogFlow(("PGMPhysReadGCPtr: %RGv %zu\n", GCPtrSrc, cb));
3311
3312 /*
3313 * Optimize reads within a single page.
3314 */
3315 if (((RTGCUINTPTR)GCPtrSrc & PAGE_OFFSET_MASK) + cb <= PAGE_SIZE)
3316 {
3317 /* Convert virtual to physical address + flags */
3318 rc = PGMGstGetPage(pVCpu, (RTGCUINTPTR)GCPtrSrc, &fFlags, &GCPhys);
3319 AssertMsgRCReturn(rc, ("GetPage failed with %Rrc for %RGv\n", rc, GCPtrSrc), rc);
3320 GCPhys |= (RTGCUINTPTR)GCPtrSrc & PAGE_OFFSET_MASK;
3321
3322 /* mark the guest page as accessed. */
3323 if (!(fFlags & X86_PTE_A))
3324 {
3325 rc = PGMGstModifyPage(pVCpu, GCPtrSrc, 1, X86_PTE_A, ~(uint64_t)(X86_PTE_A));
3326 AssertRC(rc);
3327 }
3328
3329 return PGMPhysRead(pVM, GCPhys, pvDst, cb, enmOrigin);
3330 }
3331
3332 /*
3333 * Page by page.
3334 */
3335 for (;;)
3336 {
3337 /* Convert virtual to physical address + flags */
3338 rc = PGMGstGetPage(pVCpu, (RTGCUINTPTR)GCPtrSrc, &fFlags, &GCPhys);
3339 AssertMsgRCReturn(rc, ("GetPage failed with %Rrc for %RGv\n", rc, GCPtrSrc), rc);
3340 GCPhys |= (RTGCUINTPTR)GCPtrSrc & PAGE_OFFSET_MASK;
3341
3342 /* mark the guest page as accessed. */
3343 if (!(fFlags & X86_PTE_A))
3344 {
3345 rc = PGMGstModifyPage(pVCpu, GCPtrSrc, 1, X86_PTE_A, ~(uint64_t)(X86_PTE_A));
3346 AssertRC(rc);
3347 }
3348
3349 /* copy */
3350 size_t cbRead = PAGE_SIZE - ((RTGCUINTPTR)GCPtrSrc & PAGE_OFFSET_MASK);
3351 if (cbRead < cb)
3352 {
3353 VBOXSTRICTRC rcStrict = PGMPhysRead(pVM, GCPhys, pvDst, cbRead, enmOrigin);
3354 if (RT_LIKELY(rcStrict == VINF_SUCCESS))
3355 { /* likely */ }
3356 else
3357 return rcStrict;
3358 }
3359 else /* Last page (cbRead is PAGE_SIZE, we only need cb!) */
3360 return PGMPhysRead(pVM, GCPhys, pvDst, cb, enmOrigin);
3361
3362 /* next */
3363 Assert(cb > cbRead);
3364 cb -= cbRead;
3365 pvDst = (uint8_t *)pvDst + cbRead;
3366 GCPtrSrc += cbRead;
3367 }
3368}
3369
3370
3371/**
3372 * Write to guest physical memory referenced by GC pointer.
3373 *
3374 * This function uses the current CR3/CR0/CR4 of the guest and will
3375 * respect access handlers and set dirty and accessed bits.
3376 *
3377 * @returns Strict VBox status, see PGMPhysWrite for details.
3378 * @retval VERR_PAGE_TABLE_NOT_PRESENT if there is no page mapped at the
3379 * specified virtual address.
3380 *
3381 * @param pVCpu The cross context virtual CPU structure of the calling EMT.
3382 * @param GCPtrDst The destination address (GC pointer).
3383 * @param pvSrc The source address.
3384 * @param cb The number of bytes to write.
3385 * @param enmOrigin Who is calling.
3386 */
3387VMMDECL(VBOXSTRICTRC) PGMPhysWriteGCPtr(PVMCPUCC pVCpu, RTGCPTR GCPtrDst, const void *pvSrc, size_t cb, PGMACCESSORIGIN enmOrigin)
3388{
3389 RTGCPHYS GCPhys;
3390 uint64_t fFlags;
3391 int rc;
3392 PVMCC pVM = pVCpu->CTX_SUFF(pVM);
3393 VMCPU_ASSERT_EMT(pVCpu);
3394
3395 /*
3396 * Anything to do?
3397 */
3398 if (!cb)
3399 return VINF_SUCCESS;
3400
3401 LogFlow(("PGMPhysWriteGCPtr: %RGv %zu\n", GCPtrDst, cb));
3402
3403 /*
3404 * Optimize writes within a single page.
3405 */
3406 if (((RTGCUINTPTR)GCPtrDst & PAGE_OFFSET_MASK) + cb <= PAGE_SIZE)
3407 {
3408 /* Convert virtual to physical address + flags */
3409 rc = PGMGstGetPage(pVCpu, (RTGCUINTPTR)GCPtrDst, &fFlags, &GCPhys);
3410 AssertMsgRCReturn(rc, ("GetPage failed with %Rrc for %RGv\n", rc, GCPtrDst), rc);
3411 GCPhys |= (RTGCUINTPTR)GCPtrDst & PAGE_OFFSET_MASK;
3412
3413 /* Mention when we ignore X86_PTE_RW... */
3414 if (!(fFlags & X86_PTE_RW))
3415 Log(("PGMPhysWriteGCPtr: Writing to RO page %RGv %#x\n", GCPtrDst, cb));
3416
3417 /* Mark the guest page as accessed and dirty if necessary. */
3418 if ((fFlags & (X86_PTE_A | X86_PTE_D)) != (X86_PTE_A | X86_PTE_D))
3419 {
3420 rc = PGMGstModifyPage(pVCpu, GCPtrDst, 1, X86_PTE_A | X86_PTE_D, ~(uint64_t)(X86_PTE_A | X86_PTE_D));
3421 AssertRC(rc);
3422 }
3423
3424 return PGMPhysWrite(pVM, GCPhys, pvSrc, cb, enmOrigin);
3425 }
3426
3427 /*
3428 * Page by page.
3429 */
3430 for (;;)
3431 {
3432 /* Convert virtual to physical address + flags */
3433 rc = PGMGstGetPage(pVCpu, (RTGCUINTPTR)GCPtrDst, &fFlags, &GCPhys);
3434 AssertMsgRCReturn(rc, ("GetPage failed with %Rrc for %RGv\n", rc, GCPtrDst), rc);
3435 GCPhys |= (RTGCUINTPTR)GCPtrDst & PAGE_OFFSET_MASK;
3436
3437 /* Mention when we ignore X86_PTE_RW... */
3438 if (!(fFlags & X86_PTE_RW))
3439 Log(("PGMPhysWriteGCPtr: Writing to RO page %RGv %#x\n", GCPtrDst, cb));
3440
3441 /* Mark the guest page as accessed and dirty if necessary. */
3442 if ((fFlags & (X86_PTE_A | X86_PTE_D)) != (X86_PTE_A | X86_PTE_D))
3443 {
3444 rc = PGMGstModifyPage(pVCpu, GCPtrDst, 1, X86_PTE_A | X86_PTE_D, ~(uint64_t)(X86_PTE_A | X86_PTE_D));
3445 AssertRC(rc);
3446 }
3447
3448 /* copy */
3449 size_t cbWrite = PAGE_SIZE - ((RTGCUINTPTR)GCPtrDst & PAGE_OFFSET_MASK);
3450 if (cbWrite < cb)
3451 {
3452 VBOXSTRICTRC rcStrict = PGMPhysWrite(pVM, GCPhys, pvSrc, cbWrite, enmOrigin);
3453 if (RT_LIKELY(rcStrict == VINF_SUCCESS))
3454 { /* likely */ }
3455 else
3456 return rcStrict;
3457 }
3458 else /* Last page (cbWrite is PAGE_SIZE, we only need cb!) */
3459 return PGMPhysWrite(pVM, GCPhys, pvSrc, cb, enmOrigin);
3460
3461 /* next */
3462 Assert(cb > cbWrite);
3463 cb -= cbWrite;
3464 pvSrc = (uint8_t *)pvSrc + cbWrite;
3465 GCPtrDst += cbWrite;
3466 }
3467}
3468
3469
3470/**
3471 * Performs a read of guest virtual memory for instruction emulation.
3472 *
3473 * This will check permissions, raise exceptions and update the access bits.
3474 *
3475 * The current implementation will bypass all access handlers. It may later be
3476 * changed to at least respect MMIO.
3477 *
3478 *
3479 * @returns VBox status code suitable to scheduling.
3480 * @retval VINF_SUCCESS if the read was performed successfully.
3481 * @retval VINF_EM_RAW_GUEST_TRAP if an exception was raised but not dispatched yet.
3482 * @retval VINF_TRPM_XCPT_DISPATCHED if an exception was raised and dispatched.
3483 *
3484 * @param pVCpu The cross context virtual CPU structure of the calling EMT.
3485 * @param pCtxCore The context core.
3486 * @param pvDst Where to put the bytes we've read.
3487 * @param GCPtrSrc The source address.
3488 * @param cb The number of bytes to read. Not more than a page.
3489 *
3490 * @remark This function will dynamically map physical pages in GC. This may unmap
3491 * mappings done by the caller. Be careful!
3492 */
3493VMMDECL(int) PGMPhysInterpretedRead(PVMCPUCC pVCpu, PCPUMCTXCORE pCtxCore, void *pvDst, RTGCUINTPTR GCPtrSrc, size_t cb)
3494{
3495 NOREF(pCtxCore);
3496 PVMCC pVM = pVCpu->CTX_SUFF(pVM);
3497 Assert(cb <= PAGE_SIZE);
3498 VMCPU_ASSERT_EMT(pVCpu);
3499
3500/** @todo r=bird: This isn't perfect!
3501 * -# It's not checking for reserved bits being 1.
3502 * -# It's not correctly dealing with the access bit.
3503 * -# It's not respecting MMIO memory or any other access handlers.
3504 */
3505 /*
3506 * 1. Translate virtual to physical. This may fault.
3507 * 2. Map the physical address.
3508 * 3. Do the read operation.
3509 * 4. Set access bits if required.
3510 */
3511 int rc;
3512 unsigned cb1 = PAGE_SIZE - (GCPtrSrc & PAGE_OFFSET_MASK);
3513 if (cb <= cb1)
3514 {
3515 /*
3516 * Not crossing pages.
3517 */
3518 RTGCPHYS GCPhys;
3519 uint64_t fFlags;
3520 rc = PGMGstGetPage(pVCpu, GCPtrSrc, &fFlags, &GCPhys);
3521 if (RT_SUCCESS(rc))
3522 {
3523 /** @todo we should check reserved bits ... */
3524 PGMPAGEMAPLOCK PgMpLck;
3525 void const *pvSrc;
3526 rc = PGMPhysGCPhys2CCPtrReadOnly(pVM, GCPhys, &pvSrc, &PgMpLck);
3527 switch (rc)
3528 {
3529 case VINF_SUCCESS:
3530 Log(("PGMPhysInterpretedRead: pvDst=%p pvSrc=%p cb=%d\n", pvDst, (uint8_t *)pvSrc + (GCPtrSrc & PAGE_OFFSET_MASK), cb));
3531 memcpy(pvDst, (uint8_t *)pvSrc + (GCPtrSrc & PAGE_OFFSET_MASK), cb);
3532 PGMPhysReleasePageMappingLock(pVM, &PgMpLck);
3533 break;
3534 case VERR_PGM_PHYS_PAGE_RESERVED:
3535 case VERR_PGM_INVALID_GC_PHYSICAL_ADDRESS:
3536 memset(pvDst, 0xff, cb);
3537 break;
3538 default:
3539 Assert(RT_FAILURE_NP(rc));
3540 return rc;
3541 }
3542
3543 /** @todo access bit emulation isn't 100% correct. */
3544 if (!(fFlags & X86_PTE_A))
3545 {
3546 rc = PGMGstModifyPage(pVCpu, GCPtrSrc, 1, X86_PTE_A, ~(uint64_t)X86_PTE_A);
3547 AssertRC(rc);
3548 }
3549 return VINF_SUCCESS;
3550 }
3551 }
3552 else
3553 {
3554 /*
3555 * Crosses pages.
3556 */
3557 size_t cb2 = cb - cb1;
3558 uint64_t fFlags1;
3559 RTGCPHYS GCPhys1;
3560 uint64_t fFlags2;
3561 RTGCPHYS GCPhys2;
3562 rc = PGMGstGetPage(pVCpu, GCPtrSrc, &fFlags1, &GCPhys1);
3563 if (RT_SUCCESS(rc))
3564 {
3565 rc = PGMGstGetPage(pVCpu, GCPtrSrc + cb1, &fFlags2, &GCPhys2);
3566 if (RT_SUCCESS(rc))
3567 {
3568 /** @todo we should check reserved bits ... */
3569 AssertMsgFailed(("cb=%d cb1=%d cb2=%d GCPtrSrc=%RGv\n", cb, cb1, cb2, GCPtrSrc));
3570 PGMPAGEMAPLOCK PgMpLck;
3571 void const *pvSrc1;
3572 rc = PGMPhysGCPhys2CCPtrReadOnly(pVM, GCPhys1, &pvSrc1, &PgMpLck);
3573 switch (rc)
3574 {
3575 case VINF_SUCCESS:
3576 memcpy(pvDst, (uint8_t *)pvSrc1 + (GCPtrSrc & PAGE_OFFSET_MASK), cb1);
3577 PGMPhysReleasePageMappingLock(pVM, &PgMpLck);
3578 break;
3579 case VERR_PGM_INVALID_GC_PHYSICAL_ADDRESS:
3580 memset(pvDst, 0xff, cb1);
3581 break;
3582 default:
3583 Assert(RT_FAILURE_NP(rc));
3584 return rc;
3585 }
3586
3587 void const *pvSrc2;
3588 rc = PGMPhysGCPhys2CCPtrReadOnly(pVM, GCPhys2, &pvSrc2, &PgMpLck);
3589 switch (rc)
3590 {
3591 case VINF_SUCCESS:
3592 memcpy((uint8_t *)pvDst + cb1, pvSrc2, cb2);
3593 PGMPhysReleasePageMappingLock(pVM, &PgMpLck);
3594 break;
3595 case VERR_PGM_INVALID_GC_PHYSICAL_ADDRESS:
3596 memset((uint8_t *)pvDst + cb1, 0xff, cb2);
3597 break;
3598 default:
3599 Assert(RT_FAILURE_NP(rc));
3600 return rc;
3601 }
3602
3603 if (!(fFlags1 & X86_PTE_A))
3604 {
3605 rc = PGMGstModifyPage(pVCpu, GCPtrSrc, 1, X86_PTE_A, ~(uint64_t)X86_PTE_A);
3606 AssertRC(rc);
3607 }
3608 if (!(fFlags2 & X86_PTE_A))
3609 {
3610 rc = PGMGstModifyPage(pVCpu, GCPtrSrc + cb1, 1, X86_PTE_A, ~(uint64_t)X86_PTE_A);
3611 AssertRC(rc);
3612 }
3613 return VINF_SUCCESS;
3614 }
3615 }
3616 }
3617
3618 /*
3619 * Raise a #PF.
3620 */
3621 uint32_t uErr;
3622
3623 /* Get the current privilege level. */
3624 uint32_t cpl = CPUMGetGuestCPL(pVCpu);
3625 switch (rc)
3626 {
3627 case VINF_SUCCESS:
3628 uErr = (cpl >= 2) ? X86_TRAP_PF_RSVD | X86_TRAP_PF_US : X86_TRAP_PF_RSVD;
3629 break;
3630
3631 case VERR_PAGE_NOT_PRESENT:
3632 case VERR_PAGE_TABLE_NOT_PRESENT:
3633 uErr = (cpl >= 2) ? X86_TRAP_PF_US : 0;
3634 break;
3635
3636 default:
3637 AssertMsgFailed(("rc=%Rrc GCPtrSrc=%RGv cb=%#x\n", rc, GCPtrSrc, cb));
3638 return rc;
3639 }
3640 Log(("PGMPhysInterpretedRead: GCPtrSrc=%RGv cb=%#x -> #PF(%#x)\n", GCPtrSrc, cb, uErr));
3641 rc = TRPMAssertXcptPF(pVCpu, GCPtrSrc, uErr);
3642 if (RT_SUCCESS(rc))
3643 return VINF_EM_RAW_GUEST_TRAP;
3644 return rc;
3645}
3646
3647
3648/**
3649 * Performs a read of guest virtual memory for instruction emulation.
3650 *
3651 * This will check permissions, raise exceptions and update the access bits.
3652 *
3653 * The current implementation will bypass all access handlers. It may later be
3654 * changed to at least respect MMIO.
3655 *
3656 *
3657 * @returns VBox status code suitable to scheduling.
3658 * @retval VINF_SUCCESS if the read was performed successfully.
3659 * @retval VINF_EM_RAW_GUEST_TRAP if an exception was raised but not dispatched yet.
3660 * @retval VINF_TRPM_XCPT_DISPATCHED if an exception was raised and dispatched.
3661 *
3662 * @param pVCpu The cross context virtual CPU structure of the calling EMT.
3663 * @param pCtxCore The context core.
3664 * @param pvDst Where to put the bytes we've read.
3665 * @param GCPtrSrc The source address.
3666 * @param cb The number of bytes to read. Not more than a page.
3667 * @param fRaiseTrap If set the trap will be raised on as per spec, if clear
3668 * an appropriate error status will be returned (no
3669 * informational at all).
3670 *
3671 *
3672 * @remarks Takes the PGM lock.
3673 * @remarks A page fault on the 2nd page of the access will be raised without
3674 * writing the bits on the first page since we're ASSUMING that the
3675 * caller is emulating an instruction access.
3676 * @remarks This function will dynamically map physical pages in GC. This may
3677 * unmap mappings done by the caller. Be careful!
3678 */
3679VMMDECL(int) PGMPhysInterpretedReadNoHandlers(PVMCPUCC pVCpu, PCPUMCTXCORE pCtxCore, void *pvDst, RTGCUINTPTR GCPtrSrc, size_t cb,
3680 bool fRaiseTrap)
3681{
3682 NOREF(pCtxCore);
3683 PVMCC pVM = pVCpu->CTX_SUFF(pVM);
3684 Assert(cb <= PAGE_SIZE);
3685 VMCPU_ASSERT_EMT(pVCpu);
3686
3687 /*
3688 * 1. Translate virtual to physical. This may fault.
3689 * 2. Map the physical address.
3690 * 3. Do the read operation.
3691 * 4. Set access bits if required.
3692 */
3693 int rc;
3694 unsigned cb1 = PAGE_SIZE - (GCPtrSrc & PAGE_OFFSET_MASK);
3695 if (cb <= cb1)
3696 {
3697 /*
3698 * Not crossing pages.
3699 */
3700 RTGCPHYS GCPhys;
3701 uint64_t fFlags;
3702 rc = PGMGstGetPage(pVCpu, GCPtrSrc, &fFlags, &GCPhys);
3703 if (RT_SUCCESS(rc))
3704 {
3705 if (1) /** @todo we should check reserved bits ... */
3706 {
3707 const void *pvSrc;
3708 PGMPAGEMAPLOCK Lock;
3709 rc = PGMPhysGCPhys2CCPtrReadOnly(pVM, GCPhys, &pvSrc, &Lock);
3710 switch (rc)
3711 {
3712 case VINF_SUCCESS:
3713 Log(("PGMPhysInterpretedReadNoHandlers: pvDst=%p pvSrc=%p (%RGv) cb=%d\n",
3714 pvDst, (const uint8_t *)pvSrc + (GCPtrSrc & PAGE_OFFSET_MASK), GCPtrSrc, cb));
3715 memcpy(pvDst, (const uint8_t *)pvSrc + (GCPtrSrc & PAGE_OFFSET_MASK), cb);
3716 PGMPhysReleasePageMappingLock(pVM, &Lock);
3717 break;
3718 case VERR_PGM_PHYS_PAGE_RESERVED:
3719 case VERR_PGM_INVALID_GC_PHYSICAL_ADDRESS:
3720 memset(pvDst, 0xff, cb);
3721 break;
3722 default:
3723 AssertMsgFailed(("%Rrc\n", rc));
3724 AssertReturn(RT_FAILURE(rc), VERR_IPE_UNEXPECTED_INFO_STATUS);
3725 return rc;
3726 }
3727
3728 if (!(fFlags & X86_PTE_A))
3729 {
3730 /** @todo access bit emulation isn't 100% correct. */
3731 rc = PGMGstModifyPage(pVCpu, GCPtrSrc, 1, X86_PTE_A, ~(uint64_t)X86_PTE_A);
3732 AssertRC(rc);
3733 }
3734 return VINF_SUCCESS;
3735 }
3736 }
3737 }
3738 else
3739 {
3740 /*
3741 * Crosses pages.
3742 */
3743 size_t cb2 = cb - cb1;
3744 uint64_t fFlags1;
3745 RTGCPHYS GCPhys1;
3746 uint64_t fFlags2;
3747 RTGCPHYS GCPhys2;
3748 rc = PGMGstGetPage(pVCpu, GCPtrSrc, &fFlags1, &GCPhys1);
3749 if (RT_SUCCESS(rc))
3750 {
3751 rc = PGMGstGetPage(pVCpu, GCPtrSrc + cb1, &fFlags2, &GCPhys2);
3752 if (RT_SUCCESS(rc))
3753 {
3754 if (1) /** @todo we should check reserved bits ... */
3755 {
3756 const void *pvSrc;
3757 PGMPAGEMAPLOCK Lock;
3758 rc = PGMPhysGCPhys2CCPtrReadOnly(pVM, GCPhys1, &pvSrc, &Lock);
3759 switch (rc)
3760 {
3761 case VINF_SUCCESS:
3762 Log(("PGMPhysInterpretedReadNoHandlers: pvDst=%p pvSrc=%p (%RGv) cb=%d [2]\n",
3763 pvDst, (const uint8_t *)pvSrc + (GCPtrSrc & PAGE_OFFSET_MASK), GCPtrSrc, cb1));
3764 memcpy(pvDst, (const uint8_t *)pvSrc + (GCPtrSrc & PAGE_OFFSET_MASK), cb1);
3765 PGMPhysReleasePageMappingLock(pVM, &Lock);
3766 break;
3767 case VERR_PGM_PHYS_PAGE_RESERVED:
3768 case VERR_PGM_INVALID_GC_PHYSICAL_ADDRESS:
3769 memset(pvDst, 0xff, cb1);
3770 break;
3771 default:
3772 AssertMsgFailed(("%Rrc\n", rc));
3773 AssertReturn(RT_FAILURE(rc), VERR_IPE_UNEXPECTED_INFO_STATUS);
3774 return rc;
3775 }
3776
3777 rc = PGMPhysGCPhys2CCPtrReadOnly(pVM, GCPhys2, &pvSrc, &Lock);
3778 switch (rc)
3779 {
3780 case VINF_SUCCESS:
3781 memcpy((uint8_t *)pvDst + cb1, pvSrc, cb2);
3782 PGMPhysReleasePageMappingLock(pVM, &Lock);
3783 break;
3784 case VERR_PGM_PHYS_PAGE_RESERVED:
3785 case VERR_PGM_INVALID_GC_PHYSICAL_ADDRESS:
3786 memset((uint8_t *)pvDst + cb1, 0xff, cb2);
3787 break;
3788 default:
3789 AssertMsgFailed(("%Rrc\n", rc));
3790 AssertReturn(RT_FAILURE(rc), VERR_IPE_UNEXPECTED_INFO_STATUS);
3791 return rc;
3792 }
3793
3794 if (!(fFlags1 & X86_PTE_A))
3795 {
3796 rc = PGMGstModifyPage(pVCpu, GCPtrSrc, 1, X86_PTE_A, ~(uint64_t)X86_PTE_A);
3797 AssertRC(rc);
3798 }
3799 if (!(fFlags2 & X86_PTE_A))
3800 {
3801 rc = PGMGstModifyPage(pVCpu, GCPtrSrc + cb1, 1, X86_PTE_A, ~(uint64_t)X86_PTE_A);
3802 AssertRC(rc);
3803 }
3804 return VINF_SUCCESS;
3805 }
3806 /* sort out which page */
3807 }
3808 else
3809 GCPtrSrc += cb1; /* fault on 2nd page */
3810 }
3811 }
3812
3813 /*
3814 * Raise a #PF if we're allowed to do that.
3815 */
3816 /* Calc the error bits. */
3817 uint32_t cpl = CPUMGetGuestCPL(pVCpu);
3818 uint32_t uErr;
3819 switch (rc)
3820 {
3821 case VINF_SUCCESS:
3822 uErr = (cpl >= 2) ? X86_TRAP_PF_RSVD | X86_TRAP_PF_US : X86_TRAP_PF_RSVD;
3823 rc = VERR_ACCESS_DENIED;
3824 break;
3825
3826 case VERR_PAGE_NOT_PRESENT:
3827 case VERR_PAGE_TABLE_NOT_PRESENT:
3828 uErr = (cpl >= 2) ? X86_TRAP_PF_US : 0;
3829 break;
3830
3831 default:
3832 AssertMsgFailed(("rc=%Rrc GCPtrSrc=%RGv cb=%#x\n", rc, GCPtrSrc, cb));
3833 AssertReturn(RT_FAILURE(rc), VERR_IPE_UNEXPECTED_INFO_STATUS);
3834 return rc;
3835 }
3836 if (fRaiseTrap)
3837 {
3838 Log(("PGMPhysInterpretedReadNoHandlers: GCPtrSrc=%RGv cb=%#x -> Raised #PF(%#x)\n", GCPtrSrc, cb, uErr));
3839 rc = TRPMAssertXcptPF(pVCpu, GCPtrSrc, uErr);
3840 if (RT_SUCCESS(rc))
3841 return VINF_EM_RAW_GUEST_TRAP;
3842 return rc;
3843 }
3844 Log(("PGMPhysInterpretedReadNoHandlers: GCPtrSrc=%RGv cb=%#x -> #PF(%#x) [!raised]\n", GCPtrSrc, cb, uErr));
3845 return rc;
3846}
3847
3848
3849/**
3850 * Performs a write to guest virtual memory for instruction emulation.
3851 *
3852 * This will check permissions, raise exceptions and update the dirty and access
3853 * bits.
3854 *
3855 * @returns VBox status code suitable to scheduling.
3856 * @retval VINF_SUCCESS if the read was performed successfully.
3857 * @retval VINF_EM_RAW_GUEST_TRAP if an exception was raised but not dispatched yet.
3858 * @retval VINF_TRPM_XCPT_DISPATCHED if an exception was raised and dispatched.
3859 *
3860 * @param pVCpu The cross context virtual CPU structure of the calling EMT.
3861 * @param pCtxCore The context core.
3862 * @param GCPtrDst The destination address.
3863 * @param pvSrc What to write.
3864 * @param cb The number of bytes to write. Not more than a page.
3865 * @param fRaiseTrap If set the trap will be raised on as per spec, if clear
3866 * an appropriate error status will be returned (no
3867 * informational at all).
3868 *
3869 * @remarks Takes the PGM lock.
3870 * @remarks A page fault on the 2nd page of the access will be raised without
3871 * writing the bits on the first page since we're ASSUMING that the
3872 * caller is emulating an instruction access.
3873 * @remarks This function will dynamically map physical pages in GC. This may
3874 * unmap mappings done by the caller. Be careful!
3875 */
3876VMMDECL(int) PGMPhysInterpretedWriteNoHandlers(PVMCPUCC pVCpu, PCPUMCTXCORE pCtxCore, RTGCPTR GCPtrDst, const void *pvSrc,
3877 size_t cb, bool fRaiseTrap)
3878{
3879 NOREF(pCtxCore);
3880 Assert(cb <= PAGE_SIZE);
3881 PVMCC pVM = pVCpu->CTX_SUFF(pVM);
3882 VMCPU_ASSERT_EMT(pVCpu);
3883
3884 /*
3885 * 1. Translate virtual to physical. This may fault.
3886 * 2. Map the physical address.
3887 * 3. Do the write operation.
3888 * 4. Set access bits if required.
3889 */
3890 /** @todo Since this method is frequently used by EMInterpret or IOM
3891 * upon a write fault to an write access monitored page, we can
3892 * reuse the guest page table walking from the \#PF code. */
3893 int rc;
3894 unsigned cb1 = PAGE_SIZE - (GCPtrDst & PAGE_OFFSET_MASK);
3895 if (cb <= cb1)
3896 {
3897 /*
3898 * Not crossing pages.
3899 */
3900 RTGCPHYS GCPhys;
3901 uint64_t fFlags;
3902 rc = PGMGstGetPage(pVCpu, GCPtrDst, &fFlags, &GCPhys);
3903 if (RT_SUCCESS(rc))
3904 {
3905 if ( (fFlags & X86_PTE_RW) /** @todo Also check reserved bits. */
3906 || ( !(CPUMGetGuestCR0(pVCpu) & X86_CR0_WP)
3907 && CPUMGetGuestCPL(pVCpu) <= 2) ) /** @todo it's 2, right? Check cpl check below as well. */
3908 {
3909 void *pvDst;
3910 PGMPAGEMAPLOCK Lock;
3911 rc = PGMPhysGCPhys2CCPtr(pVM, GCPhys, &pvDst, &Lock);
3912 switch (rc)
3913 {
3914 case VINF_SUCCESS:
3915 Log(("PGMPhysInterpretedWriteNoHandlers: pvDst=%p (%RGv) pvSrc=%p cb=%d\n",
3916 (uint8_t *)pvDst + (GCPtrDst & PAGE_OFFSET_MASK), GCPtrDst, pvSrc, cb));
3917 memcpy((uint8_t *)pvDst + (GCPtrDst & PAGE_OFFSET_MASK), pvSrc, cb);
3918 PGMPhysReleasePageMappingLock(pVM, &Lock);
3919 break;
3920 case VERR_PGM_PHYS_PAGE_RESERVED:
3921 case VERR_PGM_INVALID_GC_PHYSICAL_ADDRESS:
3922 /* bit bucket */
3923 break;
3924 default:
3925 AssertMsgFailed(("%Rrc\n", rc));
3926 AssertReturn(RT_FAILURE(rc), VERR_IPE_UNEXPECTED_INFO_STATUS);
3927 return rc;
3928 }
3929
3930 if (!(fFlags & (X86_PTE_A | X86_PTE_D)))
3931 {
3932 /** @todo dirty & access bit emulation isn't 100% correct. */
3933 rc = PGMGstModifyPage(pVCpu, GCPtrDst, 1, X86_PTE_A | X86_PTE_D, ~(uint64_t)(X86_PTE_A | X86_PTE_D));
3934 AssertRC(rc);
3935 }
3936 return VINF_SUCCESS;
3937 }
3938 rc = VERR_ACCESS_DENIED;
3939 }
3940 }
3941 else
3942 {
3943 /*
3944 * Crosses pages.
3945 */
3946 size_t cb2 = cb - cb1;
3947 uint64_t fFlags1;
3948 RTGCPHYS GCPhys1;
3949 uint64_t fFlags2;
3950 RTGCPHYS GCPhys2;
3951 rc = PGMGstGetPage(pVCpu, GCPtrDst, &fFlags1, &GCPhys1);
3952 if (RT_SUCCESS(rc))
3953 {
3954 rc = PGMGstGetPage(pVCpu, GCPtrDst + cb1, &fFlags2, &GCPhys2);
3955 if (RT_SUCCESS(rc))
3956 {
3957 if ( ( (fFlags1 & X86_PTE_RW) /** @todo Also check reserved bits. */
3958 && (fFlags2 & X86_PTE_RW))
3959 || ( !(CPUMGetGuestCR0(pVCpu) & X86_CR0_WP)
3960 && CPUMGetGuestCPL(pVCpu) <= 2) )
3961 {
3962 void *pvDst;
3963 PGMPAGEMAPLOCK Lock;
3964 rc = PGMPhysGCPhys2CCPtr(pVM, GCPhys1, &pvDst, &Lock);
3965 switch (rc)
3966 {
3967 case VINF_SUCCESS:
3968 Log(("PGMPhysInterpretedWriteNoHandlers: pvDst=%p (%RGv) pvSrc=%p cb=%d\n",
3969 (uint8_t *)pvDst + (GCPtrDst & PAGE_OFFSET_MASK), GCPtrDst, pvSrc, cb1));
3970 memcpy((uint8_t *)pvDst + (GCPtrDst & PAGE_OFFSET_MASK), pvSrc, cb1);
3971 PGMPhysReleasePageMappingLock(pVM, &Lock);
3972 break;
3973 case VERR_PGM_PHYS_PAGE_RESERVED:
3974 case VERR_PGM_INVALID_GC_PHYSICAL_ADDRESS:
3975 /* bit bucket */
3976 break;
3977 default:
3978 AssertMsgFailed(("%Rrc\n", rc));
3979 AssertReturn(RT_FAILURE(rc), VERR_IPE_UNEXPECTED_INFO_STATUS);
3980 return rc;
3981 }
3982
3983 rc = PGMPhysGCPhys2CCPtr(pVM, GCPhys2, &pvDst, &Lock);
3984 switch (rc)
3985 {
3986 case VINF_SUCCESS:
3987 memcpy(pvDst, (const uint8_t *)pvSrc + cb1, cb2);
3988 PGMPhysReleasePageMappingLock(pVM, &Lock);
3989 break;
3990 case VERR_PGM_PHYS_PAGE_RESERVED:
3991 case VERR_PGM_INVALID_GC_PHYSICAL_ADDRESS:
3992 /* bit bucket */
3993 break;
3994 default:
3995 AssertMsgFailed(("%Rrc\n", rc));
3996 AssertReturn(RT_FAILURE(rc), VERR_IPE_UNEXPECTED_INFO_STATUS);
3997 return rc;
3998 }
3999
4000 if (!(fFlags1 & (X86_PTE_A | X86_PTE_RW)))
4001 {
4002 rc = PGMGstModifyPage(pVCpu, GCPtrDst, 1, (X86_PTE_A | X86_PTE_RW), ~(uint64_t)(X86_PTE_A | X86_PTE_RW));
4003 AssertRC(rc);
4004 }
4005 if (!(fFlags2 & (X86_PTE_A | X86_PTE_RW)))
4006 {
4007 rc = PGMGstModifyPage(pVCpu, GCPtrDst + cb1, 1, (X86_PTE_A | X86_PTE_RW), ~(uint64_t)(X86_PTE_A | X86_PTE_RW));
4008 AssertRC(rc);
4009 }
4010 return VINF_SUCCESS;
4011 }
4012 if ((fFlags1 & (X86_PTE_RW)) == X86_PTE_RW)
4013 GCPtrDst += cb1; /* fault on the 2nd page. */
4014 rc = VERR_ACCESS_DENIED;
4015 }
4016 else
4017 GCPtrDst += cb1; /* fault on the 2nd page. */
4018 }
4019 }
4020
4021 /*
4022 * Raise a #PF if we're allowed to do that.
4023 */
4024 /* Calc the error bits. */
4025 uint32_t uErr;
4026 uint32_t cpl = CPUMGetGuestCPL(pVCpu);
4027 switch (rc)
4028 {
4029 case VINF_SUCCESS:
4030 uErr = (cpl >= 2) ? X86_TRAP_PF_RSVD | X86_TRAP_PF_US : X86_TRAP_PF_RSVD;
4031 rc = VERR_ACCESS_DENIED;
4032 break;
4033
4034 case VERR_ACCESS_DENIED:
4035 uErr = (cpl >= 2) ? X86_TRAP_PF_RW | X86_TRAP_PF_US : X86_TRAP_PF_RW;
4036 break;
4037
4038 case VERR_PAGE_NOT_PRESENT:
4039 case VERR_PAGE_TABLE_NOT_PRESENT:
4040 uErr = (cpl >= 2) ? X86_TRAP_PF_US : 0;
4041 break;
4042
4043 default:
4044 AssertMsgFailed(("rc=%Rrc GCPtrDst=%RGv cb=%#x\n", rc, GCPtrDst, cb));
4045 AssertReturn(RT_FAILURE(rc), VERR_IPE_UNEXPECTED_INFO_STATUS);
4046 return rc;
4047 }
4048 if (fRaiseTrap)
4049 {
4050 Log(("PGMPhysInterpretedWriteNoHandlers: GCPtrDst=%RGv cb=%#x -> Raised #PF(%#x)\n", GCPtrDst, cb, uErr));
4051 rc = TRPMAssertXcptPF(pVCpu, GCPtrDst, uErr);
4052 if (RT_SUCCESS(rc))
4053 return VINF_EM_RAW_GUEST_TRAP;
4054 return rc;
4055 }
4056 Log(("PGMPhysInterpretedWriteNoHandlers: GCPtrDst=%RGv cb=%#x -> #PF(%#x) [!raised]\n", GCPtrDst, cb, uErr));
4057 return rc;
4058}
4059
4060
4061/**
4062 * Return the page type of the specified physical address.
4063 *
4064 * @returns The page type.
4065 * @param pVM The cross context VM structure.
4066 * @param GCPhys Guest physical address
4067 */
4068VMM_INT_DECL(PGMPAGETYPE) PGMPhysGetPageType(PVMCC pVM, RTGCPHYS GCPhys)
4069{
4070 PGM_LOCK_VOID(pVM);
4071 PPGMPAGE pPage = pgmPhysGetPage(pVM, GCPhys);
4072 PGMPAGETYPE enmPgType = pPage ? (PGMPAGETYPE)PGM_PAGE_GET_TYPE(pPage) : PGMPAGETYPE_INVALID;
4073 PGM_UNLOCK(pVM);
4074
4075 return enmPgType;
4076}
4077
4078
4079/**
4080 * Converts a GC physical address to a HC ring-3 pointer, with some
4081 * additional checks.
4082 *
4083 * @returns VBox status code (no informational statuses).
4084 *
4085 * @param pVM The cross context VM structure.
4086 * @param pVCpu The cross context virtual CPU structure of the
4087 * calling EMT.
4088 * @param GCPhys The GC physical address to convert. This API mask
4089 * the A20 line when necessary.
4090 * @param puTlbPhysRev Where to read the physical TLB revision. Needs to
4091 * be done while holding the PGM lock.
4092 * @param ppb Where to store the pointer corresponding to GCPhys
4093 * on success.
4094 * @param pfTlb The TLB flags and revision. We only add stuff.
4095 *
4096 * @remarks This is more or a less a copy of PGMR3PhysTlbGCPhys2Ptr and
4097 * PGMPhysIemGCPhys2Ptr.
4098 *
4099 * @thread EMT(pVCpu).
4100 */
4101VMM_INT_DECL(int) PGMPhysIemGCPhys2PtrNoLock(PVMCC pVM, PVMCPUCC pVCpu, RTGCPHYS GCPhys, uint64_t const volatile *puTlbPhysRev,
4102 R3R0PTRTYPE(uint8_t *) *ppb,
4103 uint64_t *pfTlb)
4104{
4105 PGM_A20_APPLY_TO_VAR(pVCpu, GCPhys);
4106 Assert(!(GCPhys & X86_PAGE_OFFSET_MASK));
4107
4108 PGM_LOCK_VOID(pVM);
4109
4110 PPGMRAMRANGE pRam;
4111 PPGMPAGE pPage;
4112 int rc = pgmPhysGetPageAndRangeEx(pVM, GCPhys, &pPage, &pRam);
4113 if (RT_SUCCESS(rc))
4114 {
4115 if (!PGM_PAGE_IS_BALLOONED(pPage))
4116 {
4117 if (!PGM_PAGE_IS_SPECIAL_ALIAS_MMIO(pPage))
4118 {
4119 if (!PGM_PAGE_HAS_ANY_HANDLERS(pPage))
4120 {
4121 /*
4122 * No access handler.
4123 */
4124 switch (PGM_PAGE_GET_STATE(pPage))
4125 {
4126 case PGM_PAGE_STATE_ALLOCATED:
4127 *pfTlb |= *puTlbPhysRev;
4128 break;
4129 case PGM_PAGE_STATE_BALLOONED:
4130 AssertFailed();
4131 RT_FALL_THRU();
4132 case PGM_PAGE_STATE_ZERO:
4133 case PGM_PAGE_STATE_SHARED:
4134 case PGM_PAGE_STATE_WRITE_MONITORED:
4135 *pfTlb |= *puTlbPhysRev | PGMIEMGCPHYS2PTR_F_NO_WRITE;
4136 break;
4137 }
4138
4139 PPGMPAGEMAPTLBE pTlbe;
4140 rc = pgmPhysPageQueryTlbeWithPage(pVM, pPage, GCPhys, &pTlbe);
4141 AssertLogRelRCReturn(rc, rc);
4142 *ppb = (uint8_t *)pTlbe->pv;
4143 }
4144 else if (PGM_PAGE_HAS_ACTIVE_ALL_HANDLERS(pPage))
4145 {
4146 /*
4147 * MMIO or similar all access handler: Catch all access.
4148 */
4149 *pfTlb |= *puTlbPhysRev
4150 | PGMIEMGCPHYS2PTR_F_NO_WRITE | PGMIEMGCPHYS2PTR_F_NO_READ | PGMIEMGCPHYS2PTR_F_NO_MAPPINGR3;
4151 *ppb = NULL;
4152 }
4153 else
4154 {
4155 /*
4156 * Write access handler: Catch write accesses if active.
4157 */
4158 if (PGM_PAGE_HAS_ACTIVE_HANDLERS(pPage))
4159 *pfTlb |= *puTlbPhysRev | PGMIEMGCPHYS2PTR_F_NO_WRITE;
4160 else
4161 switch (PGM_PAGE_GET_STATE(pPage))
4162 {
4163 case PGM_PAGE_STATE_ALLOCATED:
4164 *pfTlb |= *puTlbPhysRev;
4165 break;
4166 case PGM_PAGE_STATE_BALLOONED:
4167 AssertFailed();
4168 RT_FALL_THRU();
4169 case PGM_PAGE_STATE_ZERO:
4170 case PGM_PAGE_STATE_SHARED:
4171 case PGM_PAGE_STATE_WRITE_MONITORED:
4172 *pfTlb |= *puTlbPhysRev | PGMIEMGCPHYS2PTR_F_NO_WRITE;
4173 break;
4174 }
4175
4176 PPGMPAGEMAPTLBE pTlbe;
4177 rc = pgmPhysPageQueryTlbeWithPage(pVM, pPage, GCPhys, &pTlbe);
4178 AssertLogRelRCReturn(rc, rc);
4179 *ppb = (uint8_t *)pTlbe->pv;
4180 }
4181 }
4182 else
4183 {
4184 /* Alias MMIO: For now, we catch all access. */
4185 *pfTlb |= *puTlbPhysRev
4186 | PGMIEMGCPHYS2PTR_F_NO_WRITE | PGMIEMGCPHYS2PTR_F_NO_READ | PGMIEMGCPHYS2PTR_F_NO_MAPPINGR3;
4187 *ppb = NULL;
4188 }
4189 }
4190 else
4191 {
4192 /* Ballooned: Shouldn't get here, but we read zero page via PGMPhysRead and writes goes to /dev/null. */
4193 *pfTlb |= *puTlbPhysRev | PGMIEMGCPHYS2PTR_F_NO_WRITE | PGMIEMGCPHYS2PTR_F_NO_READ | PGMIEMGCPHYS2PTR_F_NO_MAPPINGR3;
4194 *ppb = NULL;
4195 }
4196 Log6(("PGMPhysIemGCPhys2PtrNoLock: GCPhys=%RGp *ppb=%p *pfTlb=%#RX64 pPage=%R[pgmpage]\n", GCPhys, *ppb, *pfTlb, pPage));
4197 }
4198 else
4199 {
4200 *pfTlb |= *puTlbPhysRev | PGMIEMGCPHYS2PTR_F_NO_WRITE | PGMIEMGCPHYS2PTR_F_NO_READ | PGMIEMGCPHYS2PTR_F_NO_MAPPINGR3;
4201 *ppb = NULL;
4202 Log6(("PGMPhysIemGCPhys2PtrNoLock: GCPhys=%RGp *ppb=%p *pfTlb=%#RX64 (rc=%Rrc)\n", GCPhys, *ppb, *pfTlb, rc));
4203 }
4204
4205 PGM_UNLOCK(pVM);
4206 return VINF_SUCCESS;
4207}
4208
4209
4210/**
4211 * Converts a GC physical address to a HC ring-3 pointer, with some
4212 * additional checks.
4213 *
4214 * @returns VBox status code (no informational statuses).
4215 * @retval VINF_SUCCESS on success.
4216 * @retval VERR_PGM_PHYS_TLB_CATCH_WRITE and *ppv set if the page has a write
4217 * access handler of some kind.
4218 * @retval VERR_PGM_PHYS_TLB_CATCH_ALL if the page has a handler catching all
4219 * accesses or is odd in any way.
4220 * @retval VERR_PGM_PHYS_TLB_UNASSIGNED if the page doesn't exist.
4221 *
4222 * @param pVM The cross context VM structure.
4223 * @param pVCpu The cross context virtual CPU structure of the
4224 * calling EMT.
4225 * @param GCPhys The GC physical address to convert. This API mask
4226 * the A20 line when necessary.
4227 * @param fWritable Whether write access is required.
4228 * @param fByPassHandlers Whether to bypass access handlers.
4229 * @param ppv Where to store the pointer corresponding to GCPhys
4230 * on success.
4231 * @param pLock
4232 *
4233 * @remarks This is more or a less a copy of PGMR3PhysTlbGCPhys2Ptr.
4234 * @thread EMT(pVCpu).
4235 */
4236VMM_INT_DECL(int) PGMPhysIemGCPhys2Ptr(PVMCC pVM, PVMCPUCC pVCpu, RTGCPHYS GCPhys, bool fWritable, bool fByPassHandlers,
4237 void **ppv, PPGMPAGEMAPLOCK pLock)
4238{
4239 PGM_A20_APPLY_TO_VAR(pVCpu, GCPhys);
4240
4241 PGM_LOCK_VOID(pVM);
4242
4243 PPGMRAMRANGE pRam;
4244 PPGMPAGE pPage;
4245 int rc = pgmPhysGetPageAndRangeEx(pVM, GCPhys, &pPage, &pRam);
4246 if (RT_SUCCESS(rc))
4247 {
4248 if (PGM_PAGE_IS_BALLOONED(pPage))
4249 rc = VERR_PGM_PHYS_TLB_CATCH_WRITE;
4250 else if (PGM_PAGE_IS_SPECIAL_ALIAS_MMIO(pPage))
4251 rc = VERR_PGM_PHYS_TLB_CATCH_ALL;
4252 else if ( !PGM_PAGE_HAS_ANY_HANDLERS(pPage)
4253 || (fByPassHandlers && !PGM_PAGE_IS_MMIO(pPage)) )
4254 rc = VINF_SUCCESS;
4255 else
4256 {
4257 if (PGM_PAGE_HAS_ACTIVE_ALL_HANDLERS(pPage)) /* catches MMIO */
4258 {
4259 Assert(!fByPassHandlers || PGM_PAGE_IS_MMIO(pPage));
4260 rc = VERR_PGM_PHYS_TLB_CATCH_ALL;
4261 }
4262 else if (PGM_PAGE_HAS_ACTIVE_HANDLERS(pPage) && fWritable)
4263 {
4264 Assert(!fByPassHandlers);
4265 rc = VERR_PGM_PHYS_TLB_CATCH_WRITE;
4266 }
4267 }
4268 if (RT_SUCCESS(rc))
4269 {
4270 int rc2;
4271
4272 /* Make sure what we return is writable. */
4273 if (fWritable)
4274 switch (PGM_PAGE_GET_STATE(pPage))
4275 {
4276 case PGM_PAGE_STATE_ALLOCATED:
4277 break;
4278 case PGM_PAGE_STATE_BALLOONED:
4279 AssertFailed();
4280 break;
4281 case PGM_PAGE_STATE_ZERO:
4282 case PGM_PAGE_STATE_SHARED:
4283 case PGM_PAGE_STATE_WRITE_MONITORED:
4284 rc2 = pgmPhysPageMakeWritable(pVM, pPage, GCPhys & ~(RTGCPHYS)PAGE_OFFSET_MASK);
4285 AssertLogRelRCReturn(rc2, rc2);
4286 break;
4287 }
4288
4289 /* Get a ring-3 mapping of the address. */
4290 PPGMPAGEMAPTLBE pTlbe;
4291 rc2 = pgmPhysPageQueryTlbeWithPage(pVM, pPage, GCPhys, &pTlbe);
4292 AssertLogRelRCReturn(rc2, rc2);
4293
4294 /* Lock it and calculate the address. */
4295 if (fWritable)
4296 pgmPhysPageMapLockForWriting(pVM, pPage, pTlbe, pLock);
4297 else
4298 pgmPhysPageMapLockForReading(pVM, pPage, pTlbe, pLock);
4299 *ppv = (void *)((uintptr_t)pTlbe->pv | (uintptr_t)(GCPhys & PAGE_OFFSET_MASK));
4300
4301 Log6(("PGMPhysIemGCPhys2Ptr: GCPhys=%RGp rc=%Rrc pPage=%R[pgmpage] *ppv=%p\n", GCPhys, rc, pPage, *ppv));
4302 }
4303 else
4304 Log6(("PGMPhysIemGCPhys2Ptr: GCPhys=%RGp rc=%Rrc pPage=%R[pgmpage]\n", GCPhys, rc, pPage));
4305
4306 /* else: handler catching all access, no pointer returned. */
4307 }
4308 else
4309 rc = VERR_PGM_PHYS_TLB_UNASSIGNED;
4310
4311 PGM_UNLOCK(pVM);
4312 return rc;
4313}
4314
4315
4316/**
4317 * Checks if the give GCPhys page requires special handling for the given access
4318 * because it's MMIO or otherwise monitored.
4319 *
4320 * @returns VBox status code (no informational statuses).
4321 * @retval VINF_SUCCESS on success.
4322 * @retval VERR_PGM_PHYS_TLB_CATCH_WRITE and *ppv set if the page has a write
4323 * access handler of some kind.
4324 * @retval VERR_PGM_PHYS_TLB_CATCH_ALL if the page has a handler catching all
4325 * accesses or is odd in any way.
4326 * @retval VERR_PGM_PHYS_TLB_UNASSIGNED if the page doesn't exist.
4327 *
4328 * @param pVM The cross context VM structure.
4329 * @param GCPhys The GC physical address to convert. Since this is
4330 * only used for filling the REM TLB, the A20 mask must
4331 * be applied before calling this API.
4332 * @param fWritable Whether write access is required.
4333 * @param fByPassHandlers Whether to bypass access handlers.
4334 *
4335 * @remarks This is a watered down version PGMPhysIemGCPhys2Ptr and really just
4336 * a stop gap thing that should be removed once there is a better TLB
4337 * for virtual address accesses.
4338 */
4339VMM_INT_DECL(int) PGMPhysIemQueryAccess(PVMCC pVM, RTGCPHYS GCPhys, bool fWritable, bool fByPassHandlers)
4340{
4341 PGM_LOCK_VOID(pVM);
4342 PGM_A20_ASSERT_MASKED(VMMGetCpu(pVM), GCPhys);
4343
4344 PPGMRAMRANGE pRam;
4345 PPGMPAGE pPage;
4346 int rc = pgmPhysGetPageAndRangeEx(pVM, GCPhys, &pPage, &pRam);
4347 if (RT_SUCCESS(rc))
4348 {
4349 if (PGM_PAGE_IS_BALLOONED(pPage))
4350 rc = VERR_PGM_PHYS_TLB_CATCH_WRITE;
4351 else if (PGM_PAGE_IS_SPECIAL_ALIAS_MMIO(pPage))
4352 rc = VERR_PGM_PHYS_TLB_CATCH_ALL;
4353 else if ( !PGM_PAGE_HAS_ANY_HANDLERS(pPage)
4354 || (fByPassHandlers && !PGM_PAGE_IS_MMIO(pPage)) )
4355 rc = VINF_SUCCESS;
4356 else
4357 {
4358 if (PGM_PAGE_HAS_ACTIVE_ALL_HANDLERS(pPage)) /* catches MMIO */
4359 {
4360 Assert(!fByPassHandlers || PGM_PAGE_IS_MMIO(pPage));
4361 rc = VERR_PGM_PHYS_TLB_CATCH_ALL;
4362 }
4363 else if (PGM_PAGE_HAS_ACTIVE_HANDLERS(pPage) && fWritable)
4364 {
4365 Assert(!fByPassHandlers);
4366 rc = VERR_PGM_PHYS_TLB_CATCH_WRITE;
4367 }
4368 }
4369 }
4370
4371 PGM_UNLOCK(pVM);
4372 return rc;
4373}
4374
4375
4376/**
4377 * Interface used by NEM to check what to do on a memory access exit.
4378 *
4379 * @returns VBox status code.
4380 * @param pVM The cross context VM structure.
4381 * @param pVCpu The cross context per virtual CPU structure.
4382 * Optional.
4383 * @param GCPhys The guest physical address.
4384 * @param fMakeWritable Whether to try make the page writable or not. If it
4385 * cannot be made writable, NEM_PAGE_PROT_WRITE won't
4386 * be returned and the return code will be unaffected
4387 * @param pInfo Where to return the page information. This is
4388 * initialized even on failure.
4389 * @param pfnChecker Page in-sync checker callback. Optional.
4390 * @param pvUser User argument to pass to pfnChecker.
4391 */
4392VMM_INT_DECL(int) PGMPhysNemPageInfoChecker(PVMCC pVM, PVMCPUCC pVCpu, RTGCPHYS GCPhys, bool fMakeWritable, PPGMPHYSNEMPAGEINFO pInfo,
4393 PFNPGMPHYSNEMCHECKPAGE pfnChecker, void *pvUser)
4394{
4395 PGM_LOCK_VOID(pVM);
4396
4397 PPGMPAGE pPage;
4398 int rc = pgmPhysGetPageEx(pVM, GCPhys, &pPage);
4399 if (RT_SUCCESS(rc))
4400 {
4401 /* Try make it writable if requested. */
4402 pInfo->u2OldNemState = PGM_PAGE_GET_NEM_STATE(pPage);
4403 if (fMakeWritable)
4404 switch (PGM_PAGE_GET_STATE(pPage))
4405 {
4406 case PGM_PAGE_STATE_SHARED:
4407 case PGM_PAGE_STATE_WRITE_MONITORED:
4408 case PGM_PAGE_STATE_ZERO:
4409 rc = pgmPhysPageMakeWritable(pVM, pPage, GCPhys);
4410 if (rc == VERR_PGM_PHYS_PAGE_RESERVED)
4411 rc = VINF_SUCCESS;
4412 break;
4413 }
4414
4415 /* Fill in the info. */
4416 pInfo->HCPhys = PGM_PAGE_GET_HCPHYS(pPage);
4417 pInfo->u2NemState = PGM_PAGE_GET_NEM_STATE(pPage);
4418 pInfo->fHasHandlers = PGM_PAGE_HAS_ACTIVE_HANDLERS(pPage) ? 1 : 0;
4419 PGMPAGETYPE const enmType = (PGMPAGETYPE)PGM_PAGE_GET_TYPE(pPage);
4420 pInfo->enmType = enmType;
4421 pInfo->fNemProt = pgmPhysPageCalcNemProtection(pPage, enmType);
4422 switch (PGM_PAGE_GET_STATE(pPage))
4423 {
4424 case PGM_PAGE_STATE_ALLOCATED:
4425 pInfo->fZeroPage = 0;
4426 break;
4427
4428 case PGM_PAGE_STATE_ZERO:
4429 pInfo->fZeroPage = 1;
4430 break;
4431
4432 case PGM_PAGE_STATE_WRITE_MONITORED:
4433 pInfo->fZeroPage = 0;
4434 break;
4435
4436 case PGM_PAGE_STATE_SHARED:
4437 pInfo->fZeroPage = 0;
4438 break;
4439
4440 case PGM_PAGE_STATE_BALLOONED:
4441 pInfo->fZeroPage = 1;
4442 break;
4443
4444 default:
4445 pInfo->fZeroPage = 1;
4446 AssertFailedStmt(rc = VERR_PGM_PHYS_PAGE_GET_IPE);
4447 }
4448
4449 /* Call the checker and update NEM state. */
4450 if (pfnChecker)
4451 {
4452 rc = pfnChecker(pVM, pVCpu, GCPhys, pInfo, pvUser);
4453 PGM_PAGE_SET_NEM_STATE(pPage, pInfo->u2NemState);
4454 }
4455
4456 /* Done. */
4457 PGM_UNLOCK(pVM);
4458 }
4459 else
4460 {
4461 PGM_UNLOCK(pVM);
4462
4463 pInfo->HCPhys = NIL_RTHCPHYS;
4464 pInfo->fNemProt = NEM_PAGE_PROT_NONE;
4465 pInfo->u2NemState = 0;
4466 pInfo->fHasHandlers = 0;
4467 pInfo->fZeroPage = 0;
4468 pInfo->enmType = PGMPAGETYPE_INVALID;
4469 }
4470
4471 return rc;
4472}
4473
4474
4475/**
4476 * NEM helper that performs @a pfnCallback on pages with NEM state @a uMinState
4477 * or higher.
4478 *
4479 * @returns VBox status code from callback.
4480 * @param pVM The cross context VM structure.
4481 * @param pVCpu The cross context per CPU structure. This is
4482 * optional as its only for passing to callback.
4483 * @param uMinState The minimum NEM state value to call on.
4484 * @param pfnCallback The callback function.
4485 * @param pvUser User argument for the callback.
4486 */
4487VMM_INT_DECL(int) PGMPhysNemEnumPagesByState(PVMCC pVM, PVMCPUCC pVCpu, uint8_t uMinState,
4488 PFNPGMPHYSNEMENUMCALLBACK pfnCallback, void *pvUser)
4489{
4490 /*
4491 * Just brute force this problem.
4492 */
4493 PGM_LOCK_VOID(pVM);
4494 int rc = VINF_SUCCESS;
4495 for (PPGMRAMRANGE pRam = pVM->pgm.s.CTX_SUFF(pRamRangesX); pRam; pRam = pRam->CTX_SUFF(pNext))
4496 {
4497 uint32_t const cPages = pRam->cb >> X86_PAGE_SHIFT;
4498 for (uint32_t iPage = 0; iPage < cPages; iPage++)
4499 {
4500 uint8_t u2State = PGM_PAGE_GET_NEM_STATE(&pRam->aPages[iPage]);
4501 if (u2State < uMinState)
4502 { /* likely */ }
4503 else
4504 {
4505 rc = pfnCallback(pVM, pVCpu, pRam->GCPhys + ((RTGCPHYS)iPage << X86_PAGE_SHIFT), &u2State, pvUser);
4506 if (RT_SUCCESS(rc))
4507 PGM_PAGE_SET_NEM_STATE(&pRam->aPages[iPage], u2State);
4508 else
4509 break;
4510 }
4511 }
4512 }
4513 PGM_UNLOCK(pVM);
4514
4515 return rc;
4516}
4517
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette