]> git.saurik.com Git - apple/xnu.git/blame - osfmk/i386/pmap.h
xnu-1486.2.11.tar.gz
[apple/xnu.git] / osfmk / i386 / pmap.h
CommitLineData
1c79356b 1/*
0c530ab8 2 * Copyright (c) 2000-2007 Apple Inc. All rights reserved.
1c79356b 3 *
2d21ac55 4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
8f6c56a5 5 *
2d21ac55
A
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
8f6c56a5 14 *
2d21ac55
A
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
17 *
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
8f6c56a5
A
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
2d21ac55
A
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
8f6c56a5 25 *
2d21ac55 26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
1c79356b
A
27 */
28/*
29 * @OSF_COPYRIGHT@
30 */
31/*
32 * Mach Operating System
33 * Copyright (c) 1991,1990,1989,1988 Carnegie Mellon University
34 * All Rights Reserved.
35 *
36 * Permission to use, copy, modify and distribute this software and its
37 * documentation is hereby granted, provided that both the copyright
38 * notice and this permission notice appear in all copies of the
39 * software, derivative works or modified versions, and any portions
40 * thereof, and that both notices appear in supporting documentation.
41 *
42 * CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS "AS IS"
43 * CONDITION. CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND FOR
44 * ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
45 *
46 * Carnegie Mellon requests users of this software to return to
47 *
48 * Software Distribution Coordinator or Software.Distribution@CS.CMU.EDU
49 * School of Computer Science
50 * Carnegie Mellon University
51 * Pittsburgh PA 15213-3890
52 *
53 * any improvements or extensions that they make and grant Carnegie Mellon
54 * the rights to redistribute these changes.
55 */
56/*
57 */
58
59/*
60 * File: pmap.h
61 *
62 * Authors: Avadis Tevanian, Jr., Michael Wayne Young
63 * Date: 1985
64 *
65 * Machine-dependent structures for the physical map module.
66 */
0c530ab8 67#ifdef KERNEL_PRIVATE
1c79356b
A
68#ifndef _PMAP_MACHINE_
69#define _PMAP_MACHINE_ 1
70
71#ifndef ASSEMBLER
72
73#include <platforms.h>
1c79356b
A
74
75#include <mach/kern_return.h>
76#include <mach/machine/vm_types.h>
77#include <mach/vm_prot.h>
78#include <mach/vm_statistics.h>
79#include <mach/machine/vm_param.h>
80#include <kern/kern_types.h>
91447636 81#include <kern/thread.h>
1c79356b 82#include <kern/lock.h>
0c530ab8
A
83
84#include <i386/mp.h>
85#include <i386/proc_reg.h>
1c79356b
A
86
87/*
88 * Define the generic in terms of the specific
89 */
90
91#define INTEL_PGBYTES I386_PGBYTES
92#define INTEL_PGSHIFT I386_PGSHIFT
93#define intel_btop(x) i386_btop(x)
94#define intel_ptob(x) i386_ptob(x)
95#define intel_round_page(x) i386_round_page(x)
96#define intel_trunc_page(x) i386_trunc_page(x)
97#define trunc_intel_to_vm(x) trunc_i386_to_vm(x)
98#define round_intel_to_vm(x) round_i386_to_vm(x)
99#define vm_to_intel(x) vm_to_i386(x)
100
101/*
102 * i386/i486/i860 Page Table Entry
103 */
104
1c79356b
A
105#endif /* ASSEMBLER */
106
91447636
A
107#define NPGPTD 4
108#define PDESHIFT 21
109#define PTEMASK 0x1ff
110#define PTEINDX 3
0c530ab8 111
91447636
A
112#define PTESHIFT 12
113
b0d623f7
A
114
115#define INITPT_SEG_BASE 0x100000
116#define INITGDT_SEG_BASE 0x106000
117#define SLEEP_SEG_BASE 0x107000
118
119#ifdef __x86_64__
120#define LOW_4GB_MASK ((vm_offset_t)0x00000000FFFFFFFFUL)
121#endif
122
91447636
A
123#define PDESIZE sizeof(pd_entry_t) /* for assembly files */
124#define PTESIZE sizeof(pt_entry_t) /* for assembly files */
125
126#define INTEL_OFFMASK (I386_PGBYTES - 1)
b0d623f7 127#define INTEL_LOFFMASK (I386_LPGBYTES - 1)
0c530ab8 128#define PG_FRAME 0x000FFFFFFFFFF000ULL
91447636 129#define NPTEPG (PAGE_SIZE/(sizeof (pt_entry_t)))
0c530ab8 130#define NPTDPG (PAGE_SIZE/(sizeof (pd_entry_t)))
1c79356b 131
91447636
A
132#define NBPTD (NPGPTD << PAGE_SHIFT)
133#define NPDEPTD (NBPTD / (sizeof (pd_entry_t)))
134#define NPDEPG (PAGE_SIZE/(sizeof (pd_entry_t)))
135#define NBPDE (1 << PDESHIFT)
136#define PDEMASK (NBPDE - 1)
9bccf70c 137
b0d623f7
A
138#define PTE_PER_PAGE 512 /* number of PTE's per page on any level */
139
0c530ab8
A
140 /* cleanly define parameters for all the page table levels */
141typedef uint64_t pml4_entry_t;
142#define NPML4PG (PAGE_SIZE/(sizeof (pml4_entry_t)))
143#define PML4SHIFT 39
144#define PML4PGSHIFT 9
145#define NBPML4 (1ULL << PML4SHIFT)
146#define PML4MASK (NBPML4-1)
147#define PML4_ENTRY_NULL ((pml4_entry_t *) 0)
148
149typedef uint64_t pdpt_entry_t;
150#define NPDPTPG (PAGE_SIZE/(sizeof (pdpt_entry_t)))
151#define PDPTSHIFT 30
152#define PDPTPGSHIFT 9
153#define NBPDPT (1 << PDPTSHIFT)
154#define PDPTMASK (NBPDPT-1)
155#define PDPT_ENTRY_NULL ((pdpt_entry_t *) 0)
156
157typedef uint64_t pd_entry_t;
158#define NPDPG (PAGE_SIZE/(sizeof (pd_entry_t)))
159#define PDSHIFT 21
160#define PDPGSHIFT 9
161#define NBPD (1 << PDSHIFT)
162#define PDMASK (NBPD-1)
163#define PD_ENTRY_NULL ((pd_entry_t *) 0)
164
165typedef uint64_t pt_entry_t;
166#define NPTPG (PAGE_SIZE/(sizeof (pt_entry_t)))
167#define PTSHIFT 12
168#define PTPGSHIFT 9
169#define NBPT (1 << PTSHIFT)
170#define PTMASK (NBPT-1)
171#define PT_ENTRY_NULL ((pt_entry_t *) 0)
172
173typedef uint64_t pmap_paddr_t;
174
b0d623f7
A
175/* superpages */
176#ifdef __x86_64__
177#define SUPERPAGE_NBASEPAGES 512
178#else
179#define SUPERPAGE_NBASEPAGES 1 /* we don't support superpages on i386 */
180#endif
181
0c530ab8
A
182/*
183 * Atomic 64-bit store of a page table entry.
184 */
185static inline void
186pmap_store_pte(pt_entry_t *entryp, pt_entry_t value)
187{
b0d623f7 188#ifdef __i386__
0c530ab8
A
189 /*
190 * Load the new value into %ecx:%ebx
191 * Load the old value into %edx:%eax
192 * Compare-exchange-8bytes at address entryp (loaded in %edi)
193 * If the compare succeeds, the new value will have been stored.
194 * Otherwise, the old value changed and reloaded, so try again.
195 */
2d21ac55 196 __asm__ volatile(
0c530ab8
A
197 " movl (%0), %%eax \n\t"
198 " movl 4(%0), %%edx \n\t"
199 "1: \n\t"
200 " cmpxchg8b (%0) \n\t"
201 " jnz 1b"
202 :
203 : "D" (entryp),
204 "b" ((uint32_t)value),
205 "c" ((uint32_t)(value >> 32))
206 : "eax", "edx", "memory");
b0d623f7
A
207#else
208 /*
209 * In the 32-bit kernel a compare-and-exchange loop was
210 * required to provide atomicity. For K64, life is easier:
211 */
212 *entryp = value;
213#endif
0c530ab8
A
214}
215
216/*
217 * Atomic 64-bit compare and exchange of a page table entry.
218 */
219static inline boolean_t
220pmap_cmpx_pte(pt_entry_t *entryp, pt_entry_t old, pt_entry_t new)
221{
222 boolean_t ret;
223
b0d623f7 224#ifdef __i386__
0c530ab8
A
225 /*
226 * Load the old value into %edx:%eax
227 * Load the new value into %ecx:%ebx
228 * Compare-exchange-8bytes at address entryp (loaded in %edi)
229 * If the compare succeeds, the new value is stored, return TRUE.
230 * Otherwise, no swap is made, return FALSE.
231 */
232 asm volatile(
233 " lock; cmpxchg8b (%1) \n\t"
234 " setz %%al \n\t"
235 " movzbl %%al,%0"
236 : "=a" (ret)
237 : "D" (entryp),
238 "a" ((uint32_t)old),
239 "d" ((uint32_t)(old >> 32)),
240 "b" ((uint32_t)new),
241 "c" ((uint32_t)(new >> 32))
242 : "memory");
b0d623f7
A
243#else
244 /*
245 * Load the old value into %rax
246 * Load the new value into another register
247 * Compare-exchange-quad at address entryp
248 * If the compare succeeds, the new value is stored, return TRUE.
249 * Otherwise, no swap is made, return FALSE.
250 */
251 asm volatile(
252 " lock; cmpxchgq %2,(%3) \n\t"
253 " setz %%al \n\t"
254 " movzbl %%al,%0"
255 : "=a" (ret)
256 : "a" (old),
257 "r" (new),
258 "r" (entryp)
259 : "memory");
260#endif
0c530ab8
A
261 return ret;
262}
263
264#define pmap_update_pte(entryp, old, new) \
265 while (!pmap_cmpx_pte((entryp), (old), (new)))
266
2d21ac55 267
0c530ab8
A
268/* in 64 bit spaces, the number of each type of page in the page tables */
269#define NPML4PGS (1ULL * (PAGE_SIZE/(sizeof (pml4_entry_t))))
270#define NPDPTPGS (NPML4PGS * (PAGE_SIZE/(sizeof (pdpt_entry_t))))
271#define NPDEPGS (NPDPTPGS * (PAGE_SIZE/(sizeof (pd_entry_t))))
272#define NPTEPGS (NPDEPGS * (PAGE_SIZE/(sizeof (pt_entry_t))))
273
b0d623f7 274#ifdef __i386__
0c530ab8
A
275/*
276 * The 64-bit kernel is remapped in uber-space which is at the base
277 * the highest 4th-level directory (KERNEL_UBER_PML4_INDEX). That is,
278 * 512GB from the top of virtual space (or zero).
279 */
280#define KERNEL_UBER_PML4_INDEX 511
281#define KERNEL_UBER_BASE (0ULL - NBPML4)
282#define KERNEL_UBER_BASE_HI32 ((uint32_t)(KERNEL_UBER_BASE >> 32))
b0d623f7
A
283#else
284#define KERNEL_PML4_INDEX 511
285#define KERNEL_KEXTS_INDEX 510 /* Home of KEXTs - the basement */
286#define KERNEL_PHYSMAP_INDEX 509 /* virtual to physical map */
287#define KERNEL_BASE (0ULL - NBPML4)
288#define KERNEL_BASEMENT (KERNEL_BASE - NBPML4)
289#endif
0c530ab8 290
55e303ae 291#define VM_WIMG_COPYBACK VM_MEM_COHERENT
9bccf70c 292#define VM_WIMG_DEFAULT VM_MEM_COHERENT
55e303ae
A
293/* ?? intel ?? */
294#define VM_WIMG_IO (VM_MEM_COHERENT | \
295 VM_MEM_NOT_CACHEABLE | VM_MEM_GUARDED)
296#define VM_WIMG_WTHRU (VM_MEM_WRITE_THROUGH | VM_MEM_COHERENT | VM_MEM_GUARDED)
297/* write combining mode, aka store gather */
298#define VM_WIMG_WCOMB (VM_MEM_NOT_CACHEABLE | VM_MEM_COHERENT)
9bccf70c 299
0c530ab8
A
300/*
301 * Pte related macros
302 */
b0d623f7 303#ifdef __i386__
0c530ab8
A
304#define VADDR(pdi, pti) ((vm_offset_t)(((pdi)<<PDESHIFT)|((pti)<<PTESHIFT)))
305#define VADDR64(pmi, pdi, pti) ((vm_offset_t)(((pmi)<<PLM4SHIFT))((pdi)<<PDESHIFT)|((pti)<<PTESHIFT))
b0d623f7
A
306#else
307#define KVADDR(pmi, pdpi, pdi, pti) \
308 ((vm_offset_t) \
309 ((uint64_t) -1 << 47) | \
310 ((uint64_t)(pmi) << PML4SHIFT) | \
311 ((uint64_t)(pdpi) << PDPTSHIFT) | \
312 ((uint64_t)(pdi) << PDESHIFT) | \
313 ((uint64_t)(pti) << PTESHIFT))
314#endif
0c530ab8 315
1c79356b 316/*
91447636
A
317 * Size of Kernel address space. This is the number of page table pages
318 * (4MB each) to use for the kernel. 256 pages == 1 Gigabyte.
319 * This **MUST** be a multiple of 4 (eg: 252, 256, 260, etc).
1c79356b 320 */
91447636 321#ifndef KVA_PAGES
0c530ab8 322#define KVA_PAGES 1024
91447636 323#endif
1c79356b 324
91447636 325#ifndef NKPT
91447636 326#define NKPT 500 /* actual number of kernel page tables */
91447636
A
327#endif
328#ifndef NKPDE
329#define NKPDE (KVA_PAGES - 1) /* addressable number of page tables/pde's */
330#endif
331
0c530ab8 332
b0d623f7 333#ifdef __i386__
0c530ab8
A
334enum high_cpu_types {
335 HIGH_CPU_ISS0,
336 HIGH_CPU_ISS1,
337 HIGH_CPU_DESC,
338 HIGH_CPU_LDT_BEGIN,
339 HIGH_CPU_LDT_END = HIGH_CPU_LDT_BEGIN + (LDTSZ / 512) - 1,
340 HIGH_CPU_END
341};
342
343enum high_fixed_addresses {
344 HIGH_FIXED_TRAMPS, /* must be first */
345 HIGH_FIXED_TRAMPS_END,
346 HIGH_FIXED_GDT,
347 HIGH_FIXED_IDT,
348 HIGH_FIXED_LDT_BEGIN,
349 HIGH_FIXED_LDT_END = HIGH_FIXED_LDT_BEGIN + (LDTSZ / 512) - 1,
350 HIGH_FIXED_KTSS,
351 HIGH_FIXED_DFTSS,
352 HIGH_FIXED_DBTSS,
353 HIGH_FIXED_CPUS_BEGIN,
354 HIGH_FIXED_CPUS_END = HIGH_FIXED_CPUS_BEGIN + (HIGH_CPU_END * MAX_CPUS) - 1,
355};
356
357
358/* XXX64 below PTDI values need cleanup */
91447636
A
359/*
360 * The *PTDI values control the layout of virtual memory
361 *
362 */
0c530ab8 363#define KPTDI (0x000)/* start of kernel virtual pde's */
91447636
A
364#define PTDPTDI (0x7F4) /* ptd entry that points to ptd! */
365#define APTDPTDI (0x7F8) /* alt ptd entry that points to APTD */
0c530ab8 366#define UMAXPTDI (0x7F8) /* ptd entry for user space end */
6601e61a 367#define UMAXPTEOFF (NPTEPG) /* pte entry for user space end */
91447636
A
368
369#define KERNBASE VADDR(KPTDI,0)
1c79356b 370
0c530ab8
A
371/*
372 * Convert address offset to directory address
373 * containing the page table pointer - legacy
374 */
375/*#define pmap_pde(m,v) (&((m)->dirbase[(vm_offset_t)(v) >> PDESHIFT]))*/
376
377#define HIGH_MEM_BASE ((uint32_t)( -NBPDE) ) /* shared gdt etc seg addr */ /* XXX64 ?? */
378#define pmap_index_to_virt(x) (HIGH_MEM_BASE | ((unsigned)(x) << PAGE_SHIFT))
b0d623f7 379#endif
0c530ab8 380
1c79356b
A
381/*
382 * Convert address offset to page descriptor index
383 */
b0d623f7
A
384#define pdptnum(pmap, a) (((vm_offset_t)(a) >> PDPTSHIFT) & PDPTMASK)
385#define pdenum(pmap, a) (((vm_offset_t)(a) >> PDESHIFT) & PDEMASK)
386#define PMAP_INVALID_PDPTNUM (~0ULL)
91447636 387
b0d623f7 388#ifdef __i386__
0c530ab8
A
389#define pdeidx(pmap, a) (((a) >> PDSHIFT) & ((1ULL<<(48 - PDSHIFT)) -1))
390#define pdptidx(pmap, a) (((a) >> PDPTSHIFT) & ((1ULL<<(48 - PDPTSHIFT)) -1))
391#define pml4idx(pmap, a) (((a) >> PML4SHIFT) & ((1ULL<<(48 - PML4SHIFT)) -1))
b0d623f7
A
392#else
393#define VAMASK ((1ULL<<48)-1)
394#define pml4idx(pmap, a) ((((a) & VAMASK) >> PML4SHIFT) & \
395 ((1ULL<<(48 - PML4SHIFT))-1))
396#define pdptidx(pmap, a) ((((a) & PML4MASK) >> PDPTSHIFT) & \
397 ((1ULL<<(48 - PDPTSHIFT))-1))
398#define pdeidx(pmap, a) ((((a) & PML4MASK) >> PDSHIFT) & \
399 ((1ULL<<(48 - PDSHIFT)) - 1))
400#endif
1c79356b
A
401
402/*
403 * Convert page descriptor index to user virtual address
404 */
405#define pdetova(a) ((vm_offset_t)(a) << PDESHIFT)
406
407/*
408 * Convert address offset to page table index
409 */
0c530ab8 410#define ptenum(a) (((vm_offset_t)(a) >> PTESHIFT) & PTEMASK)
1c79356b 411
1c79356b
A
412/*
413 * Hardware pte bit definitions (to be used directly on the ptes
414 * without using the bit fields).
415 */
416
417#define INTEL_PTE_VALID 0x00000001
418#define INTEL_PTE_WRITE 0x00000002
91447636 419#define INTEL_PTE_RW 0x00000002
1c79356b
A
420#define INTEL_PTE_USER 0x00000004
421#define INTEL_PTE_WTHRU 0x00000008
422#define INTEL_PTE_NCACHE 0x00000010
423#define INTEL_PTE_REF 0x00000020
424#define INTEL_PTE_MOD 0x00000040
b0d623f7
A
425#define INTEL_PTE_PS 0x00000080
426#define INTEL_PTE_PTA 0x00000080
427#define INTEL_PTE_GLOBAL 0x00000100
1c79356b 428#define INTEL_PTE_WIRED 0x00000200
b0d623f7 429#define INTEL_PDPTE_NESTED 0x00000400
0c530ab8 430#define INTEL_PTE_PFN PG_FRAME
1c79356b 431
0c530ab8
A
432#define INTEL_PTE_NX (1ULL << 63)
433
434#define INTEL_PTE_INVALID 0
435
91447636
A
436#define pa_to_pte(a) ((a) & INTEL_PTE_PFN) /* XXX */
437#define pte_to_pa(p) ((p) & INTEL_PTE_PFN) /* XXX */
1c79356b
A
438#define pte_increment_pa(p) ((p) += INTEL_OFFMASK+1)
439
0c530ab8
A
440#define pte_kernel_rw(p) ((pt_entry_t)(pa_to_pte(p) | INTEL_PTE_VALID|INTEL_PTE_RW))
441#define pte_kernel_ro(p) ((pt_entry_t)(pa_to_pte(p) | INTEL_PTE_VALID))
442#define pte_user_rw(p) ((pt_entry)t)(pa_to_pte(p) | INTEL_PTE_VALID|INTEL_PTE_USER|INTEL_PTE_RW))
443#define pte_user_ro(p) ((pt_entry_t)(pa_to_pte(p) | INTEL_PTE_VALID|INTEL_PTE_USER))
444
9bccf70c
A
445#define PMAP_DEFAULT_CACHE 0
446#define PMAP_INHIBIT_CACHE 1
447#define PMAP_GUARDED_CACHE 2
448#define PMAP_ACTIVATE_CACHE 4
449#define PMAP_NO_GUARD_CACHE 8
450
451
91447636
A
452#ifndef ASSEMBLER
453
454#include <sys/queue.h>
455
1c79356b 456/*
91447636
A
457 * Address of current and alternate address space page table maps
458 * and directories.
1c79356b 459 */
1c79356b 460
b0d623f7
A
461#ifdef __i386__
462extern pt_entry_t PTmap[], APTmap[], Upte;
463extern pd_entry_t PTD[], APTD[], PTDpde[], APTDpde[], Upde;
464extern pmap_paddr_t lo_kernel_cr3;
465extern pdpt_entry_t *IdlePDPT64;
466#else
467extern pt_entry_t *PTmap;
468#endif
469extern boolean_t no_shared_cr3;
470extern addr64_t kernel64_cr3;
471extern pd_entry_t *IdlePTD; /* physical addr of "Idle" state PTD */
472extern pdpt_entry_t IdlePDPT[];
473extern pml4_entry_t IdlePML4[];
474
475extern uint64_t pmap_pv_hashlist_walks;
476extern uint64_t pmap_pv_hashlist_cnts;
477extern uint32_t pmap_pv_hashlist_max;
478extern uint32_t pmap_kernel_text_ps;
479
480#ifdef __i386__
91447636 481/*
b0d623f7 482 * ** i386 **
91447636
A
483 * virtual address to page table entry and
484 * to physical address. Likewise for alternate address space.
485 * Note: these work recursively, thus vtopte of a pte will give
486 * the corresponding pde that in turn maps it.
487 */
b0d623f7 488
0c530ab8 489#define vtopte(va) (PTmap + i386_btop((vm_offset_t)va))
b0d623f7
A
490#endif
491
492#ifdef __x86_64__
493#define ID_MAP_VTOP(x) ((void *)(((uint64_t)(x)) & LOW_4GB_MASK))
91447636 494
b0d623f7
A
495#define PHYSMAP_BASE KVADDR(KERNEL_PHYSMAP_INDEX,0,0,0)
496#define PHYSMAP_PTOV(x) ((void *)(((uint64_t)(x)) + PHYSMAP_BASE))
497#endif
91447636 498
1c79356b
A
499typedef volatile long cpu_set; /* set of CPUs - must be <= 32 */
500 /* changed by other processors */
91447636
A
501struct md_page {
502 int pv_list_count;
503 TAILQ_HEAD(,pv_entry) pv_list;
504};
505
506#include <vm/vm_page.h>
507
508/*
509 * For each vm_page_t, there is a list of all currently
510 * valid virtual mappings of that page. An entry is
511 * a pv_entry_t; the list is the pv_table.
512 */
1c79356b
A
513
514struct pmap {
0c530ab8 515 pd_entry_t *dirbase; /* page directory pointer */
b0d623f7 516#ifdef __i386__
0c530ab8 517 pmap_paddr_t pdirbase; /* phys. address of dirbase */
b0d623f7 518#endif
0c530ab8 519 vm_object_t pm_obj; /* object to hold pde's */
1c79356b 520 int ref_count; /* reference count */
0c530ab8 521 int nx_enabled;
2d21ac55 522 task_map_t pm_task_map;
1c79356b
A
523 decl_simple_lock_data(,lock) /* lock on map */
524 struct pmap_statistics stats; /* map statistics */
b0d623f7 525#ifdef __i386__
91447636 526 vm_offset_t pm_hold; /* true pdpt zalloc addr */
b0d623f7 527#endif
0c530ab8
A
528 pmap_paddr_t pm_cr3; /* physical addr */
529 pdpt_entry_t *pm_pdpt; /* KVA of 3rd level page */
530 pml4_entry_t *pm_pml4; /* VKA of top level */
531 vm_object_t pm_obj_pdpt; /* holds pdpt pages */
532 vm_object_t pm_obj_pml4; /* holds pml4 pages */
533 vm_object_t pm_obj_top; /* holds single top level page */
2d21ac55 534 boolean_t pm_shared;
1c79356b
A
535};
536
0c530ab8 537
b0d623f7 538#if NCOPY_WINDOWS > 0
0c530ab8
A
539#define PMAP_PDPT_FIRST_WINDOW 0
540#define PMAP_PDPT_NWINDOWS 4
541#define PMAP_PDE_FIRST_WINDOW (PMAP_PDPT_NWINDOWS)
542#define PMAP_PDE_NWINDOWS 4
543#define PMAP_PTE_FIRST_WINDOW (PMAP_PDE_FIRST_WINDOW + PMAP_PDE_NWINDOWS)
544#define PMAP_PTE_NWINDOWS 4
545
546#define PMAP_NWINDOWS_FIRSTFREE (PMAP_PTE_FIRST_WINDOW + PMAP_PTE_NWINDOWS)
547#define PMAP_WINDOW_SIZE 8
548#define PMAP_NWINDOWS (PMAP_NWINDOWS_FIRSTFREE + PMAP_WINDOW_SIZE)
549
91447636
A
550typedef struct {
551 pt_entry_t *prv_CMAP;
552 caddr_t prv_CADDR;
553} mapwindow_t;
554
555typedef struct cpu_pmap {
0c530ab8
A
556 int pdpt_window_index;
557 int pde_window_index;
558 int pte_window_index;
91447636 559 mapwindow_t mapwindow[PMAP_NWINDOWS];
91447636
A
560} cpu_pmap_t;
561
0c530ab8
A
562
563extern mapwindow_t *pmap_get_mapwindow(pt_entry_t pentry);
2d21ac55 564extern void pmap_put_mapwindow(mapwindow_t *map);
b0d623f7 565#endif
91447636
A
566
567typedef struct pmap_memory_regions {
568 ppnum_t base;
569 ppnum_t end;
570 ppnum_t alloc;
571 uint32_t type;
572} pmap_memory_region_t;
573
b0d623f7
A
574extern unsigned pmap_memory_region_count;
575extern unsigned pmap_memory_region_current;
91447636 576
0c530ab8 577#define PMAP_MEMORY_REGIONS_SIZE 128
91447636
A
578
579extern pmap_memory_region_t pmap_memory_regions[];
580
b0d623f7
A
581static inline void
582set_dirbase(pmap_t tpmap, __unused thread_t thread) {
583 current_cpu_datap()->cpu_task_cr3 = tpmap->pm_cr3;
2d21ac55 584 current_cpu_datap()->cpu_task_map = tpmap->pm_task_map;
b0d623f7
A
585#ifndef __i386__
586 /*
587 * Switch cr3 if necessary
588 * - unless running with no_shared_cr3 debugging mode
589 * and we're not on the kernel's cr3 (after pre-empted copyio)
590 */
591 if (!no_shared_cr3) {
592 if (get_cr3() != tpmap->pm_cr3)
593 set_cr3(tpmap->pm_cr3);
594 } else {
595 if (get_cr3() != current_cpu_datap()->cpu_kernel_cr3)
596 set_cr3(current_cpu_datap()->cpu_kernel_cr3);
597 }
598#endif
1c79356b
A
599}
600
1c79356b
A
601/*
602 * External declarations for PMAP_ACTIVATE.
603 */
604
0c530ab8 605extern void process_pmap_updates(void);
1c79356b 606extern void pmap_update_interrupt(void);
1c79356b
A
607
608/*
609 * Machine dependent routines that are used only for i386/i486/i860.
610 */
1c79356b 611
0c530ab8 612extern addr64_t (kvtophys)(
1c79356b
A
613 vm_offset_t addr);
614
2d21ac55
A
615extern void pmap_expand(
616 pmap_t pmap,
617 vm_map_offset_t addr);
618
1c79356b
A
619extern pt_entry_t *pmap_pte(
620 struct pmap *pmap,
0c530ab8
A
621 vm_map_offset_t addr);
622
623extern pd_entry_t *pmap_pde(
624 struct pmap *pmap,
625 vm_map_offset_t addr);
626
627extern pd_entry_t *pmap64_pde(
628 struct pmap *pmap,
629 vm_map_offset_t addr);
630
631extern pdpt_entry_t *pmap64_pdpt(
632 struct pmap *pmap,
633 vm_map_offset_t addr);
1c79356b
A
634
635extern vm_offset_t pmap_map(
636 vm_offset_t virt,
0c530ab8
A
637 vm_map_offset_t start,
638 vm_map_offset_t end,
639 vm_prot_t prot,
640 unsigned int flags);
1c79356b
A
641
642extern vm_offset_t pmap_map_bd(
643 vm_offset_t virt,
0c530ab8
A
644 vm_map_offset_t start,
645 vm_map_offset_t end,
646 vm_prot_t prot,
647 unsigned int flags);
1c79356b
A
648
649extern void pmap_bootstrap(
0c530ab8
A
650 vm_offset_t load_start,
651 boolean_t IA32e);
1c79356b
A
652
653extern boolean_t pmap_valid_page(
91447636 654 ppnum_t pn);
1c79356b
A
655
656extern int pmap_list_resident_pages(
657 struct pmap *pmap,
658 vm_offset_t *listp,
659 int space);
660
b0d623f7 661#ifdef __i386__
0c530ab8 662extern void pmap_commpage32_init(
91447636
A
663 vm_offset_t kernel,
664 vm_offset_t user,
665 int count);
0c530ab8
A
666extern void pmap_commpage64_init(
667 vm_offset_t kernel,
668 vm_map_offset_t user,
669 int count);
670
b0d623f7
A
671#endif
672
673#if NCOPY_WINDOWS > 0
91447636
A
674extern struct cpu_pmap *pmap_cpu_alloc(
675 boolean_t is_boot_cpu);
676extern void pmap_cpu_free(
677 struct cpu_pmap *cp);
b0d623f7 678#endif
0c530ab8
A
679
680extern void pmap_map_block(
681 pmap_t pmap,
682 addr64_t va,
683 ppnum_t pa,
684 uint32_t size,
685 vm_prot_t prot,
686 int attr,
687 unsigned int flags);
91447636 688
1c79356b
A
689extern void invalidate_icache(vm_offset_t addr, unsigned cnt, int phys);
690extern void flush_dcache(vm_offset_t addr, unsigned count, int phys);
55e303ae 691extern ppnum_t pmap_find_phys(pmap_t map, addr64_t va);
1c79356b 692
2d21ac55 693extern void pmap_cpu_init(void);
0c530ab8 694extern void pmap_disable_NX(pmap_t pmap);
b0d623f7 695#ifdef __i386__
0c530ab8
A
696extern void pmap_set_4GB_pagezero(pmap_t pmap);
697extern void pmap_clear_4GB_pagezero(pmap_t pmap);
698extern void pmap_load_kernel_cr3(void);
699extern vm_offset_t pmap_cpu_high_map_vaddr(int, enum high_cpu_types);
700extern vm_offset_t pmap_high_map_vaddr(enum high_cpu_types);
701extern vm_offset_t pmap_high_map(pt_entry_t, enum high_cpu_types);
702extern vm_offset_t pmap_cpu_high_shared_remap(int, enum high_cpu_types, vm_offset_t, int);
703extern vm_offset_t pmap_high_shared_remap(enum high_fixed_addresses, vm_offset_t, int);
b0d623f7 704#endif
0c530ab8
A
705
706extern void pt_fake_zone_info(int *, vm_size_t *, vm_size_t *, vm_size_t *, vm_size_t *, int *, int *);
707
708
709
1c79356b
A
710/*
711 * Macros for speed.
712 */
713
1c79356b
A
714
715#include <kern/spl.h>
716
b0d623f7
A
717
718#define PMAP_ACTIVATE_MAP(map, thread) { \
55e303ae 719 register pmap_t tpmap; \
0c530ab8
A
720 \
721 tpmap = vm_map_pmap(map); \
b0d623f7 722 set_dirbase(tpmap, thread); \
1c79356b
A
723}
724
b0d623f7
A
725#ifdef __i386__
726#define PMAP_DEACTIVATE_MAP(map, thread) \
2d21ac55
A
727 if (vm_map_pmap(map)->pm_task_map == TASK_MAP_64BIT_SHARED) \
728 pmap_load_kernel_cr3();
b0d623f7
A
729#else
730#define PMAP_DEACTIVATE_MAP(map, my_cpu)
731#endif
1c79356b 732
b0d623f7 733#if defined(__i386__)
0c530ab8 734
1c79356b
A
735#define PMAP_SWITCH_CONTEXT(old_th, new_th, my_cpu) { \
736 spl_t spl; \
0c530ab8
A
737 pt_entry_t *kpdp; \
738 pt_entry_t *updp; \
739 int i; \
740 int need_flush; \
741 \
742 need_flush = 0; \
743 spl = splhigh(); \
b0d623f7
A
744 if ((old_th->map != new_th->map) || (new_th->task != old_th->task)) { \
745 PMAP_DEACTIVATE_MAP(old_th->map, old_th); \
746 PMAP_ACTIVATE_MAP(new_th->map, new_th); \
1c79356b 747 } \
0c530ab8
A
748 kpdp = current_cpu_datap()->cpu_copywindow_pdp; \
749 for (i = 0; i < NCOPY_WINDOWS; i++) { \
750 if (new_th->machine.copy_window[i].user_base != (user_addr_t)-1) { \
751 updp = pmap_pde(new_th->map->pmap, \
752 new_th->machine.copy_window[i].user_base);\
2d21ac55 753 pmap_store_pte(kpdp, updp ? *updp : 0); \
0c530ab8
A
754 } \
755 kpdp++; \
756 } \
757 splx(spl); \
758 if (new_th->machine.copyio_state == WINDOWS_OPENED) \
759 need_flush = 1; \
760 else \
761 new_th->machine.copyio_state = WINDOWS_DIRTY; \
762 if (new_th->machine.physwindow_pte) { \
2d21ac55
A
763 pmap_store_pte((current_cpu_datap()->cpu_physwindow_ptep), \
764 new_th->machine.physwindow_pte); \
0c530ab8
A
765 if (need_flush == 0) \
766 invlpg((uintptr_t)current_cpu_datap()->cpu_physwindow_base);\
767 } \
768 if (need_flush) \
769 flush_tlb(); \
1c79356b
A
770}
771
b0d623f7
A
772#else /* __x86_64__ */
773#define PMAP_SWITCH_CONTEXT(old_th, new_th, my_cpu) { \
774 spl_t spl; \
775 \
776 spl = splhigh(); \
777 if (old_th->map != new_th->map) { \
778 PMAP_DEACTIVATE_MAP(old_th->map, old_th); \
779 PMAP_ACTIVATE_MAP(new_th->map, new_th); \
780 } \
781 splx(spl); \
782}
783#endif /* __i386__ */
784
785#ifdef __i386__
1c79356b
A
786#define PMAP_SWITCH_USER(th, new_map, my_cpu) { \
787 spl_t spl; \
788 \
0c530ab8 789 spl = splhigh(); \
b0d623f7 790 PMAP_DEACTIVATE_MAP(th->map, th); \
1c79356b 791 th->map = new_map; \
b0d623f7 792 PMAP_ACTIVATE_MAP(th->map, th); \
1c79356b 793 splx(spl); \
0c530ab8 794 inval_copy_windows(th); \
1c79356b 795}
b0d623f7
A
796#else
797#define PMAP_SWITCH_USER(th, new_map, my_cpu) { \
798 spl_t spl; \
799 \
800 spl = splhigh(); \
801 PMAP_DEACTIVATE_MAP(th->map, th); \
802 th->map = new_map; \
803 PMAP_ACTIVATE_MAP(th->map, th); \
804 splx(spl); \
805}
806#endif
1c79356b 807
0c530ab8
A
808/*
809 * Marking the current cpu's cr3 inactive is achieved by setting its lsb.
810 * Marking the current cpu's cr3 active once more involves clearng this bit.
811 * Note that valid page tables are page-aligned and so the bottom 12 bits
812 * are noramlly zero.
813 * We can only mark the current cpu active/inactive but we can test any cpu.
814 */
815#define CPU_CR3_MARK_INACTIVE() \
816 current_cpu_datap()->cpu_active_cr3 |= 1
817
818#define CPU_CR3_MARK_ACTIVE() \
819 current_cpu_datap()->cpu_active_cr3 &= ~1
820
821#define CPU_CR3_IS_ACTIVE(cpu) \
822 ((cpu_datap(cpu)->cpu_active_cr3 & 1) == 0)
823
2d21ac55
A
824#define CPU_GET_ACTIVE_CR3(cpu) \
825 (cpu_datap(cpu)->cpu_active_cr3 & ~1)
0c530ab8 826
b0d623f7
A
827#define CPU_GET_TASK_CR3(cpu) \
828 (cpu_datap(cpu)->cpu_task_cr3)
829
830/*
831 * Mark this cpu idle, and remove it from the active set,
832 * since it is not actively using any pmap. Signal_cpus
833 * will notice that it is idle, and avoid signaling it,
834 * but will queue the update request for when the cpu
835 * becomes active.
836 */
837#if defined(__x86_64__)
838#define MARK_CPU_IDLE(my_cpu) { \
839 int s = splhigh(); \
840 CPU_CR3_MARK_INACTIVE(); \
841 __asm__ volatile("mfence"); \
842 splx(s); \
843}
844#else /* __i386__ native */
1c79356b
A
845#define MARK_CPU_IDLE(my_cpu) { \
846 /* \
847 * Mark this cpu idle, and remove it from the active set, \
848 * since it is not actively using any pmap. Signal_cpus \
849 * will notice that it is idle, and avoid signaling it, \
850 * but will queue the update request for when the cpu \
851 * becomes active. \
852 */ \
853 int s = splhigh(); \
0c530ab8
A
854 if (!cpu_mode_is64bit() || no_shared_cr3) \
855 process_pmap_updates(); \
856 else \
857 pmap_load_kernel_cr3(); \
858 CPU_CR3_MARK_INACTIVE(); \
859 __asm__ volatile("mfence"); \
1c79356b 860 splx(s); \
1c79356b 861}
b0d623f7 862#endif /* __i386__ */
1c79356b 863
0c530ab8 864#define MARK_CPU_ACTIVE(my_cpu) { \
1c79356b
A
865 \
866 int s = splhigh(); \
867 /* \
868 * If a kernel_pmap update was requested while this cpu \
869 * was idle, process it as if we got the interrupt. \
870 * Before doing so, remove this cpu from the idle set. \
871 * Since we do not grab any pmap locks while we flush \
872 * our TLB, another cpu may start an update operation \
873 * before we finish. Removing this cpu from the idle \
874 * set assures that we will receive another update \
875 * interrupt if this happens. \
876 */ \
0c530ab8
A
877 CPU_CR3_MARK_ACTIVE(); \
878 __asm__ volatile("mfence"); \
55e303ae 879 \
0c530ab8
A
880 if (current_cpu_datap()->cpu_tlb_invalid) \
881 process_pmap_updates(); \
1c79356b 882 splx(s); \
1c79356b
A
883}
884
1c79356b
A
885#define PMAP_CONTEXT(pmap, thread)
886
887#define pmap_kernel_va(VA) \
0c530ab8
A
888 ((((vm_offset_t) (VA)) >= vm_min_kernel_address) && \
889 (((vm_offset_t) (VA)) <= vm_max_kernel_address))
890
1c79356b
A
891
892#define pmap_resident_count(pmap) ((pmap)->stats.resident_count)
2d21ac55 893#define pmap_resident_max(pmap) ((pmap)->stats.resident_max)
1c79356b
A
894#define pmap_copy(dst_pmap,src_pmap,dst_addr,len,src_addr)
895#define pmap_attribute(pmap,addr,size,attr,value) \
896 (KERN_INVALID_ADDRESS)
9bccf70c
A
897#define pmap_attribute_cache_sync(addr,size,attr,value) \
898 (KERN_INVALID_ADDRESS)
765c9de3 899
2d21ac55
A
900#define MACHINE_PMAP_IS_EMPTY 1
901extern boolean_t pmap_is_empty(pmap_t pmap,
902 vm_map_offset_t start,
903 vm_map_offset_t end);
904
b0d623f7 905
1c79356b
A
906#endif /* ASSEMBLER */
907
0c530ab8 908
1c79356b 909#endif /* _PMAP_MACHINE_ */
0c530ab8
A
910
911
912#endif /* KERNEL_PRIVATE */