osfmk/ppc/pmap.c

   1 /*
   2  * Copyright (c) 2000 Apple Computer, Inc. All rights reserved.
   3  *
   4  * @APPLE_LICENSE_HEADER_START@
   5  *
   6  * Copyright (c) 1999-2003 Apple Computer, Inc.  All Rights Reserved.
   7  *
   8  * This file contains Original Code and/or Modifications of Original Code
   9  * as defined in and that are subject to the Apple Public Source License
  10  * Version 2.0 (the 'License'). You may not use this file except in
  11  * compliance with the License. Please obtain a copy of the License at
  12  * http://www.opensource.apple.com/apsl/ and read it before using this
  13  * file.
  14  *
  15  * The Original Code and all software distributed under the License are
  16  * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
  17  * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
  18  * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
  19  * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
  20  * Please see the License for the specific language governing rights and
  21  * limitations under the License.
  22  *
  23  * @APPLE_LICENSE_HEADER_END@
  24  */
  25 /*
  26  * @OSF_COPYRIGHT@
  27  */
  28 /*
  29  * Mach Operating System
  30  * Copyright (c) 1990,1991,1992 The University of Utah and
  31  * the Center for Software Science (CSS).
  32  * Copyright (c) 1991,1987 Carnegie Mellon University.
  33  * All rights reserved.
  34  *
  35  * Permission to use, copy, modify and distribute this software and its
  36  * documentation is hereby granted, provided that both the copyright
  37  * notice and this permission notice appear in all copies of the
  38  * software, derivative works or modified versions, and any portions
  39  * thereof, and that both notices appear in supporting documentation,
  40  * and that all advertising materials mentioning features or use of
  41  * this software display the following acknowledgement: ``This product
  42  * includes software developed by the Center for Software Science at
  43  * the University of Utah.''
  44  *
  45  * CARNEGIE MELLON, THE UNIVERSITY OF UTAH AND CSS ALLOW FREE USE OF
  46  * THIS SOFTWARE IN ITS "AS IS" CONDITION, AND DISCLAIM ANY LIABILITY
  47  * OF ANY KIND FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF
  48  * THIS SOFTWARE.
  49  *
  50  * CSS requests users of this software to return to css-dist@cs.utah.edu any
  51  * improvements that they make and grant CSS redistribution rights.
  52  *
  53  * Carnegie Mellon requests users of this software to return to
  54  *  Software Distribution Coordinator  or  Software.Distribution@CS.CMU.EDU
  55  *  School of Computer Science
  56  *  Carnegie Mellon University
  57  *  Pittsburgh PA 15213-3890
  58  * any improvements or extensions that they make and grant Carnegie Mellon
  59  * the rights to redistribute these changes.
  60  *
  61  *      Utah $Hdr: pmap.c 1.28 92/06/23$
  62  *      Author: Mike Hibler, Bob Wheeler, University of Utah CSS, 10/90
  63  */
  64
  65 /*
  66  *      Manages physical address maps for powerpc.
  67  *
  68  *      In addition to hardware address maps, this
  69  *      module is called upon to provide software-use-only
  70  *      maps which may or may not be stored in the same
  71  *      form as hardware maps.  These pseudo-maps are
  72  *      used to store intermediate results from copy
  73  *      operations to and from address spaces.
  74  *
  75  *      Since the information managed by this module is
  76  *      also stored by the logical address mapping module,
  77  *      this module may throw away valid virtual-to-physical
  78  *      mappings at almost any time.  However, invalidations
  79  *      of virtual-to-physical mappings must be done as
  80  *      requested.
  81  *
  82  *      In order to cope with hardware architectures which
  83  *      make virtual-to-physical map invalidates expensive,
  84  *      this module may delay invalidate or reduced protection
  85  *      operations until such time as they are actually
  86  *      necessary.  This module is given full information to
  87  *      when physical maps must be made correct.
  88  *
  89  */
  90
  91 #include <zone_debug.h>
  92 #include <cpus.h>
  93 #include <debug.h>
  94 #include <mach_kgdb.h>
  95 #include <mach_vm_debug.h>
  96 #include <db_machine_commands.h>
  97
  98 #include <kern/thread.h>
  99 #include <kern/simple_lock.h>
 100 #include <mach/vm_attributes.h>
 101 #include <mach/vm_param.h>
 102 #include <vm/vm_kern.h>
 103 #include <kern/spl.h>
 104
 105 #include <kern/misc_protos.h>
 106 #include <ppc/misc_protos.h>
 107 #include <ppc/proc_reg.h>
 108
 109 #include <vm/pmap.h>
 110 #include <vm/vm_map.h>
 111 #include <vm/vm_page.h>
 112
 113 #include <ppc/pmap.h>
 114 #include <ppc/mem.h>
 115 #include <ppc/mappings.h>
 116
 117 #include <ppc/new_screen.h>
 118 #include <ppc/Firmware.h>
 119 #include <ppc/savearea.h>
 120 #include <ppc/exception.h>
 121 #include <ppc/low_trace.h>
 122 #include <ddb/db_output.h>
 123
 124 extern unsigned int     avail_remaining;
 125 extern unsigned int     mappingdeb0;
 126 extern  struct  Saveanchor saveanchor;                                          /* Aliged savearea anchor */
 127 extern int              real_ncpus;                                                                     /* Number of actual CPUs */
 128 unsigned int    debugbackpocket;                                                        /* (TEST/DEBUG) */
 129
 130 vm_offset_t             first_free_virt;
 131 int             current_free_region;                                            /* Used in pmap_next_page */
 132
 133 pmapTransTab *pmapTrans;                                                                        /* Point to the hash to pmap translations */
 134 struct phys_entry *phys_table;
 135
 136 /* forward */
 137 void pmap_activate(pmap_t pmap, thread_t th, int which_cpu);
 138 void pmap_deactivate(pmap_t pmap, thread_t th, int which_cpu);
 139 void copy_to_phys(vm_offset_t sva, vm_offset_t dpa, int bytecount);
 140
 141 #if MACH_VM_DEBUG
 142 int pmap_list_resident_pages(pmap_t pmap, vm_offset_t *listp, int space);
 143 #endif
 144
 145 /*  NOTE:  kernel_pmap_store must be in V=R storage and aligned!!!!!!!!!!!!!! */
 146
 147 extern struct pmap      kernel_pmap_store;
 148 pmap_t          kernel_pmap;                    /* Pointer to kernel pmap and anchor for in-use pmaps */
 149 addr64_t        kernel_pmap_phys;               /* Pointer to kernel pmap and anchor for in-use pmaps, physical address */
 150 pmap_t          cursor_pmap;                    /* Pointer to last pmap allocated or previous if removed from in-use list */
 151 pmap_t          sharedPmap;                             /* Pointer to common pmap for 64-bit address spaces */
 152 struct zone     *pmap_zone;                             /* zone of pmap structures */
 153 boolean_t       pmap_initialized = FALSE;
 154
 155 int ppc_max_pmaps;                                      /* Maximum number of concurrent address spaces allowed. This is machine dependent */
 156 addr64_t vm_max_address;                        /* Maximum effective address supported */
 157 addr64_t vm_max_physical;                       /* Maximum physical address supported */
 158
 159 /*
 160  * Physical-to-virtual translations are handled by inverted page table
 161  * structures, phys_tables.  Multiple mappings of a single page are handled
 162  * by linking the affected mapping structures. We initialise one region
 163  * for phys_tables of the physical memory we know about, but more may be
 164  * added as it is discovered (eg. by drivers).
 165  */
 166
 167 /*
 168  *      free pmap list. caches the first free_pmap_max pmaps that are freed up
 169  */
 170 int             free_pmap_max = 32;
 171 int             free_pmap_count;
 172 pmap_t  free_pmap_list;
 173 decl_simple_lock_data(,free_pmap_lock)
 174
 175 /*
 176  * Function to get index into phys_table for a given physical address
 177  */
 178
 179 struct phys_entry *pmap_find_physentry(ppnum_t pa)
 180 {
 181         int i;
 182         unsigned int entry;
 183
 184         for (i = pmap_mem_regions_count - 1; i >= 0; i--) {
 185                 if (pa < pmap_mem_regions[i].mrStart) continue; /* See if we fit in this region */
 186                 if (pa > pmap_mem_regions[i].mrEnd) continue;   /* Check the end too */
 187
 188                 entry = (unsigned int)pmap_mem_regions[i].mrPhysTab + ((pa - pmap_mem_regions[i].mrStart) * sizeof(phys_entry));
 189                 return (struct phys_entry *)entry;
 190         }
 191 //      kprintf("DEBUG - pmap_find_physentry: page 0x%08X not found\n", pa);
 192         return 0;
 193 }
 194
 195 /*
 196  * kern_return_t
 197  * pmap_add_physical_memory(vm_offset_t spa, vm_offset_t epa,
 198  *                          boolean_t available, unsigned int attr)
 199  *
 200  *      THIS IS NOT SUPPORTED
 201  */
 202 kern_return_t pmap_add_physical_memory(vm_offset_t spa, vm_offset_t epa,
 203                                        boolean_t available, unsigned int attr)
 204 {
 205
 206         panic("Forget it! You can't map no more memory, you greedy puke!\n");
 207         return KERN_SUCCESS;
 208 }
 209
 210 /*
 211  * pmap_map(va, spa, epa, prot)
 212  *      is called during boot to map memory in the kernel's address map.
 213  *      A virtual address range starting at "va" is mapped to the physical
 214  *      address range "spa" to "epa" with machine independent protection
 215  *      "prot".
 216  *
 217  *      "va", "spa", and "epa" are byte addresses and must be on machine
 218  *      independent page boundaries.
 219  *
 220  *      Pages with a contiguous virtual address range, the same protection, and attributes.
 221  *      therefore, we map it with a single block.
 222  *
 223  *      Note that this call will only map into 32-bit space
 224  *
 225  */
 226
 227 vm_offset_t
 228 pmap_map(
 229         vm_offset_t va,
 230         vm_offset_t spa,
 231         vm_offset_t epa,
 232         vm_prot_t prot)
 233 {
 234
 235         addr64_t colladr;
 236
 237         if (spa == epa) return(va);
 238
 239         assert(epa > spa);
 240
 241         colladr = mapping_make(kernel_pmap, (addr64_t)va, (ppnum_t)(spa >> 12), (mmFlgBlock | mmFlgPerm), (epa - spa) >> 12, prot & VM_PROT_ALL);
 242
 243         if(colladr) {                                                                                   /* Was something already mapped in the range? */
 244                 panic("pmap_map: attempt to map previously mapped range - va = %08X, pa = %08X, epa = %08X, collision = %016llX\n",
 245                         va, spa, epa, colladr);
 246         }
 247         return(va);
 248 }
 249
 250 /*
 251  *      Bootstrap the system enough to run with virtual memory.
 252  *      Map the kernel's code and data, and allocate the system page table.
 253  *      Called with mapping done by BATs. Page_size must already be set.
 254  *
 255  *      Parameters:
 256  *      msize:  Total memory present
 257  *      first_avail:    First virtual address available
 258  *      kmapsize:       Size of kernel text and data
 259  */
 260 void
 261 pmap_bootstrap(uint64_t msize, vm_offset_t *first_avail, unsigned int kmapsize)
 262 {
 263         register struct mapping *mp;
 264         vm_offset_t     addr;
 265         vm_size_t               size;
 266         int                     i, num, j, rsize, mapsize, vmpagesz, vmmapsz, bank, nbits;
 267         uint64_t                tmemsize;
 268         uint_t                  htslop;
 269         vm_offset_t             first_used_addr, PCAsize;
 270         struct phys_entry *phys_table;
 271
 272         *first_avail = round_page_32(*first_avail);                             /* Make sure we start out on a page boundary */
 273         vm_last_addr = VM_MAX_KERNEL_ADDRESS;                                   /* Set the highest address know to VM */
 274
 275         /*
 276          * Initialize kernel pmap
 277          */
 278         kernel_pmap = &kernel_pmap_store;
 279         kernel_pmap_phys = (addr64_t)&kernel_pmap_store;
 280         cursor_pmap = &kernel_pmap_store;
 281
 282         simple_lock_init(&kernel_pmap->lock, ETAP_VM_PMAP_KERNEL);
 283
 284         kernel_pmap->pmap_link.next = (queue_t)kernel_pmap;             /* Set up anchor forward */
 285         kernel_pmap->pmap_link.prev = (queue_t)kernel_pmap;             /* Set up anchor reverse */
 286         kernel_pmap->ref_count = 1;
 287         kernel_pmap->pmapFlags = pmapKeyDef;                                    /* Set the default keys */
 288         kernel_pmap->pmapCCtl = pmapCCtlVal;                                    /* Initialize cache control */
 289         kernel_pmap->space = PPC_SID_KERNEL;
 290         kernel_pmap->pmapvr = 0;                                                                /* Virtual = Real  */
 291
 292 /*
 293  *      The hash table wants to have one pteg for every 2 physical pages.
 294  *      We will allocate this in physical RAM, outside of kernel virtual memory,
 295  *      at the top of the highest bank that will contain it.
 296  *      Note that "bank" doesn't refer to a physical memory slot here, it is a range of
 297  *      physically contiguous memory.
 298  *
 299  *      The PCA will go there as well, immediately before the hash table.
 300  */
 301
 302         nbits = cntlzw(((msize << 1) - 1) >> 32);                               /* Get first bit in upper half */
 303         if(nbits == 32) nbits = nbits + cntlzw((uint_t)((msize << 1) - 1));     /* If upper half was empty, find bit in bottom half */
 304         tmemsize = 0x8000000000000000ULL >> nbits;                                      /* Get memory size rounded up to power of 2 */
 305
 306         if(tmemsize > 0x0000002000000000ULL) tmemsize = 0x0000002000000000ULL;  /* Make sure we don't make an unsupported hash table size */
 307
 308         hash_table_size = (uint_t)(tmemsize >> 13) * per_proc_info[0].pf.pfPTEG;        /* Get provisional hash_table_size */
 309         if(hash_table_size < (256 * 1024)) hash_table_size = (256 * 1024);      /* Make sure we are at least minimum size */
 310
 311         while(1) {                                                                                              /* Try to fit hash table in PCA into contiguous memory */
 312
 313                 if(hash_table_size < (256 * 1024)) {                            /* Have we dropped too short? This should never, ever happen */
 314                         panic("pmap_bootstrap: Can't find space for hash table\n");     /* This will never print, system isn't up far enough... */
 315                 }
 316
 317                 PCAsize = (hash_table_size / per_proc_info[0].pf.pfPTEG) * sizeof(PCA); /* Get total size of PCA table */
 318                 PCAsize = round_page_32(PCAsize);                                       /* Make sure it is at least a page long */
 319
 320                 for(bank = pmap_mem_regions_count - 1; bank >= 0; bank--) {     /* Search backwards through banks */
 321
 322                         hash_table_base = ((addr64_t)pmap_mem_regions[bank].mrEnd << 12) - hash_table_size + PAGE_SIZE; /* Get tenative address */
 323
 324                         htslop = hash_table_base & (hash_table_size - 1);       /* Get the extra that we will round down when we align */
 325                         hash_table_base = hash_table_base & -(addr64_t)hash_table_size; /* Round down to correct boundary */
 326
 327                         if((hash_table_base - round_page_32(PCAsize)) >= ((addr64_t)pmap_mem_regions[bank].mrStart << 12)) break;       /* Leave if we fit */
 328                 }
 329
 330                 if(bank >= 0) break;                                                            /* We are done if we found a suitable bank */
 331
 332                 hash_table_size = hash_table_size >> 1;                         /* Try the next size down */
 333         }
 334
 335         if(htslop) {                                                                                    /* If there was slop (i.e., wasted pages for alignment) add a new region */
 336                 for(i = pmap_mem_regions_count - 1; i >= bank; i--) {   /* Copy from end to our bank, including our bank */
 337                         pmap_mem_regions[i + 1].mrStart  = pmap_mem_regions[i].mrStart; /* Set the start of the bank */
 338                         pmap_mem_regions[i + 1].mrAStart = pmap_mem_regions[i].mrAStart;        /* Set the start of allocatable area */
 339                         pmap_mem_regions[i + 1].mrEnd    = pmap_mem_regions[i].mrEnd;   /* Set the end address of bank */
 340                         pmap_mem_regions[i + 1].mrAEnd   = pmap_mem_regions[i].mrAEnd;  /* Set the end address of allocatable area */
 341                 }
 342
 343                 pmap_mem_regions[i + 1].mrStart  = (hash_table_base + hash_table_size) >> 12;   /* Set the start of the next bank to the start of the slop area */
 344                 pmap_mem_regions[i + 1].mrAStart = (hash_table_base + hash_table_size) >> 12;   /* Set the start of allocatable area to the start of the slop area */
 345                 pmap_mem_regions[i].mrEnd        = (hash_table_base + hash_table_size - 4096) >> 12;    /* Set the end of our bank to the end of the hash table */
 346
 347         }
 348
 349         pmap_mem_regions[bank].mrAEnd = (hash_table_base - PCAsize - 4096) >> 12;       /* Set the maximum allocatable in this bank */
 350
 351         hw_hash_init();                                                                                 /* Initiaize the hash table and PCA */
 352         hw_setup_trans();                                                                               /* Set up hardware registers needed for translation */
 353
 354 /*
 355  *      The hash table is now all initialized and so is the PCA.  Go on to do the rest of it.
 356  *      This allocation is from the bottom up.
 357  */
 358
 359         num = atop_64(msize);                                                                           /* Get number of pages in all of memory */
 360
 361 /* Figure out how much we need to allocate */
 362
 363         size = (vm_size_t) (
 364                 (InitialSaveBloks * PAGE_SIZE) +                                        /* Allow space for the initial context saveareas */
 365                 (BackPocketSaveBloks * PAGE_SIZE) +                                     /* For backpocket saveareas */
 366                 trcWork.traceSize +                                                             /* Size of trace table */
 367                 ((((1 << maxAdrSpb) * sizeof(pmapTransTab)) + 4095) & -4096) +  /* Size of pmap translate table */
 368                 (((num * sizeof(struct phys_entry)) + 4095) & -4096)    /* For the physical entries */
 369         );
 370
 371         mapsize = size = round_page_32(size);                                           /* Get size of area to map that we just calculated */
 372         mapsize = mapsize + kmapsize;                                                   /* Account for the kernel text size */
 373
 374         vmpagesz = round_page_32(num * sizeof(struct vm_page)); /* Allow for all vm_pages needed to map physical mem */
 375         vmmapsz = round_page_32((num / 8) * sizeof(struct vm_map_entry));       /* Allow for vm_maps */
 376
 377         mapsize = mapsize + vmpagesz + vmmapsz;                                 /* Add the VM system estimates into the grand total */
 378
 379         mapsize = mapsize + (4 * 1024 * 1024);                                  /* Allow for 4 meg of extra mappings */
 380         mapsize = ((mapsize / PAGE_SIZE) + MAPPERBLOK - 1) / MAPPERBLOK;        /* Get number of blocks of mappings we need */
 381         mapsize = mapsize + ((mapsize  + MAPPERBLOK - 1) / MAPPERBLOK); /* Account for the mappings themselves */
 382
 383         size = size + (mapsize * PAGE_SIZE);                                    /* Get the true size we need */
 384
 385         /* hash table must be aligned to its size */
 386
 387         addr = *first_avail;                                                                    /* Set the address to start allocations */
 388         first_used_addr = addr;                                                                 /* Remember where we started */
 389
 390         bzero((char *)addr, size);                                                              /* Clear everything that we are allocating */
 391
 392         savearea_init(addr);                                                                    /* Initialize the savearea chains and data */
 393
 394         addr = (vm_offset_t)((unsigned int)addr + ((InitialSaveBloks + BackPocketSaveBloks) * PAGE_SIZE));      /* Point past saveareas */
 395
 396         trcWork.traceCurr = (unsigned int)addr;                                 /* Set first trace slot to use */
 397         trcWork.traceStart = (unsigned int)addr;                                /* Set start of trace table */
 398         trcWork.traceEnd = (unsigned int)addr + trcWork.traceSize;              /* Set end of trace table */
 399
 400         addr = (vm_offset_t)trcWork.traceEnd;                                   /* Set next allocatable location */
 401
 402         pmapTrans = (pmapTransTab *)addr;                                               /* Point to the pmap to hash translation table */
 403
 404         pmapTrans[PPC_SID_KERNEL].pmapPAddr = (addr64_t)((uintptr_t)kernel_pmap);       /* Initialize the kernel pmap in the translate table */
 405         pmapTrans[PPC_SID_KERNEL].pmapVAddr = CAST_DOWN(unsigned int, kernel_pmap);  /* Initialize the kernel pmap in the translate table */
 406
 407         addr += ((((1 << maxAdrSpb) * sizeof(pmapTransTab)) + 4095) & -4096);   /* Point past pmap translate table */
 408
 409 /*      NOTE: the phys_table must be within the first 2GB of physical RAM. This makes sure we only need to do 32-bit arithmetic */
 410
 411         phys_table = (struct phys_entry *) addr;                                /* Get pointer to physical table */
 412
 413         for (bank = 0; bank < pmap_mem_regions_count; bank++) { /* Set pointer and initialize all banks of ram */
 414
 415                 pmap_mem_regions[bank].mrPhysTab = phys_table;          /* Set pointer to the physical table for this bank */
 416
 417                 phys_table = phys_table + (pmap_mem_regions[bank].mrEnd - pmap_mem_regions[bank].mrStart + 1);  /* Point to the next */
 418         }
 419
 420         addr += (((num * sizeof(struct phys_entry)) + 4095) & -4096);   /* Step on past the physical entries */
 421
 422 /*
 423  *              Remaining space is for mapping entries.  Tell the initializer routine that
 424  *              the mapping system can't release this block because it's permanently assigned
 425  */
 426
 427         mapping_init();                                                                                 /* Initialize the mapping tables */
 428
 429         for(i = addr; i < first_used_addr + size; i += PAGE_SIZE) {     /* Add initial mapping blocks */
 430                 mapping_free_init(i, 1, 0);                                                     /* Pass block address and say that this one is not releasable */
 431         }
 432         mapCtl.mapcmin = MAPPERBLOK;                                                    /* Make sure we only adjust one at a time */
 433
 434         /* Map V=R the page tables */
 435         pmap_map(first_used_addr, first_used_addr,
 436                  round_page_32(first_used_addr + size), VM_PROT_READ | VM_PROT_WRITE);
 437
 438         *first_avail = round_page_32(first_used_addr + size);           /* Set next available page */
 439         first_free_virt = *first_avail;                                                 /* Ditto */
 440
 441         /* All the rest of memory is free - add it to the free
 442          * regions so that it can be allocated by pmap_steal
 443          */
 444
 445         pmap_mem_regions[0].mrAStart = (*first_avail >> 12);    /* Set up the free area to start allocations (always in the first bank) */
 446
 447         current_free_region = 0;                                                                /* Set that we will start allocating in bank 0 */
 448         avail_remaining = 0;                                                                    /* Clear free page count */
 449         for(bank = 0; bank < pmap_mem_regions_count; bank++) {  /* Total up all of the pages in the system that are available */
 450                 avail_remaining += (pmap_mem_regions[bank].mrAEnd - pmap_mem_regions[bank].mrAStart) + 1;       /* Add in allocatable pages in this bank */
 451         }
 452
 453
 454 }
 455
 456 /*
 457  * pmap_init(spa, epa)
 458  *      finishes the initialization of the pmap module.
 459  *      This procedure is called from vm_mem_init() in vm/vm_init.c
 460  *      to initialize any remaining data structures that the pmap module
 461  *      needs to map virtual memory (VM is already ON).
 462  *
 463  *      Note that the pmap needs to be sized and aligned to
 464  *      a power of two.  This is because it is used both in virtual and
 465  *      real so it can't span a page boundary.
 466  */
 467
 468 void
 469 pmap_init(void)
 470 {
 471
 472         addr64_t cva;
 473
 474         pmap_zone = zinit(pmapSize, 400 * pmapSize, 4096, "pmap");
 475 #if     ZONE_DEBUG
 476         zone_debug_disable(pmap_zone);          /* Can't debug this one 'cause it messes with size and alignment */
 477 #endif  /* ZONE_DEBUG */
 478
 479         pmap_initialized = TRUE;
 480
 481         /*
 482          *      Initialize list of freed up pmaps
 483          */
 484         free_pmap_list = 0;                                     /* Set that there are no free pmaps */
 485         free_pmap_count = 0;
 486         simple_lock_init(&free_pmap_lock, ETAP_VM_PMAP_CACHE);
 487
 488 }
 489
 490 unsigned int pmap_free_pages(void)
 491 {
 492         return avail_remaining;
 493 }
 494
 495 /*
 496  *      This function allocates physical pages.
 497  */
 498
 499 /* Non-optimal, but only used for virtual memory startup.
 500  * Allocate memory from a table of free physical addresses
 501  * If there are no more free entries, too bad.
 502  */
 503
 504 boolean_t pmap_next_page(ppnum_t *addrp)
 505 {
 506                 int i;
 507
 508         if(current_free_region >= pmap_mem_regions_count) return FALSE; /* Return failure if we have used everything... */
 509
 510         for(i = current_free_region; i < pmap_mem_regions_count; i++) { /* Find the next bank with free pages */
 511                 if(pmap_mem_regions[i].mrAStart <= pmap_mem_regions[i].mrAEnd) break;   /* Found one */
 512         }
 513
 514         current_free_region = i;                                                                                /* Set our current bank */
 515         if(i >= pmap_mem_regions_count) return FALSE;                                   /* Couldn't find a free page */
 516
 517         *addrp = pmap_mem_regions[i].mrAStart;                                  /* Allocate the page */
 518         pmap_mem_regions[i].mrAStart = pmap_mem_regions[i].mrAStart + 1;        /* Set the next one to go */
 519         avail_remaining--;                                                                                              /* Drop free count */
 520
 521         return TRUE;
 522 }
 523
 524 void pmap_virtual_space(
 525         vm_offset_t *startp,
 526         vm_offset_t *endp)
 527 {
 528         *startp = round_page_32(first_free_virt);
 529         *endp   = vm_last_addr;
 530 }
 531
 532 /*
 533  * pmap_create
 534  *
 535  * Create and return a physical map.
 536  *
 537  * If the size specified for the map is zero, the map is an actual physical
 538  * map, and may be referenced by the hardware.
 539  *
 540  * A pmap is either in the free list or in the in-use list.  The only use
 541  * of the in-use list (aside from debugging) is to handle the VSID wrap situation.
 542  * Whenever a new pmap is allocated (i.e., not recovered from the free list). The
 543  * in-use list is matched until a hole in the VSID sequence is found. (Note
 544  * that the in-use pmaps are queued in VSID sequence order.) This is all done
 545  * while free_pmap_lock is held.
 546  *
 547  * If the size specified is non-zero, the map will be used in software
 548  * only, and is bounded by that size.
 549  */
 550 pmap_t
 551 pmap_create(vm_size_t size)
 552 {
 553         pmap_t pmap, ckpmap, fore, aft;
 554         int s, i;
 555         unsigned int currSID, hspace;
 556         addr64_t physpmap;
 557
 558         /*
 559          * A software use-only map doesn't even need a pmap structure.
 560          */
 561         if (size)
 562                 return(PMAP_NULL);
 563
 564         /*
 565          * If there is a pmap in the pmap free list, reuse it.
 566          * Note that we use free_pmap_list for all chaining of pmaps, both to
 567          * the free list and the in use chain (anchored from kernel_pmap).
 568          */
 569         s = splhigh();
 570         simple_lock(&free_pmap_lock);
 571
 572         if(free_pmap_list) {                                                    /* Any free? */
 573                 pmap = free_pmap_list;                                          /* Yes, allocate it */
 574                 free_pmap_list = (pmap_t)pmap->freepmap;        /* Dequeue this one (we chain free ones through freepmap) */
 575                 free_pmap_count--;
 576         }
 577         else {
 578                 simple_unlock(&free_pmap_lock);                         /* Unlock just in case */
 579                 splx(s);
 580
 581                 pmap = (pmap_t) zalloc(pmap_zone);                      /* Get one */
 582                 if (pmap == PMAP_NULL) return(PMAP_NULL);       /* Handle out-of-memory condition */
 583
 584                 bzero((char *)pmap, pmapSize);                          /* Clean up the pmap */
 585
 586                 s = splhigh();
 587                 simple_lock(&free_pmap_lock);                           /* Lock it back up      */
 588
 589                 ckpmap = cursor_pmap;                                           /* Get starting point for free ID search */
 590                 currSID = ckpmap->spaceNum;                                     /* Get the actual space ID number */
 591
 592                 while(1) {                                                                      /* Keep trying until something happens */
 593
 594                         currSID = (currSID + 1) & (maxAdrSp - 1);       /* Get the next in the sequence */
 595                         if(((currSID * incrVSID) & (maxAdrSp - 1)) == invalSpace) continue;     /* Skip the space we have reserved */
 596                         ckpmap = (pmap_t)ckpmap->pmap_link.next;        /* On to the next in-use pmap */
 597
 598                         if(ckpmap->spaceNum != currSID) break;  /* If we are out of sequence, this is free */
 599
 600                         if(ckpmap == cursor_pmap) {                             /* See if we have 2^20 already allocated */
 601                                 panic("pmap_create: Maximum number (%d) active address spaces reached\n", maxAdrSp);    /* Die pig dog */
 602                         }
 603                 }
 604
 605                 pmap->space = (currSID * incrVSID) & (maxAdrSp - 1);    /* Calculate the actual VSID */
 606                 pmap->spaceNum = currSID;                                       /* Set the space ID number */
 607 /*
 608  *              Now we link into the chain just before the out of sequence guy.
 609  */
 610
 611                 fore = (pmap_t)ckpmap->pmap_link.prev;          /* Get the current's previous */
 612                 pmap->pmap_link.next = (queue_t)ckpmap;         /* My next points to the current */
 613                 fore->pmap_link.next = (queue_t)pmap;           /* Current's previous's next points to me */
 614                 pmap->pmap_link.prev = (queue_t)fore;           /* My prev points to what the current pointed to */
 615                 ckpmap->pmap_link.prev = (queue_t)pmap;         /* Current's prev points to me */
 616
 617                 simple_lock_init(&pmap->lock, ETAP_VM_PMAP);
 618
 619                 physpmap = ((addr64_t)pmap_find_phys(kernel_pmap, (addr64_t)((uintptr_t)pmap)) << 12) | (addr64_t)((unsigned int)pmap & 0xFFF); /* Get the physical address of the pmap */
 620
 621                 pmap->pmapvr = (addr64_t)((uintptr_t)pmap) ^ physpmap;  /* Make V to R translation mask */
 622
 623                 pmapTrans[pmap->space].pmapPAddr = physpmap;    /* Set translate table physical to point to us */
 624                 pmapTrans[pmap->space].pmapVAddr = CAST_DOWN(unsigned int, pmap);       /* Set translate table virtual to point to us */
 625         }
 626
 627         pmap->pmapFlags = pmapKeyDef;                                   /* Set default key */
 628         pmap->pmapCCtl = pmapCCtlVal;                                   /* Initialize cache control */
 629         pmap->ref_count = 1;
 630         pmap->stats.resident_count = 0;
 631         pmap->stats.wired_count = 0;
 632         pmap->pmapSCSubTag = 0x0000000000000000ULL;             /* Make sure this is clean an tidy */
 633         simple_unlock(&free_pmap_lock);
 634
 635         splx(s);
 636         return(pmap);
 637 }
 638
 639 /*
 640  * pmap_destroy
 641  *
 642  * Gives up a reference to the specified pmap.  When the reference count
 643  * reaches zero the pmap structure is added to the pmap free list.
 644  *
 645  * Should only be called if the map contains no valid mappings.
 646  */
 647 void
 648 pmap_destroy(pmap_t pmap)
 649 {
 650         int ref_count;
 651         spl_t s;
 652         pmap_t fore, aft;
 653
 654         if (pmap == PMAP_NULL)
 655                 return;
 656
 657         ref_count=hw_atomic_sub(&pmap->ref_count, 1);                   /* Back off the count */
 658         if(ref_count>0) return;                                                                 /* Still more users, leave now... */
 659
 660         if(ref_count < 0)                                                                               /* Did we go too far? */
 661                 panic("pmap_destroy(): ref_count < 0");
 662
 663 #ifdef notdef
 664         if(pmap->stats.resident_count != 0)
 665                 panic("PMAP_DESTROY: pmap not empty");
 666 #else
 667         if(pmap->stats.resident_count != 0) {
 668                 pmap_remove(pmap, 0, 0xFFFFFFFFFFFFF000ULL);
 669         }
 670 #endif
 671
 672         /*
 673          * Add the pmap to the pmap free list.
 674          */
 675
 676         s = splhigh();
 677         /*
 678          * Add the pmap to the pmap free list.
 679          */
 680         simple_lock(&free_pmap_lock);
 681
 682         if (free_pmap_count <= free_pmap_max) {         /* Do we have enough spares? */
 683
 684                 pmap->freepmap = free_pmap_list;                /* Queue in front */
 685                 free_pmap_list = pmap;
 686                 free_pmap_count++;
 687                 simple_unlock(&free_pmap_lock);
 688
 689         } else {
 690                 if(cursor_pmap == pmap) cursor_pmap = (pmap_t)pmap->pmap_link.prev;     /* If we are releasing the cursor, back up */
 691                 fore = (pmap_t)pmap->pmap_link.prev;
 692                 aft  = (pmap_t)pmap->pmap_link.next;
 693                 fore->pmap_link.next = pmap->pmap_link.next;    /* My previous's next is my next */
 694                 aft->pmap_link.prev = pmap->pmap_link.prev;             /* My next's previous is my previous */
 695                 simple_unlock(&free_pmap_lock);
 696                 pmapTrans[pmap->space].pmapPAddr = -1;                  /* Invalidate the translate table physical */
 697                 pmapTrans[pmap->space].pmapVAddr = -1;                  /* Invalidate the translate table virtual */
 698                 zfree(pmap_zone, (vm_offset_t) pmap);
 699         }
 700         splx(s);
 701 }
 702
 703 /*
 704  * pmap_reference(pmap)
 705  *      gains a reference to the specified pmap.
 706  */
 707 void
 708 pmap_reference(pmap_t pmap)
 709 {
 710         spl_t s;
 711
 712         if (pmap != PMAP_NULL) hw_atomic_add(&pmap->ref_count, 1);      /* Bump the count */
 713 }
 714
 715 /*
 716  * pmap_remove_some_phys
 717  *
 718  *      Removes mappings of the associated page from the specified pmap
 719  *
 720  */
 721 void pmap_remove_some_phys(
 722              pmap_t pmap,
 723              vm_offset_t pa)
 724 {
 725         register struct phys_entry      *pp;
 726         register struct mapping         *mp;
 727         unsigned int pindex;
 728
 729         if (pmap == PMAP_NULL) {                                        /* This should never be called with a null pmap */
 730                 panic("pmap_remove_some_phys: null pmap\n");
 731         }
 732
 733         pp = mapping_phys_lookup(pa, &pindex);          /* Get physical entry */
 734         if (pp == 0) return;                                            /* Leave if not in physical RAM */
 735
 736         while(1) {                                                                      /* Keep going until we toss all pages from this pmap */
 737                 if (pmap->pmapFlags & pmapVMhost) {
 738                         mp = hw_purge_phys(pp);                         /* Toss a map */
 739                         if(!mp ) return;
 740                         if((unsigned int)mp & mapRetCode) {             /* Was there a failure? */
 741                                 panic("pmap_remove_some_phys: hw_purge_phys failed - pp = %08X, pmap = %08X, code = %08X\n",
 742                                         pp, pmap, mp);
 743                         }
 744                 } else {
 745                         mp = hw_purge_space(pp, pmap);                  /* Toss a map */
 746                         if(!mp ) return;
 747                         if((unsigned int)mp & mapRetCode) {             /* Was there a failure? */
 748                                 panic("pmap_remove_some_phys: hw_purge_pmap failed - pp = %08X, pmap = %08X, code = %08X\n",
 749                                         pp, pmap, mp);
 750                         }
 751                 }
 752                 mapping_free(mp);                                               /* Toss the mapping */
 753         }
 754
 755         return;                                                                         /* Leave... */
 756 }
 757
 758 /*
 759  * pmap_remove(pmap, s, e)
 760  *      unmaps all virtual addresses v in the virtual address
 761  *      range determined by [s, e) and pmap.
 762  *      s and e must be on machine independent page boundaries and
 763  *      s must be less than or equal to e.
 764  *
 765  *      Note that pmap_remove does not remove any mappings in nested pmaps. We just
 766  *      skip those segments.
 767  */
 768 void
 769 pmap_remove(
 770             pmap_t pmap,
 771             addr64_t sva,
 772             addr64_t eva)
 773 {
 774         addr64_t                va, endva;
 775
 776         if (pmap == PMAP_NULL) return;                                  /* Leave if software pmap */
 777
 778
 779         /* It is just possible that eva might have wrapped around to zero,
 780          * and sometimes we get asked to liberate something of size zero
 781          * even though it's dumb (eg. after zero length read_overwrites)
 782          */
 783         assert(eva >= sva);
 784
 785         /* If these are not page aligned the loop might not terminate */
 786         assert((sva == trunc_page_64(sva)) && (eva == trunc_page_64(eva)));
 787
 788         va = sva & -4096LL;                                                     /* Round start down to a page */
 789         endva = eva & -4096LL;                                          /* Round end down to a page */
 790
 791         while(1) {                                                                      /* Go until we finish the range */
 792                 va = mapping_remove(pmap, va);                  /* Remove the mapping and see what's next */
 793                 va = va & -4096LL;                                              /* Make sure the "not found" indication is clear */
 794                 if((va == 0) || (va >= endva)) break;   /* End loop if we finish range or run off the end */
 795         }
 796
 797 }
 798
 799 /*
 800  *      Routine:
 801  *              pmap_page_protect
 802  *
 803  *      Function:
 804  *              Lower the permission for all mappings to a given page.
 805  */
 806 void
 807 pmap_page_protect(
 808         ppnum_t pa,
 809         vm_prot_t prot)
 810 {
 811         register struct phys_entry      *pp;
 812         boolean_t                       remove;
 813         unsigned int            pindex;
 814         mapping                         *mp;
 815
 816
 817         switch (prot) {
 818                 case VM_PROT_READ:
 819                 case VM_PROT_READ|VM_PROT_EXECUTE:
 820                         remove = FALSE;
 821                         break;
 822                 case VM_PROT_ALL:
 823                         return;
 824                 default:
 825                         remove = TRUE;
 826                         break;
 827         }
 828
 829
 830         pp = mapping_phys_lookup(pa, &pindex);  /* Get physical entry */
 831         if (pp == 0) return;                                            /* Leave if not in physical RAM */
 832
 833         if (remove) {                                                           /* If the protection was set to none, we'll remove all mappings */
 834
 835                 while(1) {                                                              /* Keep going until we toss all pages from this physical page */
 836                         mp = hw_purge_phys(pp);                         /* Toss a map */
 837                         if(!mp ) return;
 838                         if((unsigned int)mp & mapRetCode) {     /* Was there a failure? */
 839                                 panic("pmap_page_protect: hw_purge_phys failed - pp = %08X, code = %08X\n",
 840                                         pp, mp);
 841                         }
 842                         mapping_free(mp);                                       /* Toss the mapping */
 843                 }
 844
 845                 return;                                                                 /* Leave... */
 846         }
 847
 848 /*      When we get here, it means that we are to change the protection for a
 849  *      physical page.
 850  */
 851
 852         mapping_protect_phys(pa, prot & VM_PROT_ALL);   /* Change protection of all mappings to page. */
 853
 854 }
 855
 856 /*
 857  * pmap_protect(pmap, s, e, prot)
 858  *      changes the protection on all virtual addresses v in the
 859  *      virtual address range determined by [s, e] and pmap to prot.
 860  *      s and e must be on machine independent page boundaries and
 861  *      s must be less than or equal to e.
 862  *
 863  *      Note that any requests to change the protection of a nested pmap are
 864  *      ignored. Those changes MUST be done by calling this with the correct pmap.
 865  */
 866 void pmap_protect(
 867              pmap_t pmap,
 868              vm_offset_t sva,
 869              vm_offset_t eva,
 870              vm_prot_t prot)
 871 {
 872
 873         addr64_t va, endva, nextva;
 874
 875         if (pmap == PMAP_NULL) return;                          /* Do nothing if no pmap */
 876
 877         if (prot == VM_PROT_NONE) {                                     /* Should we kill the address range?? */
 878                 pmap_remove(pmap, (addr64_t)sva, (addr64_t)eva);        /* Yeah, dump 'em */
 879                 return;                                                                 /* Leave... */
 880         }
 881
 882         va = sva & -4096LL;                                                     /* Round start down to a page */
 883         endva = eva & -4096LL;                                          /* Round end down to a page */
 884
 885         while(1) {                                                                      /* Go until we finish the range */
 886                 (void)mapping_protect(pmap, va, prot & VM_PROT_ALL, &va);       /* Change the protection and see what's next */
 887                 if((va == 0) || (va >= endva)) break;   /* End loop if we finish range or run off the end */
 888         }
 889
 890 }
 891
 892
 893
 894 /*
 895  * pmap_enter
 896  *
 897  * Create a translation for the virtual address (virt) to the physical
 898  * address (phys) in the pmap with the protection requested. If the
 899  * translation is wired then we can not allow a full page fault, i.e.,
 900  * the mapping control block is not eligible to be stolen in a low memory
 901  * condition.
 902  *
 903  * NB: This is the only routine which MAY NOT lazy-evaluate
 904  *     or lose information.  That is, this routine must actually
 905  *     insert this page into the given map NOW.
 906  */
 907 void
 908 pmap_enter(pmap_t pmap, vm_offset_t va, ppnum_t pa, vm_prot_t prot,
 909                 unsigned int flags, boolean_t wired)
 910 {
 911         int                                     memattr;
 912         pmap_t                          opmap;
 913         unsigned int            mflags;
 914         addr64_t                        colva;
 915
 916         if (pmap == PMAP_NULL) return;                                  /* Leave if software pmap */
 917
 918         disable_preemption();                                                   /* Don't change threads */
 919
 920         mflags = 0;                                                                             /* Make sure this is initialized to nothing special */
 921         if(!(flags & VM_WIMG_USE_DEFAULT)) {                    /* Are they supplying the attributes? */
 922                 mflags = mmFlgUseAttr | (flags & VM_MEM_GUARDED) | ((flags & VM_MEM_NOT_CACHEABLE) >> 1);       /* Convert to our mapping_make flags */
 923         }
 924
 925 /*
 926  *      It is possible to hang here if another processor is remapping any pages we collide with and are removing
 927  */
 928
 929         while(1) {                                                                              /* Keep trying the enter until it goes in */
 930
 931                 colva = mapping_make(pmap, va, pa, mflags, 1, prot & VM_PROT_ALL);      /* Enter the mapping into the pmap */
 932
 933                 if(!colva) break;                                                       /* If there were no collisions, we are done... */
 934
 935                 mapping_remove(pmap, colva);                            /* Remove the mapping that collided */
 936         }
 937
 938         enable_preemption();                                                    /* Thread change ok */
 939
 940 }
 941
 942 /*
 943  *              Enters translations for odd-sized V=F blocks.
 944  *
 945  *              The higher level VM map should be locked to insure that we don't have a
 946  *              double diddle here.
 947  *
 948  *              We panic if we get a block that overlaps with another. We do not merge adjacent
 949  *              blocks because removing any address within a block removes the entire block and if
 950  *              would really mess things up if we trashed too much.
 951  *
 952  *              Once a block is mapped, it is unmutable, that is, protection, catch mode, etc. can
 953  *              not be changed.  The block must be unmapped and then remapped with the new stuff.
 954  *              We also do not keep track of reference or change flags.
 955  *
 956  *              Note that pmap_map_block_rc is the same but doesn't panic if collision.
 957  *
 958  */
 959
 960 void pmap_map_block(pmap_t pmap, addr64_t va, ppnum_t pa, vm_size_t size, vm_prot_t prot, int attr, unsigned int flags) {       /* Map an autogenned block */
 961
 962         int                                     memattr;
 963         unsigned int            mflags;
 964         addr64_t                        colva;
 965
 966
 967         if (pmap == PMAP_NULL) {                                                /* Did they give us a pmap? */
 968                 panic("pmap_map_block: null pmap\n");           /* No, like that's dumb... */
 969         }
 970
 971 //      kprintf("pmap_map_block: (%08X) va = %016llX, pa = %08X, size = %08X, prot = %08X, attr = %08X, flags = %08X\n",        /* (BRINGUP) */
 972 //              current_act(), va, pa, size, prot, attr, flags);        /* (BRINGUP) */
 973
 974
 975         mflags = mmFlgBlock | mmFlgUseAttr | (attr & VM_MEM_GUARDED) | ((attr & VM_MEM_NOT_CACHEABLE) >> 1);    /* Convert to our mapping_make flags */
 976         if(flags) mflags |= mmFlgPerm;                                  /* Mark permanent if requested */
 977
 978         colva = mapping_make(pmap, va, pa, mflags, (size >> 12), prot); /* Enter the mapping into the pmap */
 979
 980         if(colva) {                                                                             /* If there was a collision, panic */
 981                 panic("pmap_map_block: collision at %016llX, pmap = %08X\n", colva, pmap);
 982         }
 983
 984         return;                                                                                 /* Return */
 985 }
 986
 987 int pmap_map_block_rc(pmap_t pmap, addr64_t va, ppnum_t pa, vm_size_t size, vm_prot_t prot, int attr, unsigned int flags) {     /* Map an autogenned block */
 988
 989         int                                     memattr;
 990         unsigned int            mflags;
 991         addr64_t                        colva;
 992
 993
 994         if (pmap == PMAP_NULL) {                                                /* Did they give us a pmap? */
 995                 panic("pmap_map_block_rc: null pmap\n");        /* No, like that's dumb... */
 996         }
 997
 998         mflags = mmFlgBlock | mmFlgUseAttr | (attr & VM_MEM_GUARDED) | ((attr & VM_MEM_NOT_CACHEABLE) >> 1);    /* Convert to our mapping_make flags */
 999         if(flags) mflags |= mmFlgPerm;                                  /* Mark permanent if requested */
1000
1001         colva = mapping_make(pmap, va, pa, mflags, (size >> 12), prot); /* Enter the mapping into the pmap */
1002
1003         if(colva) return 0;                                                             /* If there was a collision, fail */
1004
1005         return 1;                                                                               /* Return true of we worked */
1006 }
1007
1008 /*
1009  * pmap_extract(pmap, va)
1010  *      returns the physical address corrsponding to the
1011  *      virtual address specified by pmap and va if the
1012  *      virtual address is mapped and 0 if it is not.
1013  *      Note: we assume nothing is ever mapped to phys 0.
1014  *
1015  *      NOTE: This call always will fail for physical addresses greater than 0xFFFFF000.
1016  */
1017 vm_offset_t pmap_extract(pmap_t pmap, vm_offset_t va) {
1018
1019         spl_t                                   spl;
1020         register struct mapping *mp;
1021         register vm_offset_t    pa;
1022         addr64_t                                nextva;
1023         ppnum_t                                 ppoffset;
1024         unsigned int                    gva;
1025
1026 #ifdef BOGUSCOMPAT
1027         panic("pmap_extract: THIS CALL IS BOGUS. NEVER USE IT EVER. So there...\n");    /* Don't use this */
1028 #else
1029
1030         gva = (unsigned int)va;                                                 /* Make sure we don't have a sign */
1031
1032         spl = splhigh();                                                                /* We can't allow any loss of control here */
1033
1034         mp = mapping_find(pmap, (addr64_t)gva, &nextva,1);      /* Find the mapping for this address */
1035
1036         if(!mp) {                                                                               /* Is the page mapped? */
1037                 splx(spl);                                                                      /* Enable interrupts */
1038                 return 0;                                                                       /* Pass back 0 if not found */
1039         }
1040
1041         ppoffset = (ppnum_t)(((gva & -4096LL) - (mp->mpVAddr & -4096LL)) >> 12);        /* Get offset from va to base va */
1042
1043
1044         pa = mp->mpPAddr + ppoffset;                                    /* Remember ppage because mapping may vanish after drop call */
1045
1046         mapping_drop_busy(mp);                                                  /* We have everything we need from the mapping */
1047         splx(spl);                                                                              /* Restore 'rupts */
1048
1049         if(pa > maxPPage32) return 0;                                   /* Force large addresses to fail */
1050
1051         pa = (pa << 12) | (va & 0xFFF);                                 /* Convert physical page number to address */
1052
1053 #endif
1054         return pa;                                                                              /* Return physical address or 0 */
1055 }
1056
1057 /*
1058  * ppnum_t pmap_find_phys(pmap, addr64_t va)
1059  *      returns the physical page corrsponding to the
1060  *      virtual address specified by pmap and va if the
1061  *      virtual address is mapped and 0 if it is not.
1062  *      Note: we assume nothing is ever mapped to phys 0.
1063  *
1064  */
1065 ppnum_t pmap_find_phys(pmap_t pmap, addr64_t va) {
1066
1067         spl_t                                   spl;
1068         register struct mapping *mp;
1069         ppnum_t                                 pa, ppoffset;
1070         addr64_t                                nextva, curva;
1071
1072         spl = splhigh();                                                                /* We can't allow any loss of control here */
1073
1074         mp = mapping_find(pmap, va, &nextva, 1);                /* Find the mapping for this address */
1075
1076         if(!mp) {                                                                               /* Is the page mapped? */
1077                 splx(spl);                                                                      /* Enable interrupts */
1078                 return 0;                                                                       /* Pass back 0 if not found */
1079         }
1080
1081
1082         ppoffset = (ppnum_t)(((va & -4096LL) - (mp->mpVAddr & -4096LL)) >> 12); /* Get offset from va to base va */
1083
1084         pa = mp->mpPAddr + ppoffset;                                    /* Get the actual physical address */
1085
1086         mapping_drop_busy(mp);                                                  /* We have everything we need from the mapping */
1087
1088         splx(spl);                                                                              /* Restore 'rupts */
1089         return pa;                                                                              /* Return physical address or 0 */
1090 }
1091
1092
1093 /*
1094  *      pmap_attributes:
1095  *
1096  *      Set/Get special memory attributes; not implemented.
1097  *
1098  *      Note: 'VAL_GET_INFO' is used to return info about a page.
1099  *        If less than 1 page is specified, return the physical page
1100  *        mapping and a count of the number of mappings to that page.
1101  *        If more than one page is specified, return the number
1102  *        of resident pages and the number of shared (more than
1103  *        one mapping) pages in the range;
1104  *
1105  *
1106  */
1107 kern_return_t
1108 pmap_attribute(pmap, address, size, attribute, value)
1109         pmap_t                  pmap;
1110         vm_offset_t             address;
1111         vm_size_t               size;
1112         vm_machine_attribute_t  attribute;
1113         vm_machine_attribute_val_t* value;
1114 {
1115
1116         return KERN_INVALID_ARGUMENT;
1117
1118 }
1119
1120 /*
1121  * pmap_attribute_cache_sync(vm_offset_t pa)
1122  *
1123  * Invalidates all of the instruction cache on a physical page and
1124  * pushes any dirty data from the data cache for the same physical page
1125  */
1126
1127 kern_return_t pmap_attribute_cache_sync(ppnum_t pp, vm_size_t size,
1128                                 vm_machine_attribute_t  attribute,
1129                                 vm_machine_attribute_val_t* value) {
1130
1131         spl_t s;
1132         unsigned int i, npages;
1133
1134         npages = round_page_32(size) >> 12;                     /* Get the number of pages to do */
1135
1136         for(i = 0; i < npages; i++) {                           /* Do all requested pages */
1137                 s = splhigh();                                                  /* No interruptions here */
1138                 sync_ppage(pp + i);                                             /* Go flush data cache and invalidate icache */
1139                 splx(s);                                                                /* Allow interruptions */
1140         }
1141
1142         return KERN_SUCCESS;
1143 }
1144
1145 /*
1146  * pmap_sync_caches_phys(ppnum_t pa)
1147  *
1148  * Invalidates all of the instruction cache on a physical page and
1149  * pushes any dirty data from the data cache for the same physical page
1150  */
1151
1152 void pmap_sync_caches_phys(ppnum_t pa) {
1153
1154         spl_t s;
1155
1156         s = splhigh();                                                          /* No interruptions here */
1157         sync_ppage(pa);                                                         /* Sync up dem caches */
1158         splx(s);                                                                        /* Allow interruptions */
1159         return;
1160 }
1161
1162 /*
1163  * pmap_collect
1164  *
1165  * Garbage collects the physical map system for pages that are no longer used.
1166  * It isn't implemented or needed or wanted.
1167  */
1168 void
1169 pmap_collect(pmap_t pmap)
1170 {
1171         return;
1172 }
1173
1174 /*
1175  *      Routine:        pmap_activate
1176  *      Function:
1177  *              Binds the given physical map to the given
1178  *              processor, and returns a hardware map description.
1179  *              It isn't implemented or needed or wanted.
1180  */
1181 void
1182 pmap_activate(
1183         pmap_t pmap,
1184         thread_t th,
1185         int which_cpu)
1186 {
1187         return;
1188 }
1189 /*
1190  * pmap_deactivate:
1191  * It isn't implemented or needed or wanted.
1192  */
1193 void
1194 pmap_deactivate(
1195         pmap_t pmap,
1196         thread_t th,
1197         int which_cpu)
1198 {
1199         return;
1200 }
1201
1202
1203 /*
1204  * pmap_pageable(pmap, s, e, pageable)
1205  *      Make the specified pages (by pmap, offset)
1206  *      pageable (or not) as requested.
1207  *
1208  *      A page which is not pageable may not take
1209  *      a fault; therefore, its page table entry
1210  *      must remain valid for the duration.
1211  *
1212  *      This routine is merely advisory; pmap_enter()
1213  *      will specify that these pages are to be wired
1214  *      down (or not) as appropriate.
1215  *
1216  *      (called from vm/vm_fault.c).
1217  */
1218 void
1219 pmap_pageable(
1220         pmap_t          pmap,
1221         vm_offset_t     start,
1222         vm_offset_t     end,
1223         boolean_t       pageable)
1224 {
1225
1226         return;                                                                                         /* This is not used... */
1227
1228 }
1229 /*
1230  *      Routine:        pmap_change_wiring
1231  *      NOT USED ANYMORE.
1232  */
1233 void
1234 pmap_change_wiring(
1235         register pmap_t pmap,
1236         vm_offset_t     va,
1237         boolean_t       wired)
1238 {
1239         return;                                                                                         /* This is not used... */
1240 }
1241
1242 /*
1243  * pmap_modify_pages(pmap, s, e)
1244  *      sets the modified bit on all virtual addresses v in the
1245  *      virtual address range determined by [s, e] and pmap,
1246  *      s and e must be on machine independent page boundaries and
1247  *      s must be less than or equal to e.
1248  *
1249  *  Note that this function will not descend nested pmaps.
1250  */
1251 void
1252 pmap_modify_pages(
1253              pmap_t pmap,
1254              vm_offset_t sva,
1255              vm_offset_t eva)
1256 {
1257         spl_t           spl;
1258         mapping         *mp;
1259         ppnum_t         pa;
1260         addr64_t                va, endva, nextva;
1261         unsigned int    saveflags;
1262
1263         if (pmap == PMAP_NULL) return;                                  /* If no pmap, can't do it... */
1264
1265         va = sva & -4096;                                                               /* Round to page */
1266         endva = eva & -4096;                                                    /* Round to page */
1267
1268         while (va < endva) {                                                    /* Walk through all pages */
1269
1270                 spl = splhigh();                                                        /* We can't allow any loss of control here */
1271
1272                 mp = mapping_find(pmap, (addr64_t)va, &va, 0);  /* Find the mapping for this address */
1273
1274                 if(!mp) {                                                                       /* Is the page mapped? */
1275                         splx(spl);                                                              /* Page not mapped, restore interruptions */
1276                         if((va == 0) || (va >= endva)) break;   /* We are done if there are no more or we hit the end... */
1277                         continue;                                                               /* We are not done and there is more to check... */
1278                 }
1279
1280                 saveflags = mp->mpFlags;                                        /* Remember the flags */
1281                 pa = mp->mpPAddr;                                                       /* Remember ppage because mapping may vanish after drop call */
1282
1283                 mapping_drop_busy(mp);                                          /* We have everything we need from the mapping */
1284
1285                 splx(spl);                                                                      /* Restore 'rupts */
1286
1287                 if(saveflags & (mpNest | mpBlock)) continue;    /* Can't mess around with these guys... */
1288
1289                 mapping_set_mod(pa);                                            /* Set the modfied bit for this page */
1290
1291                 if(va == 0) break;                                                      /* We hit the end of the pmap, might as well leave now... */
1292         }
1293         return;                                                                                 /* Leave... */
1294 }
1295
1296 /*
1297  * pmap_clear_modify(phys)
1298  *      clears the hardware modified ("dirty") bit for one
1299  *      machine independant page starting at the given
1300  *      physical address.  phys must be aligned on a machine
1301  *      independant page boundary.
1302  */
1303 void
1304 pmap_clear_modify(vm_offset_t pa)
1305 {
1306
1307         mapping_clr_mod((ppnum_t)pa);                           /* Clear all change bits for physical page */
1308
1309 }
1310
1311 /*
1312  * pmap_is_modified(phys)
1313  *      returns TRUE if the given physical page has been modified
1314  *      since the last call to pmap_clear_modify().
1315  */
1316 boolean_t
1317 pmap_is_modified(register vm_offset_t pa)
1318 {
1319         return mapping_tst_mod((ppnum_t)pa);    /* Check for modified */
1320
1321 }
1322
1323 /*
1324  * pmap_clear_reference(phys)
1325  *      clears the hardware referenced bit in the given machine
1326  *      independant physical page.
1327  *
1328  */
1329 void
1330 pmap_clear_reference(vm_offset_t pa)
1331 {
1332         mapping_clr_ref((ppnum_t)pa);                   /* Check for modified */
1333 }
1334
1335 /*
1336  * pmap_is_referenced(phys)
1337  *      returns TRUE if the given physical page has been referenced
1338  *      since the last call to pmap_clear_reference().
1339  */
1340 boolean_t
1341 pmap_is_referenced(vm_offset_t pa)
1342 {
1343         return mapping_tst_ref((ppnum_t)pa);    /* Check for referenced */
1344 }
1345
1346 /*
1347  * pmap_canExecute(ppnum_t pa)
1348  *  returns 1 if instructions can execute
1349  *  returns 0 if know not (i.e. guarded and/or non-executable set)
1350  *  returns -1 if we don't know (i.e., the page is no RAM)
1351  */
1352 int
1353 pmap_canExecute(ppnum_t pa)
1354 {
1355         phys_entry *physent;
1356         unsigned int pindex;
1357
1358         physent = mapping_phys_lookup(pa, &pindex);                             /* Get physical entry */
1359
1360         if(!physent) return -1;                                                                 /* If there is no physical entry, we don't know... */
1361
1362         if((physent->ppLink & (ppN | ppG))) return 0;                   /* If we are marked non-executable or guarded, say we can not execute */
1363         return 1;                                                                                               /* Good to go... */
1364 }
1365
1366 #if     MACH_VM_DEBUG
1367 int
1368 pmap_list_resident_pages(
1369         register pmap_t         pmap,
1370         register vm_offset_t    *listp,
1371         register int            space)
1372 {
1373         return 0;
1374 }
1375 #endif  /* MACH_VM_DEBUG */
1376
1377 /*
1378  * Locking:
1379  *      spl: VM
1380  */
1381 void
1382 pmap_copy_part_page(
1383         vm_offset_t     src,
1384         vm_offset_t     src_offset,
1385         vm_offset_t     dst,
1386         vm_offset_t     dst_offset,
1387         vm_size_t       len)
1388 {
1389         register struct phys_entry *pp_src, *pp_dst;
1390         spl_t   s;
1391         addr64_t fsrc, fdst;
1392
1393         assert(((dst <<12) & PAGE_MASK+dst_offset+len) <= PAGE_SIZE);
1394         assert(((src <<12) & PAGE_MASK+src_offset+len) <= PAGE_SIZE);
1395
1396         fsrc = ((addr64_t)src << 12) + src_offset;
1397         fdst = ((addr64_t)dst << 12) + dst_offset;
1398
1399         phys_copy(fsrc, fdst, len);                                                             /* Copy the stuff physically */
1400 }
1401
1402 void
1403 pmap_zero_part_page(
1404         vm_offset_t     p,
1405         vm_offset_t     offset,
1406         vm_size_t       len)
1407 {
1408     panic("pmap_zero_part_page");
1409 }
1410
1411 boolean_t pmap_verify_free(ppnum_t pa) {
1412
1413         struct phys_entry       *pp;
1414         unsigned int pindex;
1415
1416         pp = mapping_phys_lookup(pa, &pindex);  /* Get physical entry */
1417         if (pp == 0) return FALSE;                                      /* If there isn't one, show no mapping... */
1418
1419         if(pp->ppLink & ~(ppLock | ppN | ppFlags)) return TRUE; /* We have at least one mapping */
1420         return FALSE;                                                           /* No mappings */
1421 }
1422
1423
1424 /* Determine if we need to switch space and set up for it if so */
1425
1426 void pmap_switch(pmap_t map)
1427 {
1428         unsigned int i;
1429
1430
1431         hw_blow_seg(copyIOaddr);                                        /* Blow off the first segment */
1432         hw_blow_seg(copyIOaddr + 0x10000000ULL);        /* Blow off the second segment */
1433
1434 /* when changing to kernel space, don't bother
1435  * doing anything, the kernel is mapped from here already.
1436  */
1437         if (map->space == PPC_SID_KERNEL) {                     /* Are we switching into kernel space? */
1438                 return;                                                                 /* If so, we don't do anything... */
1439         }
1440
1441         hw_set_user_space(map);                                         /* Indicate if we need to load the SRs or not */
1442         return;                                                                         /* Bye, bye, butterfly... */
1443 }
1444
1445 /*
1446  *      kern_return_t pmap_nest(grand, subord, vstart, size)
1447  *
1448  *      grand  = the pmap that we will nest subord into
1449  *      subord = the pmap that goes into the grand
1450  *      vstart  = start of range in pmap to be inserted
1451  *      nstart  = start of range in pmap nested pmap
1452  *      size   = Size of nest area (up to 16TB)
1453  *
1454  *      Inserts a pmap into another.  This is used to implement shared segments.
1455  *      On the current PPC processors, this is limited to segment (256MB) aligned
1456  *      segment sized ranges.
1457  *
1458  *      We actually kinda allow recursive nests.  The gating factor is that we do not allow
1459  *      nesting on top of something that is already mapped, i.e., the range must be empty.
1460  *
1461  *
1462  *
1463  *      Note that we depend upon higher level VM locks to insure that things don't change while
1464  *      we are doing this.  For example, VM should not be doing any pmap enters while it is nesting
1465  *      or do 2 nests at once.
1466  */
1467
1468 kern_return_t pmap_nest(pmap_t grand, pmap_t subord, addr64_t vstart, addr64_t nstart, uint64_t size) {
1469
1470         addr64_t nextva, vend, colladdr;
1471         unsigned int msize;
1472         int i, nlists, asize;
1473         spl_t   s;
1474         mapping *mp;
1475
1476
1477         if(size & 0x0FFFFFFFULL) return KERN_INVALID_VALUE;     /* We can only do this for multiples of 256MB */
1478         if((size >> 28) > 65536)  return KERN_INVALID_VALUE;    /* Max size we can nest is 16TB */
1479         if(vstart & 0x0FFFFFFFULL) return KERN_INVALID_VALUE;   /* We can only do this aligned to 256MB */
1480         if(nstart & 0x0FFFFFFFULL) return KERN_INVALID_VALUE;   /* We can only do this aligned to 256MB */
1481
1482         if(size == 0) {                                                         /*      Is the size valid? */
1483                 panic("pmap_nest: size is invalid - %016llX\n", size);
1484         }
1485
1486         msize = (size >> 28) - 1;                                                       /* Change size to blocks of 256MB */
1487
1488         nlists = mapSetLists(grand);                                            /* Set number of lists this will be on */
1489
1490         mp = mapping_alloc(nlists);                                                     /* Get a spare mapping block */
1491
1492         mp->mpFlags = 0x01000000 | mpNest | nlists;                     /* Set the flags. Make sure busy count is 1 */
1493         mp->mpSpace = subord->space;                                            /* Set the address space/pmap lookup ID */
1494         mp->mpBSize = msize;                                                            /* Set the size */
1495         mp->mpPte = 0;                                                                          /* Set the PTE invalid */
1496         mp->mpPAddr = 0;                                                                        /* Set the physical page number */
1497         mp->mpVAddr = vstart;                                                           /* Set the address */
1498         mp->mpNestReloc = nstart - vstart;                                      /* Set grand to nested vaddr relocation value */
1499
1500         colladdr = hw_add_map(grand, mp);                                       /* Go add the mapping to the pmap */
1501
1502         if(colladdr) {                                                                          /* Did it collide? */
1503                 vend = vstart + size - 4096;                                    /* Point to the last page we would cover in nest */
1504                 panic("pmap_nest: attempt to nest into a non-empty range - pmap = %08X, start = %016llX, end = %016llX\n",
1505                         grand, vstart, vend);
1506         }
1507
1508         return KERN_SUCCESS;
1509 }
1510
1511 /*
1512  *      kern_return_t pmap_unnest(grand, vaddr)
1513  *
1514  *      grand  = the pmap that we will nest subord into
1515  *      vaddr  = start of range in pmap to be unnested
1516  *
1517  *      Removes a pmap from another.  This is used to implement shared segments.
1518  *      On the current PPC processors, this is limited to segment (256MB) aligned
1519  *      segment sized ranges.
1520  */
1521
1522 kern_return_t pmap_unnest(pmap_t grand, addr64_t vaddr) {
1523
1524         unsigned int oflags, seg, grandr, tstamp;
1525         int i, tcpu, mycpu;
1526         addr64_t nextva;
1527         spl_t s;
1528         mapping *mp;
1529
1530         s = splhigh();                                                                          /* Make sure interruptions are disabled */
1531
1532         mp = mapping_find(grand, vaddr, &nextva, 0);            /* Find the nested map */
1533
1534         if(((unsigned int)mp & mapRetCode) != mapRtOK) {        /* See if it was even nested */
1535                 panic("pmap_unnest: Attempt to unnest an unnested segment - va = %016llX\n", vaddr);
1536         }
1537
1538         if(!(mp->mpFlags & mpNest)) {                                           /* Did we find something other than a nest? */
1539                 panic("pmap_unnest: Attempt to unnest something that is not a nest - va = %016llX\n", vaddr);
1540         }
1541
1542         if(mp->mpVAddr != vaddr) {                                                      /* Make sure the address is the same */
1543                 panic("pmap_unnest: Attempt to unnest something that is not at start of nest - va = %016llX\n", vaddr);
1544         }
1545
1546         (void)hw_atomic_or(&mp->mpFlags, mpRemovable);          /* Show that this mapping is now removable */
1547
1548         mapping_drop_busy(mp);                                                          /* Go ahead and relase the mapping now */
1549
1550         disable_preemption();                                                           /* It's all for me! */
1551         splx(s);                                                                                        /* Restore 'rupts */
1552
1553         (void)mapping_remove(grand, vaddr);                                     /* Toss the nested pmap mapping */
1554
1555         invalidateSegs(grand);                                                          /* Invalidate the pmap segment cache */
1556
1557 /*
1558  *      Note that the following will force the segment registers to be reloaded
1559  *      on all processors (if they are using the pmap we just changed) before returning.
1560  *
1561  *      This is needed.  The reason is that until the segment register is
1562  *      reloaded, another thread in the same task on a different processor will
1563  *      be able to access memory that it isn't allowed to anymore.  That can happen
1564  *      because access to the subordinate pmap is being removed, but the pmap is still
1565  *      valid.
1566  *
1567  *      Note that we only kick the other processor if we see that it was using the pmap while we
1568  *      were changing it.
1569  */
1570
1571
1572         mycpu = cpu_number();                                                           /* Who am I? Am I just a dream? */
1573         for(i=0; i < real_ncpus; i++) {                                         /* Cycle through processors */
1574                 if((unsigned int)grand == per_proc_info[i].ppUserPmapVirt) {    /* Is this guy using the changed pmap? */
1575
1576                         per_proc_info[i].ppInvSeg = 1;                          /* Show that we need to invalidate the segments */
1577
1578                         if(i == mycpu) continue;                                        /* Don't diddle ourselves */
1579
1580                         tstamp = per_proc_info[i].ruptStamp[1];         /* Save the processor's last interrupt time stamp */
1581                         if(cpu_signal(i, SIGPcpureq, CPRQsegload, 0) != KERN_SUCCESS) { /* Make sure we see the pmap change */
1582                                 continue;
1583                         }
1584
1585                         if(!hw_cpu_wcng(&per_proc_info[i].ruptStamp[1], tstamp, LockTimeOut)) { /* Wait for the other processors to enter debug */
1586                                 panic("pmap_unnest: Other processor (%d) did not see interruption request\n", i);
1587                         }
1588                 }
1589         }
1590
1591         enable_preemption();                                                            /* Others can run now */
1592         return KERN_SUCCESS;                                                            /* Bye, bye, butterfly... */
1593 }
1594
1595
1596 /*
1597  *      void MapUserAddressSpaceInit(void)
1598  *
1599  *      Initialized anything we need to in order to map user address space slices into
1600  *      the kernel.  Primarily used for copy in/out.
1601  *
1602  *      Currently we only support one 512MB slot for this purpose.  There are two special
1603  *      mappings defined for the purpose: the special pmap nest, and linkage mapping.
1604  *
1605  *      The special pmap nest (which is allocated in this function) is used as a place holder
1606  *      in the kernel's pmap search list. It is 512MB long and covers the address range
1607  *      starting at copyIOaddr.  It points to no actual memory and when the fault handler
1608  *      hits in it, it knows to look in the per_proc and start using the linkage
1609  *      mapping contained therin.
1610  *
1611  *      The linkage mapping is used to glue the user address space slice into the
1612  *      kernel.  It contains the relocation information used to transform the faulting
1613  *      kernel address into the user address space.  It also provides the link to the
1614  *      user's pmap.  This is pointed to by the per_proc and is switched in and out
1615  *      whenever there is a context switch.
1616  *
1617  */
1618
1619 void MapUserAddressSpaceInit(void) {
1620
1621         addr64_t colladdr;
1622         int nlists, asize;
1623         mapping *mp;
1624
1625         nlists = mapSetLists(kernel_pmap);                                      /* Set number of lists this will be on */
1626
1627         mp = mapping_alloc(nlists);                                                     /* Get a spare mapping block */
1628
1629         mp->mpFlags = 0x01000000 |mpNest | mpSpecial | nlists;  /* Set the flags. Make sure busy count is 1 */
1630         mp->mpSpace = kernel_pmap->space;                                       /* Set the address space/pmap lookup ID */
1631         mp->mpBSize = 1;                                                                        /* Set the size to 2 segments */
1632         mp->mpPte = 0;                                                                          /* Means nothing */
1633         mp->mpPAddr = 0;                                                                        /* Means nothing */
1634         mp->mpVAddr = copyIOaddr;                                                       /* Set the address range we cover */
1635         mp->mpNestReloc = 0;                                                            /* Means nothing */
1636
1637         colladdr = hw_add_map(kernel_pmap, mp);                         /* Go add the mapping to the pmap */
1638
1639         if(colladdr) {                                                                          /* Did it collide? */
1640                 panic("MapUserAddressSpaceInit: MapUserAddressSpace range already mapped\n");
1641         }
1642
1643         return;
1644 }
1645
1646 /*
1647  *      addr64_t MapUserAddressSpace(vm_map_t map, vm_offset_t va, size)
1648  *
1649  *      map  = the vm_map that we are mapping into the kernel
1650  *      va = start of the address range we are mapping
1651  *      size  = size of the range.  No greater than 256MB and not 0.
1652  *      Note that we do not test validty, we chose to trust our fellows...
1653  *
1654  *      Maps a slice of a user address space into a predefined kernel range
1655  *      on a per-thread basis.  In the future, the restriction of a predefined
1656  *      range will be loosened.
1657  *
1658  *      Builds the proper linkage map to map the user range
1659  *  We will round this down to the previous segment boundary and calculate
1660  *      the relocation to the kernel slot
1661  *
1662  *      We always make a segment table entry here if we need to.  This is mainly because of
1663  *      copyin/out and if we don't, there will be multiple segment faults for
1664  *      each system call.  I have seen upwards of 30000 per second.
1665  *
1666  *      We do check, however, to see if the slice is already mapped and if so,
1667  *      we just exit.  This is done for performance reasons.  It was found that
1668  *      there was a considerable boost in copyin/out performance if we did not
1669  *      invalidate the segment at ReleaseUserAddressSpace time, so we dumped the
1670  *      restriction that you had to bracket MapUserAddressSpace.  Further, there
1671  *      is a yet further boost if you didn't need to map it each time.  The theory
1672  *      behind this is that many times copies are to or from the same segment and
1673  *      done multiple times within the same system call.  To take advantage of that,
1674  *      we check cioSpace and cioRelo to see if we've already got it.
1675  *
1676  *      We also need to half-invalidate the slice when we context switch or go
1677  *      back to user state.  A half-invalidate does not clear the actual mapping,
1678  *      but it does force the MapUserAddressSpace function to reload the segment
1679  *      register/SLBE.  If this is not done, we can end up some pretty severe
1680  *      performance penalties. If we map a slice, and the cached space/relocation is
1681  *      the same, we won't reload the segment registers.  Howver, since we ran someone else,
1682  *      our SR is cleared and we will take a fault.  This is reasonable if we block
1683  *      while copying (e.g., we took a page fault), but it is not reasonable when we
1684  *      just start.  For this reason, we half-invalidate to make sure that the SR is
1685  *      explicitly reloaded.
1686  *
1687  *      Note that we do not go to the trouble of making a pmap segment cache
1688  *      entry for these guys because they are very short term -- 99.99% of the time
1689  *      they will be unmapped before the next context switch.
1690  *
1691  */
1692
1693 addr64_t MapUserAddressSpace(vm_map_t map, addr64_t va, unsigned int size) {
1694
1695         addr64_t baddrs, reladd;
1696         thread_act_t act;
1697         mapping *mp;
1698         struct per_proc_info *perproc;
1699
1700         baddrs = va & 0xFFFFFFFFF0000000ULL;                            /* Isolate the segment */
1701         act = current_act();                                                            /* Remember our activation */
1702
1703         reladd = baddrs - copyIOaddr;                                           /* Get the relocation from user to kernel */
1704
1705         if((act->mact.cioSpace == map->pmap->space) && (act->mact.cioRelo == reladd)) { /* Already mapped? */
1706                 return ((va & 0x0FFFFFFFULL) | copyIOaddr);             /* Pass back the kernel address we are to use */
1707         }
1708
1709         disable_preemption();                                                           /* Don't move... */
1710         perproc = getPerProc();                                                         /* Get our per_proc_block */
1711
1712         mp = (mapping *)&perproc->ppCIOmp;                                      /* Make up for C */
1713         act->mact.cioRelo = reladd;                                                     /* Relocation from user to kernel */
1714         mp->mpNestReloc = reladd;                                                       /* Relocation from user to kernel */
1715
1716         act->mact.cioSpace = map->pmap->space;                          /* Set the address space/pmap lookup ID */
1717         mp->mpSpace = map->pmap->space;                                         /* Set the address space/pmap lookup ID */
1718
1719 /*
1720  *      Here we make an assumption that we are going to be using the base pmap's address space.
1721  *      If we are wrong, and that would be very, very, very rare, the fault handler will fix us up.
1722  */
1723
1724         hw_map_seg(map->pmap,  copyIOaddr, baddrs);                     /* Make the entry for the first segment */
1725
1726         enable_preemption();                                                            /* Let's move */
1727         return ((va & 0x0FFFFFFFULL) | copyIOaddr);                     /* Pass back the kernel address we are to use */
1728 }
1729
1730 /*
1731  *      void ReleaseUserAddressMapping(addr64_t kva)
1732  *
1733  *      kva = kernel address of the user copy in/out slice
1734  *
1735  */
1736
1737 void ReleaseUserAddressSpace(addr64_t kva) {
1738
1739         int i;
1740         addr64_t nextva, vend, kaddr, baddrs;
1741         unsigned int msize;
1742         thread_act_t act;
1743         mapping *mp;
1744
1745         if(kva == 0) return;                                                            /* Handle a 0 */
1746
1747         disable_preemption();                                                           /* Don't move... */
1748
1749         act = current_act();                                                            /* Remember our activation */
1750
1751         if(act->mact.cioSpace == invalSpace) {                          /* We only support one at a time */
1752                 panic("ReleaseUserAddressMapping: attempt release undefined copy in/out user address space slice\n");
1753         }
1754
1755         act->mact.cioSpace = invalSpace;                                        /* Invalidate space */
1756         mp = (mapping *)&per_proc_info[cpu_number()].ppCIOmp;   /* Make up for C */
1757         mp->mpSpace = invalSpace;                                                       /* Trash it in the per_proc as well */
1758
1759         hw_blow_seg(copyIOaddr);                                                        /* Blow off the first segment */
1760         hw_blow_seg(copyIOaddr + 0x10000000ULL);                        /* Blow off the second segment */
1761
1762         enable_preemption();                                                            /* Let's move */
1763
1764         return;                                                                                         /* Let's leave */
1765 }
1766
1767
1768
1769 /*
1770  *      kern_return_t pmap_boot_map(size)
1771  *
1772  *      size   = size of virtual address range to be mapped
1773  *
1774  *      This function is used to assign a range of virtual addresses before VM in
1775  *      initialized.  It starts at VM_MAX_KERNEL_ADDRESS and works downward.
1776  *      The variable vm_last_addr contains the current highest possible VM
1777  *      assignable address.  It is a panic to attempt to call this after VM has
1778  *      started up.  The only problem is, is that we may not have the serial or
1779  *      framebuffer mapped, so we'll never know we died.........
1780  */
1781
1782 vm_offset_t pmap_boot_map(vm_size_t size) {
1783
1784         if(kernel_map != VM_MAP_NULL) {                         /* Has VM already started? */
1785                 panic("pmap_boot_map: VM started\n");
1786         }
1787
1788         size = round_page_32(size);                                     /* Make sure this is in pages */
1789         vm_last_addr = vm_last_addr - size;                     /* Allocate the memory */
1790         return (vm_last_addr + 1);                                      /* Return the vaddr we just allocated */
1791
1792 }
1793
1794
1795
1796 /* temporary workaround */
1797 boolean_t
1798 coredumpok(vm_map_t map, vm_offset_t va)
1799 {
1800   return TRUE;
1801 }