2 * Copyright (c) 2004 Apple Computer, Inc. All rights reserved.
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
29 * Copyright (c) 1988 University of Utah.
30 * Copyright (c) 1990, 1993
31 * The Regents of the University of California. All rights reserved.
33 * This code is derived from software contributed to Berkeley by
34 * the Systems Programming Group of the University of Utah Computer
37 * Redistribution and use in source and binary forms, with or without
38 * modification, are permitted provided that the following conditions
40 * 1. Redistributions of source code must retain the above copyright
41 * notice, this list of conditions and the following disclaimer.
42 * 2. Redistributions in binary form must reproduce the above copyright
43 * notice, this list of conditions and the following disclaimer in the
44 * documentation and/or other materials provided with the distribution.
45 * 3. All advertising materials mentioning features or use of this software
46 * must display the following acknowledgement:
47 * This product includes software developed by the University of
48 * California, Berkeley and its contributors.
49 * 4. Neither the name of the University nor the names of its contributors
50 * may be used to endorse or promote products derived from this software
51 * without specific prior written permission.
53 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
54 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
55 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
56 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
57 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
58 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
59 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
60 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
61 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
62 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
65 * from: Utah Hdr: vn.c 1.13 94/04/02
67 * from: @(#)vn.c 8.6 (Berkeley) 4/1/94
68 * $FreeBSD: src/sys/dev/vn/vn.c,v 1.105.2.4 2001/11/18 07:11:00 dillon Exp $
74 * Block interface to a ramdisk.
78 #include <sys/param.h>
79 #include <sys/kernel.h>
80 #include <sys/mount.h>
81 #include <sys/namei.h>
84 #include <sys/malloc.h>
85 #include <sys/mount.h>
86 #include <sys/fcntl.h>
91 #include <sys/uio_internal.h>
92 #include <libkern/libkern.h>
95 #include <vm/vm_pager.h>
96 #include <mach/memory_object_types.h>
98 #include <miscfs/devfs/devfs.h>
101 void mdevinit(int the_cnt
);
103 static open_close_fcn_t mdevopen
;
104 static open_close_fcn_t mdevclose
;
105 static psize_fcn_t mdevsize
;
106 static strategy_fcn_t mdevstrategy
;
107 static int mdevbioctl(dev_t dev
, u_long cmd
, caddr_t data
, int flag
, struct proc
*p
);
108 static int mdevcioctl(dev_t dev
, u_long cmd
, caddr_t data
, int flag
, struct proc
*p
);
109 static int mdevrw(dev_t dev
, struct uio
*uio
, int ioflag
);
110 static char * nonspace(char *pos
, char *end
);
111 static char * getspace(char *pos
, char *end
);
112 static char * cvtnum(char *pos
, char *end
, unsigned int *num
);
114 extern void bcopy_phys(addr64_t from
, addr64_t to
, vm_size_t bytes
);
115 extern void mapping_set_mod(ppnum_t pn
);
116 extern ppnum_t
pmap_find_phys(pmap_t pmap
, addr64_t va
);
121 * D_DISK we want to look like a disk
122 * D_CANFREE We support B_FREEBUF
125 static struct bdevsw mdevbdevsw
= {
127 /* close */ mdevclose
,
128 /* strategy */ mdevstrategy
,
129 /* ioctl */ mdevbioctl
,
131 /* psize */ mdevsize
,
135 static struct cdevsw mdevcdevsw
= {
137 /* close */ mdevclose
,
140 /* ioctl */ mdevcioctl
,
142 /* reset */ eno_reset
,
144 /* select */ eno_select
,
146 /* strategy */ eno_strat
,
153 vm_offset_t mdBase
; /* file size in bytes */
154 uint32_t mdSize
; /* file size in bytes */
155 int mdFlags
; /* flags */
156 int mdSecsize
; /* sector size */
157 int mdBDev
; /* Block device number */
158 int mdCDev
; /* Character device number */
164 #define mdInited 0x01 /* This device defined */
165 #define mdRO 0x02 /* This device is read-only */
166 #define mdPhys 0x04 /* This device is in physical memory */
171 static int mdevioctl(dev_t dev
, u_long cmd
, caddr_t data
, int flag
, struct proc
*p
, int is_char
);
172 dev_t
mdevadd(int devid
, ppnum_t base
, unsigned int size
, int phys
);
173 dev_t
mdevlookup(int devid
);
175 static int mdevclose(__unused dev_t dev
, __unused
int flags
,
176 __unused
int devtype
, __unused
struct proc
*p
) {
181 static int mdevopen(dev_t dev
, int flags
, __unused
int devtype
, __unused
struct proc
*p
) {
185 devid
= minor(dev
); /* Get minor device number */
187 if (devid
> 16) return (ENXIO
); /* Not valid */
189 if ((flags
& FWRITE
) && (mdev
[devid
].mdFlags
& mdRO
)) return (EACCES
); /* Currently mounted RO */
194 static int mdevrw(dev_t dev
, struct uio
*uio
, __unused
int ioflag
) {
198 enum uio_seg saveflag
;
200 devid
= minor(dev
); /* Get minor device number */
202 if (devid
> 16) return (ENXIO
); /* Not valid */
203 if (!(mdev
[devid
].mdFlags
& mdInited
)) return (ENXIO
); /* Have we actually been defined yet? */
205 mdata
= ((addr64_t
)mdev
[devid
].mdBase
<< 12) + uio
->uio_offset
; /* Point to the area in "file" */
207 saveflag
= uio
->uio_segflg
; /* Remember what the request is */
209 if (IS_VALID_UIO_SEGFLG(uio
->uio_segflg
) == 0) {
210 panic("mdevrw - invalid uio_segflg\n");
212 #endif /* LP64_DEBUG */
213 /* Make sure we are moving from physical ram if physical device */
214 if (mdev
[devid
].mdFlags
& mdPhys
) {
215 if (uio
->uio_segflg
== UIO_USERSPACE64
)
216 uio
->uio_segflg
= UIO_PHYS_USERSPACE64
;
217 else if (uio
->uio_segflg
== UIO_USERSPACE32
)
218 uio
->uio_segflg
= UIO_PHYS_USERSPACE32
;
220 uio
->uio_segflg
= UIO_PHYS_USERSPACE
;
222 status
= uiomove64(mdata
, uio_resid(uio
), uio
); /* Move the data */
223 uio
->uio_segflg
= saveflag
; /* Restore the flag */
228 static void mdevstrategy(struct buf
*bp
) {
229 unsigned int left
, lop
, csize
;
230 vm_offset_t vaddr
, blkoff
;
232 addr64_t paddr
, fvaddr
;
235 devid
= minor(buf_device(bp
)); /* Get minor device number */
237 if ((mdev
[devid
].mdFlags
& mdInited
) == 0) { /* Have we actually been defined yet? */
238 buf_seterror(bp
, ENXIO
);
243 buf_setresid(bp
, buf_count(bp
)); /* Set byte count */
245 blkoff
= buf_blkno(bp
) * mdev
[devid
].mdSecsize
; /* Get offset into file */
248 * Note that reading past end is an error, but reading at end is an EOF. For these
249 * we just return with resid == count.
252 if (blkoff
>= (mdev
[devid
].mdSize
<< 12)) { /* Are they trying to read/write at/after end? */
253 if(blkoff
!= (mdev
[devid
].mdSize
<< 12)) { /* Are we trying to read after EOF? */
254 buf_seterror(bp
, EINVAL
); /* Yeah, this is an error */
256 buf_biodone(bp
); /* Return */
260 if ((blkoff
+ buf_count(bp
)) > (mdev
[devid
].mdSize
<< 12)) { /* Will this read go past end? */
261 buf_setcount(bp
, ((mdev
[devid
].mdSize
<< 12) - blkoff
)); /* Yes, trim to max */
264 * make sure the buffer's data area is
267 if (buf_map(bp
, (caddr_t
*)&vaddr
))
268 panic("ramstrategy: buf_map failed\n");
270 fvaddr
= (mdev
[devid
].mdBase
<< 12) + blkoff
; /* Point to offset into ram disk */
272 if (buf_flags(bp
) & B_READ
) { /* Is this a read? */
273 if(!(mdev
[devid
].mdFlags
& mdPhys
)) { /* Physical mapped disk? */
274 bcopy((void *)((uintptr_t)fvaddr
),
275 (void *)vaddr
, (size_t)buf_count(bp
)); /* This is virtual, just get the data */
278 left
= buf_count(bp
); /* Init the amount left to copy */
279 while(left
) { /* Go until it is all copied */
281 lop
= min((4096 - (vaddr
& 4095)), (4096 - (fvaddr
& 4095))); /* Get smallest amount left on sink and source */
282 csize
= min(lop
, left
); /* Don't move more than we need to */
284 pp
= pmap_find_phys(kernel_pmap
, (addr64_t
)((unsigned int)vaddr
)); /* Get the sink physical address */
285 if(!pp
) { /* Not found, what gives? */
286 panic("mdevstrategy: sink address %016llX not mapped\n", (addr64_t
)((unsigned int)vaddr
));
288 paddr
= (addr64_t
)(((addr64_t
)pp
<< 12) | (addr64_t
)(vaddr
& 4095)); /* Get actual address */
289 bcopy_phys(fvaddr
, paddr
, csize
); /* Copy this on in */
290 mapping_set_mod(paddr
>> 12); /* Make sure we know that it is modified */
292 left
= left
- csize
; /* Calculate what is left */
293 vaddr
= vaddr
+ csize
; /* Move to next sink address */
294 fvaddr
= fvaddr
+ csize
; /* Bump to next physical address */
298 else { /* This is a write */
299 if(!(mdev
[devid
].mdFlags
& mdPhys
)) { /* Physical mapped disk? */
300 bcopy((void *)vaddr
, (void *)((uintptr_t)fvaddr
),
301 (size_t)buf_count(bp
)); /* This is virtual, just put the data */
304 left
= buf_count(bp
); /* Init the amount left to copy */
305 while(left
) { /* Go until it is all copied */
307 lop
= min((4096 - (vaddr
& 4095)), (4096 - (fvaddr
& 4095))); /* Get smallest amount left on sink and source */
308 csize
= min(lop
, left
); /* Don't move more than we need to */
310 pp
= pmap_find_phys(kernel_pmap
, (addr64_t
)((unsigned int)vaddr
)); /* Get the source physical address */
311 if(!pp
) { /* Not found, what gives? */
312 panic("mdevstrategy: source address %016llX not mapped\n", (addr64_t
)((unsigned int)vaddr
));
314 paddr
= (addr64_t
)(((addr64_t
)pp
<< 12) | (addr64_t
)(vaddr
& 4095)); /* Get actual address */
316 bcopy_phys(paddr
, fvaddr
, csize
); /* Move this on out */
318 left
= left
- csize
; /* Calculate what is left */
319 vaddr
= vaddr
+ csize
; /* Move to next sink address */
320 fvaddr
= fvaddr
+ csize
; /* Bump to next physical address */
325 * buf_unmap takes care of all the cases
326 * it will unmap the buffer from kernel
327 * virtual space if that was the state
332 buf_setresid(bp
, 0); /* Nothing more to do */
333 buf_biodone(bp
); /* Say we've finished */
336 static int mdevbioctl(dev_t dev
, u_long cmd
, caddr_t data
, int flag
, struct proc
*p
) {
337 return (mdevioctl(dev
, cmd
, data
, flag
, p
, 0));
340 static int mdevcioctl(dev_t dev
, u_long cmd
, caddr_t data
, int flag
, struct proc
*p
) {
341 return (mdevioctl(dev
, cmd
, data
, flag
, p
, 1));
344 static int mdevioctl(dev_t dev
, u_long cmd
, caddr_t data
, __unused
int flag
,
345 struct proc
*p
, int is_char
) {
351 devid
= minor(dev
); /* Get minor device number */
353 if (devid
> 16) return (ENXIO
); /* Not valid */
355 error
= proc_suser(p
); /* Are we superman? */
356 if (error
) return (error
); /* Nope... */
359 o
= (u_int64_t
*)data
;
363 case DKIOCGETMAXBLOCKCOUNTREAD
:
367 case DKIOCGETMAXBLOCKCOUNTWRITE
:
371 case DKIOCGETMAXSEGMENTCOUNTREAD
:
375 case DKIOCGETMAXSEGMENTCOUNTWRITE
:
379 case DKIOCGETBLOCKSIZE
:
380 *f
= mdev
[devid
].mdSecsize
;
383 case DKIOCSETBLOCKSIZE
:
384 if (is_char
) return (ENODEV
); /* We can only do this for a block */
386 if (*f
< DEV_BSIZE
) return (EINVAL
); /* Too short? */
388 mdev
[devid
].mdSecsize
= *f
; /* set the new block size */
391 case DKIOCISWRITABLE
:
395 case DKIOCGETBLOCKCOUNT32
:
396 if(!(mdev
[devid
].mdFlags
& mdInited
)) return (ENXIO
);
397 *f
= ((mdev
[devid
].mdSize
<< 12) + mdev
[devid
].mdSecsize
- 1) / mdev
[devid
].mdSecsize
;
400 case DKIOCGETBLOCKCOUNT
:
401 if(!(mdev
[devid
].mdFlags
& mdInited
)) return (ENXIO
);
402 *o
= ((mdev
[devid
].mdSize
<< 12) + mdev
[devid
].mdSecsize
- 1) / mdev
[devid
].mdSecsize
;
413 static int mdevsize(dev_t dev
) {
417 devid
= minor(dev
); /* Get minor device number */
418 if (devid
> 16) return (ENXIO
); /* Not valid */
420 if ((mdev
[devid
].mdFlags
& mdInited
) == 0) return(-1); /* Not inited yet */
422 return(mdev
[devid
].mdSecsize
);
425 #include <pexpert/pexpert.h>
427 void mdevinit(__unused
int the_cnt
) {
436 ba
= PE_boot_args(); /* Get the boot arguments */
437 lp
= ba
+ 256; /* Point to the end */
439 while(1) { /* Step through, looking for our keywords */
440 phys
= 0; /* Assume virtual memory device */
441 ba
= nonspace(ba
, lp
); /* Find non-space */
442 if(ba
>= lp
) return; /* We are done if no more... */
443 if(((ba
[0] != 'v') && (ba
[0] != 'p'))
444 || (ba
[1] != 'm') || (ba
[2] != 'd') || (ba
[4] != '=')
445 || (ba
[3] < '0') || (ba
[3] > 'f')
446 || ((ba
[3] > '9') && (ba
[3] < 'a'))) { /* Is this of form "vmdx=" or "pmdx=" where x is hex digit? */
448 ba
= getspace(ba
, lp
); /* Find next white space or end */
449 continue; /* Start looking for the next one */
452 if(ba
[0] == 'p') phys
= 1; /* Set physical memory disk */
454 devid
= ba
[3] & 0xF; /* Assume digit */
455 if(ba
[3] > '9') devid
+= 9; /* Adjust for hex digits */
457 ba
= &ba
[5]; /* Step past keyword */
458 ba
= cvtnum(ba
, lp
, &base
); /* Convert base of memory disk */
459 if(ba
>= lp
) return; /* Malformed one at the end, leave */
460 if(ba
[0] != '.') continue; /* If not length separater, try next... */
461 if(base
& 0xFFF) continue; /* Only allow page aligned stuff */
463 ba
++; /* Step past '.' */
464 ba
= cvtnum(ba
, lp
, &size
); /* Try to convert it */
465 if(!size
|| (size
& 0xFFF)) continue; /* Allow only non-zer page size multiples */
466 if(ba
< lp
) { /* If we are not at end, check end character */
467 if((ba
[0] != ' ') && (ba
[0] != 0)) continue; /* End must be null or space */
470 dev
= mdevadd(devid
, base
>> 12, size
>> 12, phys
); /* Go add the device */
477 char *nonspace(char *pos
, char *end
) { /* Find next non-space in string */
479 if(pos
>= end
) return end
; /* Don't go past end */
480 if(pos
[0] == 0) return end
; /* If at null, make end */
482 while(1) { /* Keep going */
483 if(pos
[0] != ' ') return pos
; /* Leave if we found one */
485 if(pos
>= end
) return end
; /* Quit if we run off end */
489 char *getspace(char *pos
, char *end
) { /* Find next non-space in string */
491 while(1) { /* Keep going */
492 if(pos
>= end
) return end
; /* Don't go past end */
493 if(pos
[0] == 0) return end
; /* Leave if we hit null */
494 if(pos
[0] == ' ') return pos
; /* Leave if we found one */
499 char *cvtnum(char *pos
, char *end
, unsigned int *num
) { /* Convert to a number */
503 *num
= 0; /* Set answer to 0 to start */
506 if(pos
>= end
) return end
; /* Don't go past end */
507 if(pos
[0] == 0) return end
; /* If at null, make end */
509 if(pos
[0] == '0' && ((pos
[1] == 'x') || (pos
[1] == 'x'))) { /* A hex constant? */
511 pos
+= 2; /* Point to the number */
514 while(1) { /* Convert it */
516 if(pos
>= end
) return end
; /* Don't go past end */
517 if(pos
[0] == 0) return end
; /* If at null, make end */
518 if(pos
[0] < '0') return pos
; /* Leave if non-digit */
519 dig
= pos
[0] & 0xF; /* Extract digit */
520 if(pos
[0] > '9') { /* Is it bigger than 9? */
521 if(rad
== 10) return pos
; /* Leave if not base 10 */
522 if(!(((pos
[0] >= 'A') && (pos
[0] <= 'F'))
523 || ((pos
[0] >= 'a') && (pos
[0] <= 'f')))) return pos
; /* Leave if bogus char */
524 dig
= dig
+ 9; /* Adjust for character */
526 *num
= (*num
* rad
) + dig
; /* Accumulate the number */
531 dev_t
mdevadd(int devid
, ppnum_t base
, unsigned int size
, int phys
) {
538 for(i
= 0; i
< 16; i
++) { /* Search all known memory devices */
539 if(!(mdev
[i
].mdFlags
& mdInited
)) { /* Is this a free one? */
540 if(devid
< 0)devid
= i
; /* Remember first free one */
541 continue; /* Skip check */
543 if(!(((base
+ size
-1 ) < mdev
[i
].mdBase
) || ((mdev
[i
].mdBase
+ mdev
[i
].mdSize
- 1) < base
))) { /* Is there any overlap? */
544 panic("mdevadd: attempt to add overlapping memory device at %08X-%08X\n", mdev
[i
].mdBase
, mdev
[i
].mdBase
+ mdev
[i
].mdSize
- 1);
547 if(devid
< 0) { /* Do we have free slots? */
548 panic("mdevadd: attempt to add more than 16 memory devices\n");
552 if(devid
>= 16) { /* Giving us something bogus? */
553 panic("mdevadd: attempt to explicitly add a bogus memory device: &08X\n", devid
);
555 if(mdev
[devid
].mdFlags
&mdInited
) { /* Already there? */
556 panic("mdevadd: attempt to explicitly add a previously defined memory device: &08X\n", devid
);
560 if(mdevBMajor
< 0) { /* Have we gotten a major number yet? */
561 mdevBMajor
= bdevsw_add(-1, &mdevbdevsw
); /* Add to the table and figure out a major number */
562 if (mdevBMajor
< 0) {
563 printf("mdevadd: error - bdevsw_add() returned %d\n", mdevBMajor
);
568 if(mdevCMajor
< 0) { /* Have we gotten a major number yet? */
569 mdevCMajor
= cdevsw_add_with_bdev(-1, &mdevcdevsw
, mdevBMajor
); /* Add to the table and figure out a major number */
570 if (mdevCMajor
< 0) {
571 printf("ramdevice_init: error - cdevsw_add() returned %d\n", mdevCMajor
);
576 mdev
[devid
].mdBDev
= makedev(mdevBMajor
, devid
); /* Get the device number */
577 mdev
[devid
].mdbdevb
= devfs_make_node(mdev
[devid
].mdBDev
, DEVFS_BLOCK
, /* Make the node */
578 UID_ROOT
, GID_OPERATOR
,
579 0600, "md%d", devid
);
580 if (mdev
[devid
].mdbdevb
== NULL
) { /* Did we make one? */
581 printf("mdevadd: devfs_make_node for block failed!\n");
582 return -1; /* Nope... */
585 mdev
[devid
].mdCDev
= makedev(mdevCMajor
, devid
); /* Get the device number */
586 mdev
[devid
].mdcdevb
= devfs_make_node(mdev
[devid
].mdCDev
, DEVFS_CHAR
, /* Make the node */
587 UID_ROOT
, GID_OPERATOR
,
588 0600, "rmd%d", devid
);
589 if (mdev
[devid
].mdcdevb
== NULL
) { /* Did we make one? */
590 printf("mdevadd: devfs_make_node for character failed!\n");
591 return -1; /* Nope... */
594 mdev
[devid
].mdBase
= base
; /* Set the base address of ram disk */
595 mdev
[devid
].mdSize
= size
; /* Set the length of the ram disk */
596 mdev
[devid
].mdSecsize
= DEV_BSIZE
; /* Set starting block size */
597 if(phys
) mdev
[devid
].mdFlags
|= mdPhys
; /* Show that we are in physical memory */
598 mdev
[devid
].mdFlags
|= mdInited
; /* Show we are all set up */
599 printf("Added memory device md%x/rmd%x (%08X/%08X) at %08X for %08X\n",
600 devid
, devid
, mdev
[devid
].mdBDev
, mdev
[devid
].mdCDev
, base
<< 12, size
<< 12);
601 return mdev
[devid
].mdBDev
;
605 dev_t
mdevlookup(int devid
) {
607 if((devid
< 0) || (devid
> 15)) return -1; /* Filter any bogus requests */
608 if(!(mdev
[devid
].mdFlags
& mdInited
)) return -1; /* This one hasn't been defined */
609 return mdev
[devid
].mdBDev
; /* Return the device number */