2 * Copyright (c) 1988 University of Utah.
3 * Copyright (c) 1990, 1993
4 * The Regents of the University of California. All rights reserved.
6 * This code is derived from software contributed to Berkeley by
7 * the Systems Programming Group of the University of Utah Computer
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions
13 * 1. Redistributions of source code must retain the above copyright
14 * notice, this list of conditions and the following disclaimer.
15 * 2. Redistributions in binary form must reproduce the above copyright
16 * notice, this list of conditions and the following disclaimer in the
17 * documentation and/or other materials provided with the distribution.
18 * 3. All advertising materials mentioning features or use of this software
19 * must display the following acknowledgement:
20 * This product includes software developed by the University of
21 * California, Berkeley and its contributors.
22 * 4. Neither the name of the University nor the names of its contributors
23 * may be used to endorse or promote products derived from this software
24 * without specific prior written permission.
26 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
27 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
28 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
29 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
30 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
31 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
32 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
33 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
34 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
35 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
38 * from: Utah Hdr: vn.c 1.13 94/04/02
40 * from: @(#)vn.c 8.6 (Berkeley) 4/1/94
41 * $FreeBSD: src/sys/dev/vn/vn.c,v 1.105.2.4 2001/11/18 07:11:00 dillon Exp $
47 * Block interface to a ramdisk.
52 #include <sys/param.h>
53 #include <sys/systm.h>
54 #include <sys/kernel.h>
55 #include <sys/mount.h>
56 #include <sys/namei.h>
59 #include <sys/malloc.h>
60 #include <sys/mount.h>
61 #include <sys/vnode.h>
62 #include <sys/fcntl.h>
69 #include <vm/vm_pager.h>
70 #include <vm/vm_pageout.h>
71 #include <mach/memory_object_types.h>
73 #include <miscfs/devfs/devfs.h>
75 static open_close_fcn_t mdevopen
;
76 static open_close_fcn_t mdevclose
;
77 static psize_fcn_t mdevsize
;
78 static strategy_fcn_t mdevstrategy
;
79 static int mdevbioctl(dev_t dev
, u_long cmd
, caddr_t data
, int flag
, struct proc
*p
);
80 static int mdevcioctl(dev_t dev
, u_long cmd
, caddr_t data
, int flag
, struct proc
*p
);
81 static int mdevrw(dev_t dev
, struct uio
*uio
, int ioflag
);
82 static char *nonspace(char *pos
, char *end
);
83 static char *getspace(char *pos
, char *end
);
84 static char *cvtnum(char *pos
, char *end
, unsigned int *num
);
88 * D_DISK we want to look like a disk
89 * D_CANFREE We support B_FREEBUF
92 static struct bdevsw mdevbdevsw
= {
94 /* close */ mdevclose
,
95 /* strategy */ mdevstrategy
,
96 /* ioctl */ mdevbioctl
,
102 static struct cdevsw mdevcdevsw
= {
104 /* close */ mdevclose
,
107 /* ioctl */ mdevcioctl
,
109 /* reset */ eno_reset
,
111 /* select */ eno_select
,
113 /* strategy */ eno_strat
,
120 vm_offset_t mdBase
; /* file size in bytes */
121 uint32_t mdSize
; /* file size in bytes */
122 int mdFlags
; /* flags */
123 int mdSecsize
; /* sector size */
124 int mdBDev
; /* Block device number */
125 int mdCDev
; /* Character device number */
131 #define mdInited 0x01 /* This device defined */
132 #define mdRO 0x02 /* This device is read-only */
133 #define mdPhys 0x04 /* This device is in physical memory */
138 static int mdevioctl(dev_t dev
, u_long cmd
, caddr_t data
, int flag
, struct proc
*p
, int is_char
);
139 dev_t
mdevadd(int devid
, ppnum_t base
, unsigned int size
, int phys
);
140 dev_t
mdevlookup(int devid
);
142 static int mdevclose(dev_t dev
, int flags
, int devtype
, struct proc
*p
) {
146 static int mdevopen(dev_t dev
, int flags
, int devtype
, struct proc
*p
) {
150 devid
= minor(dev
); /* Get minor device number */
152 if (devid
> 16) return (ENXIO
); /* Not valid */
154 if ((flags
& FWRITE
) && (mdev
[devid
].mdFlags
& mdRO
)) return (EACCES
); /* Currently mounted RO */
159 static int mdevrw(dev_t dev
, struct uio
*uio
, int ioflag
) {
164 enum uio_seg saveflag
;
166 devid
= minor(dev
); /* Get minor device number */
168 if (devid
> 16) return (ENXIO
); /* Not valid */
169 if (!(mdev
[devid
].mdFlags
& mdInited
)) return (ENXIO
); /* Have we actually been defined yet? */
171 mdata
= ((addr64_t
)mdev
[devid
].mdBase
<< 12) + uio
->uio_offset
; /* Point to the area in "file" */
173 saveflag
= uio
->uio_segflg
; /* Remember what the request is */
174 if (mdev
[devid
].mdFlags
& mdPhys
) uio
->uio_segflg
= UIO_PHYS_USERSPACE
; /* Make sure we are moving from physical ram if physical device */
175 status
= uiomove64(mdata
, uio
->uio_resid
, uio
); /* Move the data */
176 uio
->uio_segflg
= saveflag
; /* Restore the flag */
181 static void mdevstrategy(struct buf
*bp
) {
183 unsigned int sz
, left
, lop
, csize
;
185 vm_offset_t vaddr
, blkoff
;
188 addr64_t paddr
, fvaddr
;
191 devid
= minor(bp
->b_dev
); /* Get minor device number */
193 if ((mdev
[devid
].mdFlags
& mdInited
) == 0) { /* Have we actually been defined yet? */
195 bp
->b_flags
|= B_ERROR
;
200 bp
->b_resid
= bp
->b_bcount
; /* Set byte count */
202 blkoff
= bp
->b_blkno
* mdev
[devid
].mdSecsize
; /* Get offset into file */
205 * Note that reading past end is an error, but reading at end is an EOF. For these
206 * we just return with b_resid == b_bcount.
209 if (blkoff
>= (mdev
[devid
].mdSize
<< 12)) { /* Are they trying to read/write at/after end? */
210 if(blkoff
!= (mdev
[devid
].mdSize
<< 12)) { /* Are we trying to read after EOF? */
211 bp
->b_error
= EINVAL
; /* Yeah, this is an error */
212 bp
->b_flags
|= B_ERROR
| B_INVAL
;
214 biodone(bp
); /* Return */
218 if ((blkoff
+ bp
->b_bcount
) > (mdev
[devid
].mdSize
<< 12)) { /* Will this read go past end? */
219 bp
->b_bcount
= ((mdev
[devid
].mdSize
<< 12) - blkoff
); /* Yes, trim to max */
222 vaddr
= 0; /* Assume not mapped yet */
225 if (bp
->b_flags
& B_VECTORLIST
) { /* Do we have a list of UPLs? */
226 tbuf
= (struct buf
*)bp
->b_real_bp
; /* Get this for C's inadequacies */
227 if((bp
->b_flags
& B_NEED_IODONE
) && /* If we have a UPL, is it already mapped? */
230 vaddr
= tbuf
->b_data
; /* We already have this mapped in, get base address */
232 else { /* Not mapped yet */
233 ret
= ubc_upl_map(bp
->b_pagelist
, &vaddr
); /* Map it in */
234 if(ret
!= KERN_SUCCESS
) panic("ramstrategy: ubc_upl_map failed, rc = %08X\n", ret
);
235 unmap
= 1; /* Remember to unmap later */
237 vaddr
= vaddr
+= bp
->b_uploffset
; /* Calculate actual vaddr */
239 else vaddr
= bp
->b_data
; /* No UPL, we already have address */
241 fvaddr
= (mdev
[devid
].mdBase
<< 12) + blkoff
; /* Point to offset into ram disk */
243 if(bp
->b_flags
& B_READ
) { /* Is this a read? */
244 if(!(mdev
[devid
].mdFlags
& mdPhys
)) { /* Physical mapped disk? */
245 bcopy((void *)fvaddr
, (void *)vaddr
, bp
->b_bcount
); /* This is virtual, just get the data */
248 left
= bp
->b_bcount
; /* Init the amount left to copy */
249 while(left
) { /* Go until it is all copied */
251 lop
= min((4096 - (vaddr
& 4095)), (4096 - (fvaddr
& 4095))); /* Get smallest amount left on sink and source */
252 csize
= min(lop
, left
); /* Don't move more than we need to */
254 pp
= pmap_find_phys(kernel_pmap
, (addr64_t
)((unsigned int)vaddr
)); /* Get the sink physical address */
255 if(!pp
) { /* Not found, what gives? */
256 panic("mdevstrategy: sink address %016llX not mapped\n", (addr64_t
)((unsigned int)vaddr
));
258 paddr
= (addr64_t
)(((addr64_t
)pp
<< 12) | (addr64_t
)(vaddr
& 4095)); /* Get actual address */
259 bcopy_phys(fvaddr
, paddr
, csize
); /* Copy this on in */
260 mapping_set_mod(paddr
>> 12); /* Make sure we know that it is modified */
262 left
= left
- csize
; /* Calculate what is left */
263 vaddr
= vaddr
+ csize
; /* Move to next sink address */
264 fvaddr
= fvaddr
+ csize
; /* Bump to next physical address */
268 else { /* This is a write */
269 if(!(mdev
[devid
].mdFlags
& mdPhys
)) { /* Physical mapped disk? */
270 bcopy((void *)vaddr
, (void *)fvaddr
, bp
->b_bcount
); /* This is virtual, just put the data */
273 left
= bp
->b_bcount
; /* Init the amount left to copy */
274 while(left
) { /* Go until it is all copied */
276 lop
= min((4096 - (vaddr
& 4095)), (4096 - (fvaddr
& 4095))); /* Get smallest amount left on sink and source */
277 csize
= min(lop
, left
); /* Don't move more than we need to */
279 pp
= pmap_find_phys(kernel_pmap
, (addr64_t
)((unsigned int)vaddr
)); /* Get the source physical address */
280 if(!pp
) { /* Not found, what gives? */
281 panic("mdevstrategy: source address %016llX not mapped\n", (addr64_t
)((unsigned int)vaddr
));
283 paddr
= (addr64_t
)(((addr64_t
)pp
<< 12) | (addr64_t
)(vaddr
& 4095)); /* Get actual address */
285 bcopy_phys(paddr
, fvaddr
, csize
); /* Move this on out */
287 left
= left
- csize
; /* Calculate what is left */
288 vaddr
= vaddr
+ csize
; /* Move to next sink address */
289 fvaddr
= fvaddr
+ csize
; /* Bump to next physical address */
294 if (unmap
) { /* Do we need to unmap this? */
295 ubc_upl_unmap(bp
->b_pagelist
); /* Yes, unmap it */
298 bp
->b_resid
= 0; /* Nothing more to do */
299 biodone(bp
); /* Say we've finished */
302 static int mdevbioctl(dev_t dev
, u_long cmd
, caddr_t data
, int flag
, struct proc
*p
) {
303 return (mdevioctl(dev
, cmd
, data
, flag
, p
, 0));
306 static int mdevcioctl(dev_t dev
, u_long cmd
, caddr_t data
, int flag
, struct proc
*p
) {
307 return (mdevioctl(dev
, cmd
, data
, flag
, p
, 1));
310 static int mdevioctl(dev_t dev
, u_long cmd
, caddr_t data
, int flag
, struct proc
*p
, int is_char
) {
317 devid
= minor(dev
); /* Get minor device number */
319 if (devid
> 16) return (ENXIO
); /* Not valid */
321 error
= suser(p
->p_ucred
, &p
->p_acflag
); /* Are we superman? */
322 if (error
) return (error
); /* Nope... */
325 o
= (u_int64_t
*)data
;
329 case DKIOCGETMAXBLOCKCOUNTREAD
:
333 case DKIOCGETMAXBLOCKCOUNTWRITE
:
337 case DKIOCGETMAXSEGMENTCOUNTREAD
:
341 case DKIOCGETMAXSEGMENTCOUNTWRITE
:
345 case DKIOCGETBLOCKSIZE
:
346 *f
= mdev
[devid
].mdSecsize
;
349 case DKIOCSETBLOCKSIZE
:
350 if (is_char
) return (ENODEV
); /* We can only do this for a block */
352 if (*f
< DEV_BSIZE
) return (EINVAL
); /* Too short? */
354 mdev
[devid
].mdSecsize
= *f
; /* set the new block size */
357 case DKIOCISWRITABLE
:
361 case DKIOCGETBLOCKCOUNT32
:
362 if(!(mdev
[devid
].mdFlags
& mdInited
)) return (ENXIO
);
363 *f
= ((mdev
[devid
].mdSize
<< 12) + mdev
[devid
].mdSecsize
- 1) / mdev
[devid
].mdSecsize
;
366 case DKIOCGETBLOCKCOUNT64
:
367 if(!(mdev
[devid
].mdFlags
& mdInited
)) return (ENXIO
);
368 *o
= ((mdev
[devid
].mdSize
<< 12) + mdev
[devid
].mdSecsize
- 1) / mdev
[devid
].mdSecsize
;
379 static int mdevsize(dev_t dev
) {
383 devid
= minor(dev
); /* Get minor device number */
384 if (devid
> 16) return (ENXIO
); /* Not valid */
386 if ((mdev
[devid
].mdFlags
& mdInited
) == 0) return(-1); /* Not inited yet */
388 return(mdev
[devid
].mdSecsize
);
392 void mdevinit(int cnt
) {
401 ba
= PE_boot_args(); /* Get the boot arguments */
402 lp
= ba
+ 256; /* Point to the end */
404 while(1) { /* Step through, looking for our keywords */
405 phys
= 0; /* Assume virtual memory device */
406 ba
= nonspace(ba
, lp
); /* Find non-space */
407 if(ba
>= lp
) return; /* We are done if no more... */
408 if(((ba
[0] != 'v') && (ba
[0] != 'p'))
409 || (ba
[1] != 'm') || (ba
[2] != 'd') || (ba
[4] != '=')
410 || (ba
[3] < '0') || (ba
[3] > 'f')
411 || ((ba
[3] > '9') && (ba
[3] < 'a'))) { /* Is this of form "vmdx=" or "pmdx=" where x is hex digit? */
413 ba
= getspace(ba
, lp
); /* Find next white space or end */
414 continue; /* Start looking for the next one */
417 if(ba
[0] == 'p') phys
= 1; /* Set physical memory disk */
419 devid
= ba
[3] & 0xF; /* Assume digit */
420 if(ba
[3] > '9') devid
+= 9; /* Adjust for hex digits */
422 ba
= &ba
[5]; /* Step past keyword */
423 ba
= cvtnum(ba
, lp
, &base
); /* Convert base of memory disk */
424 if(ba
>= lp
) return; /* Malformed one at the end, leave */
425 if(ba
[0] != '.') continue; /* If not length separater, try next... */
426 if(base
& 0xFFF) continue; /* Only allow page aligned stuff */
428 ba
++; /* Step past '.' */
429 ba
= cvtnum(ba
, lp
, &size
); /* Try to convert it */
430 if(!size
|| (size
& 0xFFF)) continue; /* Allow only non-zer page size multiples */
431 if(ba
< lp
) { /* If we are not at end, check end character */
432 if((ba
[0] != ' ') && (ba
[0] != 0)) continue; /* End must be null or space */
435 dev
= mdevadd(devid
, base
>> 12, size
>> 12, phys
); /* Go add the device */
442 char *nonspace(char *pos
, char *end
) { /* Find next non-space in string */
444 if(pos
>= end
) return end
; /* Don't go past end */
445 if(pos
[0] == 0) return end
; /* If at null, make end */
447 while(1) { /* Keep going */
448 if(pos
[0] != ' ') return pos
; /* Leave if we found one */
450 if(pos
>= end
) return end
; /* Quit if we run off end */
454 char *getspace(char *pos
, char *end
) { /* Find next non-space in string */
456 while(1) { /* Keep going */
457 if(pos
>= end
) return end
; /* Don't go past end */
458 if(pos
[0] == 0) return end
; /* Leave if we hit null */
459 if(pos
[0] == ' ') return pos
; /* Leave if we found one */
464 char *cvtnum(char *pos
, char *end
, unsigned int *num
) { /* Convert to a number */
468 *num
= 0; /* Set answer to 0 to start */
471 if(pos
>= end
) return end
; /* Don't go past end */
472 if(pos
[0] == 0) return end
; /* If at null, make end */
474 if(pos
[0] == '0' && ((pos
[1] == 'x') || (pos
[1] == 'x'))) { /* A hex constant? */
476 pos
+= 2; /* Point to the number */
479 while(1) { /* Convert it */
481 if(pos
>= end
) return end
; /* Don't go past end */
482 if(pos
[0] == 0) return end
; /* If at null, make end */
483 if(pos
[0] < '0') return pos
; /* Leave if non-digit */
484 dig
= pos
[0] & 0xF; /* Extract digit */
485 if(pos
[0] > '9') { /* Is it bigger than 9? */
486 if(rad
== 10) return pos
; /* Leave if not base 10 */
487 if(!(((pos
[0] >= 'A') && (pos
[0] <= 'F'))
488 || ((pos
[0] >= 'a') && (pos
[0] <= 'f')))) return pos
; /* Leave if bogus char */
489 dig
= dig
+ 9; /* Adjust for character */
491 *num
= (*num
* rad
) + dig
; /* Accumulate the number */
496 dev_t
mdevadd(int devid
, ppnum_t base
, unsigned int size
, int phys
) {
503 for(i
= 0; i
< 16; i
++) { /* Search all known memory devices */
504 if(!(mdev
[i
].mdFlags
& mdInited
)) { /* Is this a free one? */
505 if(devid
< 0)devid
= i
; /* Remember first free one */
506 continue; /* Skip check */
508 if(!(((base
+ size
-1 ) < mdev
[i
].mdBase
) || ((mdev
[i
].mdBase
+ mdev
[i
].mdSize
- 1) < base
))) { /* Is there any overlap? */
509 panic("mdevadd: attempt to add overlapping memory device at %08X-%08X\n", mdev
[i
].mdBase
, mdev
[i
].mdBase
+ mdev
[i
].mdSize
- 1);
512 if(devid
< 0) { /* Do we have free slots? */
513 panic("mdevadd: attempt to add more than 16 memory devices\n");
517 if(devid
>= 16) { /* Giving us something bogus? */
518 panic("mdevadd: attempt to explicitly add a bogus memory device: &08X\n", devid
);
520 if(mdev
[devid
].mdFlags
&mdInited
) { /* Already there? */
521 panic("mdevadd: attempt to explicitly add a previously defined memory device: &08X\n", devid
);
525 if(mdevBMajor
< 0) { /* Have we gotten a major number yet? */
526 mdevBMajor
= bdevsw_add(-1, &mdevbdevsw
); /* Add to the table and figure out a major number */
527 if (mdevBMajor
< 0) {
528 printf("mdevadd: error - bdevsw_add() returned %d\n", mdevBMajor
);
533 if(mdevCMajor
< 0) { /* Have we gotten a major number yet? */
534 mdevCMajor
= cdevsw_add_with_bdev(-1, &mdevcdevsw
, mdevBMajor
); /* Add to the table and figure out a major number */
535 if (mdevCMajor
< 0) {
536 printf("ramdevice_init: error - cdevsw_add() returned %d\n", mdevCMajor
);
541 mdev
[devid
].mdBDev
= makedev(mdevBMajor
, devid
); /* Get the device number */
542 mdev
[devid
].mdbdevb
= devfs_make_node(mdev
[devid
].mdBDev
, DEVFS_BLOCK
, /* Make the node */
543 UID_ROOT
, GID_OPERATOR
,
544 0600, "md%d", devid
);
545 if (mdev
[devid
].mdbdevb
== NULL
) { /* Did we make one? */
546 printf("mdevadd: devfs_make_node for block failed!\n");
547 return -1; /* Nope... */
550 mdev
[devid
].mdCDev
= makedev(mdevCMajor
, devid
); /* Get the device number */
551 mdev
[devid
].mdcdevb
= devfs_make_node(mdev
[devid
].mdCDev
, DEVFS_CHAR
, /* Make the node */
552 UID_ROOT
, GID_OPERATOR
,
553 0600, "rmd%d", devid
);
554 if (mdev
[devid
].mdcdevb
== NULL
) { /* Did we make one? */
555 printf("mdevadd: devfs_make_node for character failed!\n");
556 return -1; /* Nope... */
559 mdev
[devid
].mdBase
= base
; /* Set the base address of ram disk */
560 mdev
[devid
].mdSize
= size
; /* Set the length of the ram disk */
561 mdev
[devid
].mdSecsize
= DEV_BSIZE
; /* Set starting block size */
562 if(phys
) mdev
[devid
].mdFlags
|= mdPhys
; /* Show that we are in physical memory */
563 mdev
[devid
].mdFlags
|= mdInited
; /* Show we are all set up */
564 printf("Added memory device md%x/rmd%x (%08X/%08X) at %08X for %08X\n",
565 devid
, devid
, mdev
[devid
].mdBDev
, mdev
[devid
].mdCDev
, base
<< 12, size
<< 12);
566 return mdev
[devid
].mdBDev
;
570 dev_t
mdevlookup(int devid
) {
572 if((devid
< 0) || (devid
> 15)) return -1; /* Filter any bogus requests */
573 if(!(mdev
[devid
].mdFlags
& mdInited
)) return -1; /* This one hasn't been defined */
574 return mdev
[devid
].mdBDev
; /* Return the device number */