]>
Commit | Line | Data |
---|---|---|
1c79356b A |
1 | /* |
2 | * Copyright (c) 2000 Apple Computer, Inc. All rights reserved. | |
3 | * | |
4 | * @APPLE_LICENSE_HEADER_START@ | |
5 | * | |
de355530 A |
6 | * The contents of this file constitute Original Code as defined in and |
7 | * are subject to the Apple Public Source License Version 1.1 (the | |
8 | * "License"). You may not use this file except in compliance with the | |
9 | * License. Please obtain a copy of the License at | |
10 | * http://www.apple.com/publicsource and read it before using this file. | |
1c79356b | 11 | * |
de355530 A |
12 | * This Original Code and all software distributed under the License are |
13 | * distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY KIND, EITHER | |
1c79356b A |
14 | * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES, |
15 | * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY, | |
de355530 A |
16 | * FITNESS FOR A PARTICULAR PURPOSE OR NON-INFRINGEMENT. Please see the |
17 | * License for the specific language governing rights and limitations | |
18 | * under the License. | |
1c79356b A |
19 | * |
20 | * @APPLE_LICENSE_HEADER_END@ | |
21 | */ | |
22 | /* Copyright (c) 1995 NeXT Computer, Inc. All Rights Reserved */ | |
23 | /* | |
24 | * Copyright (c) 1989, 1991, 1993, 1994 | |
25 | * The Regents of the University of California. All rights reserved. | |
26 | * | |
27 | * Redistribution and use in source and binary forms, with or without | |
28 | * modification, are permitted provided that the following conditions | |
29 | * are met: | |
30 | * 1. Redistributions of source code must retain the above copyright | |
31 | * notice, this list of conditions and the following disclaimer. | |
32 | * 2. Redistributions in binary form must reproduce the above copyright | |
33 | * notice, this list of conditions and the following disclaimer in the | |
34 | * documentation and/or other materials provided with the distribution. | |
35 | * 3. All advertising materials mentioning features or use of this software | |
36 | * must display the following acknowledgement: | |
37 | * This product includes software developed by the University of | |
38 | * California, Berkeley and its contributors. | |
39 | * 4. Neither the name of the University nor the names of its contributors | |
40 | * may be used to endorse or promote products derived from this software | |
41 | * without specific prior written permission. | |
42 | * | |
43 | * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND | |
44 | * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | |
45 | * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | |
46 | * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE | |
47 | * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL | |
48 | * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS | |
49 | * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) | |
50 | * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT | |
51 | * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY | |
52 | * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF | |
53 | * SUCH DAMAGE. | |
54 | * | |
55 | * @(#)ffs_vfsops.c 8.31 (Berkeley) 5/20/95 | |
56 | */ | |
57 | ||
58 | #include <rev_endian_fs.h> | |
59 | #include <sys/param.h> | |
60 | #include <sys/systm.h> | |
61 | #include <sys/namei.h> | |
62 | #include <sys/proc.h> | |
63 | #include <sys/kernel.h> | |
64 | #include <sys/vnode.h> | |
65 | #include <sys/socket.h> | |
66 | #include <sys/mount.h> | |
67 | #include <sys/buf.h> | |
68 | #include <sys/mbuf.h> | |
69 | #include <sys/file.h> | |
70 | #include <dev/disk.h> | |
71 | #include <sys/ioctl.h> | |
72 | #include <sys/errno.h> | |
73 | #include <sys/malloc.h> | |
74 | #include <sys/ubc.h> | |
9bccf70c | 75 | #include <sys/quota.h> |
1c79356b A |
76 | |
77 | #include <miscfs/specfs/specdev.h> | |
78 | ||
79 | #include <ufs/ufs/quota.h> | |
80 | #include <ufs/ufs/ufsmount.h> | |
81 | #include <ufs/ufs/inode.h> | |
82 | #include <ufs/ufs/ufs_extern.h> | |
83 | ||
84 | #include <ufs/ffs/fs.h> | |
85 | #include <ufs/ffs/ffs_extern.h> | |
86 | #if REV_ENDIAN_FS | |
87 | #include <ufs/ufs/ufs_byte_order.h> | |
88 | #include <architecture/byte_order.h> | |
89 | #endif /* REV_ENDIAN_FS */ | |
90 | ||
91 | int ffs_sbupdate __P((struct ufsmount *, int)); | |
92 | ||
93 | struct vfsops ufs_vfsops = { | |
94 | ffs_mount, | |
95 | ufs_start, | |
96 | ffs_unmount, | |
97 | ufs_root, | |
98 | ufs_quotactl, | |
99 | ffs_statfs, | |
100 | ffs_sync, | |
101 | ffs_vget, | |
102 | ffs_fhtovp, | |
103 | ffs_vptofh, | |
104 | ffs_init, | |
105 | ffs_sysctl, | |
106 | }; | |
107 | ||
108 | extern u_long nextgennumber; | |
109 | ||
110 | /* | |
111 | * Called by main() when ufs is going to be mounted as root. | |
112 | */ | |
113 | ffs_mountroot() | |
114 | { | |
115 | extern struct vnode *rootvp; | |
116 | struct fs *fs; | |
117 | struct mount *mp; | |
118 | struct proc *p = current_proc(); /* XXX */ | |
119 | struct ufsmount *ump; | |
120 | u_int size; | |
121 | int error; | |
122 | ||
123 | /* | |
124 | * Get vnode for rootdev. | |
125 | */ | |
126 | if (error = bdevvp(rootdev, &rootvp)) { | |
127 | printf("ffs_mountroot: can't setup bdevvp"); | |
128 | return (error); | |
129 | } | |
9bccf70c A |
130 | if (error = vfs_rootmountalloc("ufs", "root_device", &mp)) { |
131 | vrele(rootvp); /* release the reference from bdevvp() */ | |
1c79356b | 132 | return (error); |
9bccf70c | 133 | } |
1c79356b A |
134 | |
135 | /* Must set the MNT_ROOTFS flag before doing the actual mount */ | |
136 | mp->mnt_flag |= MNT_ROOTFS; | |
137 | ||
138 | if (error = ffs_mountfs(rootvp, mp, p)) { | |
139 | mp->mnt_vfc->vfc_refcount--; | |
140 | vfs_unbusy(mp, p); | |
9bccf70c | 141 | vrele(rootvp); /* release the reference from bdevvp() */ |
1c79356b A |
142 | _FREE_ZONE(mp, sizeof (struct mount), M_MOUNT); |
143 | return (error); | |
144 | } | |
145 | simple_lock(&mountlist_slock); | |
146 | CIRCLEQ_INSERT_TAIL(&mountlist, mp, mnt_list); | |
147 | simple_unlock(&mountlist_slock); | |
148 | ump = VFSTOUFS(mp); | |
149 | fs = ump->um_fs; | |
150 | (void) copystr(mp->mnt_stat.f_mntonname, fs->fs_fsmnt, MNAMELEN - 1, 0); | |
151 | (void)ffs_statfs(mp, &mp->mnt_stat, p); | |
152 | vfs_unbusy(mp, p); | |
153 | inittodr(fs->fs_time); | |
154 | return (0); | |
155 | } | |
156 | ||
157 | /* | |
158 | * VFS Operations. | |
159 | * | |
160 | * mount system call | |
161 | */ | |
162 | int | |
163 | ffs_mount(mp, path, data, ndp, p) | |
164 | register struct mount *mp; | |
165 | char *path; | |
166 | caddr_t data; | |
167 | struct nameidata *ndp; | |
168 | struct proc *p; | |
169 | { | |
170 | struct vnode *devvp; | |
171 | struct ufs_args args; | |
172 | struct ufsmount *ump; | |
173 | register struct fs *fs; | |
174 | u_int size; | |
175 | int error, flags; | |
176 | mode_t accessmode; | |
177 | int ronly; | |
178 | int reload = 0; | |
179 | ||
180 | if (error = copyin(data, (caddr_t)&args, sizeof (struct ufs_args))) | |
181 | return (error); | |
182 | /* | |
183 | * If updating, check whether changing from read-only to | |
184 | * read/write; if there is no device name, that's all we do. | |
185 | */ | |
186 | if (mp->mnt_flag & MNT_UPDATE) { | |
187 | ump = VFSTOUFS(mp); | |
188 | fs = ump->um_fs; | |
189 | if (fs->fs_ronly == 0 && (mp->mnt_flag & MNT_RDONLY)) { | |
190 | flags = WRITECLOSE; | |
191 | if (mp->mnt_flag & MNT_FORCE) | |
192 | flags |= FORCECLOSE; | |
193 | if (error = ffs_flushfiles(mp, flags, p)) | |
194 | return (error); | |
195 | fs->fs_clean = 1; | |
196 | fs->fs_ronly = 1; | |
197 | if (error = ffs_sbupdate(ump, MNT_WAIT)) { | |
198 | fs->fs_clean = 0; | |
199 | fs->fs_ronly = 0; | |
200 | return (error); | |
201 | } | |
202 | } | |
203 | /* save fs_ronly to later use */ | |
204 | ronly = fs->fs_ronly; | |
205 | if ((mp->mnt_flag & MNT_RELOAD) || ronly) | |
206 | reload = 1; | |
207 | if ((reload) && | |
208 | (error = ffs_reload(mp, ndp->ni_cnd.cn_cred, p))) | |
209 | return (error); | |
210 | /* replace the ronly after load */ | |
211 | fs->fs_ronly = ronly; | |
212 | /* | |
213 | * Do not update the file system if the user was in singleuser | |
214 | * and then tries to mount -uw without fscking | |
215 | */ | |
216 | if (!fs->fs_clean && ronly) { | |
217 | printf("WARNING: trying to mount a dirty file system\n"); | |
218 | if (issingleuser() && (mp->mnt_flag & MNT_ROOTFS)) { | |
219 | printf("WARNING: R/W mount of %s denied. Filesystem is not clean - run fsck\n",fs->fs_fsmnt); | |
220 | /* | |
221 | * Reset the readonly bit as reload might have | |
222 | * modified this bit | |
223 | */ | |
224 | fs->fs_ronly = 1; | |
225 | return(EPERM); | |
226 | } | |
227 | } | |
228 | ||
229 | if (ronly && (mp->mnt_kern_flag & MNTK_WANTRDWR)) { | |
230 | /* | |
231 | * If upgrade to read-write by non-root, then verify | |
232 | * that user has necessary permissions on the device. | |
233 | */ | |
234 | if (p->p_ucred->cr_uid != 0) { | |
235 | devvp = ump->um_devvp; | |
236 | vn_lock(devvp, LK_EXCLUSIVE | LK_RETRY, p); | |
237 | if (error = VOP_ACCESS(devvp, VREAD | VWRITE, | |
238 | p->p_ucred, p)) { | |
239 | VOP_UNLOCK(devvp, 0, p); | |
240 | return (error); | |
241 | } | |
242 | VOP_UNLOCK(devvp, 0, p); | |
243 | } | |
244 | fs->fs_ronly = 0; | |
245 | fs->fs_clean = 0; | |
246 | (void) ffs_sbupdate(ump, MNT_WAIT); | |
247 | } | |
248 | if (args.fspec == 0) { | |
249 | /* | |
250 | * Process export requests. | |
251 | */ | |
252 | return (vfs_export(mp, &ump->um_export, &args.export)); | |
253 | } | |
254 | } | |
255 | /* | |
256 | * Not an update, or updating the name: look up the name | |
257 | * and verify that it refers to a sensible block device. | |
258 | */ | |
259 | NDINIT(ndp, LOOKUP, FOLLOW, UIO_USERSPACE, args.fspec, p); | |
260 | if (error = namei(ndp)) | |
261 | return (error); | |
262 | devvp = ndp->ni_vp; | |
263 | ||
264 | if (devvp->v_type != VBLK) { | |
265 | vrele(devvp); | |
266 | return (ENOTBLK); | |
267 | } | |
268 | if (major(devvp->v_rdev) >= nblkdev) { | |
269 | vrele(devvp); | |
270 | return (ENXIO); | |
271 | } | |
272 | /* | |
273 | * If mount by non-root, then verify that user has necessary | |
274 | * permissions on the device. | |
275 | */ | |
276 | if (p->p_ucred->cr_uid != 0) { | |
277 | accessmode = VREAD; | |
278 | if ((mp->mnt_flag & MNT_RDONLY) == 0) | |
279 | accessmode |= VWRITE; | |
280 | vn_lock(devvp, LK_EXCLUSIVE | LK_RETRY, p); | |
281 | if (error = VOP_ACCESS(devvp, accessmode, p->p_ucred, p)) { | |
282 | vput(devvp); | |
283 | return (error); | |
284 | } | |
285 | VOP_UNLOCK(devvp, 0, p); | |
286 | } | |
287 | if ((mp->mnt_flag & MNT_UPDATE) == 0) | |
288 | error = ffs_mountfs(devvp, mp, p); | |
289 | else { | |
290 | if (devvp != ump->um_devvp) | |
291 | error = EINVAL; /* needs translation */ | |
292 | else | |
293 | vrele(devvp); | |
294 | } | |
295 | if (error) { | |
296 | vrele(devvp); | |
297 | return (error); | |
298 | } | |
299 | ump = VFSTOUFS(mp); | |
300 | fs = ump->um_fs; | |
301 | (void) copyinstr(path, fs->fs_fsmnt, sizeof(fs->fs_fsmnt) - 1, &size); | |
302 | bzero(fs->fs_fsmnt + size, sizeof(fs->fs_fsmnt) - size); | |
303 | bcopy((caddr_t)fs->fs_fsmnt, (caddr_t)mp->mnt_stat.f_mntonname, | |
304 | MNAMELEN); | |
305 | (void) copyinstr(args.fspec, mp->mnt_stat.f_mntfromname, MNAMELEN - 1, | |
306 | &size); | |
307 | bzero(mp->mnt_stat.f_mntfromname + size, MNAMELEN - size); | |
308 | (void)ffs_statfs(mp, &mp->mnt_stat, p); | |
309 | return (0); | |
310 | } | |
311 | ||
312 | /* | |
313 | * Reload all incore data for a filesystem (used after running fsck on | |
314 | * the root filesystem and finding things to fix). The filesystem must | |
315 | * be mounted read-only. | |
316 | * | |
317 | * Things to do to update the mount: | |
318 | * 1) invalidate all cached meta-data. | |
319 | * 2) re-read superblock from disk. | |
320 | * 3) re-read summary information from disk. | |
321 | * 4) invalidate all inactive vnodes. | |
322 | * 5) invalidate all cached file data. | |
323 | * 6) re-read inode data for all active vnodes. | |
324 | */ | |
325 | ffs_reload(mountp, cred, p) | |
326 | register struct mount *mountp; | |
327 | struct ucred *cred; | |
328 | struct proc *p; | |
329 | { | |
330 | register struct vnode *vp, *nvp, *devvp; | |
331 | struct inode *ip; | |
9bccf70c | 332 | void *space; |
1c79356b A |
333 | struct buf *bp; |
334 | struct fs *fs, *newfs; | |
335 | int i, blks, size, error; | |
0b4e3aa0 | 336 | u_int64_t maxfilesize; /* XXX */ |
1c79356b A |
337 | int32_t *lp; |
338 | #if REV_ENDIAN_FS | |
339 | int rev_endian = (mountp->mnt_flag & MNT_REVEND); | |
340 | #endif /* REV_ENDIAN_FS */ | |
341 | ||
342 | if ((mountp->mnt_flag & MNT_RDONLY) == 0) | |
343 | return (EINVAL); | |
344 | /* | |
345 | * Step 1: invalidate all cached meta-data. | |
346 | */ | |
347 | devvp = VFSTOUFS(mountp)->um_devvp; | |
348 | if (vinvalbuf(devvp, 0, cred, p, 0, 0)) | |
349 | panic("ffs_reload: dirty1"); | |
350 | /* | |
351 | * Step 2: re-read superblock from disk. | |
352 | */ | |
353 | VOP_DEVBLOCKSIZE(devvp,&size); | |
354 | ||
355 | if (error = bread(devvp, (ufs_daddr_t)(SBOFF/size), SBSIZE, NOCRED,&bp)) { | |
356 | brelse(bp); | |
357 | return (error); | |
358 | } | |
359 | newfs = (struct fs *)bp->b_data; | |
360 | #if REV_ENDIAN_FS | |
361 | if (rev_endian) { | |
362 | byte_swap_sbin(newfs); | |
363 | } | |
364 | #endif /* REV_ENDIAN_FS */ | |
365 | if (newfs->fs_magic != FS_MAGIC || newfs->fs_bsize > MAXBSIZE || | |
366 | newfs->fs_bsize < sizeof(struct fs)) { | |
367 | #if REV_ENDIAN_FS | |
368 | if (rev_endian) | |
369 | byte_swap_sbout(newfs); | |
370 | #endif /* REV_ENDIAN_FS */ | |
371 | ||
372 | brelse(bp); | |
373 | return (EIO); /* XXX needs translation */ | |
374 | } | |
375 | fs = VFSTOUFS(mountp)->um_fs; | |
376 | /* | |
377 | * Copy pointer fields back into superblock before copying in XXX | |
378 | * new superblock. These should really be in the ufsmount. XXX | |
379 | * Note that important parameters (eg fs_ncg) are unchanged. | |
380 | */ | |
9bccf70c | 381 | newfs->fs_csp = fs->fs_csp; |
1c79356b A |
382 | newfs->fs_maxcluster = fs->fs_maxcluster; |
383 | bcopy(newfs, fs, (u_int)fs->fs_sbsize); | |
384 | if (fs->fs_sbsize < SBSIZE) | |
385 | bp->b_flags |= B_INVAL; | |
386 | #if REV_ENDIAN_FS | |
387 | if (rev_endian) | |
388 | byte_swap_sbout(newfs); | |
389 | #endif /* REV_ENDIAN_FS */ | |
390 | brelse(bp); | |
391 | mountp->mnt_maxsymlinklen = fs->fs_maxsymlinklen; | |
392 | ffs_oldfscompat(fs); | |
0b4e3aa0 A |
393 | maxfilesize = (u_int64_t)0x100000000; /* 4GB */ |
394 | if (fs->fs_maxfilesize > maxfilesize) /* XXX */ | |
395 | fs->fs_maxfilesize = maxfilesize; /* XXX */ | |
1c79356b A |
396 | /* |
397 | * Step 3: re-read summary information from disk. | |
398 | */ | |
399 | blks = howmany(fs->fs_cssize, fs->fs_fsize); | |
9bccf70c | 400 | space = fs->fs_csp; |
1c79356b A |
401 | for (i = 0; i < blks; i += fs->fs_frag) { |
402 | size = fs->fs_bsize; | |
403 | if (i + fs->fs_frag > blks) | |
404 | size = (blks - i) * fs->fs_fsize; | |
405 | if (error = bread(devvp, fsbtodb(fs, fs->fs_csaddr + i), size, | |
406 | NOCRED, &bp)) { | |
407 | brelse(bp); | |
408 | return (error); | |
409 | } | |
410 | #if REV_ENDIAN_FS | |
411 | if (rev_endian) { | |
412 | /* csum swaps */ | |
413 | byte_swap_ints((int *)bp->b_data, size / sizeof(int)); | |
414 | } | |
415 | #endif /* REV_ENDIAN_FS */ | |
9bccf70c | 416 | bcopy(bp->b_data, space, (u_int)size); |
1c79356b A |
417 | #if REV_ENDIAN_FS |
418 | if (rev_endian) { | |
419 | /* csum swaps */ | |
420 | byte_swap_ints((int *)bp->b_data, size / sizeof(int)); | |
421 | } | |
422 | #endif /* REV_ENDIAN_FS */ | |
423 | brelse(bp); | |
424 | } | |
425 | /* | |
426 | * We no longer know anything about clusters per cylinder group. | |
427 | */ | |
428 | if (fs->fs_contigsumsize > 0) { | |
429 | lp = fs->fs_maxcluster; | |
430 | for (i = 0; i < fs->fs_ncg; i++) | |
431 | *lp++ = fs->fs_contigsumsize; | |
432 | } | |
433 | ||
434 | loop: | |
435 | simple_lock(&mntvnode_slock); | |
436 | for (vp = mountp->mnt_vnodelist.lh_first; vp != NULL; vp = nvp) { | |
437 | if (vp->v_mount != mountp) { | |
438 | simple_unlock(&mntvnode_slock); | |
439 | goto loop; | |
440 | } | |
441 | nvp = vp->v_mntvnodes.le_next; | |
442 | /* | |
443 | * Step 4: invalidate all inactive vnodes. | |
444 | */ | |
445 | if (vrecycle(vp, &mntvnode_slock, p)) | |
446 | goto loop; | |
447 | /* | |
448 | * Step 5: invalidate all cached file data. | |
449 | */ | |
450 | simple_lock(&vp->v_interlock); | |
451 | simple_unlock(&mntvnode_slock); | |
452 | if (vget(vp, LK_EXCLUSIVE | LK_INTERLOCK, p)) { | |
453 | goto loop; | |
454 | } | |
455 | if (vinvalbuf(vp, 0, cred, p, 0, 0)) | |
456 | panic("ffs_reload: dirty2"); | |
457 | /* | |
458 | * Step 6: re-read inode data for all active vnodes. | |
459 | */ | |
460 | ip = VTOI(vp); | |
461 | if (error = | |
462 | bread(devvp, fsbtodb(fs, ino_to_fsba(fs, ip->i_number)), | |
463 | (int)fs->fs_bsize, NOCRED, &bp)) { | |
464 | brelse(bp); | |
465 | vput(vp); | |
466 | return (error); | |
467 | } | |
468 | #if REV_ENDIAN_FS | |
469 | if (rev_endian) { | |
470 | byte_swap_inode_in(((struct dinode *)bp->b_data + | |
471 | ino_to_fsbo(fs, ip->i_number)), ip); | |
472 | } else { | |
473 | #endif /* REV_ENDIAN_FS */ | |
474 | ip->i_din = *((struct dinode *)bp->b_data + | |
475 | ino_to_fsbo(fs, ip->i_number)); | |
476 | #if REV_ENDIAN_FS | |
477 | } | |
478 | #endif /* REV_ENDIAN_FS */ | |
479 | brelse(bp); | |
480 | vput(vp); | |
481 | simple_lock(&mntvnode_slock); | |
482 | } | |
483 | simple_unlock(&mntvnode_slock); | |
484 | return (0); | |
485 | } | |
486 | ||
487 | /* | |
488 | * Common code for mount and mountroot | |
489 | */ | |
490 | int | |
491 | ffs_mountfs(devvp, mp, p) | |
492 | register struct vnode *devvp; | |
493 | struct mount *mp; | |
494 | struct proc *p; | |
495 | { | |
496 | register struct ufsmount *ump; | |
497 | struct buf *bp; | |
498 | register struct fs *fs; | |
499 | dev_t dev; | |
500 | struct buf *cgbp; | |
501 | struct cg *cgp; | |
502 | int32_t clustersumoff; | |
9bccf70c | 503 | void *space; |
1c79356b A |
504 | int error, i, blks, size, ronly; |
505 | int32_t *lp; | |
506 | struct ucred *cred; | |
507 | extern struct vnode *rootvp; | |
508 | u_int64_t maxfilesize; /* XXX */ | |
509 | u_int dbsize = DEV_BSIZE; | |
510 | #if REV_ENDIAN_FS | |
511 | int rev_endian=0; | |
512 | #endif /* REV_ENDIAN_FS */ | |
513 | dev = devvp->v_rdev; | |
514 | cred = p ? p->p_ucred : NOCRED; | |
515 | /* | |
516 | * Disallow multiple mounts of the same device. | |
517 | * Disallow mounting of a device that is currently in use | |
518 | * (except for root, which might share swap device for miniroot). | |
519 | * Flush out any old buffers remaining from a previous use. | |
520 | */ | |
521 | if (error = vfs_mountedon(devvp)) | |
522 | return (error); | |
523 | if (vcount(devvp) > 1 && devvp != rootvp) | |
524 | return (EBUSY); | |
525 | if (error = vinvalbuf(devvp, V_SAVE, cred, p, 0, 0)) | |
526 | return (error); | |
527 | ||
528 | ronly = (mp->mnt_flag & MNT_RDONLY) != 0; | |
529 | if (error = VOP_OPEN(devvp, ronly ? FREAD : FREAD|FWRITE, FSCRED, p)) | |
530 | return (error); | |
531 | ||
532 | VOP_DEVBLOCKSIZE(devvp,&size); | |
533 | ||
534 | bp = NULL; | |
535 | ump = NULL; | |
536 | if (error = bread(devvp, (ufs_daddr_t)(SBOFF/size), SBSIZE, cred, &bp)) | |
537 | goto out; | |
538 | fs = (struct fs *)bp->b_data; | |
539 | #if REV_ENDIAN_FS | |
540 | if (fs->fs_magic != FS_MAGIC || fs->fs_bsize > MAXBSIZE || | |
541 | fs->fs_bsize < sizeof(struct fs)) { | |
542 | int magic = fs->fs_magic; | |
543 | ||
544 | byte_swap_ints(&magic, 1); | |
545 | if (magic != FS_MAGIC) { | |
546 | error = EINVAL; | |
547 | goto out; | |
548 | } | |
549 | byte_swap_sbin(fs); | |
550 | if (fs->fs_magic != FS_MAGIC || fs->fs_bsize > MAXBSIZE || | |
551 | fs->fs_bsize < sizeof(struct fs)) { | |
552 | byte_swap_sbout(fs); | |
553 | error = EINVAL; /* XXX needs translation */ | |
554 | goto out; | |
555 | } | |
556 | rev_endian=1; | |
557 | } | |
558 | #endif /* REV_ENDIAN_FS */ | |
559 | if (fs->fs_magic != FS_MAGIC || fs->fs_bsize > MAXBSIZE || | |
560 | fs->fs_bsize < sizeof(struct fs)) { | |
561 | #if REV_ENDIAN_FS | |
562 | if (rev_endian) | |
563 | byte_swap_sbout(fs); | |
564 | #endif /* REV_ENDIAN_FS */ | |
565 | error = EINVAL; /* XXX needs translation */ | |
566 | goto out; | |
567 | } | |
568 | ||
569 | ||
570 | /* | |
571 | * Buffer cache does not handle multiple pages in a buf when | |
572 | * invalidating incore buffer in pageout. There are no locks | |
573 | * in the pageout path. So there is a danger of loosing data when | |
574 | * block allocation happens at the same time a pageout of buddy | |
575 | * page occurs. incore() returns buf with both | |
576 | * pages, this leads vnode-pageout to incorrectly flush of entire. | |
577 | * buf. Till the low level ffs code is modified to deal with these | |
578 | * do not mount any FS more than 4K size. | |
579 | */ | |
580 | /* | |
581 | * Can't mount filesystems with a fragment size less than DIRBLKSIZ | |
582 | */ | |
583 | /* | |
584 | * Don't mount dirty filesystems, except for the root filesystem | |
585 | */ | |
586 | if ((fs->fs_bsize > PAGE_SIZE) || (fs->fs_fsize < DIRBLKSIZ) || | |
587 | ((!(mp->mnt_flag & MNT_ROOTFS)) && (!fs->fs_clean))) { | |
588 | #if REV_ENDIAN_FS | |
589 | if (rev_endian) | |
590 | byte_swap_sbout(fs); | |
591 | #endif /* REV_ENDIAN_FS */ | |
592 | error = ENOTSUP; | |
593 | goto out; | |
594 | } | |
595 | ||
596 | /* Let's figure out the devblock size the file system is with */ | |
597 | /* the device block size = fragment size / number of sectors per frag */ | |
598 | ||
599 | dbsize = fs->fs_fsize / NSPF(fs); | |
600 | if(dbsize <= 0 ) { | |
601 | kprintf("device blocksize computaion failed\n"); | |
602 | } else { | |
603 | if (VOP_IOCTL(devvp, DKIOCSETBLOCKSIZE, &dbsize, FWRITE, NOCRED, | |
604 | p) != 0) { | |
605 | kprintf("failed to set device blocksize\n"); | |
606 | } | |
607 | /* force the specfs to reread blocksize from size() */ | |
608 | set_fsblocksize(devvp); | |
609 | } | |
610 | ||
0b4e3aa0 A |
611 | /* cache the IO attributes */ |
612 | error = vfs_init_io_attributes(devvp, mp); | |
613 | if (error) { | |
614 | printf("ffs_mountfs: vfs_init_io_attributes returned %d\n", | |
615 | error); | |
616 | goto out; | |
617 | } | |
1c79356b A |
618 | |
619 | /* XXX updating 4.2 FFS superblocks trashes rotational layout tables */ | |
620 | if (fs->fs_postblformat == FS_42POSTBLFMT && !ronly) { | |
621 | #if REV_ENDIAN_FS | |
622 | if (rev_endian) | |
623 | byte_swap_sbout(fs); | |
624 | #endif /* REV_ENDIAN_FS */ | |
625 | error = EROFS; /* needs translation */ | |
626 | goto out; | |
627 | } | |
628 | ||
629 | /* If we are not mounting read only, then check for overlap | |
630 | * condition in cylinder group's free block map. | |
631 | * If overlap exists, then force this into a read only mount | |
632 | * to avoid further corruption. PR#2216969 | |
633 | */ | |
634 | if (ronly == 0){ | |
635 | if (error = bread (devvp, fsbtodb(fs, cgtod(fs, 0)), | |
636 | (int)fs->fs_cgsize, NOCRED, &cgbp)) { | |
637 | brelse(cgbp); | |
638 | goto out; | |
639 | } | |
640 | cgp = (struct cg *)cgbp->b_data; | |
641 | #if REV_ENDIAN_FS | |
642 | if (rev_endian) | |
643 | byte_swap_cgin(cgp,fs); | |
644 | #endif /* REV_ENDIAN_FS */ | |
645 | if (!cg_chkmagic(cgp)){ | |
646 | #if REV_ENDIAN_FS | |
647 | if (rev_endian) | |
648 | byte_swap_cgout(cgp,fs); | |
649 | #endif /* REV_ENDIAN_FS */ | |
650 | brelse(cgbp); | |
651 | goto out; | |
652 | } | |
653 | if (cgp->cg_clustersumoff != 0) { | |
654 | /* Check for overlap */ | |
655 | clustersumoff = cgp->cg_freeoff + | |
656 | howmany(fs->fs_cpg * fs->fs_spc / NSPF(fs), NBBY); | |
657 | clustersumoff = roundup(clustersumoff, sizeof(long)); | |
658 | if (cgp->cg_clustersumoff < clustersumoff) { | |
659 | /* Overlap exists */ | |
660 | mp->mnt_flag |= MNT_RDONLY; | |
661 | ronly = 1; | |
662 | } | |
663 | } | |
664 | #if REV_ENDIAN_FS | |
665 | if (rev_endian) | |
666 | byte_swap_cgout(cgp,fs); | |
667 | #endif /* REV_ENDIAN_FS */ | |
668 | brelse(cgbp); | |
669 | } | |
670 | ||
671 | ump = _MALLOC(sizeof *ump, M_UFSMNT, M_WAITOK); | |
672 | bzero((caddr_t)ump, sizeof *ump); | |
673 | ump->um_fs = _MALLOC((u_long)fs->fs_sbsize, M_UFSMNT, | |
674 | M_WAITOK); | |
675 | bcopy(bp->b_data, ump->um_fs, (u_int)fs->fs_sbsize); | |
676 | if (fs->fs_sbsize < SBSIZE) | |
677 | bp->b_flags |= B_INVAL; | |
678 | #if REV_ENDIAN_FS | |
679 | if (rev_endian) | |
680 | byte_swap_sbout(fs); | |
681 | #endif /* REV_ENDIAN_FS */ | |
682 | brelse(bp); | |
683 | bp = NULL; | |
684 | fs = ump->um_fs; | |
685 | fs->fs_ronly = ronly; | |
686 | size = fs->fs_cssize; | |
687 | blks = howmany(size, fs->fs_fsize); | |
688 | if (fs->fs_contigsumsize > 0) | |
689 | size += fs->fs_ncg * sizeof(int32_t); | |
9bccf70c A |
690 | space = _MALLOC((u_long)size, M_UFSMNT, M_WAITOK); |
691 | fs->fs_csp = space; | |
1c79356b A |
692 | for (i = 0; i < blks; i += fs->fs_frag) { |
693 | size = fs->fs_bsize; | |
694 | if (i + fs->fs_frag > blks) | |
695 | size = (blks - i) * fs->fs_fsize; | |
696 | if (error = bread(devvp, fsbtodb(fs, fs->fs_csaddr + i), size, | |
697 | cred, &bp)) { | |
9bccf70c | 698 | _FREE(fs->fs_csp, M_UFSMNT); |
1c79356b A |
699 | goto out; |
700 | } | |
701 | bcopy(bp->b_data, space, (u_int)size); | |
702 | #if REV_ENDIAN_FS | |
703 | if (rev_endian) | |
704 | byte_swap_ints((int *) space, size / sizeof(int)); | |
705 | #endif /* REV_ENDIAN_FS */ | |
9bccf70c | 706 | space = (char *)space + size; |
1c79356b A |
707 | brelse(bp); |
708 | bp = NULL; | |
709 | } | |
710 | if (fs->fs_contigsumsize > 0) { | |
9bccf70c | 711 | fs->fs_maxcluster = lp = space; |
1c79356b A |
712 | for (i = 0; i < fs->fs_ncg; i++) |
713 | *lp++ = fs->fs_contigsumsize; | |
714 | } | |
715 | mp->mnt_data = (qaddr_t)ump; | |
716 | mp->mnt_stat.f_fsid.val[0] = (long)dev; | |
717 | mp->mnt_stat.f_fsid.val[1] = mp->mnt_vfc->vfc_typenum; | |
718 | #warning hardcoded max symlen and not "mp->mnt_maxsymlinklen = fs->fs_maxsymlinklen;" | |
719 | mp->mnt_maxsymlinklen = 60; | |
720 | #if REV_ENDIAN_FS | |
721 | if (rev_endian) | |
722 | mp->mnt_flag |= MNT_REVEND; | |
723 | #endif /* REV_ENDIAN_FS */ | |
724 | ump->um_mountp = mp; | |
725 | ump->um_dev = dev; | |
726 | ump->um_devvp = devvp; | |
727 | ump->um_nindir = fs->fs_nindir; | |
728 | ump->um_bptrtodb = fs->fs_fsbtodb; | |
729 | ump->um_seqinc = fs->fs_frag; | |
730 | for (i = 0; i < MAXQUOTAS; i++) | |
9bccf70c | 731 | ump->um_qfiles[i].qf_vp = NULLVP; |
1c79356b A |
732 | devvp->v_specflags |= SI_MOUNTEDON; |
733 | ffs_oldfscompat(fs); | |
734 | ump->um_savedmaxfilesize = fs->fs_maxfilesize; /* XXX */ | |
735 | maxfilesize = (u_int64_t)0x100000000; /* 4GB */ | |
736 | #if 0 | |
737 | maxfilesize = (u_int64_t)0x40000000 * fs->fs_bsize - 1; /* XXX */ | |
738 | #endif /* 0 */ | |
739 | if (fs->fs_maxfilesize > maxfilesize) /* XXX */ | |
740 | fs->fs_maxfilesize = maxfilesize; /* XXX */ | |
741 | if (ronly == 0) { | |
742 | fs->fs_clean = 0; | |
743 | (void) ffs_sbupdate(ump, MNT_WAIT); | |
744 | } | |
745 | return (0); | |
746 | out: | |
747 | if (bp) | |
748 | brelse(bp); | |
749 | (void)VOP_CLOSE(devvp, ronly ? FREAD : FREAD|FWRITE, cred, p); | |
750 | if (ump) { | |
751 | _FREE(ump->um_fs, M_UFSMNT); | |
752 | _FREE(ump, M_UFSMNT); | |
753 | mp->mnt_data = (qaddr_t)0; | |
754 | } | |
755 | return (error); | |
756 | } | |
757 | ||
758 | /* | |
759 | * Sanity checks for old file systems. | |
760 | * | |
761 | * XXX - goes away some day. | |
762 | */ | |
763 | ffs_oldfscompat(fs) | |
764 | struct fs *fs; | |
765 | { | |
766 | int i; | |
767 | ||
768 | fs->fs_npsect = max(fs->fs_npsect, fs->fs_nsect); /* XXX */ | |
769 | fs->fs_interleave = max(fs->fs_interleave, 1); /* XXX */ | |
770 | if (fs->fs_postblformat == FS_42POSTBLFMT) /* XXX */ | |
771 | fs->fs_nrpos = 8; /* XXX */ | |
772 | if (fs->fs_inodefmt < FS_44INODEFMT) { /* XXX */ | |
773 | u_int64_t sizepb = fs->fs_bsize; /* XXX */ | |
774 | /* XXX */ | |
775 | fs->fs_maxfilesize = fs->fs_bsize * NDADDR - 1; /* XXX */ | |
776 | for (i = 0; i < NIADDR; i++) { /* XXX */ | |
777 | sizepb *= NINDIR(fs); /* XXX */ | |
778 | fs->fs_maxfilesize += sizepb; /* XXX */ | |
779 | } /* XXX */ | |
780 | fs->fs_qbmask = ~fs->fs_bmask; /* XXX */ | |
781 | fs->fs_qfmask = ~fs->fs_fmask; /* XXX */ | |
782 | } /* XXX */ | |
783 | return (0); | |
784 | } | |
785 | ||
786 | /* | |
787 | * unmount system call | |
788 | */ | |
789 | int | |
790 | ffs_unmount(mp, mntflags, p) | |
791 | struct mount *mp; | |
792 | int mntflags; | |
793 | struct proc *p; | |
794 | { | |
795 | register struct ufsmount *ump; | |
796 | register struct fs *fs; | |
797 | int error, flags; | |
9bccf70c A |
798 | int force; |
799 | ||
1c79356b | 800 | flags = 0; |
9bccf70c A |
801 | force = 0; |
802 | if (mntflags & MNT_FORCE) { | |
1c79356b | 803 | flags |= FORCECLOSE; |
9bccf70c A |
804 | force = 1; |
805 | } | |
806 | if ( (error = ffs_flushfiles(mp, flags, p)) && !force ) | |
1c79356b A |
807 | return (error); |
808 | ump = VFSTOUFS(mp); | |
809 | fs = ump->um_fs; | |
810 | if (fs->fs_ronly == 0) { | |
811 | fs->fs_clean = 1; | |
812 | if (error = ffs_sbupdate(ump, MNT_WAIT)) { | |
813 | fs->fs_clean = 0; | |
814 | #ifdef notyet | |
815 | /* we can atleast cleanup ; as the media could be WP */ | |
816 | /* & during mount, we do not check for write failures */ | |
817 | /* FIXME LATER : the Correct fix would be to have */ | |
818 | /* mount detect the WP media and downgrade to readonly mount */ | |
819 | /* For now, here it is */ | |
820 | return (error); | |
821 | #endif /* notyet */ | |
822 | } | |
823 | } | |
824 | ump->um_devvp->v_specflags &= ~SI_MOUNTEDON; | |
825 | error = VOP_CLOSE(ump->um_devvp, fs->fs_ronly ? FREAD : FREAD|FWRITE, | |
826 | NOCRED, p); | |
9bccf70c A |
827 | if (error && !force) |
828 | return (error); | |
1c79356b A |
829 | vrele(ump->um_devvp); |
830 | ||
9bccf70c | 831 | _FREE(fs->fs_csp, M_UFSMNT); |
1c79356b A |
832 | _FREE(fs, M_UFSMNT); |
833 | _FREE(ump, M_UFSMNT); | |
834 | mp->mnt_data = (qaddr_t)0; | |
835 | #if REV_ENDIAN_FS | |
836 | mp->mnt_flag &= ~MNT_REVEND; | |
837 | #endif /* REV_ENDIAN_FS */ | |
9bccf70c | 838 | return (0); |
1c79356b A |
839 | } |
840 | ||
841 | /* | |
842 | * Flush out all the files in a filesystem. | |
843 | */ | |
844 | ffs_flushfiles(mp, flags, p) | |
845 | register struct mount *mp; | |
846 | int flags; | |
847 | struct proc *p; | |
848 | { | |
849 | register struct ufsmount *ump; | |
850 | int i, error; | |
851 | ||
852 | ump = VFSTOUFS(mp); | |
853 | #if QUOTA | |
854 | if (mp->mnt_flag & MNT_QUOTA) { | |
855 | if (error = vflush(mp, NULLVP, SKIPSYSTEM|flags)) | |
856 | return (error); | |
857 | for (i = 0; i < MAXQUOTAS; i++) { | |
9bccf70c | 858 | if (ump->um_qfiles[i].qf_vp == NULLVP) |
1c79356b A |
859 | continue; |
860 | quotaoff(p, mp, i); | |
861 | } | |
862 | /* | |
863 | * Here we fall through to vflush again to ensure | |
864 | * that we have gotten rid of all the system vnodes. | |
865 | */ | |
866 | } | |
867 | #endif | |
868 | error = vflush(mp, NULLVP, SKIPSWAP|flags); | |
869 | error = vflush(mp, NULLVP, flags); | |
870 | return (error); | |
871 | } | |
872 | ||
873 | /* | |
874 | * Get file system statistics. | |
875 | */ | |
876 | int | |
877 | ffs_statfs(mp, sbp, p) | |
878 | struct mount *mp; | |
879 | register struct statfs *sbp; | |
880 | struct proc *p; | |
881 | { | |
882 | register struct ufsmount *ump; | |
883 | register struct fs *fs; | |
884 | ||
885 | ump = VFSTOUFS(mp); | |
886 | fs = ump->um_fs; | |
887 | if (fs->fs_magic != FS_MAGIC) | |
888 | panic("ffs_statfs"); | |
889 | sbp->f_bsize = fs->fs_fsize; | |
890 | sbp->f_iosize = fs->fs_bsize; | |
891 | sbp->f_blocks = fs->fs_dsize; | |
892 | sbp->f_bfree = fs->fs_cstotal.cs_nbfree * fs->fs_frag + | |
893 | fs->fs_cstotal.cs_nffree; | |
894 | sbp->f_bavail = freespace(fs, fs->fs_minfree); | |
895 | sbp->f_files = fs->fs_ncg * fs->fs_ipg - ROOTINO; | |
896 | sbp->f_ffree = fs->fs_cstotal.cs_nifree; | |
897 | if (sbp != &mp->mnt_stat) { | |
898 | sbp->f_type = mp->mnt_vfc->vfc_typenum; | |
899 | bcopy((caddr_t)mp->mnt_stat.f_mntonname, | |
900 | (caddr_t)&sbp->f_mntonname[0], MNAMELEN); | |
901 | bcopy((caddr_t)mp->mnt_stat.f_mntfromname, | |
902 | (caddr_t)&sbp->f_mntfromname[0], MNAMELEN); | |
903 | } | |
904 | return (0); | |
905 | } | |
906 | ||
907 | /* | |
908 | * Go through the disk queues to initiate sandbagged IO; | |
909 | * go through the inodes to write those that have been modified; | |
910 | * initiate the writing of the super block if it has been modified. | |
911 | * | |
912 | * Note: we are always called with the filesystem marked `MPBUSY'. | |
913 | */ | |
914 | int | |
915 | ffs_sync(mp, waitfor, cred, p) | |
916 | struct mount *mp; | |
917 | int waitfor; | |
918 | struct ucred *cred; | |
919 | struct proc *p; | |
920 | { | |
921 | struct vnode *nvp, *vp; | |
922 | struct inode *ip; | |
923 | struct ufsmount *ump = VFSTOUFS(mp); | |
924 | struct fs *fs; | |
925 | int error, allerror = 0; | |
926 | ||
927 | fs = ump->um_fs; | |
928 | if (fs->fs_fmod != 0 && fs->fs_ronly != 0) { /* XXX */ | |
929 | printf("fs = %s\n", fs->fs_fsmnt); | |
930 | panic("update: rofs mod"); | |
931 | } | |
932 | /* | |
933 | * Write back each (modified) inode. | |
934 | */ | |
935 | simple_lock(&mntvnode_slock); | |
936 | loop: | |
937 | for (vp = mp->mnt_vnodelist.lh_first; | |
938 | vp != NULL; | |
939 | vp = nvp) { | |
0b4e3aa0 A |
940 | int didhold = 0; |
941 | ||
1c79356b A |
942 | /* |
943 | * If the vnode that we are about to sync is no longer | |
944 | * associated with this mount point, start over. | |
945 | */ | |
946 | if (vp->v_mount != mp) | |
947 | goto loop; | |
948 | simple_lock(&vp->v_interlock); | |
949 | nvp = vp->v_mntvnodes.le_next; | |
950 | ip = VTOI(vp); | |
951 | if ((vp->v_type == VNON) || | |
952 | ((ip->i_flag & (IN_ACCESS | IN_CHANGE | IN_MODIFIED | IN_UPDATE)) == 0 && | |
953 | vp->v_dirtyblkhd.lh_first == NULL && !(vp->v_flag & VHASDIRTY))) { | |
954 | simple_unlock(&vp->v_interlock); | |
955 | continue; | |
956 | } | |
957 | simple_unlock(&mntvnode_slock); | |
958 | error = vget(vp, LK_EXCLUSIVE | LK_NOWAIT | LK_INTERLOCK, p); | |
959 | if (error) { | |
960 | simple_lock(&mntvnode_slock); | |
961 | if (error == ENOENT) | |
962 | goto loop; | |
963 | continue; | |
964 | } | |
0b4e3aa0 | 965 | didhold = ubc_hold(vp); |
1c79356b A |
966 | if (error = VOP_FSYNC(vp, cred, waitfor, p)) |
967 | allerror = error; | |
968 | VOP_UNLOCK(vp, 0, p); | |
0b4e3aa0 A |
969 | if (didhold) |
970 | ubc_rele(vp); | |
1c79356b A |
971 | vrele(vp); |
972 | simple_lock(&mntvnode_slock); | |
973 | } | |
974 | simple_unlock(&mntvnode_slock); | |
975 | /* | |
976 | * Force stale file system control information to be flushed. | |
977 | */ | |
978 | if (error = VOP_FSYNC(ump->um_devvp, cred, waitfor, p)) | |
979 | allerror = error; | |
980 | #if QUOTA | |
981 | qsync(mp); | |
982 | #endif | |
983 | /* | |
984 | * Write back modified superblock. | |
985 | */ | |
986 | if (fs->fs_fmod != 0) { | |
987 | fs->fs_fmod = 0; | |
988 | fs->fs_time = time.tv_sec; | |
989 | if (error = ffs_sbupdate(ump, waitfor)) | |
990 | allerror = error; | |
991 | } | |
992 | return (allerror); | |
993 | } | |
994 | ||
995 | /* | |
996 | * Look up a FFS dinode number to find its incore vnode, otherwise read it | |
997 | * in from disk. If it is in core, wait for the lock bit to clear, then | |
998 | * return the inode locked. Detection and handling of mount points must be | |
999 | * done by the calling routine. | |
1000 | */ | |
1001 | int | |
1002 | ffs_vget(mp, ino, vpp) | |
1003 | struct mount *mp; | |
1004 | ino_t ino; | |
1005 | struct vnode **vpp; | |
1006 | { | |
1007 | struct proc *p = current_proc(); /* XXX */ | |
1008 | struct fs *fs; | |
1009 | struct inode *ip; | |
1010 | struct ufsmount *ump; | |
1011 | struct buf *bp; | |
1012 | struct vnode *vp; | |
1013 | dev_t dev; | |
1014 | int i, type, error; | |
1015 | ||
1016 | ump = VFSTOUFS(mp); | |
1017 | dev = ump->um_dev; | |
1018 | ||
1019 | /* Check for unmount in progress */ | |
1020 | if (mp->mnt_kern_flag & MNTK_UNMOUNT) { | |
1021 | *vpp = NULL; | |
1022 | return (EPERM); | |
1023 | } | |
1024 | ||
1025 | if ((*vpp = ufs_ihashget(dev, ino)) != NULL) { | |
1026 | vp = *vpp; | |
1027 | UBCINFOCHECK("ffs_vget", vp); | |
1028 | return (0); | |
1029 | } | |
1030 | /* Allocate a new vnode/inode. */ | |
1031 | type = ump->um_devvp->v_tag == VT_MFS ? M_MFSNODE : M_FFSNODE; /* XXX */ | |
1032 | MALLOC_ZONE(ip, struct inode *, sizeof(struct inode), type, M_WAITOK); | |
1c79356b A |
1033 | bzero((caddr_t)ip, sizeof(struct inode)); |
1034 | lockinit(&ip->i_lock, PINOD, "inode", 0, 0); | |
7b1edb79 A |
1035 | /* lock the inode */ |
1036 | lockmgr(&ip->i_lock, LK_EXCLUSIVE, (struct slock *)0, p); | |
1037 | ||
1c79356b A |
1038 | ip->i_fs = fs = ump->um_fs; |
1039 | ip->i_dev = dev; | |
1040 | ip->i_number = ino; | |
7b1edb79 | 1041 | ip->i_flag |= IN_ALLOC; |
1c79356b A |
1042 | #if QUOTA |
1043 | for (i = 0; i < MAXQUOTAS; i++) | |
1044 | ip->i_dquot[i] = NODQUOT; | |
1045 | #endif | |
7b1edb79 | 1046 | |
1c79356b | 1047 | /* |
7b1edb79 A |
1048 | * MALLOC_ZONE is blocking call. Check for race. |
1049 | */ | |
1050 | if ((*vpp = ufs_ihashget(dev, ino)) != NULL) { | |
1051 | /* Clean up */ | |
1052 | FREE_ZONE(ip, sizeof(struct inode), type); | |
1053 | vp = *vpp; | |
1054 | UBCINFOCHECK("ffs_vget", vp); | |
1055 | return (0); | |
1056 | } | |
1057 | ||
1058 | /* | |
1059 | * Put it onto its hash chain locked so that other requests for | |
1c79356b A |
1060 | * this inode will block if they arrive while we are sleeping waiting |
1061 | * for old data structures to be purged or for the contents of the | |
1062 | * disk portion of this inode to be read. | |
1063 | */ | |
1064 | ufs_ihashins(ip); | |
1065 | ||
7b1edb79 A |
1066 | if (error = getnewvnode(VT_UFS, mp, ffs_vnodeop_p, &vp)) { |
1067 | ufs_ihashrem(ip); | |
1068 | if (ISSET(ip->i_flag, IN_WALLOC)) | |
1069 | wakeup(ip); | |
1070 | FREE_ZONE(ip, sizeof(struct inode), type); | |
1071 | *vpp = NULL; | |
1072 | return (error); | |
1073 | } | |
1074 | vp->v_data = ip; | |
1075 | ip->i_vnode = vp; | |
1076 | ||
1077 | /* | |
1078 | * A vnode is associated with the inode now, | |
1079 | * vget() can deal with the serialization. | |
1080 | */ | |
1081 | CLR(ip->i_flag, IN_ALLOC); | |
1082 | if (ISSET(ip->i_flag, IN_WALLOC)) | |
1083 | wakeup(ip); | |
1084 | ||
1c79356b A |
1085 | /* Read in the disk contents for the inode, copy into the inode. */ |
1086 | if (error = bread(ump->um_devvp, fsbtodb(fs, ino_to_fsba(fs, ino)), | |
1087 | (int)fs->fs_bsize, NOCRED, &bp)) { | |
1088 | /* | |
1089 | * The inode does not contain anything useful, so it would | |
1090 | * be misleading to leave it on its hash chain. With mode | |
1091 | * still zero, it will be unlinked and returned to the free | |
1092 | * list by vput(). | |
1093 | */ | |
1094 | vput(vp); | |
1095 | brelse(bp); | |
1096 | *vpp = NULL; | |
1097 | return (error); | |
1098 | } | |
1099 | #if REV_ENDIAN_FS | |
1100 | if (mp->mnt_flag & MNT_REVEND) { | |
1101 | byte_swap_inode_in(((struct dinode *)bp->b_data + ino_to_fsbo(fs, ino)),ip); | |
1102 | } else { | |
1103 | #endif /* REV_ENDIAN_FS */ | |
1104 | ip->i_din = *((struct dinode *)bp->b_data + ino_to_fsbo(fs, ino)); | |
1105 | #if REV_ENDIAN_FS | |
1106 | } | |
1107 | #endif /* REV_ENDIAN_FS */ | |
1108 | brelse(bp); | |
1109 | ||
1110 | /* | |
1111 | * Initialize the vnode from the inode, check for aliases. | |
1112 | * Note that the underlying vnode may have changed. | |
1113 | */ | |
1114 | if (error = ufs_vinit(mp, ffs_specop_p, FFS_FIFOOPS, &vp)) { | |
1115 | vput(vp); | |
1116 | *vpp = NULL; | |
1117 | return (error); | |
1118 | } | |
1119 | /* | |
1120 | * Finish inode initialization now that aliasing has been resolved. | |
1121 | */ | |
1122 | ip->i_devvp = ump->um_devvp; | |
1123 | VREF(ip->i_devvp); | |
1124 | /* | |
1125 | * Set up a generation number for this inode if it does not | |
1126 | * already have one. This should only happen on old filesystems. | |
1127 | */ | |
1128 | if (ip->i_gen == 0) { | |
1129 | if (++nextgennumber < (u_long)time.tv_sec) | |
1130 | nextgennumber = time.tv_sec; | |
1131 | ip->i_gen = nextgennumber; | |
1132 | if ((vp->v_mount->mnt_flag & MNT_RDONLY) == 0) | |
1133 | ip->i_flag |= IN_MODIFIED; | |
1134 | } | |
1135 | /* | |
1136 | * Ensure that uid and gid are correct. This is a temporary | |
1137 | * fix until fsck has been changed to do the update. | |
1138 | */ | |
1139 | if (fs->fs_inodefmt < FS_44INODEFMT) { /* XXX */ | |
1140 | ip->i_uid = ip->i_din.di_ouid; /* XXX */ | |
1141 | ip->i_gid = ip->i_din.di_ogid; /* XXX */ | |
1142 | } /* XXX */ | |
1143 | ||
1144 | *vpp = vp; | |
1145 | if (UBCINFOMISSING(vp) || UBCINFORECLAIMED(vp)) | |
1146 | ubc_info_init(vp); | |
1147 | return (0); | |
1148 | } | |
1149 | ||
1150 | /* | |
1151 | * File handle to vnode | |
1152 | * | |
1153 | * Have to be really careful about stale file handles: | |
1154 | * - check that the inode number is valid | |
1155 | * - call ffs_vget() to get the locked inode | |
1156 | * - check for an unallocated inode (i_mode == 0) | |
1157 | * - check that the given client host has export rights and return | |
1158 | * those rights via. exflagsp and credanonp | |
1159 | */ | |
1160 | int | |
1161 | ffs_fhtovp(mp, fhp, nam, vpp, exflagsp, credanonp) | |
1162 | register struct mount *mp; | |
1163 | struct fid *fhp; | |
1164 | struct mbuf *nam; | |
1165 | struct vnode **vpp; | |
1166 | int *exflagsp; | |
1167 | struct ucred **credanonp; | |
1168 | { | |
1169 | register struct ufid *ufhp; | |
1170 | struct fs *fs; | |
1171 | ||
1172 | ufhp = (struct ufid *)fhp; | |
1173 | fs = VFSTOUFS(mp)->um_fs; | |
1174 | if (ufhp->ufid_ino < ROOTINO || | |
1175 | ufhp->ufid_ino >= fs->fs_ncg * fs->fs_ipg) | |
1176 | return (ESTALE); | |
1177 | return (ufs_check_export(mp, ufhp, nam, vpp, exflagsp, credanonp)); | |
1178 | } | |
1179 | ||
1180 | /* | |
1181 | * Vnode pointer to File handle | |
1182 | */ | |
1183 | /* ARGSUSED */ | |
1184 | ffs_vptofh(vp, fhp) | |
1185 | struct vnode *vp; | |
1186 | struct fid *fhp; | |
1187 | { | |
1188 | register struct inode *ip; | |
1189 | register struct ufid *ufhp; | |
1190 | ||
1191 | ip = VTOI(vp); | |
1192 | ufhp = (struct ufid *)fhp; | |
1193 | ufhp->ufid_len = sizeof(struct ufid); | |
1194 | ufhp->ufid_ino = ip->i_number; | |
1195 | ufhp->ufid_gen = ip->i_gen; | |
1196 | return (0); | |
1197 | } | |
1198 | ||
1199 | /* | |
1200 | * Initialize the filesystem; just use ufs_init. | |
1201 | */ | |
1202 | int | |
1203 | ffs_init(vfsp) | |
1204 | struct vfsconf *vfsp; | |
1205 | { | |
1206 | ||
1207 | return (ufs_init(vfsp)); | |
1208 | } | |
1209 | ||
1210 | /* | |
1211 | * fast filesystem related variables. | |
1212 | */ | |
1213 | ffs_sysctl(name, namelen, oldp, oldlenp, newp, newlen, p) | |
1214 | int *name; | |
1215 | u_int namelen; | |
1216 | void *oldp; | |
1217 | size_t *oldlenp; | |
1218 | void *newp; | |
1219 | size_t newlen; | |
1220 | struct proc *p; | |
1221 | { | |
1222 | extern int doclusterread, doclusterwrite, doreallocblks, doasyncfree; | |
1223 | ||
1224 | /* all sysctl names at this level are terminal */ | |
1225 | if (namelen != 1) | |
1226 | return (ENOTDIR); /* overloaded */ | |
1227 | ||
1228 | switch (name[0]) { | |
1229 | case FFS_CLUSTERREAD: | |
1230 | return (sysctl_int(oldp, oldlenp, newp, newlen, | |
1231 | &doclusterread)); | |
1232 | case FFS_CLUSTERWRITE: | |
1233 | return (sysctl_int(oldp, oldlenp, newp, newlen, | |
1234 | &doclusterwrite)); | |
1235 | case FFS_REALLOCBLKS: | |
1236 | return (sysctl_int(oldp, oldlenp, newp, newlen, | |
1237 | &doreallocblks)); | |
1238 | case FFS_ASYNCFREE: | |
1239 | return (sysctl_int(oldp, oldlenp, newp, newlen, &doasyncfree)); | |
1240 | default: | |
1241 | return (EOPNOTSUPP); | |
1242 | } | |
1243 | /* NOTREACHED */ | |
1244 | } | |
1245 | ||
1246 | /* | |
1247 | * Write a superblock and associated information back to disk. | |
1248 | */ | |
1249 | int | |
1250 | ffs_sbupdate(mp, waitfor) | |
1251 | struct ufsmount *mp; | |
1252 | int waitfor; | |
1253 | { | |
1254 | register struct fs *dfs, *fs = mp->um_fs; | |
1255 | register struct buf *bp; | |
1256 | int blks; | |
9bccf70c | 1257 | void *space; |
1c79356b A |
1258 | int i, size, error, allerror = 0; |
1259 | int devBlockSize=0; | |
1260 | #if REV_ENDIAN_FS | |
1261 | int rev_endian=(mp->um_mountp->mnt_flag & MNT_REVEND); | |
1262 | #endif /* REV_ENDIAN_FS */ | |
1263 | ||
1264 | /* | |
1265 | * First write back the summary information. | |
1266 | */ | |
1267 | blks = howmany(fs->fs_cssize, fs->fs_fsize); | |
9bccf70c | 1268 | space = fs->fs_csp; |
1c79356b A |
1269 | for (i = 0; i < blks; i += fs->fs_frag) { |
1270 | size = fs->fs_bsize; | |
1271 | if (i + fs->fs_frag > blks) | |
1272 | size = (blks - i) * fs->fs_fsize; | |
1273 | bp = getblk(mp->um_devvp, fsbtodb(fs, fs->fs_csaddr + i), | |
1274 | size, 0, 0, BLK_META); | |
1275 | bcopy(space, bp->b_data, (u_int)size); | |
1276 | #if REV_ENDIAN_FS | |
1277 | if (rev_endian) { | |
1278 | byte_swap_ints((int *)bp->b_data, size / sizeof(int)); | |
1279 | } | |
1280 | #endif /* REV_ENDIAN_FS */ | |
9bccf70c | 1281 | space = (char *)space + size; |
1c79356b A |
1282 | if (waitfor != MNT_WAIT) |
1283 | bawrite(bp); | |
1284 | else if (error = bwrite(bp)) | |
1285 | allerror = error; | |
1286 | } | |
1287 | /* | |
1288 | * Now write back the superblock itself. If any errors occurred | |
1289 | * up to this point, then fail so that the superblock avoids | |
1290 | * being written out as clean. | |
1291 | */ | |
1292 | if (allerror) | |
1293 | return (allerror); | |
1294 | VOP_DEVBLOCKSIZE(mp->um_devvp,&devBlockSize); | |
1295 | bp = getblk(mp->um_devvp, (SBOFF/devBlockSize), (int)fs->fs_sbsize, 0, 0, BLK_META); | |
1296 | bcopy((caddr_t)fs, bp->b_data, (u_int)fs->fs_sbsize); | |
1297 | /* Restore compatibility to old file systems. XXX */ | |
1298 | dfs = (struct fs *)bp->b_data; /* XXX */ | |
1299 | if (fs->fs_postblformat == FS_42POSTBLFMT) /* XXX */ | |
1300 | dfs->fs_nrpos = -1; /* XXX */ | |
1301 | #if REV_ENDIAN_FS | |
1302 | /* | |
1303 | * Swapping bytes here ; so that in case | |
1304 | * of inode format < FS_44INODEFMT appropriate | |
1305 | * fields get moved | |
1306 | */ | |
1307 | if (rev_endian) { | |
1308 | byte_swap_sbout((struct fs *)bp->b_data); | |
1309 | } | |
1310 | #endif /* REV_ENDIAN_FS */ | |
1311 | if (fs->fs_inodefmt < FS_44INODEFMT) { /* XXX */ | |
1312 | int32_t *lp, tmp; /* XXX */ | |
1313 | /* XXX */ | |
1314 | lp = (int32_t *)&dfs->fs_qbmask; /* XXX */ | |
1315 | tmp = lp[4]; /* XXX */ | |
1316 | for (i = 4; i > 0; i--) /* XXX */ | |
1317 | lp[i] = lp[i-1]; /* XXX */ | |
1318 | lp[0] = tmp; /* XXX */ | |
1319 | } /* XXX */ | |
1320 | #if REV_ENDIAN_FS | |
1321 | /* Note that dfs is already swapped so swap the filesize | |
1322 | * before writing | |
1323 | */ | |
1324 | if (rev_endian) { | |
1325 | dfs->fs_maxfilesize = NXSwapLongLong(mp->um_savedmaxfilesize); /* XXX */ | |
1326 | } else { | |
1327 | #endif /* REV_ENDIAN_FS */ | |
1328 | dfs->fs_maxfilesize = mp->um_savedmaxfilesize; /* XXX */ | |
1329 | #if REV_ENDIAN_FS | |
1330 | } | |
1331 | #endif /* REV_ENDIAN_FS */ | |
1332 | if (waitfor != MNT_WAIT) | |
1333 | bawrite(bp); | |
1334 | else if (error = bwrite(bp)) | |
1335 | allerror = error; | |
1336 | ||
1337 | return (allerror); | |
1338 | } |