]> git.saurik.com Git - apple/xnu.git/blob - bsd/hfs/hfs_vfsops.c
xnu-1228.3.13.tar.gz
[apple/xnu.git] / bsd / hfs / hfs_vfsops.c
1 /*
2 * Copyright (c) 1999-2008 Apple Inc. All rights reserved.
3 *
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
5 *
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
14 *
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
17 *
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
25 *
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
27 */
28 /*
29 * Copyright (c) 1991, 1993, 1994
30 * The Regents of the University of California. All rights reserved.
31 * (c) UNIX System Laboratories, Inc.
32 * All or some portions of this file are derived from material licensed
33 * to the University of California by American Telephone and Telegraph
34 * Co. or Unix System Laboratories, Inc. and are reproduced herein with
35 * the permission of UNIX System Laboratories, Inc.
36 *
37 * Redistribution and use in source and binary forms, with or without
38 * modification, are permitted provided that the following conditions
39 * are met:
40 * 1. Redistributions of source code must retain the above copyright
41 * notice, this list of conditions and the following disclaimer.
42 * 2. Redistributions in binary form must reproduce the above copyright
43 * notice, this list of conditions and the following disclaimer in the
44 * documentation and/or other materials provided with the distribution.
45 * 3. All advertising materials mentioning features or use of this software
46 * must display the following acknowledgement:
47 * This product includes software developed by the University of
48 * California, Berkeley and its contributors.
49 * 4. Neither the name of the University nor the names of its contributors
50 * may be used to endorse or promote products derived from this software
51 * without specific prior written permission.
52 *
53 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
54 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
55 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
56 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
57 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
58 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
59 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
60 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
61 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
62 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
63 * SUCH DAMAGE.
64 *
65 * hfs_vfsops.c
66 * derived from @(#)ufs_vfsops.c 8.8 (Berkeley) 5/20/95
67 *
68 * (c) Copyright 1997-2002 Apple Computer, Inc. All rights reserved.
69 *
70 * hfs_vfsops.c -- VFS layer for loadable HFS file system.
71 *
72 */
73 #include <sys/param.h>
74 #include <sys/systm.h>
75 #include <sys/kauth.h>
76
77 #include <sys/ubc.h>
78 #include <sys/vnode_internal.h>
79 #include <sys/mount_internal.h>
80 #include <sys/sysctl.h>
81 #include <sys/malloc.h>
82 #include <sys/stat.h>
83 #include <sys/quota.h>
84 #include <sys/disk.h>
85 #include <sys/paths.h>
86 #include <sys/utfconv.h>
87 #include <sys/kdebug.h>
88 #include <sys/fslog.h>
89
90 #include <kern/locks.h>
91
92 #include <vfs/vfs_journal.h>
93
94 #include <miscfs/specfs/specdev.h>
95 #include <hfs/hfs_mount.h>
96
97 #include "hfs.h"
98 #include "hfs_catalog.h"
99 #include "hfs_cnode.h"
100 #include "hfs_dbg.h"
101 #include "hfs_endian.h"
102 #include "hfs_hotfiles.h"
103 #include "hfs_quota.h"
104
105 #include "hfscommon/headers/FileMgrInternal.h"
106 #include "hfscommon/headers/BTreesInternal.h"
107
108 #if HFS_DIAGNOSTIC
109 int hfs_dbg_all = 0;
110 int hfs_dbg_err = 0;
111 #endif
112
113
114 lck_grp_attr_t * hfs_group_attr;
115 lck_attr_t * hfs_lock_attr;
116 lck_grp_t * hfs_mutex_group;
117 lck_grp_t * hfs_rwlock_group;
118
119 extern struct vnodeopv_desc hfs_vnodeop_opv_desc;
120
121 static int hfs_changefs(struct mount *mp, struct hfs_mount_args *args);
122 static int hfs_fhtovp(struct mount *mp, int fhlen, unsigned char *fhp, struct vnode **vpp, vfs_context_t context);
123 static int hfs_flushfiles(struct mount *, int, struct proc *);
124 static int hfs_flushMDB(struct hfsmount *hfsmp, int waitfor, int altflush);
125 static int hfs_getmountpoint(struct vnode *vp, struct hfsmount **hfsmpp);
126 static int hfs_init(struct vfsconf *vfsp);
127 static int hfs_mount(struct mount *mp, vnode_t devvp, user_addr_t data, vfs_context_t context);
128 static int hfs_mountfs(struct vnode *devvp, struct mount *mp, struct hfs_mount_args *args, int journal_replay_only, vfs_context_t context);
129 static int hfs_reload(struct mount *mp);
130 static int hfs_vfs_root(struct mount *mp, struct vnode **vpp, vfs_context_t context);
131 static int hfs_quotactl(struct mount *, int, uid_t, caddr_t, vfs_context_t context);
132 static int hfs_start(struct mount *mp, int flags, vfs_context_t context);
133 static int hfs_statfs(struct mount *mp, register struct vfsstatfs *sbp, vfs_context_t context);
134 static int hfs_sync(struct mount *mp, int waitfor, vfs_context_t context);
135 static int hfs_sysctl(int *name, u_int namelen, user_addr_t oldp, size_t *oldlenp,
136 user_addr_t newp, size_t newlen, vfs_context_t context);
137 static int hfs_unmount(struct mount *mp, int mntflags, vfs_context_t context);
138 static int hfs_vfs_vget(struct mount *mp, ino64_t ino, struct vnode **vpp, vfs_context_t context);
139 static int hfs_vptofh(struct vnode *vp, int *fhlenp, unsigned char *fhp, vfs_context_t context);
140
141 static int hfs_reclaimspace(struct hfsmount *hfsmp, u_long startblk, u_long reclaimblks, vfs_context_t context);
142 static int hfs_overlapped_overflow_extents(struct hfsmount *hfsmp, u_int32_t startblk,
143 u_int32_t catblks, u_int32_t fileID, int rsrcfork);
144 static int hfs_journal_replay(const char *devnode, vfs_context_t context);
145
146
147 /*
148 * Called by vfs_mountroot when mounting HFS Plus as root.
149 */
150
151 __private_extern__
152 int
153 hfs_mountroot(mount_t mp, vnode_t rvp, vfs_context_t context)
154 {
155 struct hfsmount *hfsmp;
156 ExtendedVCB *vcb;
157 struct vfsstatfs *vfsp;
158 int error;
159
160 hfs_chashinit_finish();
161
162 if ((error = hfs_mountfs(rvp, mp, NULL, 0, context)))
163 return (error);
164
165 /* Init hfsmp */
166 hfsmp = VFSTOHFS(mp);
167
168 hfsmp->hfs_uid = UNKNOWNUID;
169 hfsmp->hfs_gid = UNKNOWNGID;
170 hfsmp->hfs_dir_mask = (S_IRWXU | S_IRGRP|S_IXGRP | S_IROTH|S_IXOTH); /* 0755 */
171 hfsmp->hfs_file_mask = (S_IRWXU | S_IRGRP|S_IXGRP | S_IROTH|S_IXOTH); /* 0755 */
172
173 /* Establish the free block reserve. */
174 vcb = HFSTOVCB(hfsmp);
175 vcb->reserveBlocks = ((u_int64_t)vcb->totalBlocks * HFS_MINFREE) / 100;
176 vcb->reserveBlocks = MIN(vcb->reserveBlocks, HFS_MAXRESERVE / vcb->blockSize);
177
178 vfsp = vfs_statfs(mp);
179 (void)hfs_statfs(mp, vfsp, NULL);
180
181 return (0);
182 }
183
184
185 /*
186 * VFS Operations.
187 *
188 * mount system call
189 */
190
191 static int
192 hfs_mount(struct mount *mp, vnode_t devvp, user_addr_t data, vfs_context_t context)
193 {
194 struct proc *p = vfs_context_proc(context);
195 struct hfsmount *hfsmp = NULL;
196 struct hfs_mount_args args;
197 int retval = E_NONE;
198 u_int32_t cmdflags;
199
200 if ((retval = copyin(data, (caddr_t)&args, sizeof(args)))) {
201 return (retval);
202 }
203 cmdflags = (u_int32_t)vfs_flags(mp) & MNT_CMDFLAGS;
204 if (cmdflags & MNT_UPDATE) {
205 hfsmp = VFSTOHFS(mp);
206
207 /* Reload incore data after an fsck. */
208 if (cmdflags & MNT_RELOAD) {
209 if (vfs_isrdonly(mp))
210 return hfs_reload(mp);
211 else
212 return (EINVAL);
213 }
214
215 /* Change to a read-only file system. */
216 if (((hfsmp->hfs_flags & HFS_READ_ONLY) == 0) &&
217 vfs_isrdonly(mp)) {
218 int flags;
219
220 /* use VFS_SYNC to push out System (btree) files */
221 retval = VFS_SYNC(mp, MNT_WAIT, context);
222 if (retval && ((cmdflags & MNT_FORCE) == 0))
223 goto out;
224
225 flags = WRITECLOSE;
226 if (cmdflags & MNT_FORCE)
227 flags |= FORCECLOSE;
228
229 if ((retval = hfs_flushfiles(mp, flags, p)))
230 goto out;
231 hfsmp->hfs_flags |= HFS_READ_ONLY;
232 retval = hfs_flushvolumeheader(hfsmp, MNT_WAIT, 0);
233
234 /* also get the volume bitmap blocks */
235 if (!retval) {
236 if (vnode_mount(hfsmp->hfs_devvp) == mp) {
237 retval = hfs_fsync(hfsmp->hfs_devvp, MNT_WAIT, 0, p);
238 } else {
239 vnode_get(hfsmp->hfs_devvp);
240 retval = VNOP_FSYNC(hfsmp->hfs_devvp, MNT_WAIT, context);
241 vnode_put(hfsmp->hfs_devvp);
242 }
243 }
244 if (retval) {
245 hfsmp->hfs_flags &= ~HFS_READ_ONLY;
246 goto out;
247 }
248 if (hfsmp->jnl) {
249 hfs_global_exclusive_lock_acquire(hfsmp);
250
251 journal_close(hfsmp->jnl);
252 hfsmp->jnl = NULL;
253
254 // Note: we explicitly don't want to shutdown
255 // access to the jvp because we may need
256 // it later if we go back to being read-write.
257
258 hfs_global_exclusive_lock_release(hfsmp);
259 }
260 }
261
262 /* Change to a writable file system. */
263 if (vfs_iswriteupgrade(mp)) {
264
265 /*
266 * On inconsistent disks, do not allow read-write mount
267 * unless it is the boot volume being mounted.
268 */
269 if (!(vfs_flags(mp) & MNT_ROOTFS) &&
270 (hfsmp->vcbAtrb & kHFSVolumeInconsistentMask)) {
271 retval = EINVAL;
272 goto out;
273 }
274
275
276 retval = hfs_flushvolumeheader(hfsmp, MNT_WAIT, 0);
277 if (retval != E_NONE)
278 goto out;
279
280 // If the journal was shut-down previously because we were
281 // asked to be read-only, let's start it back up again now
282
283 if ( (HFSTOVCB(hfsmp)->vcbAtrb & kHFSVolumeJournaledMask)
284 && hfsmp->jnl == NULL
285 && hfsmp->jvp != NULL) {
286 int jflags;
287
288 if (hfsmp->hfs_flags & HFS_NEED_JNL_RESET) {
289 jflags = JOURNAL_RESET;
290 } else {
291 jflags = 0;
292 }
293
294 hfs_global_exclusive_lock_acquire(hfsmp);
295
296 hfsmp->jnl = journal_open(hfsmp->jvp,
297 (hfsmp->jnl_start * HFSTOVCB(hfsmp)->blockSize) + (off_t)HFSTOVCB(hfsmp)->hfsPlusIOPosOffset,
298 hfsmp->jnl_size,
299 hfsmp->hfs_devvp,
300 hfsmp->hfs_phys_block_size,
301 jflags,
302 0,
303 hfs_sync_metadata, hfsmp->hfs_mp);
304
305 hfs_global_exclusive_lock_release(hfsmp);
306
307 if (hfsmp->jnl == NULL) {
308 retval = EINVAL;
309 goto out;
310 } else {
311 hfsmp->hfs_flags &= ~HFS_NEED_JNL_RESET;
312 }
313
314 }
315
316 /* Only clear HFS_READ_ONLY after a successfull write */
317 hfsmp->hfs_flags &= ~HFS_READ_ONLY;
318
319 if (!(hfsmp->hfs_flags & (HFS_READ_ONLY & HFS_STANDARD))) {
320 /* Setup private/hidden directories for hardlinks. */
321 hfs_privatedir_init(hfsmp, FILE_HARDLINKS);
322 hfs_privatedir_init(hfsmp, DIR_HARDLINKS);
323
324 hfs_remove_orphans(hfsmp);
325
326 /*
327 * Allow hot file clustering if conditions allow.
328 */
329 if (hfsmp->hfs_flags & HFS_METADATA_ZONE) {
330 (void) hfs_recording_init(hfsmp);
331 }
332 /* Force ACLs on HFS+ file systems. */
333 if (vfs_extendedsecurity(HFSTOVFS(hfsmp)) == 0) {
334 vfs_setextendedsecurity(HFSTOVFS(hfsmp));
335 }
336 }
337 }
338
339 /* Update file system parameters. */
340 retval = hfs_changefs(mp, &args);
341
342 } else /* not an update request */ {
343
344 /* Set the mount flag to indicate that we support volfs */
345 vfs_setflags(mp, (u_int64_t)((unsigned int)MNT_DOVOLFS));
346
347 hfs_chashinit_finish();
348
349 retval = hfs_mountfs(devvp, mp, &args, 0, context);
350 }
351 out:
352 if (retval == 0) {
353 (void)hfs_statfs(mp, vfs_statfs(mp), context);
354 }
355 return (retval);
356 }
357
358
359 struct hfs_changefs_cargs {
360 struct hfsmount *hfsmp;
361 int namefix;
362 int permfix;
363 int permswitch;
364 };
365
366 static int
367 hfs_changefs_callback(struct vnode *vp, void *cargs)
368 {
369 ExtendedVCB *vcb;
370 struct cnode *cp;
371 struct cat_desc cndesc;
372 struct cat_attr cnattr;
373 struct hfs_changefs_cargs *args;
374
375 args = (struct hfs_changefs_cargs *)cargs;
376
377 cp = VTOC(vp);
378 vcb = HFSTOVCB(args->hfsmp);
379
380 if (cat_lookup(args->hfsmp, &cp->c_desc, 0, &cndesc, &cnattr, NULL, NULL)) {
381 /*
382 * If we couldn't find this guy skip to the next one
383 */
384 if (args->namefix)
385 cache_purge(vp);
386
387 return (VNODE_RETURNED);
388 }
389 /*
390 * Get the real uid/gid and perm mask from disk.
391 */
392 if (args->permswitch || args->permfix) {
393 cp->c_uid = cnattr.ca_uid;
394 cp->c_gid = cnattr.ca_gid;
395 cp->c_mode = cnattr.ca_mode;
396 }
397 /*
398 * If we're switching name converters then...
399 * Remove the existing entry from the namei cache.
400 * Update name to one based on new encoder.
401 */
402 if (args->namefix) {
403 cache_purge(vp);
404 replace_desc(cp, &cndesc);
405
406 if (cndesc.cd_cnid == kHFSRootFolderID) {
407 strlcpy((char *)vcb->vcbVN, (const char *)cp->c_desc.cd_nameptr, NAME_MAX+1);
408 cp->c_desc.cd_encoding = args->hfsmp->hfs_encoding;
409 }
410 } else {
411 cat_releasedesc(&cndesc);
412 }
413 return (VNODE_RETURNED);
414 }
415
416 /* Change fs mount parameters */
417 static int
418 hfs_changefs(struct mount *mp, struct hfs_mount_args *args)
419 {
420 int retval = 0;
421 int namefix, permfix, permswitch;
422 struct hfsmount *hfsmp;
423 ExtendedVCB *vcb;
424 hfs_to_unicode_func_t get_unicode_func;
425 unicode_to_hfs_func_t get_hfsname_func;
426 u_long old_encoding = 0;
427 struct hfs_changefs_cargs cargs;
428 u_int32_t mount_flags;
429
430 hfsmp = VFSTOHFS(mp);
431 vcb = HFSTOVCB(hfsmp);
432 mount_flags = (unsigned int)vfs_flags(mp);
433
434 permswitch = (((hfsmp->hfs_flags & HFS_UNKNOWN_PERMS) &&
435 ((mount_flags & MNT_UNKNOWNPERMISSIONS) == 0)) ||
436 (((hfsmp->hfs_flags & HFS_UNKNOWN_PERMS) == 0) &&
437 (mount_flags & MNT_UNKNOWNPERMISSIONS)));
438
439 /* The root filesystem must operate with actual permissions: */
440 if (permswitch && (mount_flags & MNT_ROOTFS) && (mount_flags & MNT_UNKNOWNPERMISSIONS)) {
441 vfs_clearflags(mp, (u_int64_t)((unsigned int)MNT_UNKNOWNPERMISSIONS)); /* Just say "No". */
442 return EINVAL;
443 }
444 if (mount_flags & MNT_UNKNOWNPERMISSIONS)
445 hfsmp->hfs_flags |= HFS_UNKNOWN_PERMS;
446 else
447 hfsmp->hfs_flags &= ~HFS_UNKNOWN_PERMS;
448
449 namefix = permfix = 0;
450
451 /*
452 * Tracking of hot files requires up-to-date access times. So if
453 * access time updates are disabled, we must also disable hot files.
454 */
455 if (mount_flags & MNT_NOATIME) {
456 (void) hfs_recording_suspend(hfsmp);
457 }
458
459 /* Change the timezone (Note: this affects all hfs volumes and hfs+ volume create dates) */
460 if (args->hfs_timezone.tz_minuteswest != VNOVAL) {
461 gTimeZone = args->hfs_timezone;
462 }
463
464 /* Change the default uid, gid and/or mask */
465 if ((args->hfs_uid != (uid_t)VNOVAL) && (hfsmp->hfs_uid != args->hfs_uid)) {
466 hfsmp->hfs_uid = args->hfs_uid;
467 if (vcb->vcbSigWord == kHFSPlusSigWord)
468 ++permfix;
469 }
470 if ((args->hfs_gid != (gid_t)VNOVAL) && (hfsmp->hfs_gid != args->hfs_gid)) {
471 hfsmp->hfs_gid = args->hfs_gid;
472 if (vcb->vcbSigWord == kHFSPlusSigWord)
473 ++permfix;
474 }
475 if (args->hfs_mask != (mode_t)VNOVAL) {
476 if (hfsmp->hfs_dir_mask != (args->hfs_mask & ALLPERMS)) {
477 hfsmp->hfs_dir_mask = args->hfs_mask & ALLPERMS;
478 hfsmp->hfs_file_mask = args->hfs_mask & ALLPERMS;
479 if ((args->flags != VNOVAL) && (args->flags & HFSFSMNT_NOXONFILES))
480 hfsmp->hfs_file_mask = (args->hfs_mask & DEFFILEMODE);
481 if (vcb->vcbSigWord == kHFSPlusSigWord)
482 ++permfix;
483 }
484 }
485
486 /* Change the hfs encoding value (hfs only) */
487 if ((vcb->vcbSigWord == kHFSSigWord) &&
488 (args->hfs_encoding != (u_long)VNOVAL) &&
489 (hfsmp->hfs_encoding != args->hfs_encoding)) {
490
491 retval = hfs_getconverter(args->hfs_encoding, &get_unicode_func, &get_hfsname_func);
492 if (retval)
493 goto exit;
494
495 /*
496 * Connect the new hfs_get_unicode converter but leave
497 * the old hfs_get_hfsname converter in place so that
498 * we can lookup existing vnodes to get their correctly
499 * encoded names.
500 *
501 * When we're all finished, we can then connect the new
502 * hfs_get_hfsname converter and release our interest
503 * in the old converters.
504 */
505 hfsmp->hfs_get_unicode = get_unicode_func;
506 old_encoding = hfsmp->hfs_encoding;
507 hfsmp->hfs_encoding = args->hfs_encoding;
508 ++namefix;
509 }
510
511 if (!(namefix || permfix || permswitch))
512 goto exit;
513
514 /* XXX 3762912 hack to support HFS filesystem 'owner' */
515 if (permfix)
516 vfs_setowner(mp,
517 hfsmp->hfs_uid == UNKNOWNUID ? KAUTH_UID_NONE : hfsmp->hfs_uid,
518 hfsmp->hfs_gid == UNKNOWNGID ? KAUTH_GID_NONE : hfsmp->hfs_gid);
519
520 /*
521 * For each active vnode fix things that changed
522 *
523 * Note that we can visit a vnode more than once
524 * and we can race with fsync.
525 *
526 * hfs_changefs_callback will be called for each vnode
527 * hung off of this mount point
528 * the vnode will be
529 * properly referenced and unreferenced around the callback
530 */
531 cargs.hfsmp = hfsmp;
532 cargs.namefix = namefix;
533 cargs.permfix = permfix;
534 cargs.permswitch = permswitch;
535
536 vnode_iterate(mp, 0, hfs_changefs_callback, (void *)&cargs);
537
538 /*
539 * If we're switching name converters we can now
540 * connect the new hfs_get_hfsname converter and
541 * release our interest in the old converters.
542 */
543 if (namefix) {
544 hfsmp->hfs_get_hfsname = get_hfsname_func;
545 vcb->volumeNameEncodingHint = args->hfs_encoding;
546 (void) hfs_relconverter(old_encoding);
547 }
548 exit:
549 return (retval);
550 }
551
552
553 struct hfs_reload_cargs {
554 struct hfsmount *hfsmp;
555 int error;
556 };
557
558 static int
559 hfs_reload_callback(struct vnode *vp, void *cargs)
560 {
561 struct cnode *cp;
562 struct hfs_reload_cargs *args;
563
564 args = (struct hfs_reload_cargs *)cargs;
565 /*
566 * flush all the buffers associated with this node
567 */
568 (void) buf_invalidateblks(vp, 0, 0, 0);
569
570 cp = VTOC(vp);
571 /*
572 * Remove any directory hints
573 */
574 if (vnode_isdir(vp))
575 hfs_reldirhints(cp, 0);
576
577 /*
578 * Re-read cnode data for all active vnodes (non-metadata files).
579 */
580 if (!vnode_issystem(vp) && !VNODE_IS_RSRC(vp)) {
581 struct cat_fork *datafork;
582 struct cat_desc desc;
583
584 datafork = cp->c_datafork ? &cp->c_datafork->ff_data : NULL;
585
586 /* lookup by fileID since name could have changed */
587 if ((args->error = cat_idlookup(args->hfsmp, cp->c_fileid, 0, &desc, &cp->c_attr, datafork)))
588 return (VNODE_RETURNED_DONE);
589
590 /* update cnode's catalog descriptor */
591 (void) replace_desc(cp, &desc);
592 }
593 return (VNODE_RETURNED);
594 }
595
596 /*
597 * Reload all incore data for a filesystem (used after running fsck on
598 * the root filesystem and finding things to fix). The filesystem must
599 * be mounted read-only.
600 *
601 * Things to do to update the mount:
602 * invalidate all cached meta-data.
603 * invalidate all inactive vnodes.
604 * invalidate all cached file data.
605 * re-read volume header from disk.
606 * re-load meta-file info (extents, file size).
607 * re-load B-tree header data.
608 * re-read cnode data for all active vnodes.
609 */
610 static int
611 hfs_reload(struct mount *mountp)
612 {
613 register struct vnode *devvp;
614 struct buf *bp;
615 int sectorsize;
616 int error, i;
617 struct hfsmount *hfsmp;
618 struct HFSPlusVolumeHeader *vhp;
619 ExtendedVCB *vcb;
620 struct filefork *forkp;
621 struct cat_desc cndesc;
622 struct hfs_reload_cargs args;
623
624 hfsmp = VFSTOHFS(mountp);
625 vcb = HFSTOVCB(hfsmp);
626
627 if (vcb->vcbSigWord == kHFSSigWord)
628 return (EINVAL); /* rooting from HFS is not supported! */
629
630 /*
631 * Invalidate all cached meta-data.
632 */
633 devvp = hfsmp->hfs_devvp;
634 if (buf_invalidateblks(devvp, 0, 0, 0))
635 panic("hfs_reload: dirty1");
636
637 args.hfsmp = hfsmp;
638 args.error = 0;
639 /*
640 * hfs_reload_callback will be called for each vnode
641 * hung off of this mount point that can't be recycled...
642 * vnode_iterate will recycle those that it can (the VNODE_RELOAD option)
643 * the vnode will be in an 'unbusy' state (VNODE_WAIT) and
644 * properly referenced and unreferenced around the callback
645 */
646 vnode_iterate(mountp, VNODE_RELOAD | VNODE_WAIT, hfs_reload_callback, (void *)&args);
647
648 if (args.error)
649 return (args.error);
650
651 /*
652 * Re-read VolumeHeader from disk.
653 */
654 sectorsize = hfsmp->hfs_phys_block_size;
655
656 error = (int)buf_meta_bread(hfsmp->hfs_devvp,
657 (daddr64_t)((vcb->hfsPlusIOPosOffset / sectorsize) + HFS_PRI_SECTOR(sectorsize)),
658 sectorsize, NOCRED, &bp);
659 if (error) {
660 if (bp != NULL)
661 buf_brelse(bp);
662 return (error);
663 }
664
665 vhp = (HFSPlusVolumeHeader *) (buf_dataptr(bp) + HFS_PRI_OFFSET(sectorsize));
666
667 /* Do a quick sanity check */
668 if ((SWAP_BE16(vhp->signature) != kHFSPlusSigWord &&
669 SWAP_BE16(vhp->signature) != kHFSXSigWord) ||
670 (SWAP_BE16(vhp->version) != kHFSPlusVersion &&
671 SWAP_BE16(vhp->version) != kHFSXVersion) ||
672 SWAP_BE32(vhp->blockSize) != vcb->blockSize) {
673 buf_brelse(bp);
674 return (EIO);
675 }
676
677 vcb->vcbLsMod = to_bsd_time(SWAP_BE32(vhp->modifyDate));
678 vcb->vcbAtrb = SWAP_BE32 (vhp->attributes);
679 vcb->vcbJinfoBlock = SWAP_BE32(vhp->journalInfoBlock);
680 vcb->vcbClpSiz = SWAP_BE32 (vhp->rsrcClumpSize);
681 vcb->vcbNxtCNID = SWAP_BE32 (vhp->nextCatalogID);
682 vcb->vcbVolBkUp = to_bsd_time(SWAP_BE32(vhp->backupDate));
683 vcb->vcbWrCnt = SWAP_BE32 (vhp->writeCount);
684 vcb->vcbFilCnt = SWAP_BE32 (vhp->fileCount);
685 vcb->vcbDirCnt = SWAP_BE32 (vhp->folderCount);
686 HFS_UPDATE_NEXT_ALLOCATION(vcb, SWAP_BE32 (vhp->nextAllocation));
687 vcb->totalBlocks = SWAP_BE32 (vhp->totalBlocks);
688 vcb->freeBlocks = SWAP_BE32 (vhp->freeBlocks);
689 vcb->encodingsBitmap = SWAP_BE64 (vhp->encodingsBitmap);
690 bcopy(vhp->finderInfo, vcb->vcbFndrInfo, sizeof(vhp->finderInfo));
691 vcb->localCreateDate = SWAP_BE32 (vhp->createDate); /* hfs+ create date is in local time */
692
693 /*
694 * Re-load meta-file vnode data (extent info, file size, etc).
695 */
696 forkp = VTOF((struct vnode *)vcb->extentsRefNum);
697 for (i = 0; i < kHFSPlusExtentDensity; i++) {
698 forkp->ff_extents[i].startBlock =
699 SWAP_BE32 (vhp->extentsFile.extents[i].startBlock);
700 forkp->ff_extents[i].blockCount =
701 SWAP_BE32 (vhp->extentsFile.extents[i].blockCount);
702 }
703 forkp->ff_size = SWAP_BE64 (vhp->extentsFile.logicalSize);
704 forkp->ff_blocks = SWAP_BE32 (vhp->extentsFile.totalBlocks);
705 forkp->ff_clumpsize = SWAP_BE32 (vhp->extentsFile.clumpSize);
706
707
708 forkp = VTOF((struct vnode *)vcb->catalogRefNum);
709 for (i = 0; i < kHFSPlusExtentDensity; i++) {
710 forkp->ff_extents[i].startBlock =
711 SWAP_BE32 (vhp->catalogFile.extents[i].startBlock);
712 forkp->ff_extents[i].blockCount =
713 SWAP_BE32 (vhp->catalogFile.extents[i].blockCount);
714 }
715 forkp->ff_size = SWAP_BE64 (vhp->catalogFile.logicalSize);
716 forkp->ff_blocks = SWAP_BE32 (vhp->catalogFile.totalBlocks);
717 forkp->ff_clumpsize = SWAP_BE32 (vhp->catalogFile.clumpSize);
718
719 if (hfsmp->hfs_attribute_vp) {
720 forkp = VTOF(hfsmp->hfs_attribute_vp);
721 for (i = 0; i < kHFSPlusExtentDensity; i++) {
722 forkp->ff_extents[i].startBlock =
723 SWAP_BE32 (vhp->attributesFile.extents[i].startBlock);
724 forkp->ff_extents[i].blockCount =
725 SWAP_BE32 (vhp->attributesFile.extents[i].blockCount);
726 }
727 forkp->ff_size = SWAP_BE64 (vhp->attributesFile.logicalSize);
728 forkp->ff_blocks = SWAP_BE32 (vhp->attributesFile.totalBlocks);
729 forkp->ff_clumpsize = SWAP_BE32 (vhp->attributesFile.clumpSize);
730 }
731
732 forkp = VTOF((struct vnode *)vcb->allocationsRefNum);
733 for (i = 0; i < kHFSPlusExtentDensity; i++) {
734 forkp->ff_extents[i].startBlock =
735 SWAP_BE32 (vhp->allocationFile.extents[i].startBlock);
736 forkp->ff_extents[i].blockCount =
737 SWAP_BE32 (vhp->allocationFile.extents[i].blockCount);
738 }
739 forkp->ff_size = SWAP_BE64 (vhp->allocationFile.logicalSize);
740 forkp->ff_blocks = SWAP_BE32 (vhp->allocationFile.totalBlocks);
741 forkp->ff_clumpsize = SWAP_BE32 (vhp->allocationFile.clumpSize);
742
743 buf_brelse(bp);
744 vhp = NULL;
745
746 /*
747 * Re-load B-tree header data
748 */
749 forkp = VTOF((struct vnode *)vcb->extentsRefNum);
750 if ( (error = MacToVFSError( BTReloadData((FCB*)forkp) )) )
751 return (error);
752
753 forkp = VTOF((struct vnode *)vcb->catalogRefNum);
754 if ( (error = MacToVFSError( BTReloadData((FCB*)forkp) )) )
755 return (error);
756
757 if (hfsmp->hfs_attribute_vp) {
758 forkp = VTOF(hfsmp->hfs_attribute_vp);
759 if ( (error = MacToVFSError( BTReloadData((FCB*)forkp) )) )
760 return (error);
761 }
762
763 /* Reload the volume name */
764 if ((error = cat_idlookup(hfsmp, kHFSRootFolderID, 0, &cndesc, NULL, NULL)))
765 return (error);
766 vcb->volumeNameEncodingHint = cndesc.cd_encoding;
767 bcopy(cndesc.cd_nameptr, vcb->vcbVN, min(255, cndesc.cd_namelen));
768 cat_releasedesc(&cndesc);
769
770 /* Re-establish private/hidden directories. */
771 hfs_privatedir_init(hfsmp, FILE_HARDLINKS);
772 hfs_privatedir_init(hfsmp, DIR_HARDLINKS);
773
774 /* In case any volume information changed to trigger a notification */
775 hfs_generate_volume_notifications(hfsmp);
776
777 return (0);
778 }
779
780
781 /*
782 * Common code for mount and mountroot
783 */
784 static int
785 hfs_mountfs(struct vnode *devvp, struct mount *mp, struct hfs_mount_args *args,
786 int journal_replay_only, vfs_context_t context)
787 {
788 struct proc *p = vfs_context_proc(context);
789 int retval = E_NONE;
790 struct hfsmount *hfsmp;
791 struct buf *bp;
792 dev_t dev;
793 HFSMasterDirectoryBlock *mdbp;
794 int ronly;
795 #if QUOTA
796 int i;
797 #endif
798 int mntwrapper;
799 kauth_cred_t cred;
800 u_int64_t disksize;
801 daddr64_t blkcnt;
802 u_int32_t blksize;
803 u_int32_t minblksize;
804 u_int32_t iswritable;
805 daddr64_t mdb_offset;
806 int isvirtual = 0;
807
808 ronly = vfs_isrdonly(mp);
809 dev = vnode_specrdev(devvp);
810 cred = p ? vfs_context_ucred(context) : NOCRED;
811 mntwrapper = 0;
812
813 bp = NULL;
814 hfsmp = NULL;
815 mdbp = NULL;
816 minblksize = kHFSBlockSize;
817
818 /* Advisory locking should be handled at the VFS layer */
819 vfs_setlocklocal(mp);
820
821 /* Get the real physical block size. */
822 if (VNOP_IOCTL(devvp, DKIOCGETBLOCKSIZE, (caddr_t)&blksize, 0, context)) {
823 retval = ENXIO;
824 goto error_exit;
825 }
826 /* Switch to 512 byte sectors (temporarily) */
827 if (blksize > 512) {
828 u_int32_t size512 = 512;
829
830 if (VNOP_IOCTL(devvp, DKIOCSETBLOCKSIZE, (caddr_t)&size512, FWRITE, context)) {
831 retval = ENXIO;
832 goto error_exit;
833 }
834 }
835 /* Get the number of 512 byte physical blocks. */
836 if (VNOP_IOCTL(devvp, DKIOCGETBLOCKCOUNT, (caddr_t)&blkcnt, 0, context)) {
837 /* resetting block size may fail if getting block count did */
838 (void)VNOP_IOCTL(devvp, DKIOCSETBLOCKSIZE, (caddr_t)&blksize, FWRITE, context);
839
840 retval = ENXIO;
841 goto error_exit;
842 }
843 /* Compute an accurate disk size (i.e. within 512 bytes) */
844 disksize = (u_int64_t)blkcnt * (u_int64_t)512;
845
846 /*
847 * On Tiger it is not necessary to switch the device
848 * block size to be 4k if there are more than 31-bits
849 * worth of blocks but to insure compatibility with
850 * pre-Tiger systems we have to do it.
851 */
852 if (blkcnt > 0x000000007fffffff) {
853 minblksize = blksize = 4096;
854 }
855
856 /* Now switch to our preferred physical block size. */
857 if (blksize > 512) {
858 if (VNOP_IOCTL(devvp, DKIOCSETBLOCKSIZE, (caddr_t)&blksize, FWRITE, context)) {
859 retval = ENXIO;
860 goto error_exit;
861 }
862 /* Get the count of physical blocks. */
863 if (VNOP_IOCTL(devvp, DKIOCGETBLOCKCOUNT, (caddr_t)&blkcnt, 0, context)) {
864 retval = ENXIO;
865 goto error_exit;
866 }
867 }
868 /*
869 * At this point:
870 * minblksize is the minimum physical block size
871 * blksize has our preferred physical block size
872 * blkcnt has the total number of physical blocks
873 */
874
875 mdb_offset = (daddr64_t)HFS_PRI_SECTOR(blksize);
876 if ((retval = (int)buf_meta_bread(devvp, mdb_offset, blksize, cred, &bp))) {
877 goto error_exit;
878 }
879 MALLOC(mdbp, HFSMasterDirectoryBlock *, kMDBSize, M_TEMP, M_WAITOK);
880 bcopy((char *)buf_dataptr(bp) + HFS_PRI_OFFSET(blksize), mdbp, kMDBSize);
881 buf_brelse(bp);
882 bp = NULL;
883
884 MALLOC(hfsmp, struct hfsmount *, sizeof(struct hfsmount), M_HFSMNT, M_WAITOK);
885 bzero(hfsmp, sizeof(struct hfsmount));
886
887 /*
888 * Init the volume information structure
889 */
890
891 lck_mtx_init(&hfsmp->hfs_mutex, hfs_mutex_group, hfs_lock_attr);
892 lck_mtx_init(&hfsmp->hfc_mutex, hfs_mutex_group, hfs_lock_attr);
893 lck_rw_init(&hfsmp->hfs_global_lock, hfs_rwlock_group, hfs_lock_attr);
894 lck_rw_init(&hfsmp->hfs_insync, hfs_rwlock_group, hfs_lock_attr);
895
896 vfs_setfsprivate(mp, hfsmp);
897 hfsmp->hfs_mp = mp; /* Make VFSTOHFS work */
898 hfsmp->hfs_raw_dev = vnode_specrdev(devvp);
899 hfsmp->hfs_devvp = devvp;
900 vnode_ref(devvp); /* Hold a ref on the device, dropped when hfsmp is freed. */
901 hfsmp->hfs_phys_block_size = blksize;
902 hfsmp->hfs_phys_block_count = blkcnt;
903 hfsmp->hfs_flags |= HFS_WRITEABLE_MEDIA;
904 if (ronly)
905 hfsmp->hfs_flags |= HFS_READ_ONLY;
906 if (((unsigned int)vfs_flags(mp)) & MNT_UNKNOWNPERMISSIONS)
907 hfsmp->hfs_flags |= HFS_UNKNOWN_PERMS;
908
909 #if QUOTA
910 for (i = 0; i < MAXQUOTAS; i++)
911 dqfileinit(&hfsmp->hfs_qfiles[i]);
912 #endif
913
914 if (args) {
915 hfsmp->hfs_uid = (args->hfs_uid == (uid_t)VNOVAL) ? UNKNOWNUID : args->hfs_uid;
916 if (hfsmp->hfs_uid == 0xfffffffd) hfsmp->hfs_uid = UNKNOWNUID;
917 hfsmp->hfs_gid = (args->hfs_gid == (gid_t)VNOVAL) ? UNKNOWNGID : args->hfs_gid;
918 if (hfsmp->hfs_gid == 0xfffffffd) hfsmp->hfs_gid = UNKNOWNGID;
919 vfs_setowner(mp, hfsmp->hfs_uid, hfsmp->hfs_gid); /* tell the VFS */
920 if (args->hfs_mask != (mode_t)VNOVAL) {
921 hfsmp->hfs_dir_mask = args->hfs_mask & ALLPERMS;
922 if (args->flags & HFSFSMNT_NOXONFILES) {
923 hfsmp->hfs_file_mask = (args->hfs_mask & DEFFILEMODE);
924 } else {
925 hfsmp->hfs_file_mask = args->hfs_mask & ALLPERMS;
926 }
927 } else {
928 hfsmp->hfs_dir_mask = UNKNOWNPERMISSIONS & ALLPERMS; /* 0777: rwx---rwx */
929 hfsmp->hfs_file_mask = UNKNOWNPERMISSIONS & DEFFILEMODE; /* 0666: no --x by default? */
930 }
931 if ((args->flags != (int)VNOVAL) && (args->flags & HFSFSMNT_WRAPPER))
932 mntwrapper = 1;
933 } else {
934 /* Even w/o explicit mount arguments, MNT_UNKNOWNPERMISSIONS requires setting up uid, gid, and mask: */
935 if (((unsigned int)vfs_flags(mp)) & MNT_UNKNOWNPERMISSIONS) {
936 hfsmp->hfs_uid = UNKNOWNUID;
937 hfsmp->hfs_gid = UNKNOWNGID;
938 vfs_setowner(mp, hfsmp->hfs_uid, hfsmp->hfs_gid); /* tell the VFS */
939 hfsmp->hfs_dir_mask = UNKNOWNPERMISSIONS & ALLPERMS; /* 0777: rwx---rwx */
940 hfsmp->hfs_file_mask = UNKNOWNPERMISSIONS & DEFFILEMODE; /* 0666: no --x by default? */
941 }
942 }
943
944 /* Find out if disk media is writable. */
945 if (VNOP_IOCTL(devvp, DKIOCISWRITABLE, (caddr_t)&iswritable, 0, context) == 0) {
946 if (iswritable)
947 hfsmp->hfs_flags |= HFS_WRITEABLE_MEDIA;
948 else
949 hfsmp->hfs_flags &= ~HFS_WRITEABLE_MEDIA;
950 }
951
952 // record the current time at which we're mounting this volume
953 struct timeval tv;
954 microtime(&tv);
955 hfsmp->hfs_mount_time = tv.tv_sec;
956
957 /* Mount a standard HFS disk */
958 if ((SWAP_BE16(mdbp->drSigWord) == kHFSSigWord) &&
959 (mntwrapper || (SWAP_BE16(mdbp->drEmbedSigWord) != kHFSPlusSigWord))) {
960
961 /* If only journal replay is requested, exit immediately */
962 if (journal_replay_only) {
963 retval = 0;
964 goto error_exit;
965 }
966
967 if ((vfs_flags(mp) & MNT_ROOTFS)) {
968 retval = EINVAL; /* Cannot root from HFS standard disks */
969 goto error_exit;
970 }
971 /* HFS disks can only use 512 byte physical blocks */
972 if (blksize > kHFSBlockSize) {
973 blksize = kHFSBlockSize;
974 if (VNOP_IOCTL(devvp, DKIOCSETBLOCKSIZE, (caddr_t)&blksize, FWRITE, context)) {
975 retval = ENXIO;
976 goto error_exit;
977 }
978 if (VNOP_IOCTL(devvp, DKIOCGETBLOCKCOUNT, (caddr_t)&blkcnt, 0, context)) {
979 retval = ENXIO;
980 goto error_exit;
981 }
982 hfsmp->hfs_phys_block_size = blksize;
983 hfsmp->hfs_phys_block_count = blkcnt;
984 }
985 if (args) {
986 hfsmp->hfs_encoding = args->hfs_encoding;
987 HFSTOVCB(hfsmp)->volumeNameEncodingHint = args->hfs_encoding;
988
989 /* establish the timezone */
990 gTimeZone = args->hfs_timezone;
991 }
992
993 retval = hfs_getconverter(hfsmp->hfs_encoding, &hfsmp->hfs_get_unicode,
994 &hfsmp->hfs_get_hfsname);
995 if (retval)
996 goto error_exit;
997
998 retval = hfs_MountHFSVolume(hfsmp, mdbp, p);
999 if (retval)
1000 (void) hfs_relconverter(hfsmp->hfs_encoding);
1001
1002 } else /* Mount an HFS Plus disk */ {
1003 HFSPlusVolumeHeader *vhp;
1004 off_t embeddedOffset;
1005 int jnl_disable = 0;
1006
1007 /* Get the embedded Volume Header */
1008 if (SWAP_BE16(mdbp->drEmbedSigWord) == kHFSPlusSigWord) {
1009 embeddedOffset = SWAP_BE16(mdbp->drAlBlSt) * kHFSBlockSize;
1010 embeddedOffset += (u_int64_t)SWAP_BE16(mdbp->drEmbedExtent.startBlock) *
1011 (u_int64_t)SWAP_BE32(mdbp->drAlBlkSiz);
1012
1013 /*
1014 * If the embedded volume doesn't start on a block
1015 * boundary, then switch the device to a 512-byte
1016 * block size so everything will line up on a block
1017 * boundary.
1018 */
1019 if ((embeddedOffset % blksize) != 0) {
1020 printf("HFS Mount: embedded volume offset not"
1021 " a multiple of physical block size (%d);"
1022 " switching to 512\n", blksize);
1023 blksize = 512;
1024 if (VNOP_IOCTL(devvp, DKIOCSETBLOCKSIZE,
1025 (caddr_t)&blksize, FWRITE, context)) {
1026 retval = ENXIO;
1027 goto error_exit;
1028 }
1029 if (VNOP_IOCTL(devvp, DKIOCGETBLOCKCOUNT,
1030 (caddr_t)&blkcnt, 0, context)) {
1031 retval = ENXIO;
1032 goto error_exit;
1033 }
1034 /* Note: relative block count adjustment */
1035 hfsmp->hfs_phys_block_count *=
1036 hfsmp->hfs_phys_block_size / blksize;
1037 hfsmp->hfs_phys_block_size = blksize;
1038 }
1039
1040 disksize = (u_int64_t)SWAP_BE16(mdbp->drEmbedExtent.blockCount) *
1041 (u_int64_t)SWAP_BE32(mdbp->drAlBlkSiz);
1042
1043 hfsmp->hfs_phys_block_count = disksize / blksize;
1044
1045 mdb_offset = (daddr64_t)((embeddedOffset / blksize) + HFS_PRI_SECTOR(blksize));
1046 retval = (int)buf_meta_bread(devvp, mdb_offset, blksize, cred, &bp);
1047 if (retval)
1048 goto error_exit;
1049 bcopy((char *)buf_dataptr(bp) + HFS_PRI_OFFSET(blksize), mdbp, 512);
1050 buf_brelse(bp);
1051 bp = NULL;
1052 vhp = (HFSPlusVolumeHeader*) mdbp;
1053
1054 } else /* pure HFS+ */ {
1055 embeddedOffset = 0;
1056 vhp = (HFSPlusVolumeHeader*) mdbp;
1057 }
1058
1059 /*
1060 * On inconsistent disks, do not allow read-write mount
1061 * unless it is the boot volume being mounted.
1062 */
1063 if (!(vfs_flags(mp) & MNT_ROOTFS) &&
1064 (SWAP_BE32(vhp->attributes) & kHFSVolumeInconsistentMask) &&
1065 !(hfsmp->hfs_flags & HFS_READ_ONLY)) {
1066 retval = EINVAL;
1067 goto error_exit;
1068 }
1069
1070
1071 // XXXdbg
1072 //
1073 hfsmp->jnl = NULL;
1074 hfsmp->jvp = NULL;
1075 if (args != NULL && (args->flags & HFSFSMNT_EXTENDED_ARGS) &&
1076 args->journal_disable) {
1077 jnl_disable = 1;
1078 }
1079
1080 //
1081 // We only initialize the journal here if the last person
1082 // to mount this volume was journaling aware. Otherwise
1083 // we delay journal initialization until later at the end
1084 // of hfs_MountHFSPlusVolume() because the last person who
1085 // mounted it could have messed things up behind our back
1086 // (so we need to go find the .journal file, make sure it's
1087 // the right size, re-sync up if it was moved, etc).
1088 //
1089 if ( (SWAP_BE32(vhp->lastMountedVersion) == kHFSJMountVersion)
1090 && (SWAP_BE32(vhp->attributes) & kHFSVolumeJournaledMask)
1091 && !jnl_disable) {
1092
1093 // if we're able to init the journal, mark the mount
1094 // point as journaled.
1095 //
1096 if (hfs_early_journal_init(hfsmp, vhp, args, embeddedOffset, mdb_offset, mdbp, cred) == 0) {
1097 vfs_setflags(mp, (u_int64_t)((unsigned int)MNT_JOURNALED));
1098 } else {
1099 // if the journal failed to open, then set the lastMountedVersion
1100 // to be "FSK!" which fsck_hfs will see and force the fsck instead
1101 // of just bailing out because the volume is journaled.
1102 if (!ronly) {
1103 HFSPlusVolumeHeader *jvhp;
1104
1105 hfsmp->hfs_flags |= HFS_NEED_JNL_RESET;
1106
1107 if (mdb_offset == 0) {
1108 mdb_offset = (daddr64_t)((embeddedOffset / blksize) + HFS_PRI_SECTOR(blksize));
1109 }
1110
1111 bp = NULL;
1112 retval = (int)buf_meta_bread(devvp, mdb_offset, blksize, cred, &bp);
1113 if (retval == 0) {
1114 jvhp = (HFSPlusVolumeHeader *)(buf_dataptr(bp) + HFS_PRI_OFFSET(blksize));
1115
1116 if (SWAP_BE16(jvhp->signature) == kHFSPlusSigWord || SWAP_BE16(jvhp->signature) == kHFSXSigWord) {
1117 printf ("hfs(1): Journal replay fail. Writing lastMountVersion as FSK!\n");
1118 jvhp->lastMountedVersion = SWAP_BE32(kFSKMountVersion);
1119 buf_bwrite(bp);
1120 } else {
1121 buf_brelse(bp);
1122 }
1123 bp = NULL;
1124 } else if (bp) {
1125 buf_brelse(bp);
1126 // clear this so the error exit path won't try to use it
1127 bp = NULL;
1128 }
1129 }
1130
1131 // if this isn't the root device just bail out.
1132 // If it is the root device we just continue on
1133 // in the hopes that fsck_hfs will be able to
1134 // fix any damage that exists on the volume.
1135 if ( !(vfs_flags(mp) & MNT_ROOTFS)) {
1136 retval = EINVAL;
1137 goto error_exit;
1138 }
1139 }
1140 }
1141 // XXXdbg
1142
1143 /* Either the journal is replayed successfully, or there
1144 * was nothing to replay, or no journal exists. In any case,
1145 * return success.
1146 */
1147 if (journal_replay_only) {
1148 retval = 0;
1149 goto error_exit;
1150 }
1151
1152 (void) hfs_getconverter(0, &hfsmp->hfs_get_unicode, &hfsmp->hfs_get_hfsname);
1153
1154 retval = hfs_MountHFSPlusVolume(hfsmp, vhp, embeddedOffset, disksize, p, args, cred);
1155 /*
1156 * If the backend didn't like our physical blocksize
1157 * then retry with physical blocksize of 512.
1158 */
1159 if ((retval == ENXIO) && (blksize > 512) && (blksize != minblksize)) {
1160 printf("HFS Mount: could not use physical block size "
1161 "(%d) switching to 512\n", blksize);
1162 blksize = 512;
1163 if (VNOP_IOCTL(devvp, DKIOCSETBLOCKSIZE, (caddr_t)&blksize, FWRITE, context)) {
1164 retval = ENXIO;
1165 goto error_exit;
1166 }
1167 if (VNOP_IOCTL(devvp, DKIOCGETBLOCKCOUNT, (caddr_t)&blkcnt, 0, context)) {
1168 retval = ENXIO;
1169 goto error_exit;
1170 }
1171 devvp->v_specsize = blksize;
1172 /* Note: relative block count adjustment (in case this is an embedded volume). */
1173 hfsmp->hfs_phys_block_count *= hfsmp->hfs_phys_block_size / blksize;
1174 hfsmp->hfs_phys_block_size = blksize;
1175
1176 if (hfsmp->jnl) {
1177 // close and re-open this with the new block size
1178 journal_close(hfsmp->jnl);
1179 hfsmp->jnl = NULL;
1180 if (hfs_early_journal_init(hfsmp, vhp, args, embeddedOffset, mdb_offset, mdbp, cred) == 0) {
1181 vfs_setflags(mp, (u_int64_t)((unsigned int)MNT_JOURNALED));
1182 } else {
1183 // if the journal failed to open, then set the lastMountedVersion
1184 // to be "FSK!" which fsck_hfs will see and force the fsck instead
1185 // of just bailing out because the volume is journaled.
1186 if (!ronly) {
1187 HFSPlusVolumeHeader *jvhp;
1188
1189 hfsmp->hfs_flags |= HFS_NEED_JNL_RESET;
1190
1191 if (mdb_offset == 0) {
1192 mdb_offset = (daddr64_t)((embeddedOffset / blksize) + HFS_PRI_SECTOR(blksize));
1193 }
1194
1195 bp = NULL;
1196 retval = (int)buf_meta_bread(devvp, mdb_offset, blksize, cred, &bp);
1197 if (retval == 0) {
1198 jvhp = (HFSPlusVolumeHeader *)(buf_dataptr(bp) + HFS_PRI_OFFSET(blksize));
1199
1200 if (SWAP_BE16(jvhp->signature) == kHFSPlusSigWord || SWAP_BE16(jvhp->signature) == kHFSXSigWord) {
1201 printf ("hfs(2): Journal replay fail. Writing lastMountVersion as FSK!\n");
1202 jvhp->lastMountedVersion = SWAP_BE32(kFSKMountVersion);
1203 buf_bwrite(bp);
1204 } else {
1205 buf_brelse(bp);
1206 }
1207 bp = NULL;
1208 } else if (bp) {
1209 buf_brelse(bp);
1210 // clear this so the error exit path won't try to use it
1211 bp = NULL;
1212 }
1213 }
1214
1215 // if this isn't the root device just bail out.
1216 // If it is the root device we just continue on
1217 // in the hopes that fsck_hfs will be able to
1218 // fix any damage that exists on the volume.
1219 if ( !(vfs_flags(mp) & MNT_ROOTFS)) {
1220 retval = EINVAL;
1221 goto error_exit;
1222 }
1223 }
1224 }
1225
1226 /* Try again with a smaller block size... */
1227 retval = hfs_MountHFSPlusVolume(hfsmp, vhp, embeddedOffset, disksize, p, args, cred);
1228 }
1229 if (retval)
1230 (void) hfs_relconverter(0);
1231 }
1232
1233 // save off a snapshot of the mtime from the previous mount
1234 // (for matador).
1235 hfsmp->hfs_last_mounted_mtime = hfsmp->hfs_mtime;
1236
1237 if ( retval ) {
1238 goto error_exit;
1239 }
1240
1241 mp->mnt_vfsstat.f_fsid.val[0] = (long)dev;
1242 mp->mnt_vfsstat.f_fsid.val[1] = vfs_typenum(mp);
1243 vfs_setmaxsymlen(mp, 0);
1244 mp->mnt_vtable->vfc_threadsafe = TRUE;
1245 mp->mnt_vtable->vfc_vfsflags |= VFC_VFSNATIVEXATTR;
1246 #if NAMEDSTREAMS
1247 mp->mnt_kern_flag |= MNTK_NAMED_STREAMS;
1248 #endif
1249 if (!(hfsmp->hfs_flags & HFS_STANDARD)) {
1250 /* Tell VFS that we support directory hard links. */
1251 mp->mnt_vtable->vfc_vfsflags |= VFC_VFSDIRLINKS;
1252 } else {
1253 /* HFS standard doesn't support extended readdir! */
1254 mp->mnt_vtable->vfc_vfsflags &= ~VFC_VFSREADDIR_EXTENDED;
1255 }
1256
1257 if (args) {
1258 /*
1259 * Set the free space warning levels for a non-root volume:
1260 *
1261 * Set the lower freespace limit (the level that will trigger a warning)
1262 * to 5% of the volume size or 250MB, whichever is less, and the desired
1263 * level (which will cancel the alert request) to 1/2 above that limit.
1264 * Start looking for free space to drop below this level and generate a
1265 * warning immediately if needed:
1266 */
1267 hfsmp->hfs_freespace_notify_warninglimit =
1268 MIN(HFS_LOWDISKTRIGGERLEVEL / HFSTOVCB(hfsmp)->blockSize,
1269 (HFSTOVCB(hfsmp)->totalBlocks / 100) * HFS_LOWDISKTRIGGERFRACTION);
1270 hfsmp->hfs_freespace_notify_desiredlevel =
1271 MIN(HFS_LOWDISKSHUTOFFLEVEL / HFSTOVCB(hfsmp)->blockSize,
1272 (HFSTOVCB(hfsmp)->totalBlocks / 100) * HFS_LOWDISKSHUTOFFFRACTION);
1273 } else {
1274 /*
1275 * Set the free space warning levels for the root volume:
1276 *
1277 * Set the lower freespace limit (the level that will trigger a warning)
1278 * to 1% of the volume size or 50MB, whichever is less, and the desired
1279 * level (which will cancel the alert request) to 2% or 75MB, whichever is less.
1280 */
1281 hfsmp->hfs_freespace_notify_warninglimit =
1282 MIN(HFS_ROOTLOWDISKTRIGGERLEVEL / HFSTOVCB(hfsmp)->blockSize,
1283 (HFSTOVCB(hfsmp)->totalBlocks / 100) * HFS_ROOTLOWDISKTRIGGERFRACTION);
1284 hfsmp->hfs_freespace_notify_desiredlevel =
1285 MIN(HFS_ROOTLOWDISKSHUTOFFLEVEL / HFSTOVCB(hfsmp)->blockSize,
1286 (HFSTOVCB(hfsmp)->totalBlocks / 100) * HFS_ROOTLOWDISKSHUTOFFFRACTION);
1287 };
1288
1289 /* Check if the file system exists on virtual device, like disk image */
1290 if (VNOP_IOCTL(devvp, DKIOCISVIRTUAL, (caddr_t)&isvirtual, 0, context) == 0) {
1291 if (isvirtual) {
1292 hfsmp->hfs_flags |= HFS_VIRTUAL_DEVICE;
1293 }
1294 }
1295
1296 /*
1297 * Start looking for free space to drop below this level and generate a
1298 * warning immediately if needed:
1299 */
1300 hfsmp->hfs_notification_conditions = 0;
1301 hfs_generate_volume_notifications(hfsmp);
1302
1303 if (ronly == 0) {
1304 (void) hfs_flushvolumeheader(hfsmp, MNT_WAIT, 0);
1305 }
1306 FREE(mdbp, M_TEMP);
1307 return (0);
1308
1309 error_exit:
1310 if (bp)
1311 buf_brelse(bp);
1312 if (mdbp)
1313 FREE(mdbp, M_TEMP);
1314
1315 if (hfsmp && hfsmp->jvp && hfsmp->jvp != hfsmp->hfs_devvp) {
1316 (void)VNOP_CLOSE(hfsmp->jvp, ronly ? FREAD : FREAD|FWRITE, context);
1317 hfsmp->jvp = NULL;
1318 }
1319 if (hfsmp) {
1320 if (hfsmp->hfs_devvp) {
1321 vnode_rele(hfsmp->hfs_devvp);
1322 }
1323 FREE(hfsmp, M_HFSMNT);
1324 vfs_setfsprivate(mp, NULL);
1325 }
1326 return (retval);
1327 }
1328
1329
1330 /*
1331 * Make a filesystem operational.
1332 * Nothing to do at the moment.
1333 */
1334 /* ARGSUSED */
1335 static int
1336 hfs_start(__unused struct mount *mp, __unused int flags, __unused vfs_context_t context)
1337 {
1338 return (0);
1339 }
1340
1341
1342 /*
1343 * unmount system call
1344 */
1345 static int
1346 hfs_unmount(struct mount *mp, int mntflags, vfs_context_t context)
1347 {
1348 struct proc *p = vfs_context_proc(context);
1349 struct hfsmount *hfsmp = VFSTOHFS(mp);
1350 int retval = E_NONE;
1351 int flags;
1352 int force;
1353 int started_tr = 0;
1354
1355 flags = 0;
1356 force = 0;
1357 if (mntflags & MNT_FORCE) {
1358 flags |= FORCECLOSE;
1359 force = 1;
1360 }
1361
1362 if ((retval = hfs_flushfiles(mp, flags, p)) && !force)
1363 return (retval);
1364
1365 if (hfsmp->hfs_flags & HFS_METADATA_ZONE)
1366 (void) hfs_recording_suspend(hfsmp);
1367
1368 /*
1369 * Flush out the b-trees, volume bitmap and Volume Header
1370 */
1371 if ((hfsmp->hfs_flags & HFS_READ_ONLY) == 0) {
1372 retval = hfs_start_transaction(hfsmp);
1373 if (retval == 0) {
1374 started_tr = 1;
1375 } else if (!force) {
1376 goto err_exit;
1377 }
1378
1379 if (hfsmp->hfs_startup_vp) {
1380 (void) hfs_lock(VTOC(hfsmp->hfs_startup_vp), HFS_EXCLUSIVE_LOCK);
1381 retval = hfs_fsync(hfsmp->hfs_startup_vp, MNT_WAIT, 0, p);
1382 hfs_unlock(VTOC(hfsmp->hfs_startup_vp));
1383 if (retval && !force)
1384 goto err_exit;
1385 }
1386
1387 if (hfsmp->hfs_attribute_vp) {
1388 (void) hfs_lock(VTOC(hfsmp->hfs_attribute_vp), HFS_EXCLUSIVE_LOCK);
1389 retval = hfs_fsync(hfsmp->hfs_attribute_vp, MNT_WAIT, 0, p);
1390 hfs_unlock(VTOC(hfsmp->hfs_attribute_vp));
1391 if (retval && !force)
1392 goto err_exit;
1393 }
1394
1395 (void) hfs_lock(VTOC(hfsmp->hfs_catalog_vp), HFS_EXCLUSIVE_LOCK);
1396 retval = hfs_fsync(hfsmp->hfs_catalog_vp, MNT_WAIT, 0, p);
1397 hfs_unlock(VTOC(hfsmp->hfs_catalog_vp));
1398 if (retval && !force)
1399 goto err_exit;
1400
1401 (void) hfs_lock(VTOC(hfsmp->hfs_extents_vp), HFS_EXCLUSIVE_LOCK);
1402 retval = hfs_fsync(hfsmp->hfs_extents_vp, MNT_WAIT, 0, p);
1403 hfs_unlock(VTOC(hfsmp->hfs_extents_vp));
1404 if (retval && !force)
1405 goto err_exit;
1406
1407 if (hfsmp->hfs_allocation_vp) {
1408 (void) hfs_lock(VTOC(hfsmp->hfs_allocation_vp), HFS_EXCLUSIVE_LOCK);
1409 retval = hfs_fsync(hfsmp->hfs_allocation_vp, MNT_WAIT, 0, p);
1410 hfs_unlock(VTOC(hfsmp->hfs_allocation_vp));
1411 if (retval && !force)
1412 goto err_exit;
1413 }
1414
1415 if (hfsmp->hfc_filevp && vnode_issystem(hfsmp->hfc_filevp)) {
1416 retval = hfs_fsync(hfsmp->hfc_filevp, MNT_WAIT, 0, p);
1417 if (retval && !force)
1418 goto err_exit;
1419 }
1420
1421 /* If runtime corruption was detected, indicate that the volume
1422 * was not unmounted cleanly.
1423 */
1424 if (hfsmp->vcbAtrb & kHFSVolumeInconsistentMask) {
1425 HFSTOVCB(hfsmp)->vcbAtrb &= ~kHFSVolumeUnmountedMask;
1426 } else {
1427 HFSTOVCB(hfsmp)->vcbAtrb |= kHFSVolumeUnmountedMask;
1428 }
1429
1430 retval = hfs_flushvolumeheader(hfsmp, MNT_WAIT, 0);
1431 if (retval) {
1432 HFSTOVCB(hfsmp)->vcbAtrb &= ~kHFSVolumeUnmountedMask;
1433 if (!force)
1434 goto err_exit; /* could not flush everything */
1435 }
1436
1437 if (started_tr) {
1438 hfs_end_transaction(hfsmp);
1439 started_tr = 0;
1440 }
1441 }
1442
1443 if (hfsmp->jnl) {
1444 journal_flush(hfsmp->jnl);
1445 }
1446
1447 /*
1448 * Invalidate our caches and release metadata vnodes
1449 */
1450 (void) hfsUnmount(hfsmp, p);
1451
1452 /*
1453 * Last chance to dump unreferenced system files.
1454 */
1455 (void) vflush(mp, NULLVP, FORCECLOSE);
1456
1457 if (HFSTOVCB(hfsmp)->vcbSigWord == kHFSSigWord)
1458 (void) hfs_relconverter(hfsmp->hfs_encoding);
1459
1460 // XXXdbg
1461 if (hfsmp->jnl) {
1462 journal_close(hfsmp->jnl);
1463 hfsmp->jnl = NULL;
1464 }
1465
1466 VNOP_FSYNC(hfsmp->hfs_devvp, MNT_WAIT, context);
1467
1468 if (hfsmp->jvp && hfsmp->jvp != hfsmp->hfs_devvp) {
1469 retval = VNOP_CLOSE(hfsmp->jvp,
1470 hfsmp->hfs_flags & HFS_READ_ONLY ? FREAD : FREAD|FWRITE,
1471 context);
1472 vnode_put(hfsmp->jvp);
1473 hfsmp->jvp = NULL;
1474 }
1475 // XXXdbg
1476
1477 #ifdef HFS_SPARSE_DEV
1478 /* Drop our reference on the backing fs (if any). */
1479 if ((hfsmp->hfs_flags & HFS_HAS_SPARSE_DEVICE) && hfsmp->hfs_backingfs_rootvp) {
1480 struct vnode * tmpvp;
1481
1482 hfsmp->hfs_flags &= ~HFS_HAS_SPARSE_DEVICE;
1483 tmpvp = hfsmp->hfs_backingfs_rootvp;
1484 hfsmp->hfs_backingfs_rootvp = NULLVP;
1485 vnode_rele(tmpvp);
1486 }
1487 #endif /* HFS_SPARSE_DEV */
1488 lck_mtx_destroy(&hfsmp->hfc_mutex, hfs_mutex_group);
1489 vnode_rele(hfsmp->hfs_devvp);
1490 FREE(hfsmp, M_HFSMNT);
1491
1492 return (0);
1493
1494 err_exit:
1495 if (started_tr) {
1496 hfs_end_transaction(hfsmp);
1497 }
1498 return retval;
1499 }
1500
1501
1502 /*
1503 * Return the root of a filesystem.
1504 */
1505 static int
1506 hfs_vfs_root(struct mount *mp, struct vnode **vpp, __unused vfs_context_t context)
1507 {
1508 return hfs_vget(VFSTOHFS(mp), (cnid_t)kHFSRootFolderID, vpp, 1);
1509 }
1510
1511
1512 /*
1513 * Do operations associated with quotas
1514 */
1515 #if !QUOTA
1516 static int
1517 hfs_quotactl(__unused struct mount *mp, __unused int cmds, __unused uid_t uid, __unused caddr_t datap, __unused vfs_context_t context)
1518 {
1519 return (ENOTSUP);
1520 }
1521 #else
1522 static int
1523 hfs_quotactl(struct mount *mp, int cmds, uid_t uid, caddr_t datap, vfs_context_t context)
1524 {
1525 struct proc *p = vfs_context_proc(context);
1526 int cmd, type, error;
1527
1528 if (uid == ~0U)
1529 uid = vfs_context_ucred(context)->cr_ruid;
1530 cmd = cmds >> SUBCMDSHIFT;
1531
1532 switch (cmd) {
1533 case Q_SYNC:
1534 case Q_QUOTASTAT:
1535 break;
1536 case Q_GETQUOTA:
1537 if (uid == vfs_context_ucred(context)->cr_ruid)
1538 break;
1539 /* fall through */
1540 default:
1541 if ( (error = vfs_context_suser(context)) )
1542 return (error);
1543 }
1544
1545 type = cmds & SUBCMDMASK;
1546 if ((u_int)type >= MAXQUOTAS)
1547 return (EINVAL);
1548 if (vfs_busy(mp, LK_NOWAIT))
1549 return (0);
1550
1551 switch (cmd) {
1552
1553 case Q_QUOTAON:
1554 error = hfs_quotaon(p, mp, type, datap);
1555 break;
1556
1557 case Q_QUOTAOFF:
1558 error = hfs_quotaoff(p, mp, type);
1559 break;
1560
1561 case Q_SETQUOTA:
1562 error = hfs_setquota(mp, uid, type, datap);
1563 break;
1564
1565 case Q_SETUSE:
1566 error = hfs_setuse(mp, uid, type, datap);
1567 break;
1568
1569 case Q_GETQUOTA:
1570 error = hfs_getquota(mp, uid, type, datap);
1571 break;
1572
1573 case Q_SYNC:
1574 error = hfs_qsync(mp);
1575 break;
1576
1577 case Q_QUOTASTAT:
1578 error = hfs_quotastat(mp, type, datap);
1579 break;
1580
1581 default:
1582 error = EINVAL;
1583 break;
1584 }
1585 vfs_unbusy(mp);
1586
1587 return (error);
1588 }
1589 #endif /* QUOTA */
1590
1591 /* Subtype is composite of bits */
1592 #define HFS_SUBTYPE_JOURNALED 0x01
1593 #define HFS_SUBTYPE_CASESENSITIVE 0x02
1594 /* bits 2 - 6 reserved */
1595 #define HFS_SUBTYPE_STANDARDHFS 0x80
1596
1597 /*
1598 * Get file system statistics.
1599 */
1600 static int
1601 hfs_statfs(struct mount *mp, register struct vfsstatfs *sbp, __unused vfs_context_t context)
1602 {
1603 ExtendedVCB *vcb = VFSTOVCB(mp);
1604 struct hfsmount *hfsmp = VFSTOHFS(mp);
1605 u_long freeCNIDs;
1606 u_int16_t subtype = 0;
1607
1608 freeCNIDs = (u_long)0xFFFFFFFF - (u_long)vcb->vcbNxtCNID;
1609
1610 sbp->f_bsize = (u_int32_t)vcb->blockSize;
1611 sbp->f_iosize = (size_t)(MAX_UPL_TRANSFER * PAGE_SIZE);
1612 sbp->f_blocks = (u_int64_t)((unsigned long)vcb->totalBlocks);
1613 sbp->f_bfree = (u_int64_t)((unsigned long )hfs_freeblks(hfsmp, 0));
1614 sbp->f_bavail = (u_int64_t)((unsigned long )hfs_freeblks(hfsmp, 1));
1615 sbp->f_files = (u_int64_t)((unsigned long )(vcb->totalBlocks - 2)); /* max files is constrained by total blocks */
1616 sbp->f_ffree = (u_int64_t)((unsigned long )(MIN(freeCNIDs, sbp->f_bavail)));
1617
1618 /*
1619 * Subtypes (flavors) for HFS
1620 * 0: Mac OS Extended
1621 * 1: Mac OS Extended (Journaled)
1622 * 2: Mac OS Extended (Case Sensitive)
1623 * 3: Mac OS Extended (Case Sensitive, Journaled)
1624 * 4 - 127: Reserved
1625 * 128: Mac OS Standard
1626 *
1627 */
1628 if (hfsmp->hfs_flags & HFS_STANDARD) {
1629 subtype = HFS_SUBTYPE_STANDARDHFS;
1630 } else /* HFS Plus */ {
1631 if (hfsmp->jnl)
1632 subtype |= HFS_SUBTYPE_JOURNALED;
1633 if (hfsmp->hfs_flags & HFS_CASE_SENSITIVE)
1634 subtype |= HFS_SUBTYPE_CASESENSITIVE;
1635 }
1636 sbp->f_fssubtype = subtype;
1637
1638 return (0);
1639 }
1640
1641
1642 //
1643 // XXXdbg -- this is a callback to be used by the journal to
1644 // get meta data blocks flushed out to disk.
1645 //
1646 // XXXdbg -- be smarter and don't flush *every* block on each
1647 // call. try to only flush some so we don't wind up
1648 // being too synchronous.
1649 //
1650 __private_extern__
1651 void
1652 hfs_sync_metadata(void *arg)
1653 {
1654 struct mount *mp = (struct mount *)arg;
1655 struct hfsmount *hfsmp;
1656 ExtendedVCB *vcb;
1657 buf_t bp;
1658 int sectorsize, retval;
1659 daddr64_t priIDSector;
1660 hfsmp = VFSTOHFS(mp);
1661 vcb = HFSTOVCB(hfsmp);
1662
1663 // now make sure the super block is flushed
1664 sectorsize = hfsmp->hfs_phys_block_size;
1665 priIDSector = (daddr64_t)((vcb->hfsPlusIOPosOffset / sectorsize) +
1666 HFS_PRI_SECTOR(sectorsize));
1667 retval = (int)buf_meta_bread(hfsmp->hfs_devvp, priIDSector, sectorsize, NOCRED, &bp);
1668 if ((retval != 0 ) && (retval != ENXIO)) {
1669 printf("hfs_sync_metadata: can't read volume header at %d! (retval 0x%x)\n",
1670 (int)priIDSector, retval);
1671 }
1672
1673 if (retval == 0 && ((buf_flags(bp) & (B_DELWRI | B_LOCKED)) == B_DELWRI)) {
1674 buf_bwrite(bp);
1675 } else if (bp) {
1676 buf_brelse(bp);
1677 }
1678
1679 // the alternate super block...
1680 // XXXdbg - we probably don't need to do this each and every time.
1681 // hfs_btreeio.c:FlushAlternate() should flag when it was
1682 // written...
1683 if (hfsmp->hfs_alt_id_sector) {
1684 retval = (int)buf_meta_bread(hfsmp->hfs_devvp, hfsmp->hfs_alt_id_sector, sectorsize, NOCRED, &bp);
1685 if (retval == 0 && ((buf_flags(bp) & (B_DELWRI | B_LOCKED)) == B_DELWRI)) {
1686 buf_bwrite(bp);
1687 } else if (bp) {
1688 buf_brelse(bp);
1689 }
1690 }
1691 }
1692
1693
1694 struct hfs_sync_cargs {
1695 kauth_cred_t cred;
1696 struct proc *p;
1697 int waitfor;
1698 int error;
1699 };
1700
1701
1702 static int
1703 hfs_sync_callback(struct vnode *vp, void *cargs)
1704 {
1705 struct cnode *cp;
1706 struct hfs_sync_cargs *args;
1707 int error;
1708
1709 args = (struct hfs_sync_cargs *)cargs;
1710
1711 if (hfs_lock(VTOC(vp), HFS_EXCLUSIVE_LOCK) != 0) {
1712 return (VNODE_RETURNED);
1713 }
1714 cp = VTOC(vp);
1715
1716 if ((cp->c_flag & C_MODIFIED) ||
1717 (cp->c_touch_acctime | cp->c_touch_chgtime | cp->c_touch_modtime) ||
1718 vnode_hasdirtyblks(vp)) {
1719 error = hfs_fsync(vp, args->waitfor, 0, args->p);
1720
1721 if (error)
1722 args->error = error;
1723 }
1724 hfs_unlock(cp);
1725 return (VNODE_RETURNED);
1726 }
1727
1728
1729
1730 /*
1731 * Go through the disk queues to initiate sandbagged IO;
1732 * go through the inodes to write those that have been modified;
1733 * initiate the writing of the super block if it has been modified.
1734 *
1735 * Note: we are always called with the filesystem marked `MPBUSY'.
1736 */
1737 static int
1738 hfs_sync(struct mount *mp, int waitfor, vfs_context_t context)
1739 {
1740 struct proc *p = vfs_context_proc(context);
1741 struct cnode *cp;
1742 struct hfsmount *hfsmp;
1743 ExtendedVCB *vcb;
1744 struct vnode *meta_vp[4];
1745 int i;
1746 int error, allerror = 0;
1747 struct hfs_sync_cargs args;
1748
1749 /*
1750 * During MNT_UPDATE hfs_changefs might be manipulating
1751 * vnodes so back off
1752 */
1753 if (((u_int32_t)vfs_flags(mp)) & MNT_UPDATE) /* XXX MNT_UPDATE may not be visible here */
1754 return (0);
1755
1756 hfsmp = VFSTOHFS(mp);
1757 if (hfsmp->hfs_flags & HFS_READ_ONLY)
1758 return (EROFS);
1759
1760 /* skip over frozen volumes */
1761 if (!lck_rw_try_lock_shared(&hfsmp->hfs_insync))
1762 return 0;
1763
1764 args.cred = kauth_cred_get();
1765 args.waitfor = waitfor;
1766 args.p = p;
1767 args.error = 0;
1768 /*
1769 * hfs_sync_callback will be called for each vnode
1770 * hung off of this mount point... the vnode will be
1771 * properly referenced and unreferenced around the callback
1772 */
1773 vnode_iterate(mp, 0, hfs_sync_callback, (void *)&args);
1774
1775 if (args.error)
1776 allerror = args.error;
1777
1778 vcb = HFSTOVCB(hfsmp);
1779
1780 meta_vp[0] = vcb->extentsRefNum;
1781 meta_vp[1] = vcb->catalogRefNum;
1782 meta_vp[2] = vcb->allocationsRefNum; /* This is NULL for standard HFS */
1783 meta_vp[3] = hfsmp->hfs_attribute_vp; /* Optional file */
1784
1785 /* Now sync our three metadata files */
1786 for (i = 0; i < 4; ++i) {
1787 struct vnode *btvp;
1788
1789 btvp = meta_vp[i];;
1790 if ((btvp==0) || (vnode_mount(btvp) != mp))
1791 continue;
1792
1793 /* XXX use hfs_systemfile_lock instead ? */
1794 (void) hfs_lock(VTOC(btvp), HFS_EXCLUSIVE_LOCK);
1795 cp = VTOC(btvp);
1796
1797 if (((cp->c_flag & C_MODIFIED) == 0) &&
1798 (cp->c_touch_acctime == 0) &&
1799 (cp->c_touch_chgtime == 0) &&
1800 (cp->c_touch_modtime == 0) &&
1801 vnode_hasdirtyblks(btvp) == 0) {
1802 hfs_unlock(VTOC(btvp));
1803 continue;
1804 }
1805 error = vnode_get(btvp);
1806 if (error) {
1807 hfs_unlock(VTOC(btvp));
1808 continue;
1809 }
1810 if ((error = hfs_fsync(btvp, waitfor, 0, p)))
1811 allerror = error;
1812
1813 hfs_unlock(cp);
1814 vnode_put(btvp);
1815 };
1816
1817 /*
1818 * Force stale file system control information to be flushed.
1819 */
1820 if (vcb->vcbSigWord == kHFSSigWord) {
1821 if ((error = VNOP_FSYNC(hfsmp->hfs_devvp, waitfor, context))) {
1822 allerror = error;
1823 }
1824 }
1825 #if QUOTA
1826 hfs_qsync(mp);
1827 #endif /* QUOTA */
1828
1829 hfs_hotfilesync(hfsmp, vfs_context_kernel());
1830
1831 /*
1832 * Write back modified superblock.
1833 */
1834 if (IsVCBDirty(vcb)) {
1835 error = hfs_flushvolumeheader(hfsmp, waitfor, 0);
1836 if (error)
1837 allerror = error;
1838 }
1839
1840 if (hfsmp->jnl) {
1841 journal_flush(hfsmp->jnl);
1842 }
1843
1844 lck_rw_unlock_shared(&hfsmp->hfs_insync);
1845 return (allerror);
1846 }
1847
1848
1849 /*
1850 * File handle to vnode
1851 *
1852 * Have to be really careful about stale file handles:
1853 * - check that the cnode id is valid
1854 * - call hfs_vget() to get the locked cnode
1855 * - check for an unallocated cnode (i_mode == 0)
1856 * - check that the given client host has export rights and return
1857 * those rights via. exflagsp and credanonp
1858 */
1859 static int
1860 hfs_fhtovp(struct mount *mp, int fhlen, unsigned char *fhp, struct vnode **vpp, __unused vfs_context_t context)
1861 {
1862 struct hfsfid *hfsfhp;
1863 struct vnode *nvp;
1864 int result;
1865
1866 *vpp = NULL;
1867 hfsfhp = (struct hfsfid *)fhp;
1868
1869 if (fhlen < (int)sizeof(struct hfsfid))
1870 return (EINVAL);
1871
1872 result = hfs_vget(VFSTOHFS(mp), ntohl(hfsfhp->hfsfid_cnid), &nvp, 0);
1873 if (result) {
1874 if (result == ENOENT)
1875 result = ESTALE;
1876 return result;
1877 }
1878
1879 /* The createtime can be changed by hfs_setattr or hfs_setattrlist.
1880 * For NFS, we are assuming that only if the createtime was moved
1881 * forward would it mean the fileID got reused in that session by
1882 * wrapping. We don't have a volume ID or other unique identifier to
1883 * to use here for a generation ID across reboots, crashes where
1884 * metadata noting lastFileID didn't make it to disk but client has
1885 * it, or volume erasures where fileIDs start over again. Lastly,
1886 * with HFS allowing "wraps" of fileIDs now, this becomes more
1887 * error prone. Future, would be change the "wrap bit" to a unique
1888 * wrap number and use that for generation number. For now do this.
1889 */
1890 if (((time_t)(ntohl(hfsfhp->hfsfid_gen)) < VTOC(nvp)->c_itime)) {
1891 hfs_unlock(VTOC(nvp));
1892 vnode_put(nvp);
1893 return (ESTALE);
1894 }
1895 *vpp = nvp;
1896
1897 hfs_unlock(VTOC(nvp));
1898 return (0);
1899 }
1900
1901
1902 /*
1903 * Vnode pointer to File handle
1904 */
1905 /* ARGSUSED */
1906 static int
1907 hfs_vptofh(struct vnode *vp, int *fhlenp, unsigned char *fhp, __unused vfs_context_t context)
1908 {
1909 struct cnode *cp;
1910 struct hfsfid *hfsfhp;
1911
1912 if (ISHFS(VTOVCB(vp)))
1913 return (ENOTSUP); /* hfs standard is not exportable */
1914
1915 if (*fhlenp < (int)sizeof(struct hfsfid))
1916 return (EOVERFLOW);
1917
1918 cp = VTOC(vp);
1919 hfsfhp = (struct hfsfid *)fhp;
1920 hfsfhp->hfsfid_cnid = htonl(cp->c_fileid);
1921 hfsfhp->hfsfid_gen = htonl(cp->c_itime);
1922 *fhlenp = sizeof(struct hfsfid);
1923
1924 return (0);
1925 }
1926
1927
1928 /*
1929 * Initial HFS filesystems, done only once.
1930 */
1931 static int
1932 hfs_init(__unused struct vfsconf *vfsp)
1933 {
1934 static int done = 0;
1935
1936 if (done)
1937 return (0);
1938 done = 1;
1939 hfs_chashinit();
1940 hfs_converterinit();
1941
1942 BTReserveSetup();
1943
1944
1945 hfs_lock_attr = lck_attr_alloc_init();
1946 hfs_group_attr = lck_grp_attr_alloc_init();
1947 hfs_mutex_group = lck_grp_alloc_init("hfs-mutex", hfs_group_attr);
1948 hfs_rwlock_group = lck_grp_alloc_init("hfs-rwlock", hfs_group_attr);
1949
1950
1951 return (0);
1952 }
1953
1954 static int
1955 hfs_getmountpoint(struct vnode *vp, struct hfsmount **hfsmpp)
1956 {
1957 struct hfsmount * hfsmp;
1958 char fstypename[MFSNAMELEN];
1959
1960 if (vp == NULL)
1961 return (EINVAL);
1962
1963 if (!vnode_isvroot(vp))
1964 return (EINVAL);
1965
1966 vnode_vfsname(vp, fstypename);
1967 if (strncmp(fstypename, "hfs", sizeof(fstypename)) != 0)
1968 return (EINVAL);
1969
1970 hfsmp = VTOHFS(vp);
1971
1972 if (HFSTOVCB(hfsmp)->vcbSigWord == kHFSSigWord)
1973 return (EINVAL);
1974
1975 *hfsmpp = hfsmp;
1976
1977 return (0);
1978 }
1979
1980 // XXXdbg
1981 #include <sys/filedesc.h>
1982
1983 /*
1984 * HFS filesystem related variables.
1985 */
1986 static int
1987 hfs_sysctl(int *name, __unused u_int namelen, user_addr_t oldp, size_t *oldlenp,
1988 user_addr_t newp, size_t newlen, vfs_context_t context)
1989 {
1990 struct proc *p = vfs_context_proc(context);
1991 int error;
1992 struct hfsmount *hfsmp;
1993
1994 /* all sysctl names at this level are terminal */
1995
1996 if (name[0] == HFS_ENCODINGBIAS) {
1997 int bias;
1998
1999 bias = hfs_getencodingbias();
2000 error = sysctl_int(oldp, oldlenp, newp, newlen, &bias);
2001 if (error == 0 && newp)
2002 hfs_setencodingbias(bias);
2003 return (error);
2004
2005 } else if (name[0] == HFS_EXTEND_FS) {
2006 u_int64_t newsize;
2007 vnode_t vp = vfs_context_cwd(context);
2008
2009 if (newp == USER_ADDR_NULL || vp == NULLVP)
2010 return (EINVAL);
2011 if ((error = hfs_getmountpoint(vp, &hfsmp)))
2012 return (error);
2013 error = sysctl_quad(oldp, oldlenp, newp, newlen, (quad_t *)&newsize);
2014 if (error)
2015 return (error);
2016
2017 error = hfs_extendfs(hfsmp, newsize, context);
2018 return (error);
2019
2020 } else if (name[0] == HFS_ENCODINGHINT) {
2021 size_t bufsize;
2022 size_t bytes;
2023 u_int32_t hint;
2024 u_int16_t *unicode_name;
2025 char *filename;
2026
2027 if ((newlen <= 0) || (newlen > MAXPATHLEN))
2028 return (EINVAL);
2029
2030 bufsize = MAX(newlen * 3, MAXPATHLEN);
2031 MALLOC(filename, char *, newlen, M_TEMP, M_WAITOK);
2032 MALLOC(unicode_name, u_int16_t *, bufsize, M_TEMP, M_WAITOK);
2033
2034 error = copyin(newp, (caddr_t)filename, newlen);
2035 if (error == 0) {
2036 error = utf8_decodestr((u_int8_t *)filename, newlen - 1, unicode_name,
2037 &bytes, bufsize, 0, UTF_DECOMPOSED);
2038 if (error == 0) {
2039 hint = hfs_pickencoding(unicode_name, bytes / 2);
2040 error = sysctl_int(oldp, oldlenp, USER_ADDR_NULL, 0, (int32_t *)&hint);
2041 }
2042 }
2043 FREE(unicode_name, M_TEMP);
2044 FREE(filename, M_TEMP);
2045 return (error);
2046
2047 } else if (name[0] == HFS_ENABLE_JOURNALING) {
2048 // make the file system journaled...
2049 vnode_t vp = vfs_context_cwd(context);
2050 vnode_t jvp;
2051 ExtendedVCB *vcb;
2052 struct cat_attr jnl_attr, jinfo_attr;
2053 struct cat_fork jnl_fork, jinfo_fork;
2054 void *jnl = NULL;
2055 int lockflags;
2056
2057 /* Only root can enable journaling */
2058 if (!is_suser()) {
2059 return (EPERM);
2060 }
2061 if (vp == NULLVP)
2062 return EINVAL;
2063
2064 hfsmp = VTOHFS(vp);
2065 if (hfsmp->hfs_flags & HFS_READ_ONLY) {
2066 return EROFS;
2067 }
2068 if (HFSTOVCB(hfsmp)->vcbSigWord == kHFSSigWord) {
2069 printf("hfs: can't make a plain hfs volume journaled.\n");
2070 return EINVAL;
2071 }
2072
2073 if (hfsmp->jnl) {
2074 printf("hfs: volume @ mp %p is already journaled!\n", vnode_mount(vp));
2075 return EAGAIN;
2076 }
2077
2078 vcb = HFSTOVCB(hfsmp);
2079 lockflags = hfs_systemfile_lock(hfsmp, SFL_CATALOG | SFL_EXTENTS, HFS_EXCLUSIVE_LOCK);
2080 if (BTHasContiguousNodes(VTOF(vcb->catalogRefNum)) == 0 ||
2081 BTHasContiguousNodes(VTOF(vcb->extentsRefNum)) == 0) {
2082
2083 printf("hfs: volume has a btree w/non-contiguous nodes. can not enable journaling.\n");
2084 hfs_systemfile_unlock(hfsmp, lockflags);
2085 return EINVAL;
2086 }
2087 hfs_systemfile_unlock(hfsmp, lockflags);
2088
2089 // make sure these both exist!
2090 if ( GetFileInfo(vcb, kHFSRootFolderID, ".journal_info_block", &jinfo_attr, &jinfo_fork) == 0
2091 || GetFileInfo(vcb, kHFSRootFolderID, ".journal", &jnl_attr, &jnl_fork) == 0) {
2092
2093 return EINVAL;
2094 }
2095
2096 hfs_sync(hfsmp->hfs_mp, MNT_WAIT, context);
2097
2098 printf("hfs: Initializing the journal (joffset 0x%llx sz 0x%llx)...\n",
2099 (off_t)name[2], (off_t)name[3]);
2100
2101 jvp = hfsmp->hfs_devvp;
2102 jnl = journal_create(jvp,
2103 (off_t)name[2] * (off_t)HFSTOVCB(hfsmp)->blockSize
2104 + HFSTOVCB(hfsmp)->hfsPlusIOPosOffset,
2105 (off_t)((unsigned)name[3]),
2106 hfsmp->hfs_devvp,
2107 hfsmp->hfs_phys_block_size,
2108 0,
2109 0,
2110 hfs_sync_metadata, hfsmp->hfs_mp);
2111
2112 if (jnl == NULL) {
2113 printf("hfs: FAILED to create the journal!\n");
2114 if (jvp && jvp != hfsmp->hfs_devvp) {
2115 VNOP_CLOSE(jvp, hfsmp->hfs_flags & HFS_READ_ONLY ? FREAD : FREAD|FWRITE, context);
2116 }
2117 jvp = NULL;
2118
2119 return EINVAL;
2120 }
2121
2122 hfs_global_exclusive_lock_acquire(hfsmp);
2123
2124 /*
2125 * Flush all dirty metadata buffers.
2126 */
2127 buf_flushdirtyblks(hfsmp->hfs_devvp, MNT_WAIT, 0, "hfs_sysctl");
2128 buf_flushdirtyblks(hfsmp->hfs_extents_vp, MNT_WAIT, 0, "hfs_sysctl");
2129 buf_flushdirtyblks(hfsmp->hfs_catalog_vp, MNT_WAIT, 0, "hfs_sysctl");
2130 buf_flushdirtyblks(hfsmp->hfs_allocation_vp, MNT_WAIT, 0, "hfs_sysctl");
2131 if (hfsmp->hfs_attribute_vp)
2132 buf_flushdirtyblks(hfsmp->hfs_attribute_vp, MNT_WAIT, 0, "hfs_sysctl");
2133
2134 HFSTOVCB(hfsmp)->vcbJinfoBlock = name[1];
2135 HFSTOVCB(hfsmp)->vcbAtrb |= kHFSVolumeJournaledMask;
2136 hfsmp->jvp = jvp;
2137 hfsmp->jnl = jnl;
2138
2139 // save this off for the hack-y check in hfs_remove()
2140 hfsmp->jnl_start = (u_int32_t)name[2];
2141 hfsmp->jnl_size = (off_t)((unsigned)name[3]);
2142 hfsmp->hfs_jnlinfoblkid = jinfo_attr.ca_fileid;
2143 hfsmp->hfs_jnlfileid = jnl_attr.ca_fileid;
2144
2145 vfs_setflags(hfsmp->hfs_mp, (u_int64_t)((unsigned int)MNT_JOURNALED));
2146
2147 hfs_global_exclusive_lock_release(hfsmp);
2148 hfs_flushvolumeheader(hfsmp, MNT_WAIT, 1);
2149
2150 return 0;
2151 } else if (name[0] == HFS_DISABLE_JOURNALING) {
2152 // clear the journaling bit
2153 vnode_t vp = vfs_context_cwd(context);
2154
2155 /* Only root can disable journaling */
2156 if (!is_suser()) {
2157 return (EPERM);
2158 }
2159 if (vp == NULLVP)
2160 return EINVAL;
2161
2162 hfsmp = VTOHFS(vp);
2163
2164 /*
2165 * Disabling journaling is disallowed on volumes with directory hard links
2166 * because we have not tested the relevant code path.
2167 */
2168 if (hfsmp->hfs_private_attr[DIR_HARDLINKS].ca_entries != 0){
2169 printf("hfs: cannot disable journaling on volumes with directory hardlinks\n");
2170 return EPERM;
2171 }
2172
2173 printf("hfs: disabling journaling for mount @ %p\n", vnode_mount(vp));
2174
2175 hfs_global_exclusive_lock_acquire(hfsmp);
2176
2177 // Lights out for you buddy!
2178 journal_close(hfsmp->jnl);
2179 hfsmp->jnl = NULL;
2180
2181 if (hfsmp->jvp && hfsmp->jvp != hfsmp->hfs_devvp) {
2182 VNOP_CLOSE(hfsmp->jvp, hfsmp->hfs_flags & HFS_READ_ONLY ? FREAD : FREAD|FWRITE, context);
2183 }
2184 hfsmp->jvp = NULL;
2185 vfs_clearflags(hfsmp->hfs_mp, (u_int64_t)((unsigned int)MNT_JOURNALED));
2186 hfsmp->jnl_start = 0;
2187 hfsmp->hfs_jnlinfoblkid = 0;
2188 hfsmp->hfs_jnlfileid = 0;
2189
2190 HFSTOVCB(hfsmp)->vcbAtrb &= ~kHFSVolumeJournaledMask;
2191
2192 hfs_global_exclusive_lock_release(hfsmp);
2193 hfs_flushvolumeheader(hfsmp, MNT_WAIT, 1);
2194
2195 return 0;
2196 } else if (name[0] == HFS_GET_JOURNAL_INFO) {
2197 vnode_t vp = vfs_context_cwd(context);
2198 off_t jnl_start, jnl_size;
2199
2200 if (vp == NULLVP)
2201 return EINVAL;
2202
2203 hfsmp = VTOHFS(vp);
2204 if (hfsmp->jnl == NULL) {
2205 jnl_start = 0;
2206 jnl_size = 0;
2207 } else {
2208 jnl_start = (off_t)(hfsmp->jnl_start * HFSTOVCB(hfsmp)->blockSize) + (off_t)HFSTOVCB(hfsmp)->hfsPlusIOPosOffset;
2209 jnl_size = (off_t)hfsmp->jnl_size;
2210 }
2211
2212 if ((error = copyout((caddr_t)&jnl_start, CAST_USER_ADDR_T(name[1]), sizeof(off_t))) != 0) {
2213 return error;
2214 }
2215 if ((error = copyout((caddr_t)&jnl_size, CAST_USER_ADDR_T(name[2]), sizeof(off_t))) != 0) {
2216 return error;
2217 }
2218
2219 return 0;
2220 } else if (name[0] == HFS_SET_PKG_EXTENSIONS) {
2221
2222 return set_package_extensions_table((void *)name[1], name[2], name[3]);
2223
2224 } else if (name[0] == VFS_CTL_QUERY) {
2225 struct sysctl_req *req;
2226 struct vfsidctl vc;
2227 struct user_vfsidctl user_vc;
2228 struct mount *mp;
2229 struct vfsquery vq;
2230 boolean_t is_64_bit;
2231
2232 is_64_bit = proc_is64bit(p);
2233 req = CAST_DOWN(struct sysctl_req *, oldp); /* we're new style vfs sysctl. */
2234
2235 if (is_64_bit) {
2236 error = SYSCTL_IN(req, &user_vc, sizeof(user_vc));
2237 if (error) return (error);
2238
2239 mp = vfs_getvfs(&user_vc.vc_fsid);
2240 }
2241 else {
2242 error = SYSCTL_IN(req, &vc, sizeof(vc));
2243 if (error) return (error);
2244
2245 mp = vfs_getvfs(&vc.vc_fsid);
2246 }
2247 if (mp == NULL) return (ENOENT);
2248
2249 hfsmp = VFSTOHFS(mp);
2250 bzero(&vq, sizeof(vq));
2251 vq.vq_flags = hfsmp->hfs_notification_conditions;
2252 return SYSCTL_OUT(req, &vq, sizeof(vq));;
2253 } else if (name[0] == HFS_REPLAY_JOURNAL) {
2254 char *devnode = NULL;
2255 size_t devnode_len;
2256
2257 devnode_len = *oldlenp;
2258 MALLOC(devnode, char *, devnode_len + 1, M_TEMP, M_WAITOK);
2259 if (devnode == NULL) {
2260 return ENOMEM;
2261 }
2262
2263 error = copyin(oldp, (caddr_t)devnode, devnode_len);
2264 if (error) {
2265 FREE(devnode, M_TEMP);
2266 return error;
2267 }
2268 devnode[devnode_len] = 0;
2269
2270 error = hfs_journal_replay(devnode, context);
2271 FREE(devnode, M_TEMP);
2272 return error;
2273 }
2274
2275 return (ENOTSUP);
2276 }
2277
2278
2279 static int
2280 hfs_vfs_vget(struct mount *mp, ino64_t ino, struct vnode **vpp, __unused vfs_context_t context)
2281 {
2282 int error;
2283
2284 error = hfs_vget(VFSTOHFS(mp), (cnid_t)ino, vpp, 1);
2285 if (error)
2286 return (error);
2287
2288 /*
2289 * ADLs may need to have their origin state updated
2290 * since build_path needs a valid parent.
2291 */
2292 if (vnode_isdir(*vpp) &&
2293 (VTOC(*vpp)->c_flag & C_HARDLINK) &&
2294 (hfs_lock(VTOC(*vpp), HFS_EXCLUSIVE_LOCK) == 0)) {
2295 cnode_t *cp = VTOC(*vpp);
2296 struct cat_desc cdesc;
2297
2298 if (!hfs_haslinkorigin(cp) &&
2299 (cat_findname(VFSTOHFS(mp), (cnid_t)ino, &cdesc) == 0)) {
2300 if (cdesc.cd_parentcnid !=
2301 VFSTOHFS(mp)->hfs_private_desc[DIR_HARDLINKS].cd_cnid) {
2302 hfs_savelinkorigin(cp, cdesc.cd_parentcnid);
2303 }
2304 cat_releasedesc(&cdesc);
2305 }
2306 hfs_unlock(cp);
2307 }
2308 return (0);
2309 }
2310
2311
2312 /*
2313 * Look up an HFS object by ID.
2314 *
2315 * The object is returned with an iocount reference and the cnode locked.
2316 *
2317 * If the object is a file then it will represent the data fork.
2318 */
2319 __private_extern__
2320 int
2321 hfs_vget(struct hfsmount *hfsmp, cnid_t cnid, struct vnode **vpp, int skiplock)
2322 {
2323 struct vnode *vp = NULLVP;
2324 struct cat_desc cndesc;
2325 struct cat_attr cnattr;
2326 struct cat_fork cnfork;
2327 u_int32_t linkref = 0;
2328 int error;
2329
2330 /* Check for cnids that should't be exported. */
2331 if ((cnid < kHFSFirstUserCatalogNodeID) &&
2332 (cnid != kHFSRootFolderID && cnid != kHFSRootParentID)) {
2333 return (ENOENT);
2334 }
2335 /* Don't export our private directories. */
2336 if (cnid == hfsmp->hfs_private_desc[FILE_HARDLINKS].cd_cnid ||
2337 cnid == hfsmp->hfs_private_desc[DIR_HARDLINKS].cd_cnid) {
2338 return (ENOENT);
2339 }
2340 /*
2341 * Check the hash first
2342 */
2343 vp = hfs_chash_getvnode(hfsmp->hfs_raw_dev, cnid, 0, skiplock);
2344 if (vp) {
2345 *vpp = vp;
2346 return(0);
2347 }
2348
2349 bzero(&cndesc, sizeof(cndesc));
2350 bzero(&cnattr, sizeof(cnattr));
2351 bzero(&cnfork, sizeof(cnfork));
2352
2353 /*
2354 * Not in hash, lookup in catalog
2355 */
2356 if (cnid == kHFSRootParentID) {
2357 static char hfs_rootname[] = "/";
2358
2359 cndesc.cd_nameptr = (const u_int8_t *)&hfs_rootname[0];
2360 cndesc.cd_namelen = 1;
2361 cndesc.cd_parentcnid = kHFSRootParentID;
2362 cndesc.cd_cnid = kHFSRootFolderID;
2363 cndesc.cd_flags = CD_ISDIR;
2364
2365 cnattr.ca_fileid = kHFSRootFolderID;
2366 cnattr.ca_linkcount = 1;
2367 cnattr.ca_entries = 1;
2368 cnattr.ca_dircount = 1;
2369 cnattr.ca_mode = (S_IFDIR | S_IRWXU | S_IRWXG | S_IRWXO);
2370 } else {
2371 int lockflags;
2372 cnid_t pid;
2373 const char *nameptr;
2374
2375 lockflags = hfs_systemfile_lock(hfsmp, SFL_CATALOG, HFS_SHARED_LOCK);
2376 error = cat_idlookup(hfsmp, cnid, 0, &cndesc, &cnattr, &cnfork);
2377 hfs_systemfile_unlock(hfsmp, lockflags);
2378
2379 if (error) {
2380 *vpp = NULL;
2381 return (error);
2382 }
2383
2384 /*
2385 * Check for a raw hardlink inode and save its linkref.
2386 */
2387 pid = cndesc.cd_parentcnid;
2388 nameptr = (const char *)cndesc.cd_nameptr;
2389
2390 if ((pid == hfsmp->hfs_private_desc[FILE_HARDLINKS].cd_cnid) &&
2391 (bcmp(nameptr, HFS_INODE_PREFIX, HFS_INODE_PREFIX_LEN) == 0)) {
2392 linkref = strtoul(&nameptr[HFS_INODE_PREFIX_LEN], NULL, 10);
2393
2394 } else if ((pid == hfsmp->hfs_private_desc[DIR_HARDLINKS].cd_cnid) &&
2395 (bcmp(nameptr, HFS_DIRINODE_PREFIX, HFS_DIRINODE_PREFIX_LEN) == 0)) {
2396 linkref = strtoul(&nameptr[HFS_DIRINODE_PREFIX_LEN], NULL, 10);
2397
2398 } else if ((pid == hfsmp->hfs_private_desc[FILE_HARDLINKS].cd_cnid) &&
2399 (bcmp(nameptr, HFS_DELETE_PREFIX, HFS_DELETE_PREFIX_LEN) == 0)) {
2400 *vpp = NULL;
2401 cat_releasedesc(&cndesc);
2402 return (ENOENT); /* open unlinked file */
2403 }
2404 }
2405
2406 /*
2407 * Finish initializing cnode descriptor for hardlinks.
2408 *
2409 * We need a valid name and parent for reverse lookups.
2410 */
2411 if (linkref) {
2412 cnid_t nextlinkid;
2413 cnid_t prevlinkid;
2414 struct cat_desc linkdesc;
2415
2416 cnattr.ca_linkref = linkref;
2417
2418 /*
2419 * Pick up the first link in the chain and get a descriptor for it.
2420 * This allows blind volfs paths to work for hardlinks.
2421 */
2422 if ((hfs_lookuplink(hfsmp, linkref, &prevlinkid, &nextlinkid) == 0) &&
2423 (nextlinkid != 0)) {
2424 if (cat_findname(hfsmp, nextlinkid, &linkdesc) == 0) {
2425 cat_releasedesc(&cndesc);
2426 bcopy(&linkdesc, &cndesc, sizeof(linkdesc));
2427 }
2428 }
2429 }
2430
2431 if (linkref) {
2432 error = hfs_getnewvnode(hfsmp, NULL, NULL, &cndesc, 0, &cnattr, &cnfork, &vp);
2433 if (error == 0) {
2434 VTOC(vp)->c_flag |= C_HARDLINK;
2435 vnode_setmultipath(vp);
2436 }
2437 } else {
2438 struct componentname cn;
2439
2440 /* Supply hfs_getnewvnode with a component name. */
2441 MALLOC_ZONE(cn.cn_pnbuf, caddr_t, MAXPATHLEN, M_NAMEI, M_WAITOK);
2442 cn.cn_nameiop = LOOKUP;
2443 cn.cn_flags = ISLASTCN | HASBUF;
2444 cn.cn_context = NULL;
2445 cn.cn_pnlen = MAXPATHLEN;
2446 cn.cn_nameptr = cn.cn_pnbuf;
2447 cn.cn_namelen = cndesc.cd_namelen;
2448 cn.cn_hash = 0;
2449 cn.cn_consume = 0;
2450 bcopy(cndesc.cd_nameptr, cn.cn_nameptr, cndesc.cd_namelen + 1);
2451
2452 error = hfs_getnewvnode(hfsmp, NULLVP, &cn, &cndesc, 0, &cnattr, &cnfork, &vp);
2453
2454 if (error == 0 && (VTOC(vp)->c_flag & C_HARDLINK) && vnode_isdir(vp)) {
2455 hfs_savelinkorigin(VTOC(vp), cndesc.cd_parentcnid);
2456 }
2457 FREE_ZONE(cn.cn_pnbuf, cn.cn_pnlen, M_NAMEI);
2458 }
2459 cat_releasedesc(&cndesc);
2460
2461 *vpp = vp;
2462 if (vp && skiplock) {
2463 hfs_unlock(VTOC(vp));
2464 }
2465 return (error);
2466 }
2467
2468
2469 /*
2470 * Flush out all the files in a filesystem.
2471 */
2472 static int
2473 #if QUOTA
2474 hfs_flushfiles(struct mount *mp, int flags, struct proc *p)
2475 #else
2476 hfs_flushfiles(struct mount *mp, int flags, __unused struct proc *p)
2477 #endif /* QUOTA */
2478 {
2479 struct hfsmount *hfsmp;
2480 struct vnode *skipvp = NULLVP;
2481 int error;
2482 #if QUOTA
2483 int quotafilecnt;
2484 int i;
2485 #endif
2486
2487 hfsmp = VFSTOHFS(mp);
2488
2489 #if QUOTA
2490 /*
2491 * The open quota files have an indirect reference on
2492 * the root directory vnode. We must account for this
2493 * extra reference when doing the intial vflush.
2494 */
2495 quotafilecnt = 0;
2496 if (((unsigned int)vfs_flags(mp)) & MNT_QUOTA) {
2497
2498 /* Find out how many quota files we have open. */
2499 for (i = 0; i < MAXQUOTAS; i++) {
2500 if (hfsmp->hfs_qfiles[i].qf_vp != NULLVP)
2501 ++quotafilecnt;
2502 }
2503
2504 /* Obtain the root vnode so we can skip over it. */
2505 skipvp = hfs_chash_getvnode(hfsmp->hfs_raw_dev, kHFSRootFolderID, 0, 0);
2506 }
2507 #endif /* QUOTA */
2508
2509 error = vflush(mp, skipvp, SKIPSYSTEM | SKIPSWAP | flags);
2510 if (error != 0)
2511 return(error);
2512
2513 error = vflush(mp, skipvp, SKIPSYSTEM | flags);
2514
2515 #if QUOTA
2516 if (((unsigned int)vfs_flags(mp)) & MNT_QUOTA) {
2517 if (skipvp) {
2518 /*
2519 * See if there are additional references on the
2520 * root vp besides the ones obtained from the open
2521 * quota files and the hfs_chash_getvnode call above.
2522 */
2523 if ((error == 0) &&
2524 (vnode_isinuse(skipvp, quotafilecnt))) {
2525 error = EBUSY; /* root directory is still open */
2526 }
2527 hfs_unlock(VTOC(skipvp));
2528 vnode_put(skipvp);
2529 }
2530 if (error && (flags & FORCECLOSE) == 0)
2531 return (error);
2532
2533 for (i = 0; i < MAXQUOTAS; i++) {
2534 if (hfsmp->hfs_qfiles[i].qf_vp == NULLVP)
2535 continue;
2536 hfs_quotaoff(p, mp, i);
2537 }
2538 error = vflush(mp, NULLVP, SKIPSYSTEM | flags);
2539 }
2540 #endif /* QUOTA */
2541
2542 return (error);
2543 }
2544
2545 /*
2546 * Update volume encoding bitmap (HFS Plus only)
2547 */
2548 __private_extern__
2549 void
2550 hfs_setencodingbits(struct hfsmount *hfsmp, u_int32_t encoding)
2551 {
2552 #define kIndexMacUkrainian 48 /* MacUkrainian encoding is 152 */
2553 #define kIndexMacFarsi 49 /* MacFarsi encoding is 140 */
2554
2555 u_int32_t index;
2556
2557 switch (encoding) {
2558 case kTextEncodingMacUkrainian:
2559 index = kIndexMacUkrainian;
2560 break;
2561 case kTextEncodingMacFarsi:
2562 index = kIndexMacFarsi;
2563 break;
2564 default:
2565 index = encoding;
2566 break;
2567 }
2568
2569 if (index < 64 && (hfsmp->encodingsBitmap & (u_int64_t)(1ULL << index)) == 0) {
2570 HFS_MOUNT_LOCK(hfsmp, TRUE)
2571 hfsmp->encodingsBitmap |= (u_int64_t)(1ULL << index);
2572 MarkVCBDirty(hfsmp);
2573 HFS_MOUNT_UNLOCK(hfsmp, TRUE);
2574 }
2575 }
2576
2577 /*
2578 * Update volume stats
2579 *
2580 * On journal volumes this will cause a volume header flush
2581 */
2582 __private_extern__
2583 int
2584 hfs_volupdate(struct hfsmount *hfsmp, enum volop op, int inroot)
2585 {
2586 struct timeval tv;
2587
2588 microtime(&tv);
2589
2590 lck_mtx_lock(&hfsmp->hfs_mutex);
2591
2592 MarkVCBDirty(hfsmp);
2593 hfsmp->hfs_mtime = tv.tv_sec;
2594
2595 switch (op) {
2596 case VOL_UPDATE:
2597 break;
2598 case VOL_MKDIR:
2599 if (hfsmp->hfs_dircount != 0xFFFFFFFF)
2600 ++hfsmp->hfs_dircount;
2601 if (inroot && hfsmp->vcbNmRtDirs != 0xFFFF)
2602 ++hfsmp->vcbNmRtDirs;
2603 break;
2604 case VOL_RMDIR:
2605 if (hfsmp->hfs_dircount != 0)
2606 --hfsmp->hfs_dircount;
2607 if (inroot && hfsmp->vcbNmRtDirs != 0xFFFF)
2608 --hfsmp->vcbNmRtDirs;
2609 break;
2610 case VOL_MKFILE:
2611 if (hfsmp->hfs_filecount != 0xFFFFFFFF)
2612 ++hfsmp->hfs_filecount;
2613 if (inroot && hfsmp->vcbNmFls != 0xFFFF)
2614 ++hfsmp->vcbNmFls;
2615 break;
2616 case VOL_RMFILE:
2617 if (hfsmp->hfs_filecount != 0)
2618 --hfsmp->hfs_filecount;
2619 if (inroot && hfsmp->vcbNmFls != 0xFFFF)
2620 --hfsmp->vcbNmFls;
2621 break;
2622 }
2623
2624 lck_mtx_unlock(&hfsmp->hfs_mutex);
2625
2626 if (hfsmp->jnl) {
2627 hfs_flushvolumeheader(hfsmp, 0, 0);
2628 }
2629
2630 return (0);
2631 }
2632
2633
2634 static int
2635 hfs_flushMDB(struct hfsmount *hfsmp, int waitfor, int altflush)
2636 {
2637 ExtendedVCB *vcb = HFSTOVCB(hfsmp);
2638 struct filefork *fp;
2639 HFSMasterDirectoryBlock *mdb;
2640 struct buf *bp = NULL;
2641 int retval;
2642 int sectorsize;
2643 ByteCount namelen;
2644
2645 sectorsize = hfsmp->hfs_phys_block_size;
2646 retval = (int)buf_bread(hfsmp->hfs_devvp, (daddr64_t)HFS_PRI_SECTOR(sectorsize), sectorsize, NOCRED, &bp);
2647 if (retval) {
2648 if (bp)
2649 buf_brelse(bp);
2650 return retval;
2651 }
2652
2653 lck_mtx_lock(&hfsmp->hfs_mutex);
2654
2655 mdb = (HFSMasterDirectoryBlock *)(buf_dataptr(bp) + HFS_PRI_OFFSET(sectorsize));
2656
2657 mdb->drCrDate = SWAP_BE32 (UTCToLocal(to_hfs_time(vcb->vcbCrDate)));
2658 mdb->drLsMod = SWAP_BE32 (UTCToLocal(to_hfs_time(vcb->vcbLsMod)));
2659 mdb->drAtrb = SWAP_BE16 (vcb->vcbAtrb);
2660 mdb->drNmFls = SWAP_BE16 (vcb->vcbNmFls);
2661 mdb->drAllocPtr = SWAP_BE16 (vcb->nextAllocation);
2662 mdb->drClpSiz = SWAP_BE32 (vcb->vcbClpSiz);
2663 mdb->drNxtCNID = SWAP_BE32 (vcb->vcbNxtCNID);
2664 mdb->drFreeBks = SWAP_BE16 (vcb->freeBlocks);
2665
2666 namelen = strlen((char *)vcb->vcbVN);
2667 retval = utf8_to_hfs(vcb, namelen, vcb->vcbVN, mdb->drVN);
2668 /* Retry with MacRoman in case that's how it was exported. */
2669 if (retval)
2670 retval = utf8_to_mac_roman(namelen, vcb->vcbVN, mdb->drVN);
2671
2672 mdb->drVolBkUp = SWAP_BE32 (UTCToLocal(to_hfs_time(vcb->vcbVolBkUp)));
2673 mdb->drWrCnt = SWAP_BE32 (vcb->vcbWrCnt);
2674 mdb->drNmRtDirs = SWAP_BE16 (vcb->vcbNmRtDirs);
2675 mdb->drFilCnt = SWAP_BE32 (vcb->vcbFilCnt);
2676 mdb->drDirCnt = SWAP_BE32 (vcb->vcbDirCnt);
2677
2678 bcopy(vcb->vcbFndrInfo, mdb->drFndrInfo, sizeof(mdb->drFndrInfo));
2679
2680 fp = VTOF(vcb->extentsRefNum);
2681 mdb->drXTExtRec[0].startBlock = SWAP_BE16 (fp->ff_extents[0].startBlock);
2682 mdb->drXTExtRec[0].blockCount = SWAP_BE16 (fp->ff_extents[0].blockCount);
2683 mdb->drXTExtRec[1].startBlock = SWAP_BE16 (fp->ff_extents[1].startBlock);
2684 mdb->drXTExtRec[1].blockCount = SWAP_BE16 (fp->ff_extents[1].blockCount);
2685 mdb->drXTExtRec[2].startBlock = SWAP_BE16 (fp->ff_extents[2].startBlock);
2686 mdb->drXTExtRec[2].blockCount = SWAP_BE16 (fp->ff_extents[2].blockCount);
2687 mdb->drXTFlSize = SWAP_BE32 (fp->ff_blocks * vcb->blockSize);
2688 mdb->drXTClpSiz = SWAP_BE32 (fp->ff_clumpsize);
2689 FTOC(fp)->c_flag &= ~C_MODIFIED;
2690
2691 fp = VTOF(vcb->catalogRefNum);
2692 mdb->drCTExtRec[0].startBlock = SWAP_BE16 (fp->ff_extents[0].startBlock);
2693 mdb->drCTExtRec[0].blockCount = SWAP_BE16 (fp->ff_extents[0].blockCount);
2694 mdb->drCTExtRec[1].startBlock = SWAP_BE16 (fp->ff_extents[1].startBlock);
2695 mdb->drCTExtRec[1].blockCount = SWAP_BE16 (fp->ff_extents[1].blockCount);
2696 mdb->drCTExtRec[2].startBlock = SWAP_BE16 (fp->ff_extents[2].startBlock);
2697 mdb->drCTExtRec[2].blockCount = SWAP_BE16 (fp->ff_extents[2].blockCount);
2698 mdb->drCTFlSize = SWAP_BE32 (fp->ff_blocks * vcb->blockSize);
2699 mdb->drCTClpSiz = SWAP_BE32 (fp->ff_clumpsize);
2700 FTOC(fp)->c_flag &= ~C_MODIFIED;
2701
2702 MarkVCBClean( vcb );
2703
2704 lck_mtx_unlock(&hfsmp->hfs_mutex);
2705
2706 /* If requested, flush out the alternate MDB */
2707 if (altflush) {
2708 struct buf *alt_bp = NULL;
2709
2710 if (buf_meta_bread(hfsmp->hfs_devvp, hfsmp->hfs_alt_id_sector, sectorsize, NOCRED, &alt_bp) == 0) {
2711 bcopy(mdb, (char *)buf_dataptr(alt_bp) + HFS_ALT_OFFSET(sectorsize), kMDBSize);
2712
2713 (void) VNOP_BWRITE(alt_bp);
2714 } else if (alt_bp)
2715 buf_brelse(alt_bp);
2716 }
2717
2718 if (waitfor != MNT_WAIT)
2719 buf_bawrite(bp);
2720 else
2721 retval = VNOP_BWRITE(bp);
2722
2723 return (retval);
2724 }
2725
2726 /*
2727 * Flush any dirty in-memory mount data to the on-disk
2728 * volume header.
2729 *
2730 * Note: the on-disk volume signature is intentionally
2731 * not flushed since the on-disk "H+" and "HX" signatures
2732 * are always stored in-memory as "H+".
2733 */
2734 __private_extern__
2735 int
2736 hfs_flushvolumeheader(struct hfsmount *hfsmp, int waitfor, int altflush)
2737 {
2738 ExtendedVCB *vcb = HFSTOVCB(hfsmp);
2739 struct filefork *fp;
2740 HFSPlusVolumeHeader *volumeHeader;
2741 int retval;
2742 struct buf *bp;
2743 int i;
2744 int sectorsize;
2745 daddr64_t priIDSector;
2746 int critical;
2747 u_int16_t signature;
2748 u_int16_t hfsversion;
2749
2750 if (hfsmp->hfs_flags & HFS_READ_ONLY) {
2751 return(0);
2752 }
2753 if (hfsmp->hfs_flags & HFS_STANDARD) {
2754 return hfs_flushMDB(hfsmp, waitfor, altflush);
2755 }
2756 critical = altflush;
2757 sectorsize = hfsmp->hfs_phys_block_size;
2758 priIDSector = (daddr64_t)((vcb->hfsPlusIOPosOffset / sectorsize) +
2759 HFS_PRI_SECTOR(sectorsize));
2760
2761 if (hfs_start_transaction(hfsmp) != 0) {
2762 return EINVAL;
2763 }
2764
2765 retval = (int)buf_meta_bread(hfsmp->hfs_devvp, priIDSector, sectorsize, NOCRED, &bp);
2766 if (retval) {
2767 if (bp)
2768 buf_brelse(bp);
2769
2770 hfs_end_transaction(hfsmp);
2771
2772 printf("HFS: err %d reading VH blk (%s)\n", retval, vcb->vcbVN);
2773 return (retval);
2774 }
2775
2776 if (hfsmp->jnl) {
2777 journal_modify_block_start(hfsmp->jnl, bp);
2778 }
2779
2780 volumeHeader = (HFSPlusVolumeHeader *)((char *)buf_dataptr(bp) + HFS_PRI_OFFSET(sectorsize));
2781
2782 /*
2783 * Sanity check what we just read.
2784 */
2785 signature = SWAP_BE16 (volumeHeader->signature);
2786 hfsversion = SWAP_BE16 (volumeHeader->version);
2787 if ((signature != kHFSPlusSigWord && signature != kHFSXSigWord) ||
2788 (hfsversion < kHFSPlusVersion) || (hfsversion > 100) ||
2789 (SWAP_BE32 (volumeHeader->blockSize) != vcb->blockSize)) {
2790 #if 1
2791 panic("HFS: corrupt VH on %s, sig 0x%04x, ver %d, blksize %d",
2792 vcb->vcbVN, signature, hfsversion,
2793 SWAP_BE32 (volumeHeader->blockSize));
2794 #endif
2795 printf("HFS: corrupt VH blk (%s)\n", vcb->vcbVN);
2796 buf_brelse(bp);
2797 return (EIO);
2798 }
2799
2800 /*
2801 * For embedded HFS+ volumes, update create date if it changed
2802 * (ie from a setattrlist call)
2803 */
2804 if ((vcb->hfsPlusIOPosOffset != 0) &&
2805 (SWAP_BE32 (volumeHeader->createDate) != vcb->localCreateDate)) {
2806 struct buf *bp2;
2807 HFSMasterDirectoryBlock *mdb;
2808
2809 retval = (int)buf_meta_bread(hfsmp->hfs_devvp, (daddr64_t)HFS_PRI_SECTOR(sectorsize),
2810 sectorsize, NOCRED, &bp2);
2811 if (retval) {
2812 if (bp2)
2813 buf_brelse(bp2);
2814 retval = 0;
2815 } else {
2816 mdb = (HFSMasterDirectoryBlock *)(buf_dataptr(bp2) +
2817 HFS_PRI_OFFSET(sectorsize));
2818
2819 if ( SWAP_BE32 (mdb->drCrDate) != vcb->localCreateDate )
2820 {
2821 if (hfsmp->jnl) {
2822 journal_modify_block_start(hfsmp->jnl, bp2);
2823 }
2824
2825 mdb->drCrDate = SWAP_BE32 (vcb->localCreateDate); /* pick up the new create date */
2826
2827 if (hfsmp->jnl) {
2828 journal_modify_block_end(hfsmp->jnl, bp2, NULL, NULL);
2829 } else {
2830 (void) VNOP_BWRITE(bp2); /* write out the changes */
2831 }
2832 }
2833 else
2834 {
2835 buf_brelse(bp2); /* just release it */
2836 }
2837 }
2838 }
2839
2840 lck_mtx_lock(&hfsmp->hfs_mutex);
2841
2842 /* Note: only update the lower 16 bits worth of attributes */
2843 volumeHeader->attributes = SWAP_BE32 (vcb->vcbAtrb);
2844 volumeHeader->journalInfoBlock = SWAP_BE32 (vcb->vcbJinfoBlock);
2845 if (hfsmp->jnl) {
2846 volumeHeader->lastMountedVersion = SWAP_BE32 (kHFSJMountVersion);
2847 } else {
2848 volumeHeader->lastMountedVersion = SWAP_BE32 (kHFSPlusMountVersion);
2849 }
2850 volumeHeader->createDate = SWAP_BE32 (vcb->localCreateDate); /* volume create date is in local time */
2851 volumeHeader->modifyDate = SWAP_BE32 (to_hfs_time(vcb->vcbLsMod));
2852 volumeHeader->backupDate = SWAP_BE32 (to_hfs_time(vcb->vcbVolBkUp));
2853 volumeHeader->fileCount = SWAP_BE32 (vcb->vcbFilCnt);
2854 volumeHeader->folderCount = SWAP_BE32 (vcb->vcbDirCnt);
2855 volumeHeader->totalBlocks = SWAP_BE32 (vcb->totalBlocks);
2856 volumeHeader->freeBlocks = SWAP_BE32 (vcb->freeBlocks);
2857 volumeHeader->nextAllocation = SWAP_BE32 (vcb->nextAllocation);
2858 volumeHeader->rsrcClumpSize = SWAP_BE32 (vcb->vcbClpSiz);
2859 volumeHeader->dataClumpSize = SWAP_BE32 (vcb->vcbClpSiz);
2860 volumeHeader->nextCatalogID = SWAP_BE32 (vcb->vcbNxtCNID);
2861 volumeHeader->writeCount = SWAP_BE32 (vcb->vcbWrCnt);
2862 volumeHeader->encodingsBitmap = SWAP_BE64 (vcb->encodingsBitmap);
2863
2864 if (bcmp(vcb->vcbFndrInfo, volumeHeader->finderInfo, sizeof(volumeHeader->finderInfo)) != 0) {
2865 bcopy(vcb->vcbFndrInfo, volumeHeader->finderInfo, sizeof(volumeHeader->finderInfo));
2866 critical = 1;
2867 }
2868
2869 /*
2870 * System files are only dirty when altflush is set.
2871 */
2872 if (altflush == 0) {
2873 goto done;
2874 }
2875
2876 /* Sync Extents over-flow file meta data */
2877 fp = VTOF(vcb->extentsRefNum);
2878 if (FTOC(fp)->c_flag & C_MODIFIED) {
2879 for (i = 0; i < kHFSPlusExtentDensity; i++) {
2880 volumeHeader->extentsFile.extents[i].startBlock =
2881 SWAP_BE32 (fp->ff_extents[i].startBlock);
2882 volumeHeader->extentsFile.extents[i].blockCount =
2883 SWAP_BE32 (fp->ff_extents[i].blockCount);
2884 }
2885 volumeHeader->extentsFile.logicalSize = SWAP_BE64 (fp->ff_size);
2886 volumeHeader->extentsFile.totalBlocks = SWAP_BE32 (fp->ff_blocks);
2887 volumeHeader->extentsFile.clumpSize = SWAP_BE32 (fp->ff_clumpsize);
2888 FTOC(fp)->c_flag &= ~C_MODIFIED;
2889 }
2890
2891 /* Sync Catalog file meta data */
2892 fp = VTOF(vcb->catalogRefNum);
2893 if (FTOC(fp)->c_flag & C_MODIFIED) {
2894 for (i = 0; i < kHFSPlusExtentDensity; i++) {
2895 volumeHeader->catalogFile.extents[i].startBlock =
2896 SWAP_BE32 (fp->ff_extents[i].startBlock);
2897 volumeHeader->catalogFile.extents[i].blockCount =
2898 SWAP_BE32 (fp->ff_extents[i].blockCount);
2899 }
2900 volumeHeader->catalogFile.logicalSize = SWAP_BE64 (fp->ff_size);
2901 volumeHeader->catalogFile.totalBlocks = SWAP_BE32 (fp->ff_blocks);
2902 volumeHeader->catalogFile.clumpSize = SWAP_BE32 (fp->ff_clumpsize);
2903 FTOC(fp)->c_flag &= ~C_MODIFIED;
2904 }
2905
2906 /* Sync Allocation file meta data */
2907 fp = VTOF(vcb->allocationsRefNum);
2908 if (FTOC(fp)->c_flag & C_MODIFIED) {
2909 for (i = 0; i < kHFSPlusExtentDensity; i++) {
2910 volumeHeader->allocationFile.extents[i].startBlock =
2911 SWAP_BE32 (fp->ff_extents[i].startBlock);
2912 volumeHeader->allocationFile.extents[i].blockCount =
2913 SWAP_BE32 (fp->ff_extents[i].blockCount);
2914 }
2915 volumeHeader->allocationFile.logicalSize = SWAP_BE64 (fp->ff_size);
2916 volumeHeader->allocationFile.totalBlocks = SWAP_BE32 (fp->ff_blocks);
2917 volumeHeader->allocationFile.clumpSize = SWAP_BE32 (fp->ff_clumpsize);
2918 FTOC(fp)->c_flag &= ~C_MODIFIED;
2919 }
2920
2921 /* Sync Attribute file meta data */
2922 if (hfsmp->hfs_attribute_vp) {
2923 fp = VTOF(hfsmp->hfs_attribute_vp);
2924 for (i = 0; i < kHFSPlusExtentDensity; i++) {
2925 volumeHeader->attributesFile.extents[i].startBlock =
2926 SWAP_BE32 (fp->ff_extents[i].startBlock);
2927 volumeHeader->attributesFile.extents[i].blockCount =
2928 SWAP_BE32 (fp->ff_extents[i].blockCount);
2929 }
2930 FTOC(fp)->c_flag &= ~C_MODIFIED;
2931 volumeHeader->attributesFile.logicalSize = SWAP_BE64 (fp->ff_size);
2932 volumeHeader->attributesFile.totalBlocks = SWAP_BE32 (fp->ff_blocks);
2933 volumeHeader->attributesFile.clumpSize = SWAP_BE32 (fp->ff_clumpsize);
2934 }
2935
2936 /* Sync Startup file meta data */
2937 if (hfsmp->hfs_startup_vp) {
2938 fp = VTOF(hfsmp->hfs_startup_vp);
2939 if (FTOC(fp)->c_flag & C_MODIFIED) {
2940 for (i = 0; i < kHFSPlusExtentDensity; i++) {
2941 volumeHeader->startupFile.extents[i].startBlock =
2942 SWAP_BE32 (fp->ff_extents[i].startBlock);
2943 volumeHeader->startupFile.extents[i].blockCount =
2944 SWAP_BE32 (fp->ff_extents[i].blockCount);
2945 }
2946 volumeHeader->startupFile.logicalSize = SWAP_BE64 (fp->ff_size);
2947 volumeHeader->startupFile.totalBlocks = SWAP_BE32 (fp->ff_blocks);
2948 volumeHeader->startupFile.clumpSize = SWAP_BE32 (fp->ff_clumpsize);
2949 FTOC(fp)->c_flag &= ~C_MODIFIED;
2950 }
2951 }
2952
2953 done:
2954 MarkVCBClean(hfsmp);
2955 lck_mtx_unlock(&hfsmp->hfs_mutex);
2956
2957 /* If requested, flush out the alternate volume header */
2958 if (altflush && hfsmp->hfs_alt_id_sector) {
2959 struct buf *alt_bp = NULL;
2960
2961 if (buf_meta_bread(hfsmp->hfs_devvp, hfsmp->hfs_alt_id_sector, sectorsize, NOCRED, &alt_bp) == 0) {
2962 if (hfsmp->jnl) {
2963 journal_modify_block_start(hfsmp->jnl, alt_bp);
2964 }
2965
2966 bcopy(volumeHeader, (char *)buf_dataptr(alt_bp) + HFS_ALT_OFFSET(sectorsize), kMDBSize);
2967
2968 if (hfsmp->jnl) {
2969 journal_modify_block_end(hfsmp->jnl, alt_bp, NULL, NULL);
2970 } else {
2971 (void) VNOP_BWRITE(alt_bp);
2972 }
2973 } else if (alt_bp)
2974 buf_brelse(alt_bp);
2975 }
2976
2977 if (hfsmp->jnl) {
2978 journal_modify_block_end(hfsmp->jnl, bp, NULL, NULL);
2979 } else {
2980 if (waitfor != MNT_WAIT)
2981 buf_bawrite(bp);
2982 else {
2983 retval = VNOP_BWRITE(bp);
2984 /* When critical data changes, flush the device cache */
2985 if (critical && (retval == 0)) {
2986 (void) VNOP_IOCTL(hfsmp->hfs_devvp, DKIOCSYNCHRONIZECACHE,
2987 NULL, FWRITE, NULL);
2988 }
2989 }
2990 }
2991 hfs_end_transaction(hfsmp);
2992
2993 return (retval);
2994 }
2995
2996
2997 /*
2998 * Extend a file system.
2999 */
3000 __private_extern__
3001 int
3002 hfs_extendfs(struct hfsmount *hfsmp, u_int64_t newsize, vfs_context_t context)
3003 {
3004 struct proc *p = vfs_context_proc(context);
3005 kauth_cred_t cred = vfs_context_ucred(context);
3006 struct vnode *vp;
3007 struct vnode *devvp;
3008 struct buf *bp;
3009 struct filefork *fp = NULL;
3010 ExtendedVCB *vcb;
3011 struct cat_fork forkdata;
3012 u_int64_t oldsize;
3013 u_int64_t newblkcnt;
3014 u_int64_t prev_phys_block_count;
3015 u_int32_t addblks;
3016 u_int64_t sectorcnt;
3017 u_int32_t sectorsize;
3018 daddr64_t prev_alt_sector;
3019 daddr_t bitmapblks;
3020 int lockflags;
3021 int error;
3022 int64_t oldBitmapSize;
3023 Boolean usedExtendFileC = false;
3024
3025 devvp = hfsmp->hfs_devvp;
3026 vcb = HFSTOVCB(hfsmp);
3027
3028 /*
3029 * - HFS Plus file systems only.
3030 * - Journaling must be enabled.
3031 * - No embedded volumes.
3032 */
3033 if ((vcb->vcbSigWord == kHFSSigWord) ||
3034 (hfsmp->jnl == NULL) ||
3035 (vcb->hfsPlusIOPosOffset != 0)) {
3036 return (EPERM);
3037 }
3038 /*
3039 * If extending file system by non-root, then verify
3040 * ownership and check permissions.
3041 */
3042 if (suser(cred, NULL)) {
3043 error = hfs_vget(hfsmp, kHFSRootFolderID, &vp, 0);
3044
3045 if (error)
3046 return (error);
3047 error = hfs_owner_rights(hfsmp, VTOC(vp)->c_uid, cred, p, 0);
3048 if (error == 0) {
3049 error = hfs_write_access(vp, cred, p, false);
3050 }
3051 hfs_unlock(VTOC(vp));
3052 vnode_put(vp);
3053 if (error)
3054 return (error);
3055
3056 error = vnode_authorize(devvp, NULL, KAUTH_VNODE_READ_DATA | KAUTH_VNODE_WRITE_DATA, context);
3057 if (error)
3058 return (error);
3059 }
3060 if (VNOP_IOCTL(devvp, DKIOCGETBLOCKSIZE, (caddr_t)&sectorsize, 0, context)) {
3061 return (ENXIO);
3062 }
3063 if (sectorsize != hfsmp->hfs_phys_block_size) {
3064 return (ENXIO);
3065 }
3066 if (VNOP_IOCTL(devvp, DKIOCGETBLOCKCOUNT, (caddr_t)&sectorcnt, 0, context)) {
3067 return (ENXIO);
3068 }
3069 if ((sectorsize * sectorcnt) < newsize) {
3070 printf("hfs_extendfs: not enough space on device\n");
3071 return (ENOSPC);
3072 }
3073 oldsize = (u_int64_t)hfsmp->totalBlocks * (u_int64_t)hfsmp->blockSize;
3074
3075 /*
3076 * Validate new size.
3077 */
3078 if ((newsize <= oldsize) || (newsize % sectorsize)) {
3079 printf("hfs_extendfs: invalid size\n");
3080 return (EINVAL);
3081 }
3082 newblkcnt = newsize / vcb->blockSize;
3083 if (newblkcnt > (u_int64_t)0xFFFFFFFF)
3084 return (EOVERFLOW);
3085
3086 addblks = newblkcnt - vcb->totalBlocks;
3087
3088 printf("hfs_extendfs: growing %s by %d blocks\n", vcb->vcbVN, addblks);
3089 /*
3090 * Enclose changes inside a transaction.
3091 */
3092 if (hfs_start_transaction(hfsmp) != 0) {
3093 return (EINVAL);
3094 }
3095
3096 /*
3097 * Note: we take the attributes lock in case we have an attribute data vnode
3098 * which needs to change size.
3099 */
3100 lockflags = hfs_systemfile_lock(hfsmp, SFL_ATTRIBUTE | SFL_EXTENTS | SFL_BITMAP, HFS_EXCLUSIVE_LOCK);
3101 vp = vcb->allocationsRefNum;
3102 fp = VTOF(vp);
3103 bcopy(&fp->ff_data, &forkdata, sizeof(forkdata));
3104
3105 /*
3106 * Calculate additional space required (if any) by allocation bitmap.
3107 */
3108 oldBitmapSize = fp->ff_size;
3109 bitmapblks = roundup((newblkcnt+7) / 8, vcb->vcbVBMIOSize) / vcb->blockSize;
3110 if (bitmapblks > (daddr_t)fp->ff_blocks)
3111 bitmapblks -= fp->ff_blocks;
3112 else
3113 bitmapblks = 0;
3114
3115 if (bitmapblks > 0) {
3116 daddr64_t blkno;
3117 daddr_t blkcnt;
3118 off_t bytesAdded;
3119
3120 /*
3121 * Get the bitmap's current size (in allocation blocks) so we know
3122 * where to start zero filling once the new space is added. We've
3123 * got to do this before the bitmap is grown.
3124 */
3125 blkno = (daddr64_t)fp->ff_blocks;
3126
3127 /*
3128 * Try to grow the allocation file in the normal way, using allocation
3129 * blocks already existing in the file system. This way, we might be
3130 * able to grow the bitmap contiguously, or at least in the metadata
3131 * zone.
3132 */
3133 error = ExtendFileC(vcb, fp, bitmapblks * vcb->blockSize, 0,
3134 kEFAllMask | kEFNoClumpMask | kEFReserveMask | kEFMetadataMask,
3135 &bytesAdded);
3136
3137 if (error == 0) {
3138 usedExtendFileC = true;
3139 } else {
3140 /*
3141 * If the above allocation failed, fall back to allocating the new
3142 * extent of the bitmap from the space we're going to add. Since those
3143 * blocks don't yet belong to the file system, we have to update the
3144 * extent list directly, and manually adjust the file size.
3145 */
3146 bytesAdded = 0;
3147 error = AddFileExtent(vcb, fp, vcb->totalBlocks, bitmapblks);
3148 if (error) {
3149 printf("hfs_extendfs: error %d adding extents\n", error);
3150 goto out;
3151 }
3152 fp->ff_blocks += bitmapblks;
3153 VTOC(vp)->c_blocks = fp->ff_blocks;
3154 VTOC(vp)->c_flag |= C_MODIFIED;
3155 }
3156
3157 /*
3158 * Update the allocation file's size to include the newly allocated
3159 * blocks. Note that ExtendFileC doesn't do this, which is why this
3160 * statement is outside the above "if" statement.
3161 */
3162 fp->ff_size += (u_int64_t)bitmapblks * (u_int64_t)vcb->blockSize;
3163
3164 /*
3165 * Zero out the new bitmap blocks.
3166 */
3167 {
3168
3169 bp = NULL;
3170 blkcnt = bitmapblks;
3171 while (blkcnt > 0) {
3172 error = (int)buf_meta_bread(vp, blkno, vcb->blockSize, NOCRED, &bp);
3173 if (error) {
3174 if (bp) {
3175 buf_brelse(bp);
3176 }
3177 break;
3178 }
3179 bzero((char *)buf_dataptr(bp), vcb->blockSize);
3180 buf_markaged(bp);
3181 error = (int)buf_bwrite(bp);
3182 if (error)
3183 break;
3184 --blkcnt;
3185 ++blkno;
3186 }
3187 }
3188 if (error) {
3189 printf("hfs_extendfs: error %d clearing blocks\n", error);
3190 goto out;
3191 }
3192 /*
3193 * Mark the new bitmap space as allocated.
3194 *
3195 * Note that ExtendFileC will have marked any blocks it allocated, so
3196 * this is only needed if we used AddFileExtent. Also note that this
3197 * has to come *after* the zero filling of new blocks in the case where
3198 * we used AddFileExtent (since the part of the bitmap we're touching
3199 * is in those newly allocated blocks).
3200 */
3201 if (!usedExtendFileC) {
3202 error = BlockMarkAllocated(vcb, vcb->totalBlocks, bitmapblks);
3203 if (error) {
3204 printf("hfs_extendfs: error %d setting bitmap\n", error);
3205 goto out;
3206 }
3207 vcb->freeBlocks -= bitmapblks;
3208 }
3209 }
3210 /*
3211 * Mark the new alternate VH as allocated.
3212 */
3213 if (vcb->blockSize == 512)
3214 error = BlockMarkAllocated(vcb, vcb->totalBlocks + addblks - 2, 2);
3215 else
3216 error = BlockMarkAllocated(vcb, vcb->totalBlocks + addblks - 1, 1);
3217 if (error) {
3218 printf("hfs_extendfs: error %d setting bitmap (VH)\n", error);
3219 goto out;
3220 }
3221 /*
3222 * Mark the old alternate VH as free.
3223 */
3224 if (vcb->blockSize == 512)
3225 (void) BlockMarkFree(vcb, vcb->totalBlocks - 2, 2);
3226 else
3227 (void) BlockMarkFree(vcb, vcb->totalBlocks - 1, 1);
3228 /*
3229 * Adjust file system variables for new space.
3230 */
3231 prev_phys_block_count = hfsmp->hfs_phys_block_count;
3232 prev_alt_sector = hfsmp->hfs_alt_id_sector;
3233
3234 vcb->totalBlocks += addblks;
3235 vcb->freeBlocks += addblks;
3236 hfsmp->hfs_phys_block_count = newsize / sectorsize;
3237 hfsmp->hfs_alt_id_sector = (hfsmp->hfsPlusIOPosOffset / sectorsize) +
3238 HFS_ALT_SECTOR(sectorsize, hfsmp->hfs_phys_block_count);
3239 MarkVCBDirty(vcb);
3240 error = hfs_flushvolumeheader(hfsmp, MNT_WAIT, HFS_ALTFLUSH);
3241 if (error) {
3242 printf("hfs_extendfs: couldn't flush volume headers (%d)", error);
3243 /*
3244 * Restore to old state.
3245 */
3246 if (usedExtendFileC) {
3247 (void) TruncateFileC(vcb, fp, oldBitmapSize, false);
3248 } else {
3249 fp->ff_blocks -= bitmapblks;
3250 fp->ff_size -= (u_int64_t)bitmapblks * (u_int64_t)vcb->blockSize;
3251 /*
3252 * No need to mark the excess blocks free since those bitmap blocks
3253 * are no longer part of the bitmap. But we do need to undo the
3254 * effect of the "vcb->freeBlocks -= bitmapblks" above.
3255 */
3256 vcb->freeBlocks += bitmapblks;
3257 }
3258 vcb->totalBlocks -= addblks;
3259 vcb->freeBlocks -= addblks;
3260 hfsmp->hfs_phys_block_count = prev_phys_block_count;
3261 hfsmp->hfs_alt_id_sector = prev_alt_sector;
3262 MarkVCBDirty(vcb);
3263 if (vcb->blockSize == 512)
3264 (void) BlockMarkAllocated(vcb, vcb->totalBlocks - 2, 2);
3265 else
3266 (void) BlockMarkAllocated(vcb, vcb->totalBlocks - 1, 1);
3267 goto out;
3268 }
3269 /*
3270 * Invalidate the old alternate volume header.
3271 */
3272 bp = NULL;
3273 if (prev_alt_sector) {
3274 if (buf_meta_bread(hfsmp->hfs_devvp, prev_alt_sector, sectorsize,
3275 NOCRED, &bp) == 0) {
3276 journal_modify_block_start(hfsmp->jnl, bp);
3277
3278 bzero((char *)buf_dataptr(bp) + HFS_ALT_OFFSET(sectorsize), kMDBSize);
3279
3280 journal_modify_block_end(hfsmp->jnl, bp, NULL, NULL);
3281 } else if (bp) {
3282 buf_brelse(bp);
3283 }
3284 }
3285
3286 /*
3287 * TODO: Adjust the size of the metadata zone based on new volume size?
3288 */
3289
3290 /*
3291 * Adjust the size of hfsmp->hfs_attrdata_vp
3292 */
3293 if (hfsmp->hfs_attrdata_vp) {
3294 struct cnode *attr_cp;
3295 struct filefork *attr_fp;
3296
3297 if (vnode_get(hfsmp->hfs_attrdata_vp) == 0) {
3298 attr_cp = VTOC(hfsmp->hfs_attrdata_vp);
3299 attr_fp = VTOF(hfsmp->hfs_attrdata_vp);
3300
3301 attr_cp->c_blocks = newblkcnt;
3302 attr_fp->ff_blocks = newblkcnt;
3303 attr_fp->ff_extents[0].blockCount = newblkcnt;
3304 attr_fp->ff_size = (off_t) newblkcnt * hfsmp->blockSize;
3305 ubc_setsize(hfsmp->hfs_attrdata_vp, attr_fp->ff_size);
3306 vnode_put(hfsmp->hfs_attrdata_vp);
3307 }
3308 }
3309
3310 out:
3311 if (error && fp) {
3312 /* Restore allocation fork. */
3313 bcopy(&forkdata, &fp->ff_data, sizeof(forkdata));
3314 VTOC(vp)->c_blocks = fp->ff_blocks;
3315
3316 }
3317 /*
3318 Regardless of whether or not the totalblocks actually increased,
3319 we should reset the allocLimit field. If it changed, it will
3320 get updated; if not, it will remain the same.
3321 */
3322 hfsmp->allocLimit = vcb->totalBlocks;
3323 hfs_systemfile_unlock(hfsmp, lockflags);
3324 hfs_end_transaction(hfsmp);
3325
3326 return (error);
3327 }
3328
3329 #define HFS_MIN_SIZE (32LL * 1024LL * 1024LL)
3330
3331 /*
3332 * Truncate a file system (while still mounted).
3333 */
3334 __private_extern__
3335 int
3336 hfs_truncatefs(struct hfsmount *hfsmp, u_int64_t newsize, vfs_context_t context)
3337 {
3338 struct buf *bp = NULL;
3339 u_int64_t oldsize;
3340 u_int32_t newblkcnt;
3341 u_int32_t reclaimblks = 0;
3342 int lockflags = 0;
3343 int transaction_begun = 0;
3344 int error;
3345
3346 lck_mtx_lock(&hfsmp->hfs_mutex);
3347 if (hfsmp->hfs_flags & HFS_RESIZE_IN_PROGRESS) {
3348 lck_mtx_unlock(&hfsmp->hfs_mutex);
3349 return (EALREADY);
3350 }
3351 hfsmp->hfs_flags |= HFS_RESIZE_IN_PROGRESS;
3352 hfsmp->hfs_resize_filesmoved = 0;
3353 hfsmp->hfs_resize_totalfiles = 0;
3354 lck_mtx_unlock(&hfsmp->hfs_mutex);
3355
3356 /*
3357 * - Journaled HFS Plus volumes only.
3358 * - No embedded volumes.
3359 */
3360 if ((hfsmp->jnl == NULL) ||
3361 (hfsmp->hfsPlusIOPosOffset != 0)) {
3362 error = EPERM;
3363 goto out;
3364 }
3365 oldsize = (u_int64_t)hfsmp->totalBlocks * (u_int64_t)hfsmp->blockSize;
3366 newblkcnt = newsize / hfsmp->blockSize;
3367 reclaimblks = hfsmp->totalBlocks - newblkcnt;
3368
3369 /* Make sure new size is valid. */
3370 if ((newsize < HFS_MIN_SIZE) ||
3371 (newsize >= oldsize) ||
3372 (newsize % hfsmp->hfs_phys_block_size)) {
3373 error = EINVAL;
3374 goto out;
3375 }
3376 /* Make sure there's enough space to work with. */
3377 if (reclaimblks >= hfs_freeblks(hfsmp, 1)) {
3378 printf("hfs_truncatefs: insufficient space (need %u blocks; have %u blocks)\n", reclaimblks, hfs_freeblks(hfsmp, 1));
3379 error = ENOSPC;
3380 goto out;
3381 }
3382
3383 /* Start with a clean journal. */
3384 journal_flush(hfsmp->jnl);
3385
3386 if (hfs_start_transaction(hfsmp) != 0) {
3387 error = EINVAL;
3388 goto out;
3389 }
3390 transaction_begun = 1;
3391
3392 /*
3393 * Prevent new allocations from using the part we're trying to truncate.
3394 *
3395 * NOTE: allocLimit is set to the allocation block number where the new
3396 * alternate volume header will be. That way there will be no files to
3397 * interfere with allocating the new alternate volume header, and no files
3398 * in the allocation blocks beyond (i.e. the blocks we're trying to
3399 * truncate away.
3400 */
3401 lck_mtx_lock(&hfsmp->hfs_mutex);
3402 if (hfsmp->blockSize == 512)
3403 hfsmp->allocLimit = newblkcnt - 2;
3404 else
3405 hfsmp->allocLimit = newblkcnt - 1;
3406 hfsmp->freeBlocks -= reclaimblks;
3407 lck_mtx_unlock(&hfsmp->hfs_mutex);
3408
3409 /*
3410 * Look for files that have blocks at or beyond the location of the
3411 * new alternate volume header.
3412 */
3413 if (hfs_isallocated(hfsmp, hfsmp->allocLimit, reclaimblks)) {
3414 /*
3415 * hfs_reclaimspace will use separate transactions when
3416 * relocating files (so we don't overwhelm the journal).
3417 */
3418 hfs_end_transaction(hfsmp);
3419 transaction_begun = 0;
3420
3421 /* Attempt to reclaim some space. */
3422 if (hfs_reclaimspace(hfsmp, hfsmp->allocLimit, reclaimblks, context) != 0) {
3423 printf("hfs_truncatefs: couldn't reclaim space on %s\n", hfsmp->vcbVN);
3424 error = ENOSPC;
3425 goto out;
3426 }
3427 if (hfs_start_transaction(hfsmp) != 0) {
3428 error = EINVAL;
3429 goto out;
3430 }
3431 transaction_begun = 1;
3432
3433 /* Check if we're clear now. */
3434 if (hfs_isallocated(hfsmp, hfsmp->allocLimit, reclaimblks)) {
3435 printf("hfs_truncatefs: didn't reclaim enough space on %s\n", hfsmp->vcbVN);
3436 error = EAGAIN; /* tell client to try again */
3437 goto out;
3438 }
3439 }
3440
3441 /*
3442 * Note: we take the attributes lock in case we have an attribute data vnode
3443 * which needs to change size.
3444 */
3445 lockflags = hfs_systemfile_lock(hfsmp, SFL_ATTRIBUTE | SFL_EXTENTS | SFL_BITMAP, HFS_EXCLUSIVE_LOCK);
3446
3447 /*
3448 * Mark the old alternate volume header as free.
3449 * We don't bother shrinking allocation bitmap file.
3450 */
3451 if (hfsmp->blockSize == 512)
3452 (void) BlockMarkFree(hfsmp, hfsmp->totalBlocks - 2, 2);
3453 else
3454 (void) BlockMarkFree(hfsmp, hfsmp->totalBlocks - 1, 1);
3455
3456 /*
3457 * Allocate last 1KB for alternate volume header.
3458 */
3459 error = BlockMarkAllocated(hfsmp, hfsmp->allocLimit, (hfsmp->blockSize == 512) ? 2 : 1);
3460 if (error) {
3461 printf("hfs_truncatefs: Error %d allocating new alternate volume header\n", error);
3462 goto out;
3463 }
3464
3465 /*
3466 * Invalidate the existing alternate volume header.
3467 *
3468 * Don't include this in a transaction (don't call journal_modify_block)
3469 * since this block will be outside of the truncated file system!
3470 */
3471 if (hfsmp->hfs_alt_id_sector) {
3472 if (buf_meta_bread(hfsmp->hfs_devvp, hfsmp->hfs_alt_id_sector,
3473 hfsmp->hfs_phys_block_size, NOCRED, &bp) == 0) {
3474
3475 bzero((void*)((char *)buf_dataptr(bp) + HFS_ALT_OFFSET(hfsmp->hfs_phys_block_size)), kMDBSize);
3476 (void) VNOP_BWRITE(bp);
3477 } else if (bp) {
3478 buf_brelse(bp);
3479 }
3480 bp = NULL;
3481 }
3482
3483 /* Log successful shrinking. */
3484 printf("hfs_truncatefs: shrank \"%s\" to %d blocks (was %d blocks)\n",
3485 hfsmp->vcbVN, newblkcnt, hfsmp->totalBlocks);
3486
3487 /*
3488 * Adjust file system variables and flush them to disk.
3489 */
3490 hfsmp->totalBlocks = newblkcnt;
3491 hfsmp->hfs_phys_block_count = newsize / hfsmp->hfs_phys_block_size;
3492 hfsmp->hfs_alt_id_sector = HFS_ALT_SECTOR(hfsmp->hfs_phys_block_size, hfsmp->hfs_phys_block_count);
3493 MarkVCBDirty(hfsmp);
3494 error = hfs_flushvolumeheader(hfsmp, MNT_WAIT, HFS_ALTFLUSH);
3495 if (error)
3496 panic("hfs_truncatefs: unexpected error flushing volume header (%d)\n", error);
3497
3498 /*
3499 * TODO: Adjust the size of the metadata zone based on new volume size?
3500 */
3501
3502 /*
3503 * Adjust the size of hfsmp->hfs_attrdata_vp
3504 */
3505 if (hfsmp->hfs_attrdata_vp) {
3506 struct cnode *cp;
3507 struct filefork *fp;
3508
3509 if (vnode_get(hfsmp->hfs_attrdata_vp) == 0) {
3510 cp = VTOC(hfsmp->hfs_attrdata_vp);
3511 fp = VTOF(hfsmp->hfs_attrdata_vp);
3512
3513 cp->c_blocks = newblkcnt;
3514 fp->ff_blocks = newblkcnt;
3515 fp->ff_extents[0].blockCount = newblkcnt;
3516 fp->ff_size = (off_t) newblkcnt * hfsmp->blockSize;
3517 ubc_setsize(hfsmp->hfs_attrdata_vp, fp->ff_size);
3518 vnode_put(hfsmp->hfs_attrdata_vp);
3519 }
3520 }
3521
3522 out:
3523 if (error)
3524 hfsmp->freeBlocks += reclaimblks;
3525
3526 lck_mtx_lock(&hfsmp->hfs_mutex);
3527 hfsmp->allocLimit = hfsmp->totalBlocks;
3528 if (hfsmp->nextAllocation >= hfsmp->allocLimit)
3529 hfsmp->nextAllocation = hfsmp->hfs_metazone_end + 1;
3530 hfsmp->hfs_flags &= ~HFS_RESIZE_IN_PROGRESS;
3531 lck_mtx_unlock(&hfsmp->hfs_mutex);
3532
3533 if (lockflags) {
3534 hfs_systemfile_unlock(hfsmp, lockflags);
3535 }
3536 if (transaction_begun) {
3537 hfs_end_transaction(hfsmp);
3538 journal_flush(hfsmp->jnl);
3539 }
3540
3541 return (error);
3542 }
3543
3544
3545 /*
3546 * Invalidate the physical block numbers associated with buffer cache blocks
3547 * in the given extent of the given vnode.
3548 */
3549 struct hfs_inval_blk_no {
3550 daddr64_t sectorStart;
3551 daddr64_t sectorCount;
3552 };
3553 static int
3554 hfs_invalidate_block_numbers_callback(buf_t bp, void *args_in)
3555 {
3556 daddr64_t blkno;
3557 struct hfs_inval_blk_no *args;
3558
3559 blkno = buf_blkno(bp);
3560 args = args_in;
3561
3562 if (blkno >= args->sectorStart && blkno < args->sectorStart+args->sectorCount)
3563 buf_setblkno(bp, buf_lblkno(bp));
3564
3565 return BUF_RETURNED;
3566 }
3567 static void
3568 hfs_invalidate_sectors(struct vnode *vp, daddr64_t sectorStart, daddr64_t sectorCount)
3569 {
3570 struct hfs_inval_blk_no args;
3571 args.sectorStart = sectorStart;
3572 args.sectorCount = sectorCount;
3573
3574 buf_iterate(vp, hfs_invalidate_block_numbers_callback, BUF_SCAN_DIRTY|BUF_SCAN_CLEAN, &args);
3575 }
3576
3577
3578 /*
3579 * Copy the contents of an extent to a new location. Also invalidates the
3580 * physical block number of any buffer cache block in the copied extent
3581 * (so that if the block is written, it will go through VNOP_BLOCKMAP to
3582 * determine the new physical block number).
3583 */
3584 static int
3585 hfs_copy_extent(
3586 struct hfsmount *hfsmp,
3587 struct vnode *vp, /* The file whose extent is being copied. */
3588 u_int32_t oldStart, /* The start of the source extent. */
3589 u_int32_t newStart, /* The start of the destination extent. */
3590 u_int32_t blockCount, /* The number of allocation blocks to copy. */
3591 vfs_context_t context)
3592 {
3593 int err = 0;
3594 size_t bufferSize;
3595 void *buffer = NULL;
3596 struct vfsioattr ioattr;
3597 buf_t bp = NULL;
3598 off_t resid;
3599 size_t ioSize;
3600 u_int32_t ioSizeSectors; /* Device sectors in this I/O */
3601 daddr64_t srcSector, destSector;
3602 u_int32_t sectorsPerBlock = hfsmp->blockSize / hfsmp->hfs_phys_block_size;
3603
3604 /*
3605 * Sanity check that we have locked the vnode of the file we're copying.
3606 *
3607 * But since hfs_systemfile_lock() doesn't actually take the lock on
3608 * the allocation file if a journal is active, ignore the check if the
3609 * file being copied is the allocation file.
3610 */
3611 struct cnode *cp = VTOC(vp);
3612 if (cp != hfsmp->hfs_allocation_cp && cp->c_lockowner != current_thread())
3613 panic("hfs_copy_extent: vp=%p (cp=%p) not owned?\n", vp, cp);
3614
3615 /*
3616 * Wait for any in-progress writes to this vnode to complete, so that we'll
3617 * be copying consistent bits. (Otherwise, it's possible that an async
3618 * write will complete to the old extent after we read from it. That
3619 * could lead to corruption.)
3620 */
3621 err = vnode_waitforwrites(vp, 0, 0, 0, "hfs_copy_extent");
3622 if (err) {
3623 printf("hfs_copy_extent: Error %d from vnode_waitforwrites\n", err);
3624 return err;
3625 }
3626
3627 /*
3628 * Determine the I/O size to use
3629 *
3630 * NOTE: Many external drives will result in an ioSize of 128KB.
3631 * TODO: Should we use a larger buffer, doing several consecutive
3632 * reads, then several consecutive writes?
3633 */
3634 vfs_ioattr(hfsmp->hfs_mp, &ioattr);
3635 bufferSize = MIN(ioattr.io_maxreadcnt, ioattr.io_maxwritecnt);
3636 if (kmem_alloc(kernel_map, (vm_offset_t*) &buffer, bufferSize))
3637 return ENOMEM;
3638
3639 /* Get a buffer for doing the I/O */
3640 bp = buf_alloc(hfsmp->hfs_devvp);
3641 buf_setdataptr(bp, (uintptr_t)buffer);
3642
3643 resid = (off_t) blockCount * (off_t) hfsmp->blockSize;
3644 srcSector = (daddr64_t) oldStart * hfsmp->blockSize / hfsmp->hfs_phys_block_size;
3645 destSector = (daddr64_t) newStart * hfsmp->blockSize / hfsmp->hfs_phys_block_size;
3646 while (resid > 0) {
3647 ioSize = MIN(bufferSize, resid);
3648 ioSizeSectors = ioSize / hfsmp->hfs_phys_block_size;
3649
3650 /* Prepare the buffer for reading */
3651 buf_reset(bp, B_READ);
3652 buf_setsize(bp, ioSize);
3653 buf_setcount(bp, ioSize);
3654 buf_setblkno(bp, srcSector);
3655 buf_setlblkno(bp, srcSector);
3656
3657 /* Do the read */
3658 err = VNOP_STRATEGY(bp);
3659 if (!err)
3660 err = buf_biowait(bp);
3661 if (err) {
3662 printf("hfs_copy_extent: Error %d from VNOP_STRATEGY (read)\n", err);
3663 break;
3664 }
3665
3666 /* Prepare the buffer for writing */
3667 buf_reset(bp, B_WRITE);
3668 buf_setsize(bp, ioSize);
3669 buf_setcount(bp, ioSize);
3670 buf_setblkno(bp, destSector);
3671 buf_setlblkno(bp, destSector);
3672 if (journal_uses_fua(hfsmp->jnl))
3673 buf_markfua(bp);
3674
3675 /* Do the write */
3676 vnode_startwrite(hfsmp->hfs_devvp);
3677 err = VNOP_STRATEGY(bp);
3678 if (!err)
3679 err = buf_biowait(bp);
3680 if (err) {
3681 printf("hfs_copy_extent: Error %d from VNOP_STRATEGY (write)\n", err);
3682 break;
3683 }
3684
3685 resid -= ioSize;
3686 srcSector += ioSizeSectors;
3687 destSector += ioSizeSectors;
3688 }
3689 if (bp)
3690 buf_free(bp);
3691 if (buffer)
3692 kmem_free(kernel_map, (vm_offset_t)buffer, bufferSize);
3693
3694 /* Make sure all writes have been flushed to disk. */
3695 if (!journal_uses_fua(hfsmp->jnl)) {
3696 err = VNOP_IOCTL(hfsmp->hfs_devvp, DKIOCSYNCHRONIZECACHE, NULL, FWRITE, context);
3697 if (err) {
3698 printf("hfs_copy_extent: DKIOCSYNCHRONIZECACHE failed (%d)\n", err);
3699 err = 0; /* Don't fail the copy. */
3700 }
3701 }
3702
3703 if (!err)
3704 hfs_invalidate_sectors(vp, (daddr64_t)oldStart*sectorsPerBlock, (daddr64_t)blockCount*sectorsPerBlock);
3705
3706 return err;
3707 }
3708
3709
3710 /*
3711 * Reclaim space at the end of a volume, used by a given system file.
3712 *
3713 * This routine attempts to move any extent which contains allocation blocks
3714 * at or after "startblk." A separate transaction is used to do the move.
3715 * The contents of any moved extents are read and written via the volume's
3716 * device vnode -- NOT via "vp." During the move, moved blocks which are part
3717 * of a transaction have their physical block numbers invalidated so they will
3718 * eventually be written to their new locations.
3719 *
3720 * This routine can be used to move overflow extents for the allocation file.
3721 *
3722 * Inputs:
3723 * hfsmp The volume being resized.
3724 * startblk Blocks >= this allocation block need to be moved.
3725 * locks Which locks need to be taken for the given system file.
3726 * vp The vnode for the system file.
3727 *
3728 * Outputs:
3729 * moved Set to true if any extents were moved.
3730 */
3731 static int
3732 hfs_relocate_callback(__unused HFSPlusExtentKey *key, HFSPlusExtentRecord *record, HFSPlusExtentRecord *state)
3733 {
3734 bcopy(state, record, sizeof(HFSPlusExtentRecord));
3735 return 0;
3736 }
3737 static int
3738 hfs_reclaim_sys_file(struct hfsmount *hfsmp, struct vnode *vp, u_long startblk, int locks, Boolean *moved, vfs_context_t context)
3739 {
3740 int error;
3741 int lockflags;
3742 int i;
3743 u_long datablks;
3744 u_long block;
3745 u_int32_t oldStartBlock;
3746 u_int32_t newStartBlock;
3747 u_int32_t blockCount;
3748 struct filefork *fp;
3749
3750 /* If there is no vnode for this file, then there's nothing to do. */
3751 if (vp == NULL)
3752 return 0;
3753
3754 /* printf("hfs_reclaim_sys_file: %.*s\n", VTOC(vp)->c_desc.cd_namelen, VTOC(vp)->c_desc.cd_nameptr); */
3755
3756 /* We always need the allocation bitmap and extents B-tree */
3757 locks |= SFL_BITMAP | SFL_EXTENTS;
3758
3759 error = hfs_start_transaction(hfsmp);
3760 if (error) {
3761 printf("hfs_reclaim_sys_file: hfs_start_transaction returned %d\n", error);
3762 return error;
3763 }
3764 lockflags = hfs_systemfile_lock(hfsmp, locks, HFS_EXCLUSIVE_LOCK);
3765 fp = VTOF(vp);
3766 datablks = 0;
3767
3768 /* Relocate non-overflow extents */
3769 for (i = 0; i < kHFSPlusExtentDensity; ++i) {
3770 if (fp->ff_extents[i].blockCount == 0)
3771 break;
3772 oldStartBlock = fp->ff_extents[i].startBlock;
3773 blockCount = fp->ff_extents[i].blockCount;
3774 datablks += blockCount;
3775 block = oldStartBlock + blockCount;
3776 if (block > startblk) {
3777 error = BlockAllocate(hfsmp, 1, blockCount, blockCount, true, true, &newStartBlock, &blockCount);
3778 if (error) {
3779 printf("hfs_reclaim_sys_file: BlockAllocate returned %d\n", error);
3780 goto fail;
3781 }
3782 if (blockCount != fp->ff_extents[i].blockCount) {
3783 printf("hfs_reclaim_sys_file: new blockCount=%u, original blockCount=%u", blockCount, fp->ff_extents[i].blockCount);
3784 goto free_fail;
3785 }
3786 error = hfs_copy_extent(hfsmp, vp, oldStartBlock, newStartBlock, blockCount, context);
3787 if (error) {
3788 printf("hfs_reclaim_sys_file: hfs_copy_extent returned %d\n", error);
3789 goto free_fail;
3790 }
3791 fp->ff_extents[i].startBlock = newStartBlock;
3792 VTOC(vp)->c_flag |= C_MODIFIED;
3793 *moved = true;
3794 error = BlockDeallocate(hfsmp, oldStartBlock, blockCount);
3795 if (error) {
3796 /* TODO: Mark volume inconsistent? */
3797 printf("hfs_reclaim_sys_file: BlockDeallocate returned %d\n", error);
3798 goto fail;
3799 }
3800 error = hfs_flushvolumeheader(hfsmp, MNT_WAIT, HFS_ALTFLUSH);
3801 if (error) {
3802 /* TODO: Mark volume inconsistent? */
3803 printf("hfs_reclaim_sys_file: hfs_flushvolumeheader returned %d\n", error);
3804 goto fail;
3805 }
3806 }
3807 }
3808
3809 /* Relocate overflow extents (if any) */
3810 if (i == kHFSPlusExtentDensity && fp->ff_blocks > datablks) {
3811 struct BTreeIterator *iterator = NULL;
3812 struct FSBufferDescriptor btdata;
3813 HFSPlusExtentRecord record;
3814 HFSPlusExtentKey *key;
3815 FCB *fcb;
3816 u_int32_t fileID;
3817 u_int8_t forktype;
3818
3819 forktype = VNODE_IS_RSRC(vp) ? 0xFF : 0;
3820 fileID = VTOC(vp)->c_cnid;
3821 if (kmem_alloc(kernel_map, (vm_offset_t*) &iterator, sizeof(*iterator))) {
3822 printf("hfs_reclaim_sys_file: kmem_alloc failed!\n");
3823 error = ENOMEM;
3824 goto fail;
3825 }
3826
3827 bzero(iterator, sizeof(*iterator));
3828 key = (HFSPlusExtentKey *) &iterator->key;
3829 key->keyLength = kHFSPlusExtentKeyMaximumLength;
3830 key->forkType = forktype;
3831 key->fileID = fileID;
3832 key->startBlock = datablks;
3833
3834 btdata.bufferAddress = &record;
3835 btdata.itemSize = sizeof(record);
3836 btdata.itemCount = 1;
3837
3838 fcb = VTOF(hfsmp->hfs_extents_vp);
3839
3840 error = BTSearchRecord(fcb, iterator, &btdata, NULL, iterator);
3841 while (error == 0) {
3842 /* Stop when we encounter a different file or fork. */
3843 if ((key->fileID != fileID) ||
3844 (key->forkType != forktype)) {
3845 break;
3846 }
3847 /*
3848 * Check if the file overlaps target space.
3849 */
3850 for (i = 0; i < kHFSPlusExtentDensity; ++i) {
3851 if (record[i].blockCount == 0) {
3852 goto overflow_done;
3853 }
3854 oldStartBlock = record[i].startBlock;
3855 blockCount = record[i].blockCount;
3856 block = oldStartBlock + blockCount;
3857 if (block > startblk) {
3858 error = BlockAllocate(hfsmp, 1, blockCount, blockCount, true, true, &newStartBlock, &blockCount);
3859 if (error) {
3860 printf("hfs_reclaim_sys_file: BlockAllocate returned %d\n", error);
3861 goto overflow_done;
3862 }
3863 if (blockCount != record[i].blockCount) {
3864 printf("hfs_reclaim_sys_file: new blockCount=%u, original blockCount=%u", blockCount, fp->ff_extents[i].blockCount);
3865 kmem_free(kernel_map, (vm_offset_t)iterator, sizeof(*iterator));
3866 goto free_fail;
3867 }
3868 error = hfs_copy_extent(hfsmp, vp, oldStartBlock, newStartBlock, blockCount, context);
3869 if (error) {
3870 printf("hfs_reclaim_sys_file: hfs_copy_extent returned %d\n", error);
3871 kmem_free(kernel_map, (vm_offset_t)iterator, sizeof(*iterator));
3872 goto free_fail;
3873 }
3874 record[i].startBlock = newStartBlock;
3875 VTOC(vp)->c_flag |= C_MODIFIED;
3876 *moved = true;
3877 /*
3878 * NOTE: To support relocating overflow extents of the
3879 * allocation file, we must update the BTree record BEFORE
3880 * deallocating the old extent so that BlockDeallocate will
3881 * use the extent's new location to calculate physical block
3882 * numbers. (This is for the case where the old extent's
3883 * bitmap bits actually reside in the extent being moved.)
3884 */
3885 error = BTUpdateRecord(fcb, iterator, (IterateCallBackProcPtr) hfs_relocate_callback, &record);
3886 if (error) {
3887 /* TODO: Mark volume inconsistent? */
3888 printf("hfs_reclaim_sys_file: BTUpdateRecord returned %d\n", error);
3889 goto overflow_done;
3890 }
3891 error = BlockDeallocate(hfsmp, oldStartBlock, blockCount);
3892 if (error) {
3893 /* TODO: Mark volume inconsistent? */
3894 printf("hfs_reclaim_sys_file: BlockDeallocate returned %d\n", error);
3895 goto overflow_done;
3896 }
3897 }
3898 }
3899 /* Look for more records. */
3900 error = BTIterateRecord(fcb, kBTreeNextRecord, iterator, &btdata, NULL);
3901 if (error == btNotFound) {
3902 error = 0;
3903 break;
3904 }
3905 }
3906 overflow_done:
3907 kmem_free(kernel_map, (vm_offset_t)iterator, sizeof(*iterator));
3908 if (error) {
3909 goto fail;
3910 }
3911 }
3912
3913 hfs_systemfile_unlock(hfsmp, lockflags);
3914 error = hfs_end_transaction(hfsmp);
3915 if (error) {
3916 printf("hfs_reclaim_sys_file: hfs_end_transaction returned %d\n", error);
3917 }
3918
3919 return error;
3920
3921 free_fail:
3922 (void) BlockDeallocate(hfsmp, newStartBlock, blockCount);
3923 fail:
3924 (void) hfs_systemfile_unlock(hfsmp, lockflags);
3925 (void) hfs_end_transaction(hfsmp);
3926 return error;
3927 }
3928
3929
3930 /*
3931 * This journal_relocate callback updates the journal info block to point
3932 * at the new journal location. This write must NOT be done using the
3933 * transaction. We must write the block immediately. We must also force
3934 * it to get to the media so that the new journal location will be seen by
3935 * the replay code before we can safely let journaled blocks be written
3936 * to their normal locations.
3937 *
3938 * The tests for journal_uses_fua below are mildly hacky. Since the journal
3939 * and the file system are both on the same device, I'm leveraging what
3940 * the journal has decided about FUA.
3941 */
3942 struct hfs_journal_relocate_args {
3943 struct hfsmount *hfsmp;
3944 vfs_context_t context;
3945 u_int32_t newStartBlock;
3946 };
3947
3948 static errno_t
3949 hfs_journal_relocate_callback(void *_args)
3950 {
3951 int error;
3952 struct hfs_journal_relocate_args *args = _args;
3953 struct hfsmount *hfsmp = args->hfsmp;
3954 buf_t bp;
3955 JournalInfoBlock *jibp;
3956
3957 error = buf_meta_bread(hfsmp->hfs_devvp,
3958 hfsmp->vcbJinfoBlock * (hfsmp->blockSize/hfsmp->hfs_phys_block_size),
3959 hfsmp->blockSize, vfs_context_ucred(args->context), &bp);
3960 if (error) {
3961 printf("hfs_reclaim_journal_file: failed to read JIB (%d)\n", error);
3962 return error;
3963 }
3964 jibp = (JournalInfoBlock*) buf_dataptr(bp);
3965 jibp->offset = SWAP_BE64((u_int64_t)args->newStartBlock * hfsmp->blockSize);
3966 jibp->size = SWAP_BE64(hfsmp->jnl_size);
3967 if (journal_uses_fua(hfsmp->jnl))
3968 buf_markfua(bp);
3969 error = buf_bwrite(bp);
3970 if (error) {
3971 printf("hfs_reclaim_journal_file: failed to write JIB (%d)\n", error);
3972 return error;
3973 }
3974 if (!journal_uses_fua(hfsmp->jnl)) {
3975 error = VNOP_IOCTL(hfsmp->hfs_devvp, DKIOCSYNCHRONIZECACHE, NULL, FWRITE, args->context);
3976 if (error) {
3977 printf("hfs_reclaim_journal_file: DKIOCSYNCHRONIZECACHE failed (%d)\n", error);
3978 error = 0; /* Don't fail the operation. */
3979 }
3980 }
3981
3982 return error;
3983 }
3984
3985
3986 static int
3987 hfs_reclaim_journal_file(struct hfsmount *hfsmp, vfs_context_t context)
3988 {
3989 int error;
3990 int lockflags;
3991 u_int32_t newStartBlock;
3992 u_int32_t oldBlockCount;
3993 u_int32_t newBlockCount;
3994 struct cat_desc journal_desc;
3995 struct cat_attr journal_attr;
3996 struct cat_fork journal_fork;
3997 struct hfs_journal_relocate_args callback_args;
3998
3999 error = hfs_start_transaction(hfsmp);
4000 if (error) {
4001 printf("hfs_reclaim_journal_file: hfs_start_transaction returned %d\n", error);
4002 return error;
4003 }
4004 lockflags = hfs_systemfile_lock(hfsmp, SFL_CATALOG | SFL_BITMAP, HFS_EXCLUSIVE_LOCK);
4005
4006 oldBlockCount = hfsmp->jnl_size / hfsmp->blockSize;
4007
4008 /* TODO: Allow the journal to change size based on the new volume size. */
4009 error = BlockAllocate(hfsmp, 1, oldBlockCount, oldBlockCount, true, true, &newStartBlock, &newBlockCount);
4010 if (error) {
4011 printf("hfs_reclaim_journal_file: BlockAllocate returned %d\n", error);
4012 goto fail;
4013 }
4014 if (newBlockCount != oldBlockCount) {
4015 printf("hfs_reclaim_journal_file: newBlockCount != oldBlockCount (%u, %u)\n", newBlockCount, oldBlockCount);
4016 goto free_fail;
4017 }
4018
4019 error = BlockDeallocate(hfsmp, hfsmp->jnl_start, oldBlockCount);
4020 if (error) {
4021 printf("hfs_reclaim_journal_file: BlockDeallocate returned %d\n", error);
4022 goto free_fail;
4023 }
4024
4025 /* Update the catalog record for .journal */
4026 error = cat_idlookup(hfsmp, hfsmp->hfs_jnlfileid, 1, &journal_desc, &journal_attr, &journal_fork);
4027 if (error) {
4028 printf("hfs_reclaim_journal_file: cat_idlookup returned %d\n", error);
4029 goto free_fail;
4030 }
4031 journal_fork.cf_size = newBlockCount * hfsmp->blockSize;
4032 journal_fork.cf_extents[0].startBlock = newStartBlock;
4033 journal_fork.cf_extents[0].blockCount = newBlockCount;
4034 journal_fork.cf_blocks = newBlockCount;
4035 error = cat_update(hfsmp, &journal_desc, &journal_attr, &journal_fork, NULL);
4036 cat_releasedesc(&journal_desc); /* all done with cat descriptor */
4037 if (error) {
4038 printf("hfs_reclaim_journal_file: cat_update returned %d\n", error);
4039 goto free_fail;
4040 }
4041 callback_args.hfsmp = hfsmp;
4042 callback_args.context = context;
4043 callback_args.newStartBlock = newStartBlock;
4044
4045 error = journal_relocate(hfsmp->jnl, (off_t)newStartBlock*hfsmp->blockSize,
4046 (off_t)newBlockCount*hfsmp->blockSize, 0,
4047 hfs_journal_relocate_callback, &callback_args);
4048 if (error) {
4049 /* NOTE: journal_relocate will mark the journal invalid. */
4050 printf("hfs_reclaim_journal_file: journal_relocate returned %d\n", error);
4051 goto fail;
4052 }
4053 hfsmp->jnl_start = newStartBlock;
4054 hfsmp->jnl_size = (off_t)newBlockCount * hfsmp->blockSize;
4055
4056 hfs_systemfile_unlock(hfsmp, lockflags);
4057 error = hfs_end_transaction(hfsmp);
4058 if (error) {
4059 printf("hfs_reclaim_journal_file: hfs_end_transaction returned %d\n", error);
4060 }
4061
4062 return error;
4063
4064 free_fail:
4065 (void) BlockDeallocate(hfsmp, newStartBlock, newBlockCount);
4066 fail:
4067 hfs_systemfile_unlock(hfsmp, lockflags);
4068 (void) hfs_end_transaction(hfsmp);
4069 return error;
4070 }
4071
4072
4073 /*
4074 * Move the journal info block to a new location. We have to make sure the
4075 * new copy of the journal info block gets to the media first, then change
4076 * the field in the volume header and the catalog record.
4077 */
4078 static int
4079 hfs_reclaim_journal_info_block(struct hfsmount *hfsmp, vfs_context_t context)
4080 {
4081 int error;
4082 int lockflags;
4083 u_int32_t newBlock;
4084 u_int32_t blockCount;
4085 struct cat_desc jib_desc;
4086 struct cat_attr jib_attr;
4087 struct cat_fork jib_fork;
4088 buf_t old_bp, new_bp;
4089
4090 error = hfs_start_transaction(hfsmp);
4091 if (error) {
4092 printf("hfs_reclaim_journal_info_block: hfs_start_transaction returned %d\n", error);
4093 return error;
4094 }
4095 lockflags = hfs_systemfile_lock(hfsmp, SFL_CATALOG | SFL_BITMAP, HFS_EXCLUSIVE_LOCK);
4096
4097 error = BlockAllocate(hfsmp, 1, 1, 1, true, true, &newBlock, &blockCount);
4098 if (error) {
4099 printf("hfs_reclaim_journal_info_block: BlockAllocate returned %d\n", error);
4100 goto fail;
4101 }
4102 if (blockCount != 1) {
4103 printf("hfs_reclaim_journal_info_block: blockCount != 1 (%u)\n", blockCount);
4104 goto free_fail;
4105 }
4106 error = BlockDeallocate(hfsmp, hfsmp->vcbJinfoBlock, 1);
4107 if (error) {
4108 printf("hfs_reclaim_journal_info_block: BlockDeallocate returned %d\n", error);
4109 goto free_fail;
4110 }
4111
4112 /* Copy the old journal info block content to the new location */
4113 error = buf_meta_bread(hfsmp->hfs_devvp,
4114 hfsmp->vcbJinfoBlock * (hfsmp->blockSize/hfsmp->hfs_phys_block_size),
4115 hfsmp->blockSize, vfs_context_ucred(context), &old_bp);
4116 if (error) {
4117 printf("hfs_reclaim_journal_info_block: failed to read JIB (%d)\n", error);
4118 goto free_fail;
4119 }
4120 new_bp = buf_getblk(hfsmp->hfs_devvp,
4121 newBlock * (hfsmp->blockSize/hfsmp->hfs_phys_block_size),
4122 hfsmp->blockSize, 0, 0, BLK_META);
4123 bcopy((char*)buf_dataptr(old_bp), (char*)buf_dataptr(new_bp), hfsmp->blockSize);
4124 buf_brelse(old_bp);
4125 if (journal_uses_fua(hfsmp->jnl))
4126 buf_markfua(new_bp);
4127 error = buf_bwrite(new_bp);
4128 if (error) {
4129 printf("hfs_reclaim_journal_info_block: failed to write new JIB (%d)\n", error);
4130 goto free_fail;
4131 }
4132 if (!journal_uses_fua(hfsmp->jnl)) {
4133 error = VNOP_IOCTL(hfsmp->hfs_devvp, DKIOCSYNCHRONIZECACHE, NULL, FWRITE, context);
4134 if (error) {
4135 printf("hfs_reclaim_journal_info_block: DKIOCSYNCHRONIZECACHE failed (%d)\n", error);
4136 /* Don't fail the operation. */
4137 }
4138 }
4139
4140 /* Update the catalog record for .journal_info_block */
4141 error = cat_idlookup(hfsmp, hfsmp->hfs_jnlinfoblkid, 1, &jib_desc, &jib_attr, &jib_fork);
4142 if (error) {
4143 printf("hfs_reclaim_journal_file: cat_idlookup returned %d\n", error);
4144 goto fail;
4145 }
4146 jib_fork.cf_size = hfsmp->blockSize;
4147 jib_fork.cf_extents[0].startBlock = newBlock;
4148 jib_fork.cf_extents[0].blockCount = 1;
4149 jib_fork.cf_blocks = 1;
4150 error = cat_update(hfsmp, &jib_desc, &jib_attr, &jib_fork, NULL);
4151 cat_releasedesc(&jib_desc); /* all done with cat descriptor */
4152 if (error) {
4153 printf("hfs_reclaim_journal_info_block: cat_update returned %d\n", error);
4154 goto fail;
4155 }
4156
4157 /* Update the pointer to the journal info block in the volume header. */
4158 hfsmp->vcbJinfoBlock = newBlock;
4159 error = hfs_flushvolumeheader(hfsmp, MNT_WAIT, HFS_ALTFLUSH);
4160 if (error) {
4161 printf("hfs_reclaim_journal_info_block: hfs_flushvolumeheader returned %d\n", error);
4162 goto fail;
4163 }
4164 hfs_systemfile_unlock(hfsmp, lockflags);
4165 error = hfs_end_transaction(hfsmp);
4166 if (error) {
4167 printf("hfs_reclaim_journal_info_block: hfs_end_transaction returned %d\n", error);
4168 }
4169 error = journal_flush(hfsmp->jnl);
4170 if (error) {
4171 printf("hfs_reclaim_journal_info_block: journal_flush returned %d\n", error);
4172 }
4173 return error;
4174
4175 free_fail:
4176 (void) BlockDeallocate(hfsmp, newBlock, blockCount);
4177 fail:
4178 hfs_systemfile_unlock(hfsmp, lockflags);
4179 (void) hfs_end_transaction(hfsmp);
4180 return error;
4181 }
4182
4183
4184 /*
4185 * Reclaim space at the end of a file system.
4186 */
4187 static int
4188 hfs_reclaimspace(struct hfsmount *hfsmp, u_long startblk, u_long reclaimblks, vfs_context_t context)
4189 {
4190 struct vnode *vp = NULL;
4191 FCB *fcb;
4192 struct BTreeIterator * iterator = NULL;
4193 struct FSBufferDescriptor btdata;
4194 struct HFSPlusCatalogFile filerec;
4195 u_int32_t saved_next_allocation;
4196 cnid_t * cnidbufp;
4197 size_t cnidbufsize;
4198 int filecnt = 0;
4199 int maxfilecnt;
4200 u_long block;
4201 u_long datablks;
4202 u_long rsrcblks;
4203 u_long blkstomove = 0;
4204 int lockflags;
4205 int i;
4206 int error;
4207 int lastprogress = 0;
4208 Boolean system_file_moved = false;
4209
4210 /* Relocate extents of the Allocation file if they're in the way. */
4211 error = hfs_reclaim_sys_file(hfsmp, hfsmp->hfs_allocation_vp, startblk, SFL_BITMAP, &system_file_moved, context);
4212 if (error) {
4213 printf("hfs_reclaimspace: reclaim allocation file returned %d\n", error);
4214 return error;
4215 }
4216 /* Relocate extents of the Extents B-tree if they're in the way. */
4217 error = hfs_reclaim_sys_file(hfsmp, hfsmp->hfs_extents_vp, startblk, SFL_EXTENTS, &system_file_moved, context);
4218 if (error) {
4219 printf("hfs_reclaimspace: reclaim extents b-tree returned %d\n", error);
4220 return error;
4221 }
4222 /* Relocate extents of the Catalog B-tree if they're in the way. */
4223 error = hfs_reclaim_sys_file(hfsmp, hfsmp->hfs_catalog_vp, startblk, SFL_CATALOG, &system_file_moved, context);
4224 if (error) {
4225 printf("hfs_reclaimspace: reclaim catalog b-tree returned %d\n", error);
4226 return error;
4227 }
4228 /* Relocate extents of the Attributes B-tree if they're in the way. */
4229 error = hfs_reclaim_sys_file(hfsmp, hfsmp->hfs_attribute_vp, startblk, SFL_ATTRIBUTE, &system_file_moved, context);
4230 if (error) {
4231 printf("hfs_reclaimspace: reclaim attribute b-tree returned %d\n", error);
4232 return error;
4233 }
4234 /* Relocate extents of the Startup File if there is one and they're in the way. */
4235 error = hfs_reclaim_sys_file(hfsmp, hfsmp->hfs_startup_vp, startblk, SFL_STARTUP, &system_file_moved, context);
4236 if (error) {
4237 printf("hfs_reclaimspace: reclaim startup file returned %d\n", error);
4238 return error;
4239 }
4240
4241 /*
4242 * We need to make sure the alternate volume header gets flushed if we moved
4243 * any extents in the volume header. But we need to do that before
4244 * shrinking the size of the volume, or else the journal code will panic
4245 * with an invalid (too large) block number.
4246 *
4247 * Note that system_file_moved will be set if ANY extent was moved, even
4248 * if it was just an overflow extent. In this case, the journal_flush isn't
4249 * strictly required, but shouldn't hurt.
4250 */
4251 if (system_file_moved)
4252 journal_flush(hfsmp->jnl);
4253
4254 if (hfsmp->jnl_start + (hfsmp->jnl_size / hfsmp->blockSize) > startblk) {
4255 error = hfs_reclaim_journal_file(hfsmp, context);
4256 if (error) {
4257 printf("hfs_reclaimspace: hfs_reclaim_journal_file failed (%d)\n", error);
4258 return error;
4259 }
4260 }
4261
4262 if (hfsmp->vcbJinfoBlock >= startblk) {
4263 error = hfs_reclaim_journal_info_block(hfsmp, context);
4264 if (error) {
4265 printf("hfs_reclaimspace: hfs_reclaim_journal_info_block failed (%d)\n", error);
4266 return error;
4267 }
4268 }
4269
4270 /* For now move a maximum of 250,000 files. */
4271 maxfilecnt = MIN(hfsmp->hfs_filecount, 250000);
4272 maxfilecnt = MIN((u_long)maxfilecnt, reclaimblks);
4273 cnidbufsize = maxfilecnt * sizeof(cnid_t);
4274 if (kmem_alloc(kernel_map, (vm_offset_t *)&cnidbufp, cnidbufsize)) {
4275 return (ENOMEM);
4276 }
4277 if (kmem_alloc(kernel_map, (vm_offset_t *)&iterator, sizeof(*iterator))) {
4278 kmem_free(kernel_map, (vm_offset_t)cnidbufp, cnidbufsize);
4279 return (ENOMEM);
4280 }
4281
4282 saved_next_allocation = hfsmp->nextAllocation;
4283 HFS_UPDATE_NEXT_ALLOCATION(hfsmp, hfsmp->hfs_metazone_start);
4284
4285 fcb = VTOF(hfsmp->hfs_catalog_vp);
4286 bzero(iterator, sizeof(*iterator));
4287
4288 btdata.bufferAddress = &filerec;
4289 btdata.itemSize = sizeof(filerec);
4290 btdata.itemCount = 1;
4291
4292 /* Keep the Catalog and extents files locked during iteration. */
4293 lockflags = hfs_systemfile_lock(hfsmp, SFL_CATALOG | SFL_EXTENTS, HFS_SHARED_LOCK);
4294
4295 error = BTIterateRecord(fcb, kBTreeFirstRecord, iterator, NULL, NULL);
4296 if (error) {
4297 goto end_iteration;
4298 }
4299 /*
4300 * Iterate over all the catalog records looking for files
4301 * that overlap into the space we're trying to free up.
4302 */
4303 for (filecnt = 0; filecnt < maxfilecnt; ) {
4304 error = BTIterateRecord(fcb, kBTreeNextRecord, iterator, &btdata, NULL);
4305 if (error) {
4306 if (error == fsBTRecordNotFoundErr || error == fsBTEndOfIterationErr) {
4307 error = 0;
4308 }
4309 break;
4310 }
4311 if (filerec.recordType != kHFSPlusFileRecord) {
4312 continue;
4313 }
4314 datablks = rsrcblks = 0;
4315 /*
4316 * Check if either fork overlaps target space.
4317 */
4318 for (i = 0; i < kHFSPlusExtentDensity; ++i) {
4319 if (filerec.dataFork.extents[i].blockCount != 0) {
4320 datablks += filerec.dataFork.extents[i].blockCount;
4321 block = filerec.dataFork.extents[i].startBlock +
4322 filerec.dataFork.extents[i].blockCount;
4323 if (block >= startblk) {
4324 if ((filerec.fileID == hfsmp->hfs_jnlfileid) ||
4325 (filerec.fileID == hfsmp->hfs_jnlinfoblkid)) {
4326 printf("hfs_reclaimspace: cannot move active journal\n");
4327 error = EPERM;
4328 goto end_iteration;
4329 }
4330 cnidbufp[filecnt++] = filerec.fileID;
4331 blkstomove += filerec.dataFork.totalBlocks;
4332 break;
4333 }
4334 }
4335 if (filerec.resourceFork.extents[i].blockCount != 0) {
4336 rsrcblks += filerec.resourceFork.extents[i].blockCount;
4337 block = filerec.resourceFork.extents[i].startBlock +
4338 filerec.resourceFork.extents[i].blockCount;
4339 if (block >= startblk) {
4340 cnidbufp[filecnt++] = filerec.fileID;
4341 blkstomove += filerec.resourceFork.totalBlocks;
4342 break;
4343 }
4344 }
4345 }
4346 /*
4347 * Check for any overflow extents that overlap.
4348 */
4349 if (i == kHFSPlusExtentDensity) {
4350 if (filerec.dataFork.totalBlocks > datablks) {
4351 if (hfs_overlapped_overflow_extents(hfsmp, startblk, datablks, filerec.fileID, 0)) {
4352 cnidbufp[filecnt++] = filerec.fileID;
4353 blkstomove += filerec.dataFork.totalBlocks;
4354 }
4355 } else if (filerec.resourceFork.totalBlocks > rsrcblks) {
4356 if (hfs_overlapped_overflow_extents(hfsmp, startblk, rsrcblks, filerec.fileID, 1)) {
4357 cnidbufp[filecnt++] = filerec.fileID;
4358 blkstomove += filerec.resourceFork.totalBlocks;
4359 }
4360 }
4361 }
4362 }
4363
4364 end_iteration:
4365 if (filecnt == 0 && !system_file_moved) {
4366 printf("hfs_reclaimspace: no files moved\n");
4367 error = ENOSPC;
4368 }
4369 /* All done with catalog. */
4370 hfs_systemfile_unlock(hfsmp, lockflags);
4371 if (error || filecnt == 0)
4372 goto out;
4373
4374 /*
4375 * Double check space requirements to make sure
4376 * there is enough space to relocate any files
4377 * that reside in the reclaim area.
4378 *
4379 * Blocks To Move --------------
4380 * | | |
4381 * V V V
4382 * ------------------------------------------------------------------------
4383 * | | / /// // |
4384 * | | / /// // |
4385 * | | / /// // |
4386 * ------------------------------------------------------------------------
4387 *
4388 * <------------------- New Total Blocks ------------------><-- Reclaim -->
4389 *
4390 * <------------------------ Original Total Blocks ----------------------->
4391 *
4392 */
4393 if (blkstomove >= hfs_freeblks(hfsmp, 1)) {
4394 printf("hfs_truncatefs: insufficient space (need %lu blocks; have %u blocks)\n", blkstomove, hfs_freeblks(hfsmp, 1));
4395 error = ENOSPC;
4396 goto out;
4397 }
4398 hfsmp->hfs_resize_filesmoved = 0;
4399 hfsmp->hfs_resize_totalfiles = filecnt;
4400
4401 /* Now move any files that are in the way. */
4402 for (i = 0; i < filecnt; ++i) {
4403 struct vnode * rvp;
4404
4405 if (hfs_vget(hfsmp, cnidbufp[i], &vp, 0) != 0)
4406 continue;
4407
4408 /* Relocate any data fork blocks. */
4409 if (VTOF(vp)->ff_blocks > 0) {
4410 error = hfs_relocate(vp, hfsmp->hfs_metazone_end + 1, kauth_cred_get(), current_proc());
4411 }
4412 if (error)
4413 break;
4414
4415 /* Relocate any resource fork blocks. */
4416 if ((VTOC((vp))->c_blocks - VTOF((vp))->ff_blocks) > 0) {
4417 error = hfs_vgetrsrc(hfsmp, vp, &rvp, TRUE);
4418 if (error)
4419 break;
4420 error = hfs_relocate(rvp, hfsmp->hfs_metazone_end + 1, kauth_cred_get(), current_proc());
4421 vnode_put(rvp);
4422 if (error)
4423 break;
4424 }
4425 hfs_unlock(VTOC(vp));
4426 vnode_put(vp);
4427 vp = NULL;
4428
4429 ++hfsmp->hfs_resize_filesmoved;
4430
4431 /* Report intermediate progress. */
4432 if (filecnt > 100) {
4433 int progress;
4434
4435 progress = (i * 100) / filecnt;
4436 if (progress > (lastprogress + 9)) {
4437 printf("hfs_reclaimspace: %d%% done...\n", progress);
4438 lastprogress = progress;
4439 }
4440 }
4441 }
4442 if (vp) {
4443 hfs_unlock(VTOC(vp));
4444 vnode_put(vp);
4445 vp = NULL;
4446 }
4447 if (hfsmp->hfs_resize_filesmoved != 0) {
4448 printf("hfs_reclaimspace: relocated %d files on \"%s\"\n",
4449 (int)hfsmp->hfs_resize_filesmoved, hfsmp->vcbVN);
4450 }
4451 out:
4452 kmem_free(kernel_map, (vm_offset_t)iterator, sizeof(*iterator));
4453 kmem_free(kernel_map, (vm_offset_t)cnidbufp, cnidbufsize);
4454
4455 /*
4456 * Restore the roving allocation pointer on errors.
4457 * (but only if we didn't move any files)
4458 */
4459 if (error && hfsmp->hfs_resize_filesmoved == 0) {
4460 HFS_UPDATE_NEXT_ALLOCATION(hfsmp, saved_next_allocation);
4461 }
4462 return (error);
4463 }
4464
4465
4466 /*
4467 * Check if there are any overflow extents that overlap.
4468 */
4469 static int
4470 hfs_overlapped_overflow_extents(struct hfsmount *hfsmp, u_int32_t startblk, u_int32_t catblks, u_int32_t fileID, int rsrcfork)
4471 {
4472 struct BTreeIterator * iterator = NULL;
4473 struct FSBufferDescriptor btdata;
4474 HFSPlusExtentRecord extrec;
4475 HFSPlusExtentKey *extkeyptr;
4476 FCB *fcb;
4477 u_int32_t block;
4478 u_int8_t forktype;
4479 int overlapped = 0;
4480 int i;
4481 int error;
4482
4483 forktype = rsrcfork ? 0xFF : 0;
4484 if (kmem_alloc(kernel_map, (vm_offset_t *)&iterator, sizeof(*iterator))) {
4485 return (0);
4486 }
4487 bzero(iterator, sizeof(*iterator));
4488 extkeyptr = (HFSPlusExtentKey *)&iterator->key;
4489 extkeyptr->keyLength = kHFSPlusExtentKeyMaximumLength;
4490 extkeyptr->forkType = forktype;
4491 extkeyptr->fileID = fileID;
4492 extkeyptr->startBlock = catblks;
4493
4494 btdata.bufferAddress = &extrec;
4495 btdata.itemSize = sizeof(extrec);
4496 btdata.itemCount = 1;
4497
4498 fcb = VTOF(hfsmp->hfs_extents_vp);
4499
4500 error = BTSearchRecord(fcb, iterator, &btdata, NULL, iterator);
4501 while (error == 0) {
4502 /* Stop when we encounter a different file. */
4503 if ((extkeyptr->fileID != fileID) ||
4504 (extkeyptr->forkType != forktype)) {
4505 break;
4506 }
4507 /*
4508 * Check if the file overlaps target space.
4509 */
4510 for (i = 0; i < kHFSPlusExtentDensity; ++i) {
4511 if (extrec[i].blockCount == 0) {
4512 break;
4513 }
4514 block = extrec[i].startBlock + extrec[i].blockCount;
4515 if (block >= startblk) {
4516 overlapped = 1;
4517 break;
4518 }
4519 }
4520 /* Look for more records. */
4521 error = BTIterateRecord(fcb, kBTreeNextRecord, iterator, &btdata, NULL);
4522 }
4523
4524 kmem_free(kernel_map, (vm_offset_t)iterator, sizeof(*iterator));
4525 return (overlapped);
4526 }
4527
4528
4529 /*
4530 * Calculate the progress of a file system resize operation.
4531 */
4532 __private_extern__
4533 int
4534 hfs_resize_progress(struct hfsmount *hfsmp, u_int32_t *progress)
4535 {
4536 if ((hfsmp->hfs_flags & HFS_RESIZE_IN_PROGRESS) == 0) {
4537 return (ENXIO);
4538 }
4539
4540 if (hfsmp->hfs_resize_totalfiles > 0)
4541 *progress = (hfsmp->hfs_resize_filesmoved * 100) / hfsmp->hfs_resize_totalfiles;
4542 else
4543 *progress = 0;
4544
4545 return (0);
4546 }
4547
4548
4549 /*
4550 * Get file system attributes.
4551 */
4552 static int
4553 hfs_vfs_getattr(struct mount *mp, struct vfs_attr *fsap, __unused vfs_context_t context)
4554 {
4555 #define HFS_ATTR_CMN_VALIDMASK (ATTR_CMN_VALIDMASK & ~(ATTR_CMN_NAMEDATTRCOUNT | ATTR_CMN_NAMEDATTRLIST))
4556 #define HFS_ATTR_FILE_VALIDMASK (ATTR_FILE_VALIDMASK & ~(ATTR_FILE_FILETYPE | ATTR_FILE_FORKCOUNT | ATTR_FILE_FORKLIST))
4557
4558 ExtendedVCB *vcb = VFSTOVCB(mp);
4559 struct hfsmount *hfsmp = VFSTOHFS(mp);
4560 u_long freeCNIDs;
4561
4562 freeCNIDs = (u_long)0xFFFFFFFF - (u_long)hfsmp->vcbNxtCNID;
4563
4564 VFSATTR_RETURN(fsap, f_objcount, (u_int64_t)hfsmp->vcbFilCnt + (u_int64_t)hfsmp->vcbDirCnt);
4565 VFSATTR_RETURN(fsap, f_filecount, (u_int64_t)hfsmp->vcbFilCnt);
4566 VFSATTR_RETURN(fsap, f_dircount, (u_int64_t)hfsmp->vcbDirCnt);
4567 VFSATTR_RETURN(fsap, f_maxobjcount, (u_int64_t)0xFFFFFFFF);
4568 VFSATTR_RETURN(fsap, f_iosize, (size_t)(MAX_UPL_TRANSFER * PAGE_SIZE));
4569 VFSATTR_RETURN(fsap, f_blocks, (u_int64_t)hfsmp->totalBlocks);
4570 VFSATTR_RETURN(fsap, f_bfree, (u_int64_t)hfs_freeblks(hfsmp, 0));
4571 VFSATTR_RETURN(fsap, f_bavail, (u_int64_t)hfs_freeblks(hfsmp, 1));
4572 VFSATTR_RETURN(fsap, f_bsize, (u_int32_t)vcb->blockSize);
4573 /* XXX needs clarification */
4574 VFSATTR_RETURN(fsap, f_bused, hfsmp->totalBlocks - hfs_freeblks(hfsmp, 1));
4575 /* Maximum files is constrained by total blocks. */
4576 VFSATTR_RETURN(fsap, f_files, (u_int64_t)(hfsmp->totalBlocks - 2));
4577 VFSATTR_RETURN(fsap, f_ffree, MIN((u_int64_t)freeCNIDs, (u_int64_t)hfs_freeblks(hfsmp, 1)));
4578
4579 fsap->f_fsid.val[0] = hfsmp->hfs_raw_dev;
4580 fsap->f_fsid.val[1] = vfs_typenum(mp);
4581 VFSATTR_SET_SUPPORTED(fsap, f_fsid);
4582
4583 VFSATTR_RETURN(fsap, f_signature, vcb->vcbSigWord);
4584 VFSATTR_RETURN(fsap, f_carbon_fsid, 0);
4585
4586 if (VFSATTR_IS_ACTIVE(fsap, f_capabilities)) {
4587 vol_capabilities_attr_t *cap;
4588
4589 cap = &fsap->f_capabilities;
4590
4591 if (hfsmp->hfs_flags & HFS_STANDARD) {
4592 cap->capabilities[VOL_CAPABILITIES_FORMAT] =
4593 VOL_CAP_FMT_PERSISTENTOBJECTIDS |
4594 VOL_CAP_FMT_CASE_PRESERVING |
4595 VOL_CAP_FMT_FAST_STATFS |
4596 VOL_CAP_FMT_HIDDEN_FILES |
4597 VOL_CAP_FMT_PATH_FROM_ID;
4598 } else {
4599 cap->capabilities[VOL_CAPABILITIES_FORMAT] =
4600 VOL_CAP_FMT_PERSISTENTOBJECTIDS |
4601 VOL_CAP_FMT_SYMBOLICLINKS |
4602 VOL_CAP_FMT_HARDLINKS |
4603 VOL_CAP_FMT_JOURNAL |
4604 VOL_CAP_FMT_ZERO_RUNS |
4605 (hfsmp->jnl ? VOL_CAP_FMT_JOURNAL_ACTIVE : 0) |
4606 (hfsmp->hfs_flags & HFS_CASE_SENSITIVE ? VOL_CAP_FMT_CASE_SENSITIVE : 0) |
4607 VOL_CAP_FMT_CASE_PRESERVING |
4608 VOL_CAP_FMT_FAST_STATFS |
4609 VOL_CAP_FMT_2TB_FILESIZE |
4610 VOL_CAP_FMT_HIDDEN_FILES |
4611 VOL_CAP_FMT_PATH_FROM_ID;
4612 }
4613 cap->capabilities[VOL_CAPABILITIES_INTERFACES] =
4614 VOL_CAP_INT_SEARCHFS |
4615 VOL_CAP_INT_ATTRLIST |
4616 VOL_CAP_INT_NFSEXPORT |
4617 VOL_CAP_INT_READDIRATTR |
4618 VOL_CAP_INT_EXCHANGEDATA |
4619 VOL_CAP_INT_ALLOCATE |
4620 VOL_CAP_INT_VOL_RENAME |
4621 VOL_CAP_INT_ADVLOCK |
4622 VOL_CAP_INT_FLOCK |
4623 #if NAMEDSTREAMS
4624 VOL_CAP_INT_EXTENDED_ATTR |
4625 VOL_CAP_INT_NAMEDSTREAMS;
4626 #else
4627 VOL_CAP_INT_EXTENDED_ATTR;
4628 #endif
4629 cap->capabilities[VOL_CAPABILITIES_RESERVED1] = 0;
4630 cap->capabilities[VOL_CAPABILITIES_RESERVED2] = 0;
4631
4632 cap->valid[VOL_CAPABILITIES_FORMAT] =
4633 VOL_CAP_FMT_PERSISTENTOBJECTIDS |
4634 VOL_CAP_FMT_SYMBOLICLINKS |
4635 VOL_CAP_FMT_HARDLINKS |
4636 VOL_CAP_FMT_JOURNAL |
4637 VOL_CAP_FMT_JOURNAL_ACTIVE |
4638 VOL_CAP_FMT_NO_ROOT_TIMES |
4639 VOL_CAP_FMT_SPARSE_FILES |
4640 VOL_CAP_FMT_ZERO_RUNS |
4641 VOL_CAP_FMT_CASE_SENSITIVE |
4642 VOL_CAP_FMT_CASE_PRESERVING |
4643 VOL_CAP_FMT_FAST_STATFS |
4644 VOL_CAP_FMT_2TB_FILESIZE |
4645 VOL_CAP_FMT_OPENDENYMODES |
4646 VOL_CAP_FMT_HIDDEN_FILES |
4647 VOL_CAP_FMT_PATH_FROM_ID;
4648 cap->valid[VOL_CAPABILITIES_INTERFACES] =
4649 VOL_CAP_INT_SEARCHFS |
4650 VOL_CAP_INT_ATTRLIST |
4651 VOL_CAP_INT_NFSEXPORT |
4652 VOL_CAP_INT_READDIRATTR |
4653 VOL_CAP_INT_EXCHANGEDATA |
4654 VOL_CAP_INT_COPYFILE |
4655 VOL_CAP_INT_ALLOCATE |
4656 VOL_CAP_INT_VOL_RENAME |
4657 VOL_CAP_INT_ADVLOCK |
4658 VOL_CAP_INT_FLOCK |
4659 VOL_CAP_INT_MANLOCK |
4660 #if NAMEDSTREAMS
4661 VOL_CAP_INT_EXTENDED_ATTR |
4662 VOL_CAP_INT_NAMEDSTREAMS;
4663 #else
4664 VOL_CAP_INT_EXTENDED_ATTR;
4665 #endif
4666 cap->valid[VOL_CAPABILITIES_RESERVED1] = 0;
4667 cap->valid[VOL_CAPABILITIES_RESERVED2] = 0;
4668 VFSATTR_SET_SUPPORTED(fsap, f_capabilities);
4669 }
4670 if (VFSATTR_IS_ACTIVE(fsap, f_attributes)) {
4671 vol_attributes_attr_t *attrp = &fsap->f_attributes;
4672
4673 attrp->validattr.commonattr = HFS_ATTR_CMN_VALIDMASK;
4674 attrp->validattr.volattr = ATTR_VOL_VALIDMASK & ~ATTR_VOL_INFO;
4675 attrp->validattr.dirattr = ATTR_DIR_VALIDMASK;
4676 attrp->validattr.fileattr = HFS_ATTR_FILE_VALIDMASK;
4677 attrp->validattr.forkattr = 0;
4678
4679 attrp->nativeattr.commonattr = HFS_ATTR_CMN_VALIDMASK;
4680 attrp->nativeattr.volattr = ATTR_VOL_VALIDMASK & ~ATTR_VOL_INFO;
4681 attrp->nativeattr.dirattr = ATTR_DIR_VALIDMASK;
4682 attrp->nativeattr.fileattr = HFS_ATTR_FILE_VALIDMASK;
4683 attrp->nativeattr.forkattr = 0;
4684 VFSATTR_SET_SUPPORTED(fsap, f_attributes);
4685 }
4686 fsap->f_create_time.tv_sec = hfsmp->vcbCrDate;
4687 fsap->f_create_time.tv_nsec = 0;
4688 VFSATTR_SET_SUPPORTED(fsap, f_create_time);
4689 fsap->f_modify_time.tv_sec = hfsmp->vcbLsMod;
4690 fsap->f_modify_time.tv_nsec = 0;
4691 VFSATTR_SET_SUPPORTED(fsap, f_modify_time);
4692
4693 fsap->f_backup_time.tv_sec = hfsmp->vcbVolBkUp;
4694 fsap->f_backup_time.tv_nsec = 0;
4695 VFSATTR_SET_SUPPORTED(fsap, f_backup_time);
4696 if (VFSATTR_IS_ACTIVE(fsap, f_fssubtype)) {
4697 u_int16_t subtype = 0;
4698
4699 /*
4700 * Subtypes (flavors) for HFS
4701 * 0: Mac OS Extended
4702 * 1: Mac OS Extended (Journaled)
4703 * 2: Mac OS Extended (Case Sensitive)
4704 * 3: Mac OS Extended (Case Sensitive, Journaled)
4705 * 4 - 127: Reserved
4706 * 128: Mac OS Standard
4707 *
4708 */
4709 if (hfsmp->hfs_flags & HFS_STANDARD) {
4710 subtype = HFS_SUBTYPE_STANDARDHFS;
4711 } else /* HFS Plus */ {
4712 if (hfsmp->jnl)
4713 subtype |= HFS_SUBTYPE_JOURNALED;
4714 if (hfsmp->hfs_flags & HFS_CASE_SENSITIVE)
4715 subtype |= HFS_SUBTYPE_CASESENSITIVE;
4716 }
4717 fsap->f_fssubtype = subtype;
4718 VFSATTR_SET_SUPPORTED(fsap, f_fssubtype);
4719 }
4720
4721 if (VFSATTR_IS_ACTIVE(fsap, f_vol_name)) {
4722 strlcpy(fsap->f_vol_name, (char *) hfsmp->vcbVN, MAXPATHLEN);
4723 VFSATTR_SET_SUPPORTED(fsap, f_vol_name);
4724 }
4725 return (0);
4726 }
4727
4728 /*
4729 * Perform a volume rename. Requires the FS' root vp.
4730 */
4731 static int
4732 hfs_rename_volume(struct vnode *vp, const char *name, proc_t p)
4733 {
4734 ExtendedVCB *vcb = VTOVCB(vp);
4735 struct cnode *cp = VTOC(vp);
4736 struct hfsmount *hfsmp = VTOHFS(vp);
4737 struct cat_desc to_desc;
4738 struct cat_desc todir_desc;
4739 struct cat_desc new_desc;
4740 cat_cookie_t cookie;
4741 int lockflags;
4742 int error = 0;
4743
4744 /*
4745 * Ignore attempts to rename a volume to a zero-length name.
4746 */
4747 if (name[0] == 0)
4748 return(0);
4749
4750 bzero(&to_desc, sizeof(to_desc));
4751 bzero(&todir_desc, sizeof(todir_desc));
4752 bzero(&new_desc, sizeof(new_desc));
4753 bzero(&cookie, sizeof(cookie));
4754
4755 todir_desc.cd_parentcnid = kHFSRootParentID;
4756 todir_desc.cd_cnid = kHFSRootFolderID;
4757 todir_desc.cd_flags = CD_ISDIR;
4758
4759 to_desc.cd_nameptr = (const u_int8_t *)name;
4760 to_desc.cd_namelen = strlen(name);
4761 to_desc.cd_parentcnid = kHFSRootParentID;
4762 to_desc.cd_cnid = cp->c_cnid;
4763 to_desc.cd_flags = CD_ISDIR;
4764
4765 if ((error = hfs_lock(cp, HFS_EXCLUSIVE_LOCK)) == 0) {
4766 if ((error = hfs_start_transaction(hfsmp)) == 0) {
4767 if ((error = cat_preflight(hfsmp, CAT_RENAME, &cookie, p)) == 0) {
4768 lockflags = hfs_systemfile_lock(hfsmp, SFL_CATALOG, HFS_EXCLUSIVE_LOCK);
4769
4770 error = cat_rename(hfsmp, &cp->c_desc, &todir_desc, &to_desc, &new_desc);
4771
4772 /*
4773 * If successful, update the name in the VCB, ensure it's terminated.
4774 */
4775 if (!error) {
4776 strlcpy((char *)vcb->vcbVN, name, sizeof(vcb->vcbVN));
4777 }
4778
4779 hfs_systemfile_unlock(hfsmp, lockflags);
4780 cat_postflight(hfsmp, &cookie, p);
4781
4782 if (error)
4783 MarkVCBDirty(vcb);
4784 (void) hfs_flushvolumeheader(hfsmp, MNT_WAIT, 0);
4785 }
4786 hfs_end_transaction(hfsmp);
4787 }
4788 if (!error) {
4789 /* Release old allocated name buffer */
4790 if (cp->c_desc.cd_flags & CD_HASBUF) {
4791 const char *tmp_name = (const char *)cp->c_desc.cd_nameptr;
4792
4793 cp->c_desc.cd_nameptr = 0;
4794 cp->c_desc.cd_namelen = 0;
4795 cp->c_desc.cd_flags &= ~CD_HASBUF;
4796 vfs_removename(tmp_name);
4797 }
4798 /* Update cnode's catalog descriptor */
4799 replace_desc(cp, &new_desc);
4800 vcb->volumeNameEncodingHint = new_desc.cd_encoding;
4801 cp->c_touch_chgtime = TRUE;
4802 }
4803
4804 hfs_unlock(cp);
4805 }
4806
4807 return(error);
4808 }
4809
4810 /*
4811 * Get file system attributes.
4812 */
4813 static int
4814 hfs_vfs_setattr(struct mount *mp, struct vfs_attr *fsap, __unused vfs_context_t context)
4815 {
4816 kauth_cred_t cred = vfs_context_ucred(context);
4817 int error = 0;
4818
4819 /*
4820 * Must be superuser or owner of filesystem to change volume attributes
4821 */
4822 if (!kauth_cred_issuser(cred) && (kauth_cred_getuid(cred) != vfs_statfs(mp)->f_owner))
4823 return(EACCES);
4824
4825 if (VFSATTR_IS_ACTIVE(fsap, f_vol_name)) {
4826 vnode_t root_vp;
4827
4828 error = hfs_vfs_root(mp, &root_vp, context);
4829 if (error)
4830 goto out;
4831
4832 error = hfs_rename_volume(root_vp, fsap->f_vol_name, vfs_context_proc(context));
4833 (void) vnode_put(root_vp);
4834 if (error)
4835 goto out;
4836
4837 VFSATTR_SET_SUPPORTED(fsap, f_vol_name);
4838 }
4839
4840 out:
4841 return error;
4842 }
4843
4844 /* If a runtime corruption is detected, set the volume inconsistent
4845 * bit in the volume attributes. The volume inconsistent bit is a persistent
4846 * bit which represents that the volume is corrupt and needs repair.
4847 * The volume inconsistent bit can be set from the kernel when it detects
4848 * runtime corruption or from file system repair utilities like fsck_hfs when
4849 * a repair operation fails. The bit should be cleared only from file system
4850 * verify/repair utility like fsck_hfs when a verify/repair succeeds.
4851 */
4852 void hfs_mark_volume_inconsistent(struct hfsmount *hfsmp)
4853 {
4854 HFS_MOUNT_LOCK(hfsmp, TRUE);
4855 if ((hfsmp->vcbAtrb & kHFSVolumeInconsistentMask) == 0) {
4856 hfsmp->vcbAtrb |= kHFSVolumeInconsistentMask;
4857 MarkVCBDirty(hfsmp);
4858 }
4859 /* Log information to ASL log */
4860 fslog_fs_corrupt(hfsmp->hfs_mp);
4861 printf("HFS: Runtime corruption detected on %s, fsck will be forced on next mount.\n", hfsmp->vcbVN);
4862 HFS_MOUNT_UNLOCK(hfsmp, TRUE);
4863 }
4864
4865 /* Replay the journal on the device node provided. Returns zero if
4866 * journal replay succeeded or no journal was supposed to be replayed.
4867 */
4868 static int hfs_journal_replay(const char *devnode, vfs_context_t context)
4869 {
4870 int retval = 0;
4871 struct vnode *devvp = NULL;
4872 struct mount *mp = NULL;
4873 struct hfs_mount_args *args = NULL;
4874
4875 /* Lookup vnode for given raw device path */
4876 retval = vnode_open(devnode, FREAD|FWRITE, 0, 0, &devvp, NULL);
4877 if (retval) {
4878 goto out;
4879 }
4880
4881 /* Replay allowed only on raw devices */
4882 if (!vnode_ischr(devvp)) {
4883 retval = EINVAL;
4884 goto out;
4885 }
4886
4887 /* Create dummy mount structures */
4888 MALLOC(mp, struct mount *, sizeof(struct mount), M_TEMP, M_WAITOK);
4889 bzero(mp, sizeof(struct mount));
4890 mount_lock_init(mp);
4891
4892 MALLOC(args, struct hfs_mount_args *, sizeof(struct hfs_mount_args), M_TEMP, M_WAITOK);
4893 bzero(args, sizeof(struct hfs_mount_args));
4894
4895 retval = hfs_mountfs(devvp, mp, args, 1, context);
4896 buf_flushdirtyblks(devvp, MNT_WAIT, 0, "hfs_journal_replay");
4897
4898 out:
4899 if (mp) {
4900 mount_lock_destroy(mp);
4901 FREE(mp, M_TEMP);
4902 }
4903 if (args) {
4904 FREE(args, M_TEMP);
4905 }
4906 if (devvp) {
4907 vnode_close(devvp, FREAD|FWRITE, NULL);
4908 }
4909 return retval;
4910 }
4911
4912 /*
4913 * hfs vfs operations.
4914 */
4915 struct vfsops hfs_vfsops = {
4916 hfs_mount,
4917 hfs_start,
4918 hfs_unmount,
4919 hfs_vfs_root,
4920 hfs_quotactl,
4921 hfs_vfs_getattr, /* was hfs_statfs */
4922 hfs_sync,
4923 hfs_vfs_vget,
4924 hfs_fhtovp,
4925 hfs_vptofh,
4926 hfs_init,
4927 hfs_sysctl,
4928 hfs_vfs_setattr,
4929 {NULL}
4930 };