2 * Copyright (c) 1999-2009 Apple Inc. All rights reserved.
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
29 * Copyright (c) 1991, 1993, 1994
30 * The Regents of the University of California. All rights reserved.
31 * (c) UNIX System Laboratories, Inc.
32 * All or some portions of this file are derived from material licensed
33 * to the University of California by American Telephone and Telegraph
34 * Co. or Unix System Laboratories, Inc. and are reproduced herein with
35 * the permission of UNIX System Laboratories, Inc.
37 * Redistribution and use in source and binary forms, with or without
38 * modification, are permitted provided that the following conditions
40 * 1. Redistributions of source code must retain the above copyright
41 * notice, this list of conditions and the following disclaimer.
42 * 2. Redistributions in binary form must reproduce the above copyright
43 * notice, this list of conditions and the following disclaimer in the
44 * documentation and/or other materials provided with the distribution.
45 * 3. All advertising materials mentioning features or use of this software
46 * must display the following acknowledgement:
47 * This product includes software developed by the University of
48 * California, Berkeley and its contributors.
49 * 4. Neither the name of the University nor the names of its contributors
50 * may be used to endorse or promote products derived from this software
51 * without specific prior written permission.
53 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
54 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
55 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
56 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
57 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
58 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
59 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
60 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
61 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
62 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
66 * derived from @(#)ufs_vfsops.c 8.8 (Berkeley) 5/20/95
68 * (c) Copyright 1997-2002 Apple Computer, Inc. All rights reserved.
70 * hfs_vfsops.c -- VFS layer for loadable HFS file system.
73 #include <sys/param.h>
74 #include <sys/systm.h>
75 #include <sys/kauth.h>
78 #include <sys/ubc_internal.h>
79 #include <sys/vnode_internal.h>
80 #include <sys/mount_internal.h>
81 #include <sys/sysctl.h>
82 #include <sys/malloc.h>
84 #include <sys/quota.h>
86 #include <sys/paths.h>
87 #include <sys/utfconv.h>
88 #include <sys/kdebug.h>
89 #include <sys/fslog.h>
91 #include <kern/locks.h>
93 #include <vfs/vfs_journal.h>
95 #include <miscfs/specfs/specdev.h>
96 #include <hfs/hfs_mount.h>
98 #include <libkern/crypto/md5.h>
99 #include <uuid/uuid.h>
102 #include "hfs_catalog.h"
103 #include "hfs_cnode.h"
105 #include "hfs_endian.h"
106 #include "hfs_hotfiles.h"
107 #include "hfs_quota.h"
109 #include "hfscommon/headers/FileMgrInternal.h"
110 #include "hfscommon/headers/BTreesInternal.h"
118 lck_grp_attr_t
* hfs_group_attr
;
119 lck_attr_t
* hfs_lock_attr
;
120 lck_grp_t
* hfs_mutex_group
;
121 lck_grp_t
* hfs_rwlock_group
;
123 extern struct vnodeopv_desc hfs_vnodeop_opv_desc
;
124 extern struct vnodeopv_desc hfs_std_vnodeop_opv_desc
;
126 /* not static so we can re-use in hfs_readwrite.c for build_path calls */
127 int hfs_vfs_vget(struct mount
*mp
, ino64_t ino
, struct vnode
**vpp
, vfs_context_t context
);
129 static int hfs_changefs(struct mount
*mp
, struct hfs_mount_args
*args
);
130 static int hfs_fhtovp(struct mount
*mp
, int fhlen
, unsigned char *fhp
, struct vnode
**vpp
, vfs_context_t context
);
131 static int hfs_flushfiles(struct mount
*, int, struct proc
*);
132 static int hfs_flushMDB(struct hfsmount
*hfsmp
, int waitfor
, int altflush
);
133 static int hfs_getmountpoint(struct vnode
*vp
, struct hfsmount
**hfsmpp
);
134 static int hfs_init(struct vfsconf
*vfsp
);
135 static int hfs_mount(struct mount
*mp
, vnode_t devvp
, user_addr_t data
, vfs_context_t context
);
136 static int hfs_mountfs(struct vnode
*devvp
, struct mount
*mp
, struct hfs_mount_args
*args
, int journal_replay_only
, vfs_context_t context
);
137 static int hfs_reload(struct mount
*mp
);
138 static int hfs_vfs_root(struct mount
*mp
, struct vnode
**vpp
, vfs_context_t context
);
139 static int hfs_quotactl(struct mount
*, int, uid_t
, caddr_t
, vfs_context_t context
);
140 static int hfs_start(struct mount
*mp
, int flags
, vfs_context_t context
);
141 static int hfs_statfs(struct mount
*mp
, register struct vfsstatfs
*sbp
, vfs_context_t context
);
142 static int hfs_sync(struct mount
*mp
, int waitfor
, vfs_context_t context
);
143 static int hfs_sysctl(int *name
, u_int namelen
, user_addr_t oldp
, size_t *oldlenp
,
144 user_addr_t newp
, size_t newlen
, vfs_context_t context
);
145 static int hfs_unmount(struct mount
*mp
, int mntflags
, vfs_context_t context
);
146 static int hfs_vptofh(struct vnode
*vp
, int *fhlenp
, unsigned char *fhp
, vfs_context_t context
);
148 static int hfs_reclaimspace(struct hfsmount
*hfsmp
, u_int32_t startblk
, u_int32_t reclaimblks
, vfs_context_t context
);
149 static int hfs_overlapped_overflow_extents(struct hfsmount
*hfsmp
, u_int32_t startblk
,
150 u_int32_t catblks
, u_int32_t fileID
, int rsrcfork
);
151 static int hfs_journal_replay(vnode_t devvp
, vfs_context_t context
);
155 * Called by vfs_mountroot when mounting HFS Plus as root.
160 hfs_mountroot(mount_t mp
, vnode_t rvp
, vfs_context_t context
)
162 struct hfsmount
*hfsmp
;
164 struct vfsstatfs
*vfsp
;
167 if ((error
= hfs_mountfs(rvp
, mp
, NULL
, 0, context
)))
171 hfsmp
= VFSTOHFS(mp
);
173 hfsmp
->hfs_uid
= UNKNOWNUID
;
174 hfsmp
->hfs_gid
= UNKNOWNGID
;
175 hfsmp
->hfs_dir_mask
= (S_IRWXU
| S_IRGRP
|S_IXGRP
| S_IROTH
|S_IXOTH
); /* 0755 */
176 hfsmp
->hfs_file_mask
= (S_IRWXU
| S_IRGRP
|S_IXGRP
| S_IROTH
|S_IXOTH
); /* 0755 */
178 /* Establish the free block reserve. */
179 vcb
= HFSTOVCB(hfsmp
);
180 vcb
->reserveBlocks
= ((u_int64_t
)vcb
->totalBlocks
* HFS_MINFREE
) / 100;
181 vcb
->reserveBlocks
= MIN(vcb
->reserveBlocks
, HFS_MAXRESERVE
/ vcb
->blockSize
);
183 vfsp
= vfs_statfs(mp
);
184 (void)hfs_statfs(mp
, vfsp
, NULL
);
197 hfs_mount(struct mount
*mp
, vnode_t devvp
, user_addr_t data
, vfs_context_t context
)
199 struct proc
*p
= vfs_context_proc(context
);
200 struct hfsmount
*hfsmp
= NULL
;
201 struct hfs_mount_args args
;
205 if ((retval
= copyin(data
, (caddr_t
)&args
, sizeof(args
)))) {
208 cmdflags
= (u_int32_t
)vfs_flags(mp
) & MNT_CMDFLAGS
;
209 if (cmdflags
& MNT_UPDATE
) {
210 hfsmp
= VFSTOHFS(mp
);
212 /* Reload incore data after an fsck. */
213 if (cmdflags
& MNT_RELOAD
) {
214 if (vfs_isrdonly(mp
))
215 return hfs_reload(mp
);
220 /* Change to a read-only file system. */
221 if (((hfsmp
->hfs_flags
& HFS_READ_ONLY
) == 0) &&
225 /* Set flag to indicate that a downgrade to read-only
226 * is in progress and therefore block any further
227 * modifications to the file system.
229 hfs_global_exclusive_lock_acquire(hfsmp
);
230 hfsmp
->hfs_flags
|= HFS_RDONLY_DOWNGRADE
;
231 hfsmp
->hfs_downgrading_proc
= current_thread();
232 hfs_global_exclusive_lock_release(hfsmp
);
234 /* use VFS_SYNC to push out System (btree) files */
235 retval
= VFS_SYNC(mp
, MNT_WAIT
, context
);
236 if (retval
&& ((cmdflags
& MNT_FORCE
) == 0)) {
237 hfsmp
->hfs_flags
&= ~HFS_RDONLY_DOWNGRADE
;
238 hfsmp
->hfs_downgrading_proc
= NULL
;
243 if (cmdflags
& MNT_FORCE
)
246 if ((retval
= hfs_flushfiles(mp
, flags
, p
))) {
247 hfsmp
->hfs_flags
&= ~HFS_RDONLY_DOWNGRADE
;
248 hfsmp
->hfs_downgrading_proc
= NULL
;
252 /* mark the volume cleanly unmounted */
253 hfsmp
->vcbAtrb
|= kHFSVolumeUnmountedMask
;
254 retval
= hfs_flushvolumeheader(hfsmp
, MNT_WAIT
, 0);
255 hfsmp
->hfs_flags
|= HFS_READ_ONLY
;
257 /* also get the volume bitmap blocks */
259 if (vnode_mount(hfsmp
->hfs_devvp
) == mp
) {
260 retval
= hfs_fsync(hfsmp
->hfs_devvp
, MNT_WAIT
, 0, p
);
262 vnode_get(hfsmp
->hfs_devvp
);
263 retval
= VNOP_FSYNC(hfsmp
->hfs_devvp
, MNT_WAIT
, context
);
264 vnode_put(hfsmp
->hfs_devvp
);
268 hfsmp
->hfs_flags
&= ~HFS_RDONLY_DOWNGRADE
;
269 hfsmp
->hfs_downgrading_proc
= NULL
;
270 hfsmp
->hfs_flags
&= ~HFS_READ_ONLY
;
274 hfs_global_exclusive_lock_acquire(hfsmp
);
276 journal_close(hfsmp
->jnl
);
279 // Note: we explicitly don't want to shutdown
280 // access to the jvp because we may need
281 // it later if we go back to being read-write.
283 hfs_global_exclusive_lock_release(hfsmp
);
286 hfsmp
->hfs_downgrading_proc
= NULL
;
289 /* Change to a writable file system. */
290 if (vfs_iswriteupgrade(mp
)) {
293 * On inconsistent disks, do not allow read-write mount
294 * unless it is the boot volume being mounted.
296 if (!(vfs_flags(mp
) & MNT_ROOTFS
) &&
297 (hfsmp
->vcbAtrb
& kHFSVolumeInconsistentMask
)) {
302 // If the journal was shut-down previously because we were
303 // asked to be read-only, let's start it back up again now
305 if ( (HFSTOVCB(hfsmp
)->vcbAtrb
& kHFSVolumeJournaledMask
)
306 && hfsmp
->jnl
== NULL
307 && hfsmp
->jvp
!= NULL
) {
310 if (hfsmp
->hfs_flags
& HFS_NEED_JNL_RESET
) {
311 jflags
= JOURNAL_RESET
;
316 hfs_global_exclusive_lock_acquire(hfsmp
);
318 hfsmp
->jnl
= journal_open(hfsmp
->jvp
,
319 (hfsmp
->jnl_start
* HFSTOVCB(hfsmp
)->blockSize
) + (off_t
)HFSTOVCB(hfsmp
)->hfsPlusIOPosOffset
,
322 hfsmp
->hfs_logical_block_size
,
325 hfs_sync_metadata
, hfsmp
->hfs_mp
);
327 hfs_global_exclusive_lock_release(hfsmp
);
329 if (hfsmp
->jnl
== NULL
) {
333 hfsmp
->hfs_flags
&= ~HFS_NEED_JNL_RESET
;
338 /* See if we need to erase unused Catalog nodes due to <rdar://problem/6947811>. */
339 retval
= hfs_erase_unused_nodes(hfsmp
);
340 if (retval
!= E_NONE
)
343 /* Only clear HFS_READ_ONLY after a successful write */
344 hfsmp
->hfs_flags
&= ~HFS_READ_ONLY
;
346 /* If this mount point was downgraded from read-write
347 * to read-only, clear that information as we are now
348 * moving back to read-write.
350 hfsmp
->hfs_flags
&= ~HFS_RDONLY_DOWNGRADE
;
351 hfsmp
->hfs_downgrading_proc
= NULL
;
353 /* mark the volume dirty (clear clean unmount bit) */
354 hfsmp
->vcbAtrb
&= ~kHFSVolumeUnmountedMask
;
356 retval
= hfs_flushvolumeheader(hfsmp
, MNT_WAIT
, 0);
357 if (retval
!= E_NONE
)
360 if (!(hfsmp
->hfs_flags
& (HFS_READ_ONLY
| HFS_STANDARD
))) {
361 /* Setup private/hidden directories for hardlinks. */
362 hfs_privatedir_init(hfsmp
, FILE_HARDLINKS
);
363 hfs_privatedir_init(hfsmp
, DIR_HARDLINKS
);
365 hfs_remove_orphans(hfsmp
);
368 * Allow hot file clustering if conditions allow.
370 if (hfsmp
->hfs_flags
& HFS_METADATA_ZONE
) {
371 (void) hfs_recording_init(hfsmp
);
373 /* Force ACLs on HFS+ file systems. */
374 if (vfs_extendedsecurity(HFSTOVFS(hfsmp
)) == 0) {
375 vfs_setextendedsecurity(HFSTOVFS(hfsmp
));
380 /* Update file system parameters. */
381 retval
= hfs_changefs(mp
, &args
);
383 } else /* not an update request */ {
385 /* Set the mount flag to indicate that we support volfs */
386 vfs_setflags(mp
, (u_int64_t
)((unsigned int)MNT_DOVOLFS
));
388 retval
= hfs_mountfs(devvp
, mp
, &args
, 0, context
);
392 (void)hfs_statfs(mp
, vfs_statfs(mp
), context
);
398 struct hfs_changefs_cargs
{
399 struct hfsmount
*hfsmp
;
406 hfs_changefs_callback(struct vnode
*vp
, void *cargs
)
410 struct cat_desc cndesc
;
411 struct cat_attr cnattr
;
412 struct hfs_changefs_cargs
*args
;
416 args
= (struct hfs_changefs_cargs
*)cargs
;
419 vcb
= HFSTOVCB(args
->hfsmp
);
421 lockflags
= hfs_systemfile_lock(args
->hfsmp
, SFL_CATALOG
, HFS_SHARED_LOCK
);
422 error
= cat_lookup(args
->hfsmp
, &cp
->c_desc
, 0, &cndesc
, &cnattr
, NULL
, NULL
);
423 hfs_systemfile_unlock(args
->hfsmp
, lockflags
);
426 * If we couldn't find this guy skip to the next one
431 return (VNODE_RETURNED
);
434 * Get the real uid/gid and perm mask from disk.
436 if (args
->permswitch
|| args
->permfix
) {
437 cp
->c_uid
= cnattr
.ca_uid
;
438 cp
->c_gid
= cnattr
.ca_gid
;
439 cp
->c_mode
= cnattr
.ca_mode
;
442 * If we're switching name converters then...
443 * Remove the existing entry from the namei cache.
444 * Update name to one based on new encoder.
448 replace_desc(cp
, &cndesc
);
450 if (cndesc
.cd_cnid
== kHFSRootFolderID
) {
451 strlcpy((char *)vcb
->vcbVN
, (const char *)cp
->c_desc
.cd_nameptr
, NAME_MAX
+1);
452 cp
->c_desc
.cd_encoding
= args
->hfsmp
->hfs_encoding
;
455 cat_releasedesc(&cndesc
);
457 return (VNODE_RETURNED
);
460 /* Change fs mount parameters */
462 hfs_changefs(struct mount
*mp
, struct hfs_mount_args
*args
)
465 int namefix
, permfix
, permswitch
;
466 struct hfsmount
*hfsmp
;
468 hfs_to_unicode_func_t get_unicode_func
;
469 unicode_to_hfs_func_t get_hfsname_func
;
470 u_int32_t old_encoding
= 0;
471 struct hfs_changefs_cargs cargs
;
472 u_int32_t mount_flags
;
474 hfsmp
= VFSTOHFS(mp
);
475 vcb
= HFSTOVCB(hfsmp
);
476 mount_flags
= (unsigned int)vfs_flags(mp
);
478 hfsmp
->hfs_flags
|= HFS_IN_CHANGEFS
;
480 permswitch
= (((hfsmp
->hfs_flags
& HFS_UNKNOWN_PERMS
) &&
481 ((mount_flags
& MNT_UNKNOWNPERMISSIONS
) == 0)) ||
482 (((hfsmp
->hfs_flags
& HFS_UNKNOWN_PERMS
) == 0) &&
483 (mount_flags
& MNT_UNKNOWNPERMISSIONS
)));
485 /* The root filesystem must operate with actual permissions: */
486 if (permswitch
&& (mount_flags
& MNT_ROOTFS
) && (mount_flags
& MNT_UNKNOWNPERMISSIONS
)) {
487 vfs_clearflags(mp
, (u_int64_t
)((unsigned int)MNT_UNKNOWNPERMISSIONS
)); /* Just say "No". */
491 if (mount_flags
& MNT_UNKNOWNPERMISSIONS
)
492 hfsmp
->hfs_flags
|= HFS_UNKNOWN_PERMS
;
494 hfsmp
->hfs_flags
&= ~HFS_UNKNOWN_PERMS
;
496 namefix
= permfix
= 0;
499 * Tracking of hot files requires up-to-date access times. So if
500 * access time updates are disabled, we must also disable hot files.
502 if (mount_flags
& MNT_NOATIME
) {
503 (void) hfs_recording_suspend(hfsmp
);
506 /* Change the timezone (Note: this affects all hfs volumes and hfs+ volume create dates) */
507 if (args
->hfs_timezone
.tz_minuteswest
!= VNOVAL
) {
508 gTimeZone
= args
->hfs_timezone
;
511 /* Change the default uid, gid and/or mask */
512 if ((args
->hfs_uid
!= (uid_t
)VNOVAL
) && (hfsmp
->hfs_uid
!= args
->hfs_uid
)) {
513 hfsmp
->hfs_uid
= args
->hfs_uid
;
514 if (vcb
->vcbSigWord
== kHFSPlusSigWord
)
517 if ((args
->hfs_gid
!= (gid_t
)VNOVAL
) && (hfsmp
->hfs_gid
!= args
->hfs_gid
)) {
518 hfsmp
->hfs_gid
= args
->hfs_gid
;
519 if (vcb
->vcbSigWord
== kHFSPlusSigWord
)
522 if (args
->hfs_mask
!= (mode_t
)VNOVAL
) {
523 if (hfsmp
->hfs_dir_mask
!= (args
->hfs_mask
& ALLPERMS
)) {
524 hfsmp
->hfs_dir_mask
= args
->hfs_mask
& ALLPERMS
;
525 hfsmp
->hfs_file_mask
= args
->hfs_mask
& ALLPERMS
;
526 if ((args
->flags
!= VNOVAL
) && (args
->flags
& HFSFSMNT_NOXONFILES
))
527 hfsmp
->hfs_file_mask
= (args
->hfs_mask
& DEFFILEMODE
);
528 if (vcb
->vcbSigWord
== kHFSPlusSigWord
)
533 /* Change the hfs encoding value (hfs only) */
534 if ((vcb
->vcbSigWord
== kHFSSigWord
) &&
535 (args
->hfs_encoding
!= (u_int32_t
)VNOVAL
) &&
536 (hfsmp
->hfs_encoding
!= args
->hfs_encoding
)) {
538 retval
= hfs_getconverter(args
->hfs_encoding
, &get_unicode_func
, &get_hfsname_func
);
543 * Connect the new hfs_get_unicode converter but leave
544 * the old hfs_get_hfsname converter in place so that
545 * we can lookup existing vnodes to get their correctly
548 * When we're all finished, we can then connect the new
549 * hfs_get_hfsname converter and release our interest
550 * in the old converters.
552 hfsmp
->hfs_get_unicode
= get_unicode_func
;
553 old_encoding
= hfsmp
->hfs_encoding
;
554 hfsmp
->hfs_encoding
= args
->hfs_encoding
;
558 if (!(namefix
|| permfix
|| permswitch
))
561 /* XXX 3762912 hack to support HFS filesystem 'owner' */
564 hfsmp
->hfs_uid
== UNKNOWNUID
? KAUTH_UID_NONE
: hfsmp
->hfs_uid
,
565 hfsmp
->hfs_gid
== UNKNOWNGID
? KAUTH_GID_NONE
: hfsmp
->hfs_gid
);
568 * For each active vnode fix things that changed
570 * Note that we can visit a vnode more than once
571 * and we can race with fsync.
573 * hfs_changefs_callback will be called for each vnode
574 * hung off of this mount point
576 * The vnode will be properly referenced and unreferenced
577 * around the callback
580 cargs
.namefix
= namefix
;
581 cargs
.permfix
= permfix
;
582 cargs
.permswitch
= permswitch
;
584 vnode_iterate(mp
, 0, hfs_changefs_callback
, (void *)&cargs
);
587 * If we're switching name converters we can now
588 * connect the new hfs_get_hfsname converter and
589 * release our interest in the old converters.
592 hfsmp
->hfs_get_hfsname
= get_hfsname_func
;
593 vcb
->volumeNameEncodingHint
= args
->hfs_encoding
;
594 (void) hfs_relconverter(old_encoding
);
597 hfsmp
->hfs_flags
&= ~HFS_IN_CHANGEFS
;
602 struct hfs_reload_cargs
{
603 struct hfsmount
*hfsmp
;
608 hfs_reload_callback(struct vnode
*vp
, void *cargs
)
611 struct hfs_reload_cargs
*args
;
614 args
= (struct hfs_reload_cargs
*)cargs
;
616 * flush all the buffers associated with this node
618 (void) buf_invalidateblks(vp
, 0, 0, 0);
622 * Remove any directory hints
625 hfs_reldirhints(cp
, 0);
628 * Re-read cnode data for all active vnodes (non-metadata files).
630 if (!vnode_issystem(vp
) && !VNODE_IS_RSRC(vp
)) {
631 struct cat_fork
*datafork
;
632 struct cat_desc desc
;
634 datafork
= cp
->c_datafork
? &cp
->c_datafork
->ff_data
: NULL
;
636 /* lookup by fileID since name could have changed */
637 lockflags
= hfs_systemfile_lock(args
->hfsmp
, SFL_CATALOG
, HFS_SHARED_LOCK
);
638 args
->error
= cat_idlookup(args
->hfsmp
, cp
->c_fileid
, 0, &desc
, &cp
->c_attr
, datafork
);
639 hfs_systemfile_unlock(args
->hfsmp
, lockflags
);
641 return (VNODE_RETURNED_DONE
);
644 /* update cnode's catalog descriptor */
645 (void) replace_desc(cp
, &desc
);
647 return (VNODE_RETURNED
);
651 * Reload all incore data for a filesystem (used after running fsck on
652 * the root filesystem and finding things to fix). The filesystem must
653 * be mounted read-only.
655 * Things to do to update the mount:
656 * invalidate all cached meta-data.
657 * invalidate all inactive vnodes.
658 * invalidate all cached file data.
659 * re-read volume header from disk.
660 * re-load meta-file info (extents, file size).
661 * re-load B-tree header data.
662 * re-read cnode data for all active vnodes.
665 hfs_reload(struct mount
*mountp
)
667 register struct vnode
*devvp
;
670 struct hfsmount
*hfsmp
;
671 struct HFSPlusVolumeHeader
*vhp
;
673 struct filefork
*forkp
;
674 struct cat_desc cndesc
;
675 struct hfs_reload_cargs args
;
676 daddr64_t priIDSector
;
678 hfsmp
= VFSTOHFS(mountp
);
679 vcb
= HFSTOVCB(hfsmp
);
681 if (vcb
->vcbSigWord
== kHFSSigWord
)
682 return (EINVAL
); /* rooting from HFS is not supported! */
685 * Invalidate all cached meta-data.
687 devvp
= hfsmp
->hfs_devvp
;
688 if (buf_invalidateblks(devvp
, 0, 0, 0))
689 panic("hfs_reload: dirty1");
694 * hfs_reload_callback will be called for each vnode
695 * hung off of this mount point that can't be recycled...
696 * vnode_iterate will recycle those that it can (the VNODE_RELOAD option)
697 * the vnode will be in an 'unbusy' state (VNODE_WAIT) and
698 * properly referenced and unreferenced around the callback
700 vnode_iterate(mountp
, VNODE_RELOAD
| VNODE_WAIT
, hfs_reload_callback
, (void *)&args
);
706 * Re-read VolumeHeader from disk.
708 priIDSector
= (daddr64_t
)((vcb
->hfsPlusIOPosOffset
/ hfsmp
->hfs_logical_block_size
) +
709 HFS_PRI_SECTOR(hfsmp
->hfs_logical_block_size
));
711 error
= (int)buf_meta_bread(hfsmp
->hfs_devvp
,
712 HFS_PHYSBLK_ROUNDDOWN(priIDSector
, hfsmp
->hfs_log_per_phys
),
713 hfsmp
->hfs_physical_block_size
, NOCRED
, &bp
);
720 vhp
= (HFSPlusVolumeHeader
*) (buf_dataptr(bp
) + HFS_PRI_OFFSET(hfsmp
->hfs_physical_block_size
));
722 /* Do a quick sanity check */
723 if ((SWAP_BE16(vhp
->signature
) != kHFSPlusSigWord
&&
724 SWAP_BE16(vhp
->signature
) != kHFSXSigWord
) ||
725 (SWAP_BE16(vhp
->version
) != kHFSPlusVersion
&&
726 SWAP_BE16(vhp
->version
) != kHFSXVersion
) ||
727 SWAP_BE32(vhp
->blockSize
) != vcb
->blockSize
) {
732 vcb
->vcbLsMod
= to_bsd_time(SWAP_BE32(vhp
->modifyDate
));
733 vcb
->vcbAtrb
= SWAP_BE32 (vhp
->attributes
);
734 vcb
->vcbJinfoBlock
= SWAP_BE32(vhp
->journalInfoBlock
);
735 vcb
->vcbClpSiz
= SWAP_BE32 (vhp
->rsrcClumpSize
);
736 vcb
->vcbNxtCNID
= SWAP_BE32 (vhp
->nextCatalogID
);
737 vcb
->vcbVolBkUp
= to_bsd_time(SWAP_BE32(vhp
->backupDate
));
738 vcb
->vcbWrCnt
= SWAP_BE32 (vhp
->writeCount
);
739 vcb
->vcbFilCnt
= SWAP_BE32 (vhp
->fileCount
);
740 vcb
->vcbDirCnt
= SWAP_BE32 (vhp
->folderCount
);
741 HFS_UPDATE_NEXT_ALLOCATION(vcb
, SWAP_BE32 (vhp
->nextAllocation
));
742 vcb
->totalBlocks
= SWAP_BE32 (vhp
->totalBlocks
);
743 vcb
->freeBlocks
= SWAP_BE32 (vhp
->freeBlocks
);
744 vcb
->encodingsBitmap
= SWAP_BE64 (vhp
->encodingsBitmap
);
745 bcopy(vhp
->finderInfo
, vcb
->vcbFndrInfo
, sizeof(vhp
->finderInfo
));
746 vcb
->localCreateDate
= SWAP_BE32 (vhp
->createDate
); /* hfs+ create date is in local time */
749 * Re-load meta-file vnode data (extent info, file size, etc).
751 forkp
= VTOF((struct vnode
*)vcb
->extentsRefNum
);
752 for (i
= 0; i
< kHFSPlusExtentDensity
; i
++) {
753 forkp
->ff_extents
[i
].startBlock
=
754 SWAP_BE32 (vhp
->extentsFile
.extents
[i
].startBlock
);
755 forkp
->ff_extents
[i
].blockCount
=
756 SWAP_BE32 (vhp
->extentsFile
.extents
[i
].blockCount
);
758 forkp
->ff_size
= SWAP_BE64 (vhp
->extentsFile
.logicalSize
);
759 forkp
->ff_blocks
= SWAP_BE32 (vhp
->extentsFile
.totalBlocks
);
760 forkp
->ff_clumpsize
= SWAP_BE32 (vhp
->extentsFile
.clumpSize
);
763 forkp
= VTOF((struct vnode
*)vcb
->catalogRefNum
);
764 for (i
= 0; i
< kHFSPlusExtentDensity
; i
++) {
765 forkp
->ff_extents
[i
].startBlock
=
766 SWAP_BE32 (vhp
->catalogFile
.extents
[i
].startBlock
);
767 forkp
->ff_extents
[i
].blockCount
=
768 SWAP_BE32 (vhp
->catalogFile
.extents
[i
].blockCount
);
770 forkp
->ff_size
= SWAP_BE64 (vhp
->catalogFile
.logicalSize
);
771 forkp
->ff_blocks
= SWAP_BE32 (vhp
->catalogFile
.totalBlocks
);
772 forkp
->ff_clumpsize
= SWAP_BE32 (vhp
->catalogFile
.clumpSize
);
774 if (hfsmp
->hfs_attribute_vp
) {
775 forkp
= VTOF(hfsmp
->hfs_attribute_vp
);
776 for (i
= 0; i
< kHFSPlusExtentDensity
; i
++) {
777 forkp
->ff_extents
[i
].startBlock
=
778 SWAP_BE32 (vhp
->attributesFile
.extents
[i
].startBlock
);
779 forkp
->ff_extents
[i
].blockCount
=
780 SWAP_BE32 (vhp
->attributesFile
.extents
[i
].blockCount
);
782 forkp
->ff_size
= SWAP_BE64 (vhp
->attributesFile
.logicalSize
);
783 forkp
->ff_blocks
= SWAP_BE32 (vhp
->attributesFile
.totalBlocks
);
784 forkp
->ff_clumpsize
= SWAP_BE32 (vhp
->attributesFile
.clumpSize
);
787 forkp
= VTOF((struct vnode
*)vcb
->allocationsRefNum
);
788 for (i
= 0; i
< kHFSPlusExtentDensity
; i
++) {
789 forkp
->ff_extents
[i
].startBlock
=
790 SWAP_BE32 (vhp
->allocationFile
.extents
[i
].startBlock
);
791 forkp
->ff_extents
[i
].blockCount
=
792 SWAP_BE32 (vhp
->allocationFile
.extents
[i
].blockCount
);
794 forkp
->ff_size
= SWAP_BE64 (vhp
->allocationFile
.logicalSize
);
795 forkp
->ff_blocks
= SWAP_BE32 (vhp
->allocationFile
.totalBlocks
);
796 forkp
->ff_clumpsize
= SWAP_BE32 (vhp
->allocationFile
.clumpSize
);
802 * Re-load B-tree header data
804 forkp
= VTOF((struct vnode
*)vcb
->extentsRefNum
);
805 if ( (error
= MacToVFSError( BTReloadData((FCB
*)forkp
) )) )
808 forkp
= VTOF((struct vnode
*)vcb
->catalogRefNum
);
809 if ( (error
= MacToVFSError( BTReloadData((FCB
*)forkp
) )) )
812 if (hfsmp
->hfs_attribute_vp
) {
813 forkp
= VTOF(hfsmp
->hfs_attribute_vp
);
814 if ( (error
= MacToVFSError( BTReloadData((FCB
*)forkp
) )) )
818 /* Reload the volume name */
819 if ((error
= cat_idlookup(hfsmp
, kHFSRootFolderID
, 0, &cndesc
, NULL
, NULL
)))
821 vcb
->volumeNameEncodingHint
= cndesc
.cd_encoding
;
822 bcopy(cndesc
.cd_nameptr
, vcb
->vcbVN
, min(255, cndesc
.cd_namelen
));
823 cat_releasedesc(&cndesc
);
825 /* Re-establish private/hidden directories. */
826 hfs_privatedir_init(hfsmp
, FILE_HARDLINKS
);
827 hfs_privatedir_init(hfsmp
, DIR_HARDLINKS
);
829 /* In case any volume information changed to trigger a notification */
830 hfs_generate_volume_notifications(hfsmp
);
838 hfs_syncer(void *arg0
, void *unused
)
840 #pragma unused(unused)
842 struct hfsmount
*hfsmp
= arg0
;
845 uint32_t delay
= HFS_META_DELAY
;
849 clock_get_calendar_microtime(&secs
, &usecs
);
850 now
= ((uint64_t)secs
* 1000000ULL) + (uint64_t)usecs
;
853 // If the amount of pending writes is more than our limit, wait
854 // for 2/3 of it to drain and then flush the journal.
856 if (hfsmp
->hfs_mp
->mnt_pending_write_size
> hfsmp
->hfs_max_pending_io
) {
858 uint64_t pending_io
, start
, rate
;
862 hfs_start_transaction(hfsmp
); // so we hold off any new i/o's
864 pending_io
= hfsmp
->hfs_mp
->mnt_pending_write_size
;
866 clock_get_calendar_microtime(&secs
, &usecs
);
867 start
= ((uint64_t)secs
* 1000000ULL) + (uint64_t)usecs
;
869 while(hfsmp
->hfs_mp
->mnt_pending_write_size
> (pending_io
/3) && counter
++ < 500) {
870 tsleep((caddr_t
)hfsmp
, PRIBIO
, "hfs-wait-for-io-to-drain", 10);
873 if (counter
>= 500) {
874 printf("hfs: timed out waiting for io to drain (%lld)\n", (int64_t)hfsmp
->hfs_mp
->mnt_pending_write_size
);
878 journal_flush(hfsmp
->jnl
);
880 hfs_sync(hfsmp
->hfs_mp
, MNT_WAIT
, vfs_context_kernel());
883 clock_get_calendar_microtime(&secs
, &usecs
);
884 now
= ((uint64_t)secs
* 1000000ULL) + (uint64_t)usecs
;
885 hfsmp
->hfs_last_sync_time
= now
;
886 rate
= ((pending_io
* 1000000ULL) / (now
- start
)); // yields bytes per second
888 hfs_end_transaction(hfsmp
);
891 // If a reasonable amount of time elapsed then check the
892 // i/o rate. If it's taking less than 1 second or more
893 // than 2 seconds, adjust hfs_max_pending_io so that we
894 // will allow about 1.5 seconds of i/o to queue up.
896 if ((now
- start
) >= 300000) {
897 uint64_t scale
= (pending_io
* 100) / rate
;
899 if (scale
< 100 || scale
> 200) {
900 // set it so that it should take about 1.5 seconds to drain
901 hfsmp
->hfs_max_pending_io
= (rate
* 150ULL) / 100ULL;
905 } else if ( ((now
- hfsmp
->hfs_last_sync_time
) >= 5000000ULL)
906 || (((now
- hfsmp
->hfs_last_sync_time
) >= 100000LL)
907 && ((now
- hfsmp
->hfs_last_sync_request_time
) >= 100000LL)
908 && (hfsmp
->hfs_active_threads
== 0)
909 && (hfsmp
->hfs_global_lock_nesting
== 0))) {
912 // Flush the journal if more than 5 seconds elapsed since
913 // the last sync OR we have not sync'ed recently and the
914 // last sync request time was more than 100 milliseconds
915 // ago and no one is in the middle of a transaction right
916 // now. Else we defer the sync and reschedule it.
919 lck_rw_lock_shared(&hfsmp
->hfs_global_lock
);
921 journal_flush(hfsmp
->jnl
);
923 lck_rw_unlock_shared(&hfsmp
->hfs_global_lock
);
925 hfs_sync(hfsmp
->hfs_mp
, MNT_WAIT
, vfs_context_kernel());
928 clock_get_calendar_microtime(&secs
, &usecs
);
929 now
= ((uint64_t)secs
* 1000000ULL) + (uint64_t)usecs
;
930 hfsmp
->hfs_last_sync_time
= now
;
932 } else if (hfsmp
->hfs_active_threads
== 0) {
935 clock_interval_to_deadline(delay
, HFS_MILLISEC_SCALE
, &deadline
);
936 thread_call_enter_delayed(hfsmp
->hfs_syncer
, deadline
);
938 // note: we intentionally return early here and do not
939 // decrement the sync_scheduled and sync_incomplete
940 // variables because we rescheduled the timer.
946 // NOTE: we decrement these *after* we're done the journal_flush() since
947 // it can take a significant amount of time and so we don't want more
948 // callbacks scheduled until we're done this one.
950 OSDecrementAtomic((volatile SInt32
*)&hfsmp
->hfs_sync_scheduled
);
951 OSDecrementAtomic((volatile SInt32
*)&hfsmp
->hfs_sync_incomplete
);
952 wakeup((caddr_t
)&hfsmp
->hfs_sync_incomplete
);
956 extern int IOBSDIsMediaEjectable( const char *cdev_name
);
959 * Common code for mount and mountroot
962 hfs_mountfs(struct vnode
*devvp
, struct mount
*mp
, struct hfs_mount_args
*args
,
963 int journal_replay_only
, vfs_context_t context
)
965 struct proc
*p
= vfs_context_proc(context
);
967 struct hfsmount
*hfsmp
= NULL
;
970 HFSMasterDirectoryBlock
*mdbp
= NULL
;
978 daddr64_t log_blkcnt
;
979 u_int32_t log_blksize
;
980 u_int32_t phys_blksize
;
981 u_int32_t minblksize
;
982 u_int32_t iswritable
;
983 daddr64_t mdb_offset
;
988 /* only hfs_mountroot passes us NULL as the 'args' argument */
992 ronly
= vfs_isrdonly(mp
);
993 dev
= vnode_specrdev(devvp
);
994 cred
= p
? vfs_context_ucred(context
) : NOCRED
;
1000 minblksize
= kHFSBlockSize
;
1002 /* Advisory locking should be handled at the VFS layer */
1003 vfs_setlocklocal(mp
);
1005 /* Get the logical block size (treated as physical block size everywhere) */
1006 if (VNOP_IOCTL(devvp
, DKIOCGETBLOCKSIZE
, (caddr_t
)&log_blksize
, 0, context
)) {
1010 if (log_blksize
== 0 || log_blksize
> 1024*1024*1024) {
1011 printf("hfs: logical block size 0x%x looks bad. Not mounting.\n", log_blksize
);
1016 /* Get the physical block size. */
1017 retval
= VNOP_IOCTL(devvp
, DKIOCGETPHYSICALBLOCKSIZE
, (caddr_t
)&phys_blksize
, 0, context
);
1019 if ((retval
!= ENOTSUP
) && (retval
!= ENOTTY
)) {
1023 /* If device does not support this ioctl, assume that physical
1024 * block size is same as logical block size
1026 phys_blksize
= log_blksize
;
1028 if (phys_blksize
== 0 || phys_blksize
> 1024*1024*1024) {
1029 printf("hfs: physical block size 0x%x looks bad. Not mounting.\n", phys_blksize
);
1034 /* Switch to 512 byte sectors (temporarily) */
1035 if (log_blksize
> 512) {
1036 u_int32_t size512
= 512;
1038 if (VNOP_IOCTL(devvp
, DKIOCSETBLOCKSIZE
, (caddr_t
)&size512
, FWRITE
, context
)) {
1043 /* Get the number of 512 byte physical blocks. */
1044 if (VNOP_IOCTL(devvp
, DKIOCGETBLOCKCOUNT
, (caddr_t
)&log_blkcnt
, 0, context
)) {
1045 /* resetting block size may fail if getting block count did */
1046 (void)VNOP_IOCTL(devvp
, DKIOCSETBLOCKSIZE
, (caddr_t
)&log_blksize
, FWRITE
, context
);
1051 /* Compute an accurate disk size (i.e. within 512 bytes) */
1052 disksize
= (u_int64_t
)log_blkcnt
* (u_int64_t
)512;
1055 * On Tiger it is not necessary to switch the device
1056 * block size to be 4k if there are more than 31-bits
1057 * worth of blocks but to insure compatibility with
1058 * pre-Tiger systems we have to do it.
1060 * If the device size is not a multiple of 4K (8 * 512), then
1061 * switching the logical block size isn't going to help because
1062 * we will be unable to write the alternate volume header.
1063 * In this case, just leave the logical block size unchanged.
1065 if (log_blkcnt
> 0x000000007fffffff && (log_blkcnt
& 7) == 0) {
1066 minblksize
= log_blksize
= 4096;
1067 if (phys_blksize
< log_blksize
)
1068 phys_blksize
= log_blksize
;
1072 * The cluster layer is not currently prepared to deal with a logical
1073 * block size larger than the system's page size. (It can handle
1074 * blocks per page, but not multiple pages per block.) So limit the
1075 * logical block size to the page size.
1077 if (log_blksize
> PAGE_SIZE
)
1078 log_blksize
= PAGE_SIZE
;
1080 /* Now switch to our preferred physical block size. */
1081 if (log_blksize
> 512) {
1082 if (VNOP_IOCTL(devvp
, DKIOCSETBLOCKSIZE
, (caddr_t
)&log_blksize
, FWRITE
, context
)) {
1086 /* Get the count of physical blocks. */
1087 if (VNOP_IOCTL(devvp
, DKIOCGETBLOCKCOUNT
, (caddr_t
)&log_blkcnt
, 0, context
)) {
1094 * minblksize is the minimum physical block size
1095 * log_blksize has our preferred physical block size
1096 * log_blkcnt has the total number of physical blocks
1099 mdb_offset
= (daddr64_t
)HFS_PRI_SECTOR(log_blksize
);
1100 if ((retval
= (int)buf_meta_bread(devvp
,
1101 HFS_PHYSBLK_ROUNDDOWN(mdb_offset
, (phys_blksize
/log_blksize
)),
1102 phys_blksize
, cred
, &bp
))) {
1105 MALLOC(mdbp
, HFSMasterDirectoryBlock
*, kMDBSize
, M_TEMP
, M_WAITOK
);
1110 bcopy((char *)buf_dataptr(bp
) + HFS_PRI_OFFSET(phys_blksize
), mdbp
, kMDBSize
);
1114 MALLOC(hfsmp
, struct hfsmount
*, sizeof(struct hfsmount
), M_HFSMNT
, M_WAITOK
);
1115 if (hfsmp
== NULL
) {
1119 bzero(hfsmp
, sizeof(struct hfsmount
));
1121 hfs_chashinit_finish(hfsmp
);
1124 * Init the volume information structure
1127 lck_mtx_init(&hfsmp
->hfs_mutex
, hfs_mutex_group
, hfs_lock_attr
);
1128 lck_mtx_init(&hfsmp
->hfc_mutex
, hfs_mutex_group
, hfs_lock_attr
);
1129 lck_rw_init(&hfsmp
->hfs_global_lock
, hfs_rwlock_group
, hfs_lock_attr
);
1130 lck_rw_init(&hfsmp
->hfs_insync
, hfs_rwlock_group
, hfs_lock_attr
);
1132 vfs_setfsprivate(mp
, hfsmp
);
1133 hfsmp
->hfs_mp
= mp
; /* Make VFSTOHFS work */
1134 hfsmp
->hfs_raw_dev
= vnode_specrdev(devvp
);
1135 hfsmp
->hfs_devvp
= devvp
;
1136 vnode_ref(devvp
); /* Hold a ref on the device, dropped when hfsmp is freed. */
1137 hfsmp
->hfs_logical_block_size
= log_blksize
;
1138 hfsmp
->hfs_logical_block_count
= log_blkcnt
;
1139 hfsmp
->hfs_physical_block_size
= phys_blksize
;
1140 hfsmp
->hfs_log_per_phys
= (phys_blksize
/ log_blksize
);
1141 hfsmp
->hfs_flags
|= HFS_WRITEABLE_MEDIA
;
1143 hfsmp
->hfs_flags
|= HFS_READ_ONLY
;
1144 if (((unsigned int)vfs_flags(mp
)) & MNT_UNKNOWNPERMISSIONS
)
1145 hfsmp
->hfs_flags
|= HFS_UNKNOWN_PERMS
;
1148 for (i
= 0; i
< MAXQUOTAS
; i
++)
1149 dqfileinit(&hfsmp
->hfs_qfiles
[i
]);
1153 hfsmp
->hfs_uid
= (args
->hfs_uid
== (uid_t
)VNOVAL
) ? UNKNOWNUID
: args
->hfs_uid
;
1154 if (hfsmp
->hfs_uid
== 0xfffffffd) hfsmp
->hfs_uid
= UNKNOWNUID
;
1155 hfsmp
->hfs_gid
= (args
->hfs_gid
== (gid_t
)VNOVAL
) ? UNKNOWNGID
: args
->hfs_gid
;
1156 if (hfsmp
->hfs_gid
== 0xfffffffd) hfsmp
->hfs_gid
= UNKNOWNGID
;
1157 vfs_setowner(mp
, hfsmp
->hfs_uid
, hfsmp
->hfs_gid
); /* tell the VFS */
1158 if (args
->hfs_mask
!= (mode_t
)VNOVAL
) {
1159 hfsmp
->hfs_dir_mask
= args
->hfs_mask
& ALLPERMS
;
1160 if (args
->flags
& HFSFSMNT_NOXONFILES
) {
1161 hfsmp
->hfs_file_mask
= (args
->hfs_mask
& DEFFILEMODE
);
1163 hfsmp
->hfs_file_mask
= args
->hfs_mask
& ALLPERMS
;
1166 hfsmp
->hfs_dir_mask
= UNKNOWNPERMISSIONS
& ALLPERMS
; /* 0777: rwx---rwx */
1167 hfsmp
->hfs_file_mask
= UNKNOWNPERMISSIONS
& DEFFILEMODE
; /* 0666: no --x by default? */
1169 if ((args
->flags
!= (int)VNOVAL
) && (args
->flags
& HFSFSMNT_WRAPPER
))
1172 /* Even w/o explicit mount arguments, MNT_UNKNOWNPERMISSIONS requires setting up uid, gid, and mask: */
1173 if (((unsigned int)vfs_flags(mp
)) & MNT_UNKNOWNPERMISSIONS
) {
1174 hfsmp
->hfs_uid
= UNKNOWNUID
;
1175 hfsmp
->hfs_gid
= UNKNOWNGID
;
1176 vfs_setowner(mp
, hfsmp
->hfs_uid
, hfsmp
->hfs_gid
); /* tell the VFS */
1177 hfsmp
->hfs_dir_mask
= UNKNOWNPERMISSIONS
& ALLPERMS
; /* 0777: rwx---rwx */
1178 hfsmp
->hfs_file_mask
= UNKNOWNPERMISSIONS
& DEFFILEMODE
; /* 0666: no --x by default? */
1182 /* Find out if disk media is writable. */
1183 if (VNOP_IOCTL(devvp
, DKIOCISWRITABLE
, (caddr_t
)&iswritable
, 0, context
) == 0) {
1185 hfsmp
->hfs_flags
|= HFS_WRITEABLE_MEDIA
;
1187 hfsmp
->hfs_flags
&= ~HFS_WRITEABLE_MEDIA
;
1190 // record the current time at which we're mounting this volume
1193 hfsmp
->hfs_mount_time
= tv
.tv_sec
;
1195 /* Mount a standard HFS disk */
1196 if ((SWAP_BE16(mdbp
->drSigWord
) == kHFSSigWord
) &&
1197 (mntwrapper
|| (SWAP_BE16(mdbp
->drEmbedSigWord
) != kHFSPlusSigWord
))) {
1199 /* On 10.6 and beyond, non read-only mounts for HFS standard vols get rejected */
1200 if (vfs_isrdwr(mp
)) {
1204 /* Treat it as if it's read-only and not writeable */
1205 hfsmp
->hfs_flags
|= HFS_READ_ONLY
;
1206 hfsmp
->hfs_flags
&= ~HFS_WRITEABLE_MEDIA
;
1208 /* If only journal replay is requested, exit immediately */
1209 if (journal_replay_only
) {
1214 if ((vfs_flags(mp
) & MNT_ROOTFS
)) {
1215 retval
= EINVAL
; /* Cannot root from HFS standard disks */
1218 /* HFS disks can only use 512 byte physical blocks */
1219 if (log_blksize
> kHFSBlockSize
) {
1220 log_blksize
= kHFSBlockSize
;
1221 if (VNOP_IOCTL(devvp
, DKIOCSETBLOCKSIZE
, (caddr_t
)&log_blksize
, FWRITE
, context
)) {
1225 if (VNOP_IOCTL(devvp
, DKIOCGETBLOCKCOUNT
, (caddr_t
)&log_blkcnt
, 0, context
)) {
1229 hfsmp
->hfs_logical_block_size
= log_blksize
;
1230 hfsmp
->hfs_logical_block_count
= log_blkcnt
;
1231 hfsmp
->hfs_physical_block_size
= log_blksize
;
1232 hfsmp
->hfs_log_per_phys
= 1;
1235 hfsmp
->hfs_encoding
= args
->hfs_encoding
;
1236 HFSTOVCB(hfsmp
)->volumeNameEncodingHint
= args
->hfs_encoding
;
1238 /* establish the timezone */
1239 gTimeZone
= args
->hfs_timezone
;
1242 retval
= hfs_getconverter(hfsmp
->hfs_encoding
, &hfsmp
->hfs_get_unicode
,
1243 &hfsmp
->hfs_get_hfsname
);
1247 retval
= hfs_MountHFSVolume(hfsmp
, mdbp
, p
);
1249 (void) hfs_relconverter(hfsmp
->hfs_encoding
);
1251 } else /* Mount an HFS Plus disk */ {
1252 HFSPlusVolumeHeader
*vhp
;
1253 off_t embeddedOffset
;
1254 int jnl_disable
= 0;
1256 /* Get the embedded Volume Header */
1257 if (SWAP_BE16(mdbp
->drEmbedSigWord
) == kHFSPlusSigWord
) {
1258 embeddedOffset
= SWAP_BE16(mdbp
->drAlBlSt
) * kHFSBlockSize
;
1259 embeddedOffset
+= (u_int64_t
)SWAP_BE16(mdbp
->drEmbedExtent
.startBlock
) *
1260 (u_int64_t
)SWAP_BE32(mdbp
->drAlBlkSiz
);
1263 * If the embedded volume doesn't start on a block
1264 * boundary, then switch the device to a 512-byte
1265 * block size so everything will line up on a block
1268 if ((embeddedOffset
% log_blksize
) != 0) {
1269 printf("hfs_mountfs: embedded volume offset not"
1270 " a multiple of physical block size (%d);"
1271 " switching to 512\n", log_blksize
);
1273 if (VNOP_IOCTL(devvp
, DKIOCSETBLOCKSIZE
,
1274 (caddr_t
)&log_blksize
, FWRITE
, context
)) {
1278 if (VNOP_IOCTL(devvp
, DKIOCGETBLOCKCOUNT
,
1279 (caddr_t
)&log_blkcnt
, 0, context
)) {
1283 /* Note: relative block count adjustment */
1284 hfsmp
->hfs_logical_block_count
*=
1285 hfsmp
->hfs_logical_block_size
/ log_blksize
;
1287 /* Update logical /physical block size */
1288 hfsmp
->hfs_logical_block_size
= log_blksize
;
1289 hfsmp
->hfs_physical_block_size
= log_blksize
;
1290 phys_blksize
= log_blksize
;
1291 hfsmp
->hfs_log_per_phys
= 1;
1294 disksize
= (u_int64_t
)SWAP_BE16(mdbp
->drEmbedExtent
.blockCount
) *
1295 (u_int64_t
)SWAP_BE32(mdbp
->drAlBlkSiz
);
1297 hfsmp
->hfs_logical_block_count
= disksize
/ log_blksize
;
1299 mdb_offset
= (daddr64_t
)((embeddedOffset
/ log_blksize
) + HFS_PRI_SECTOR(log_blksize
));
1300 retval
= (int)buf_meta_bread(devvp
, HFS_PHYSBLK_ROUNDDOWN(mdb_offset
, hfsmp
->hfs_log_per_phys
),
1301 phys_blksize
, cred
, &bp
);
1304 bcopy((char *)buf_dataptr(bp
) + HFS_PRI_OFFSET(phys_blksize
), mdbp
, 512);
1307 vhp
= (HFSPlusVolumeHeader
*) mdbp
;
1309 } else /* pure HFS+ */ {
1311 vhp
= (HFSPlusVolumeHeader
*) mdbp
;
1315 * On inconsistent disks, do not allow read-write mount
1316 * unless it is the boot volume being mounted. We also
1317 * always want to replay the journal if the journal_replay_only
1318 * flag is set because that will (most likely) get the
1319 * disk into a consistent state before fsck_hfs starts
1322 if ( !(vfs_flags(mp
) & MNT_ROOTFS
)
1323 && (SWAP_BE32(vhp
->attributes
) & kHFSVolumeInconsistentMask
)
1324 && !journal_replay_only
1325 && !(hfsmp
->hfs_flags
& HFS_READ_ONLY
)) {
1335 if (args
!= NULL
&& (args
->flags
& HFSFSMNT_EXTENDED_ARGS
) &&
1336 args
->journal_disable
) {
1341 // We only initialize the journal here if the last person
1342 // to mount this volume was journaling aware. Otherwise
1343 // we delay journal initialization until later at the end
1344 // of hfs_MountHFSPlusVolume() because the last person who
1345 // mounted it could have messed things up behind our back
1346 // (so we need to go find the .journal file, make sure it's
1347 // the right size, re-sync up if it was moved, etc).
1349 if ( (SWAP_BE32(vhp
->lastMountedVersion
) == kHFSJMountVersion
)
1350 && (SWAP_BE32(vhp
->attributes
) & kHFSVolumeJournaledMask
)
1353 // if we're able to init the journal, mark the mount
1354 // point as journaled.
1356 if ((retval
= hfs_early_journal_init(hfsmp
, vhp
, args
, embeddedOffset
, mdb_offset
, mdbp
, cred
)) == 0) {
1357 vfs_setflags(mp
, (u_int64_t
)((unsigned int)MNT_JOURNALED
));
1359 if (retval
== EROFS
) {
1360 // EROFS is a special error code that means the volume has an external
1361 // journal which we couldn't find. in that case we do not want to
1362 // rewrite the volume header - we'll just refuse to mount the volume.
1367 // if the journal failed to open, then set the lastMountedVersion
1368 // to be "FSK!" which fsck_hfs will see and force the fsck instead
1369 // of just bailing out because the volume is journaled.
1371 HFSPlusVolumeHeader
*jvhp
;
1373 hfsmp
->hfs_flags
|= HFS_NEED_JNL_RESET
;
1375 if (mdb_offset
== 0) {
1376 mdb_offset
= (daddr64_t
)((embeddedOffset
/ log_blksize
) + HFS_PRI_SECTOR(log_blksize
));
1380 retval
= (int)buf_meta_bread(devvp
,
1381 HFS_PHYSBLK_ROUNDDOWN(mdb_offset
, hfsmp
->hfs_log_per_phys
),
1382 phys_blksize
, cred
, &bp
);
1384 jvhp
= (HFSPlusVolumeHeader
*)(buf_dataptr(bp
) + HFS_PRI_OFFSET(phys_blksize
));
1386 if (SWAP_BE16(jvhp
->signature
) == kHFSPlusSigWord
|| SWAP_BE16(jvhp
->signature
) == kHFSXSigWord
) {
1387 printf ("hfs(1): Journal replay fail. Writing lastMountVersion as FSK!\n");
1388 jvhp
->lastMountedVersion
= SWAP_BE32(kFSKMountVersion
);
1396 // clear this so the error exit path won't try to use it
1401 // if this isn't the root device just bail out.
1402 // If it is the root device we just continue on
1403 // in the hopes that fsck_hfs will be able to
1404 // fix any damage that exists on the volume.
1405 if ( !(vfs_flags(mp
) & MNT_ROOTFS
)) {
1413 /* Either the journal is replayed successfully, or there
1414 * was nothing to replay, or no journal exists. In any case,
1417 if (journal_replay_only
) {
1422 (void) hfs_getconverter(0, &hfsmp
->hfs_get_unicode
, &hfsmp
->hfs_get_hfsname
);
1424 retval
= hfs_MountHFSPlusVolume(hfsmp
, vhp
, embeddedOffset
, disksize
, p
, args
, cred
);
1426 * If the backend didn't like our physical blocksize
1427 * then retry with physical blocksize of 512.
1429 if ((retval
== ENXIO
) && (log_blksize
> 512) && (log_blksize
!= minblksize
)) {
1430 printf("hfs_mountfs: could not use physical block size "
1431 "(%d) switching to 512\n", log_blksize
);
1433 if (VNOP_IOCTL(devvp
, DKIOCSETBLOCKSIZE
, (caddr_t
)&log_blksize
, FWRITE
, context
)) {
1437 if (VNOP_IOCTL(devvp
, DKIOCGETBLOCKCOUNT
, (caddr_t
)&log_blkcnt
, 0, context
)) {
1441 devvp
->v_specsize
= log_blksize
;
1442 /* Note: relative block count adjustment (in case this is an embedded volume). */
1443 hfsmp
->hfs_logical_block_count
*= hfsmp
->hfs_logical_block_size
/ log_blksize
;
1444 hfsmp
->hfs_logical_block_size
= log_blksize
;
1445 hfsmp
->hfs_log_per_phys
= hfsmp
->hfs_physical_block_size
/ log_blksize
;
1447 if (hfsmp
->jnl
&& hfsmp
->jvp
== devvp
) {
1448 // close and re-open this with the new block size
1449 journal_close(hfsmp
->jnl
);
1451 if (hfs_early_journal_init(hfsmp
, vhp
, args
, embeddedOffset
, mdb_offset
, mdbp
, cred
) == 0) {
1452 vfs_setflags(mp
, (u_int64_t
)((unsigned int)MNT_JOURNALED
));
1454 // if the journal failed to open, then set the lastMountedVersion
1455 // to be "FSK!" which fsck_hfs will see and force the fsck instead
1456 // of just bailing out because the volume is journaled.
1458 HFSPlusVolumeHeader
*jvhp
;
1460 hfsmp
->hfs_flags
|= HFS_NEED_JNL_RESET
;
1462 if (mdb_offset
== 0) {
1463 mdb_offset
= (daddr64_t
)((embeddedOffset
/ log_blksize
) + HFS_PRI_SECTOR(log_blksize
));
1467 retval
= (int)buf_meta_bread(devvp
, HFS_PHYSBLK_ROUNDDOWN(mdb_offset
, hfsmp
->hfs_log_per_phys
),
1468 phys_blksize
, cred
, &bp
);
1470 jvhp
= (HFSPlusVolumeHeader
*)(buf_dataptr(bp
) + HFS_PRI_OFFSET(phys_blksize
));
1472 if (SWAP_BE16(jvhp
->signature
) == kHFSPlusSigWord
|| SWAP_BE16(jvhp
->signature
) == kHFSXSigWord
) {
1473 printf ("hfs(2): Journal replay fail. Writing lastMountVersion as FSK!\n");
1474 jvhp
->lastMountedVersion
= SWAP_BE32(kFSKMountVersion
);
1482 // clear this so the error exit path won't try to use it
1487 // if this isn't the root device just bail out.
1488 // If it is the root device we just continue on
1489 // in the hopes that fsck_hfs will be able to
1490 // fix any damage that exists on the volume.
1491 if ( !(vfs_flags(mp
) & MNT_ROOTFS
)) {
1498 /* Try again with a smaller block size... */
1499 retval
= hfs_MountHFSPlusVolume(hfsmp
, vhp
, embeddedOffset
, disksize
, p
, args
, cred
);
1502 (void) hfs_relconverter(0);
1505 // save off a snapshot of the mtime from the previous mount
1507 hfsmp
->hfs_last_mounted_mtime
= hfsmp
->hfs_mtime
;
1513 mp
->mnt_vfsstat
.f_fsid
.val
[0] = (long)dev
;
1514 mp
->mnt_vfsstat
.f_fsid
.val
[1] = vfs_typenum(mp
);
1515 vfs_setmaxsymlen(mp
, 0);
1517 mp
->mnt_vtable
->vfc_vfsflags
|= VFC_VFSNATIVEXATTR
;
1519 mp
->mnt_kern_flag
|= MNTK_NAMED_STREAMS
;
1521 if (!(hfsmp
->hfs_flags
& HFS_STANDARD
)) {
1522 /* Tell VFS that we support directory hard links. */
1523 mp
->mnt_vtable
->vfc_vfsflags
|= VFC_VFSDIRLINKS
;
1525 /* HFS standard doesn't support extended readdir! */
1526 mp
->mnt_vtable
->vfc_vfsflags
&= ~VFC_VFSREADDIR_EXTENDED
;
1531 * Set the free space warning levels for a non-root volume:
1533 * Set the "danger" limit to 1% of the volume size or 100MB, whichever
1534 * is less. Set the "warning" limit to 2% of the volume size or 150MB,
1535 * whichever is less. And last, set the "desired" freespace level to
1536 * to 3% of the volume size or 200MB, whichever is less.
1538 hfsmp
->hfs_freespace_notify_dangerlimit
=
1539 MIN(HFS_VERYLOWDISKTRIGGERLEVEL
/ HFSTOVCB(hfsmp
)->blockSize
,
1540 (HFSTOVCB(hfsmp
)->totalBlocks
/ 100) * HFS_VERYLOWDISKTRIGGERFRACTION
);
1541 hfsmp
->hfs_freespace_notify_warninglimit
=
1542 MIN(HFS_LOWDISKTRIGGERLEVEL
/ HFSTOVCB(hfsmp
)->blockSize
,
1543 (HFSTOVCB(hfsmp
)->totalBlocks
/ 100) * HFS_LOWDISKTRIGGERFRACTION
);
1544 hfsmp
->hfs_freespace_notify_desiredlevel
=
1545 MIN(HFS_LOWDISKSHUTOFFLEVEL
/ HFSTOVCB(hfsmp
)->blockSize
,
1546 (HFSTOVCB(hfsmp
)->totalBlocks
/ 100) * HFS_LOWDISKSHUTOFFFRACTION
);
1549 * Set the free space warning levels for the root volume:
1551 * Set the "danger" limit to 5% of the volume size or 125MB, whichever
1552 * is less. Set the "warning" limit to 10% of the volume size or 250MB,
1553 * whichever is less. And last, set the "desired" freespace level to
1554 * to 11% of the volume size or 375MB, whichever is less.
1556 hfsmp
->hfs_freespace_notify_dangerlimit
=
1557 MIN(HFS_ROOTVERYLOWDISKTRIGGERLEVEL
/ HFSTOVCB(hfsmp
)->blockSize
,
1558 (HFSTOVCB(hfsmp
)->totalBlocks
/ 100) * HFS_ROOTVERYLOWDISKTRIGGERFRACTION
);
1559 hfsmp
->hfs_freespace_notify_warninglimit
=
1560 MIN(HFS_ROOTLOWDISKTRIGGERLEVEL
/ HFSTOVCB(hfsmp
)->blockSize
,
1561 (HFSTOVCB(hfsmp
)->totalBlocks
/ 100) * HFS_ROOTLOWDISKTRIGGERFRACTION
);
1562 hfsmp
->hfs_freespace_notify_desiredlevel
=
1563 MIN(HFS_ROOTLOWDISKSHUTOFFLEVEL
/ HFSTOVCB(hfsmp
)->blockSize
,
1564 (HFSTOVCB(hfsmp
)->totalBlocks
/ 100) * HFS_ROOTLOWDISKSHUTOFFFRACTION
);
1567 /* Check if the file system exists on virtual device, like disk image */
1568 if (VNOP_IOCTL(devvp
, DKIOCISVIRTUAL
, (caddr_t
)&isvirtual
, 0, context
) == 0) {
1570 hfsmp
->hfs_flags
|= HFS_VIRTUAL_DEVICE
;
1574 /* do not allow ejectability checks on the root device */
1576 if ((hfsmp
->hfs_flags
& HFS_VIRTUAL_DEVICE
) == 0 &&
1577 IOBSDIsMediaEjectable(mp
->mnt_vfsstat
.f_mntfromname
)) {
1578 hfsmp
->hfs_max_pending_io
= 4096*1024; // a reasonable value to start with.
1579 hfsmp
->hfs_syncer
= thread_call_allocate(hfs_syncer
, hfsmp
);
1580 if (hfsmp
->hfs_syncer
== NULL
) {
1581 printf("hfs: failed to allocate syncer thread callback for %s (%s)\n",
1582 mp
->mnt_vfsstat
.f_mntfromname
, mp
->mnt_vfsstat
.f_mntonname
);
1588 * Start looking for free space to drop below this level and generate a
1589 * warning immediately if needed:
1591 hfsmp
->hfs_notification_conditions
= 0;
1592 hfs_generate_volume_notifications(hfsmp
);
1595 (void) hfs_flushvolumeheader(hfsmp
, MNT_WAIT
, 0);
1606 if (hfsmp
&& hfsmp
->jvp
&& hfsmp
->jvp
!= hfsmp
->hfs_devvp
) {
1607 vnode_clearmountedon(hfsmp
->jvp
);
1608 (void)VNOP_CLOSE(hfsmp
->jvp
, ronly
? FREAD
: FREAD
|FWRITE
, vfs_context_kernel());
1612 if (hfsmp
->hfs_devvp
) {
1613 vnode_rele(hfsmp
->hfs_devvp
);
1615 hfs_delete_chash(hfsmp
);
1617 FREE(hfsmp
, M_HFSMNT
);
1618 vfs_setfsprivate(mp
, NULL
);
1625 * Make a filesystem operational.
1626 * Nothing to do at the moment.
1630 hfs_start(__unused
struct mount
*mp
, __unused
int flags
, __unused vfs_context_t context
)
1637 * unmount system call
1640 hfs_unmount(struct mount
*mp
, int mntflags
, vfs_context_t context
)
1642 struct proc
*p
= vfs_context_proc(context
);
1643 struct hfsmount
*hfsmp
= VFSTOHFS(mp
);
1644 int retval
= E_NONE
;
1651 if (mntflags
& MNT_FORCE
) {
1652 flags
|= FORCECLOSE
;
1656 if ((retval
= hfs_flushfiles(mp
, flags
, p
)) && !force
)
1659 if (hfsmp
->hfs_flags
& HFS_METADATA_ZONE
)
1660 (void) hfs_recording_suspend(hfsmp
);
1663 * Cancel any pending timers for this volume. Then wait for any timers
1664 * which have fired, but whose callbacks have not yet completed.
1666 if (hfsmp
->hfs_syncer
)
1668 struct timespec ts
= {0, 100000000}; /* 0.1 seconds */
1671 * Cancel any timers that have been scheduled, but have not
1672 * fired yet. NOTE: The kernel considers a timer complete as
1673 * soon as it starts your callback, so the kernel does not
1674 * keep track of the number of callbacks in progress.
1676 if (thread_call_cancel(hfsmp
->hfs_syncer
))
1677 OSDecrementAtomic((volatile SInt32
*)&hfsmp
->hfs_sync_incomplete
);
1678 thread_call_free(hfsmp
->hfs_syncer
);
1679 hfsmp
->hfs_syncer
= NULL
;
1682 * This waits for all of the callbacks that were entered before
1683 * we did thread_call_cancel above, but have not completed yet.
1685 while(hfsmp
->hfs_sync_incomplete
> 0)
1687 msleep((caddr_t
)&hfsmp
->hfs_sync_incomplete
, NULL
, PWAIT
, "hfs_unmount", &ts
);
1690 if (hfsmp
->hfs_sync_incomplete
< 0)
1691 panic("hfs_unmount: pm_sync_incomplete underflow!\n");
1695 * Flush out the b-trees, volume bitmap and Volume Header
1697 if ((hfsmp
->hfs_flags
& HFS_READ_ONLY
) == 0) {
1698 retval
= hfs_start_transaction(hfsmp
);
1701 } else if (!force
) {
1705 if (hfsmp
->hfs_startup_vp
) {
1706 (void) hfs_lock(VTOC(hfsmp
->hfs_startup_vp
), HFS_EXCLUSIVE_LOCK
);
1707 retval
= hfs_fsync(hfsmp
->hfs_startup_vp
, MNT_WAIT
, 0, p
);
1708 hfs_unlock(VTOC(hfsmp
->hfs_startup_vp
));
1709 if (retval
&& !force
)
1713 if (hfsmp
->hfs_attribute_vp
) {
1714 (void) hfs_lock(VTOC(hfsmp
->hfs_attribute_vp
), HFS_EXCLUSIVE_LOCK
);
1715 retval
= hfs_fsync(hfsmp
->hfs_attribute_vp
, MNT_WAIT
, 0, p
);
1716 hfs_unlock(VTOC(hfsmp
->hfs_attribute_vp
));
1717 if (retval
&& !force
)
1721 (void) hfs_lock(VTOC(hfsmp
->hfs_catalog_vp
), HFS_EXCLUSIVE_LOCK
);
1722 retval
= hfs_fsync(hfsmp
->hfs_catalog_vp
, MNT_WAIT
, 0, p
);
1723 hfs_unlock(VTOC(hfsmp
->hfs_catalog_vp
));
1724 if (retval
&& !force
)
1727 (void) hfs_lock(VTOC(hfsmp
->hfs_extents_vp
), HFS_EXCLUSIVE_LOCK
);
1728 retval
= hfs_fsync(hfsmp
->hfs_extents_vp
, MNT_WAIT
, 0, p
);
1729 hfs_unlock(VTOC(hfsmp
->hfs_extents_vp
));
1730 if (retval
&& !force
)
1733 if (hfsmp
->hfs_allocation_vp
) {
1734 (void) hfs_lock(VTOC(hfsmp
->hfs_allocation_vp
), HFS_EXCLUSIVE_LOCK
);
1735 retval
= hfs_fsync(hfsmp
->hfs_allocation_vp
, MNT_WAIT
, 0, p
);
1736 hfs_unlock(VTOC(hfsmp
->hfs_allocation_vp
));
1737 if (retval
&& !force
)
1741 if (hfsmp
->hfc_filevp
&& vnode_issystem(hfsmp
->hfc_filevp
)) {
1742 retval
= hfs_fsync(hfsmp
->hfc_filevp
, MNT_WAIT
, 0, p
);
1743 if (retval
&& !force
)
1747 /* If runtime corruption was detected, indicate that the volume
1748 * was not unmounted cleanly.
1750 if (hfsmp
->vcbAtrb
& kHFSVolumeInconsistentMask
) {
1751 HFSTOVCB(hfsmp
)->vcbAtrb
&= ~kHFSVolumeUnmountedMask
;
1753 HFSTOVCB(hfsmp
)->vcbAtrb
|= kHFSVolumeUnmountedMask
;
1756 if (hfsmp
->hfs_flags
& HFS_HAS_SPARSE_DEVICE
) {
1758 u_int32_t min_start
= hfsmp
->totalBlocks
;
1760 // set the nextAllocation pointer to the smallest free block number
1761 // we've seen so on the next mount we won't rescan unnecessarily
1762 for(i
=0; i
< (int)hfsmp
->vcbFreeExtCnt
; i
++) {
1763 if (hfsmp
->vcbFreeExt
[i
].startBlock
< min_start
) {
1764 min_start
= hfsmp
->vcbFreeExt
[i
].startBlock
;
1767 if (min_start
< hfsmp
->nextAllocation
) {
1768 hfsmp
->nextAllocation
= min_start
;
1773 retval
= hfs_flushvolumeheader(hfsmp
, MNT_WAIT
, 0);
1775 HFSTOVCB(hfsmp
)->vcbAtrb
&= ~kHFSVolumeUnmountedMask
;
1777 goto err_exit
; /* could not flush everything */
1781 hfs_end_transaction(hfsmp
);
1787 hfs_journal_flush(hfsmp
);
1791 * Invalidate our caches and release metadata vnodes
1793 (void) hfsUnmount(hfsmp
, p
);
1796 * Last chance to dump unreferenced system files.
1798 (void) vflush(mp
, NULLVP
, FORCECLOSE
);
1800 if (HFSTOVCB(hfsmp
)->vcbSigWord
== kHFSSigWord
)
1801 (void) hfs_relconverter(hfsmp
->hfs_encoding
);
1805 journal_close(hfsmp
->jnl
);
1809 VNOP_FSYNC(hfsmp
->hfs_devvp
, MNT_WAIT
, context
);
1811 if (hfsmp
->jvp
&& hfsmp
->jvp
!= hfsmp
->hfs_devvp
) {
1812 vnode_clearmountedon(hfsmp
->jvp
);
1813 retval
= VNOP_CLOSE(hfsmp
->jvp
,
1814 hfsmp
->hfs_flags
& HFS_READ_ONLY
? FREAD
: FREAD
|FWRITE
,
1815 vfs_context_kernel());
1816 vnode_put(hfsmp
->jvp
);
1821 #ifdef HFS_SPARSE_DEV
1822 /* Drop our reference on the backing fs (if any). */
1823 if ((hfsmp
->hfs_flags
& HFS_HAS_SPARSE_DEVICE
) && hfsmp
->hfs_backingfs_rootvp
) {
1824 struct vnode
* tmpvp
;
1826 hfsmp
->hfs_flags
&= ~HFS_HAS_SPARSE_DEVICE
;
1827 tmpvp
= hfsmp
->hfs_backingfs_rootvp
;
1828 hfsmp
->hfs_backingfs_rootvp
= NULLVP
;
1831 #endif /* HFS_SPARSE_DEV */
1832 lck_mtx_destroy(&hfsmp
->hfc_mutex
, hfs_mutex_group
);
1833 vnode_rele(hfsmp
->hfs_devvp
);
1835 hfs_delete_chash(hfsmp
);
1836 FREE(hfsmp
, M_HFSMNT
);
1842 hfs_end_transaction(hfsmp
);
1849 * Return the root of a filesystem.
1852 hfs_vfs_root(struct mount
*mp
, struct vnode
**vpp
, __unused vfs_context_t context
)
1854 return hfs_vget(VFSTOHFS(mp
), (cnid_t
)kHFSRootFolderID
, vpp
, 1);
1859 * Do operations associated with quotas
1863 hfs_quotactl(__unused
struct mount
*mp
, __unused
int cmds
, __unused uid_t uid
, __unused caddr_t datap
, __unused vfs_context_t context
)
1869 hfs_quotactl(struct mount
*mp
, int cmds
, uid_t uid
, caddr_t datap
, vfs_context_t context
)
1871 struct proc
*p
= vfs_context_proc(context
);
1872 int cmd
, type
, error
;
1875 uid
= vfs_context_ucred(context
)->cr_ruid
;
1876 cmd
= cmds
>> SUBCMDSHIFT
;
1883 if (uid
== vfs_context_ucred(context
)->cr_ruid
)
1887 if ( (error
= vfs_context_suser(context
)) )
1891 type
= cmds
& SUBCMDMASK
;
1892 if ((u_int
)type
>= MAXQUOTAS
)
1894 if (vfs_busy(mp
, LK_NOWAIT
))
1900 error
= hfs_quotaon(p
, mp
, type
, datap
);
1904 error
= hfs_quotaoff(p
, mp
, type
);
1908 error
= hfs_setquota(mp
, uid
, type
, datap
);
1912 error
= hfs_setuse(mp
, uid
, type
, datap
);
1916 error
= hfs_getquota(mp
, uid
, type
, datap
);
1920 error
= hfs_qsync(mp
);
1924 error
= hfs_quotastat(mp
, type
, datap
);
1937 /* Subtype is composite of bits */
1938 #define HFS_SUBTYPE_JOURNALED 0x01
1939 #define HFS_SUBTYPE_CASESENSITIVE 0x02
1940 /* bits 2 - 6 reserved */
1941 #define HFS_SUBTYPE_STANDARDHFS 0x80
1944 * Get file system statistics.
1947 hfs_statfs(struct mount
*mp
, register struct vfsstatfs
*sbp
, __unused vfs_context_t context
)
1949 ExtendedVCB
*vcb
= VFSTOVCB(mp
);
1950 struct hfsmount
*hfsmp
= VFSTOHFS(mp
);
1951 u_int32_t freeCNIDs
;
1952 u_int16_t subtype
= 0;
1954 freeCNIDs
= (u_int32_t
)0xFFFFFFFF - (u_int32_t
)vcb
->vcbNxtCNID
;
1956 sbp
->f_bsize
= (u_int32_t
)vcb
->blockSize
;
1957 sbp
->f_iosize
= (size_t)cluster_max_io_size(mp
, 0);
1958 sbp
->f_blocks
= (u_int64_t
)((u_int32_t
)vcb
->totalBlocks
);
1959 sbp
->f_bfree
= (u_int64_t
)((u_int32_t
)hfs_freeblks(hfsmp
, 0));
1960 sbp
->f_bavail
= (u_int64_t
)((u_int32_t
)hfs_freeblks(hfsmp
, 1));
1961 sbp
->f_files
= (u_int64_t
)((u_int32_t
)(vcb
->totalBlocks
- 2)); /* max files is constrained by total blocks */
1962 sbp
->f_ffree
= (u_int64_t
)((u_int32_t
)(MIN(freeCNIDs
, sbp
->f_bavail
)));
1965 * Subtypes (flavors) for HFS
1966 * 0: Mac OS Extended
1967 * 1: Mac OS Extended (Journaled)
1968 * 2: Mac OS Extended (Case Sensitive)
1969 * 3: Mac OS Extended (Case Sensitive, Journaled)
1971 * 128: Mac OS Standard
1974 if (hfsmp
->hfs_flags
& HFS_STANDARD
) {
1975 subtype
= HFS_SUBTYPE_STANDARDHFS
;
1976 } else /* HFS Plus */ {
1978 subtype
|= HFS_SUBTYPE_JOURNALED
;
1979 if (hfsmp
->hfs_flags
& HFS_CASE_SENSITIVE
)
1980 subtype
|= HFS_SUBTYPE_CASESENSITIVE
;
1982 sbp
->f_fssubtype
= subtype
;
1989 // XXXdbg -- this is a callback to be used by the journal to
1990 // get meta data blocks flushed out to disk.
1992 // XXXdbg -- be smarter and don't flush *every* block on each
1993 // call. try to only flush some so we don't wind up
1994 // being too synchronous.
1998 hfs_sync_metadata(void *arg
)
2000 struct mount
*mp
= (struct mount
*)arg
;
2001 struct hfsmount
*hfsmp
;
2005 daddr64_t priIDSector
;
2006 hfsmp
= VFSTOHFS(mp
);
2007 vcb
= HFSTOVCB(hfsmp
);
2009 // now make sure the super block is flushed
2010 priIDSector
= (daddr64_t
)((vcb
->hfsPlusIOPosOffset
/ hfsmp
->hfs_logical_block_size
) +
2011 HFS_PRI_SECTOR(hfsmp
->hfs_logical_block_size
));
2013 retval
= (int)buf_meta_bread(hfsmp
->hfs_devvp
,
2014 HFS_PHYSBLK_ROUNDDOWN(priIDSector
, hfsmp
->hfs_log_per_phys
),
2015 hfsmp
->hfs_physical_block_size
, NOCRED
, &bp
);
2016 if ((retval
!= 0 ) && (retval
!= ENXIO
)) {
2017 printf("hfs_sync_metadata: can't read volume header at %d! (retval 0x%x)\n",
2018 (int)priIDSector
, retval
);
2021 if (retval
== 0 && ((buf_flags(bp
) & (B_DELWRI
| B_LOCKED
)) == B_DELWRI
)) {
2027 // the alternate super block...
2028 // XXXdbg - we probably don't need to do this each and every time.
2029 // hfs_btreeio.c:FlushAlternate() should flag when it was
2031 if (hfsmp
->hfs_alt_id_sector
) {
2032 retval
= (int)buf_meta_bread(hfsmp
->hfs_devvp
,
2033 HFS_PHYSBLK_ROUNDDOWN(hfsmp
->hfs_alt_id_sector
, hfsmp
->hfs_log_per_phys
),
2034 hfsmp
->hfs_physical_block_size
, NOCRED
, &bp
);
2035 if (retval
== 0 && ((buf_flags(bp
) & (B_DELWRI
| B_LOCKED
)) == B_DELWRI
)) {
2044 struct hfs_sync_cargs
{
2053 hfs_sync_callback(struct vnode
*vp
, void *cargs
)
2056 struct hfs_sync_cargs
*args
;
2059 args
= (struct hfs_sync_cargs
*)cargs
;
2061 if (hfs_lock(VTOC(vp
), HFS_EXCLUSIVE_LOCK
) != 0) {
2062 return (VNODE_RETURNED
);
2066 if ((cp
->c_flag
& C_MODIFIED
) ||
2067 (cp
->c_touch_acctime
| cp
->c_touch_chgtime
| cp
->c_touch_modtime
) ||
2068 vnode_hasdirtyblks(vp
)) {
2069 error
= hfs_fsync(vp
, args
->waitfor
, 0, args
->p
);
2072 args
->error
= error
;
2075 return (VNODE_RETURNED
);
2081 * Go through the disk queues to initiate sandbagged IO;
2082 * go through the inodes to write those that have been modified;
2083 * initiate the writing of the super block if it has been modified.
2085 * Note: we are always called with the filesystem marked `MPBUSY'.
2088 hfs_sync(struct mount
*mp
, int waitfor
, vfs_context_t context
)
2090 struct proc
*p
= vfs_context_proc(context
);
2092 struct hfsmount
*hfsmp
;
2094 struct vnode
*meta_vp
[4];
2096 int error
, allerror
= 0;
2097 struct hfs_sync_cargs args
;
2099 hfsmp
= VFSTOHFS(mp
);
2102 * hfs_changefs might be manipulating vnodes so back off
2104 if (hfsmp
->hfs_flags
& HFS_IN_CHANGEFS
)
2107 if (hfsmp
->hfs_flags
& HFS_READ_ONLY
)
2110 /* skip over frozen volumes */
2111 if (!lck_rw_try_lock_shared(&hfsmp
->hfs_insync
))
2114 args
.cred
= kauth_cred_get();
2115 args
.waitfor
= waitfor
;
2119 * hfs_sync_callback will be called for each vnode
2120 * hung off of this mount point... the vnode will be
2121 * properly referenced and unreferenced around the callback
2123 vnode_iterate(mp
, 0, hfs_sync_callback
, (void *)&args
);
2126 allerror
= args
.error
;
2128 vcb
= HFSTOVCB(hfsmp
);
2130 meta_vp
[0] = vcb
->extentsRefNum
;
2131 meta_vp
[1] = vcb
->catalogRefNum
;
2132 meta_vp
[2] = vcb
->allocationsRefNum
; /* This is NULL for standard HFS */
2133 meta_vp
[3] = hfsmp
->hfs_attribute_vp
; /* Optional file */
2135 /* Now sync our three metadata files */
2136 for (i
= 0; i
< 4; ++i
) {
2140 if ((btvp
==0) || (vnode_mount(btvp
) != mp
))
2143 /* XXX use hfs_systemfile_lock instead ? */
2144 (void) hfs_lock(VTOC(btvp
), HFS_EXCLUSIVE_LOCK
);
2147 if (((cp
->c_flag
& C_MODIFIED
) == 0) &&
2148 (cp
->c_touch_acctime
== 0) &&
2149 (cp
->c_touch_chgtime
== 0) &&
2150 (cp
->c_touch_modtime
== 0) &&
2151 vnode_hasdirtyblks(btvp
) == 0) {
2152 hfs_unlock(VTOC(btvp
));
2155 error
= vnode_get(btvp
);
2157 hfs_unlock(VTOC(btvp
));
2160 if ((error
= hfs_fsync(btvp
, waitfor
, 0, p
)))
2168 * Force stale file system control information to be flushed.
2170 if (vcb
->vcbSigWord
== kHFSSigWord
) {
2171 if ((error
= VNOP_FSYNC(hfsmp
->hfs_devvp
, waitfor
, context
))) {
2179 hfs_hotfilesync(hfsmp
, vfs_context_kernel());
2182 * Write back modified superblock.
2184 if (IsVCBDirty(vcb
)) {
2185 error
= hfs_flushvolumeheader(hfsmp
, waitfor
, 0);
2191 hfs_journal_flush(hfsmp
);
2199 clock_get_calendar_microtime(&secs
, &usecs
);
2200 now
= ((uint64_t)secs
* 1000000ULL) + (uint64_t)usecs
;
2201 hfsmp
->hfs_last_sync_time
= now
;
2204 lck_rw_unlock_shared(&hfsmp
->hfs_insync
);
2210 * File handle to vnode
2212 * Have to be really careful about stale file handles:
2213 * - check that the cnode id is valid
2214 * - call hfs_vget() to get the locked cnode
2215 * - check for an unallocated cnode (i_mode == 0)
2216 * - check that the given client host has export rights and return
2217 * those rights via. exflagsp and credanonp
2220 hfs_fhtovp(struct mount
*mp
, int fhlen
, unsigned char *fhp
, struct vnode
**vpp
, __unused vfs_context_t context
)
2222 struct hfsfid
*hfsfhp
;
2227 hfsfhp
= (struct hfsfid
*)fhp
;
2229 if (fhlen
< (int)sizeof(struct hfsfid
))
2232 result
= hfs_vget(VFSTOHFS(mp
), ntohl(hfsfhp
->hfsfid_cnid
), &nvp
, 0);
2234 if (result
== ENOENT
)
2240 * We used to use the create time as the gen id of the file handle,
2241 * but it is not static enough because it can change at any point
2242 * via system calls. We still don't have another volume ID or other
2243 * unique identifier to use for a generation ID across reboots that
2244 * persists until the file is removed. Using only the CNID exposes
2245 * us to the potential wrap-around case, but as of 2/2008, it would take
2246 * over 2 months to wrap around if the machine did nothing but allocate
2247 * CNIDs. Using some kind of wrap counter would only be effective if
2248 * each file had the wrap counter associated with it. For now,
2249 * we use only the CNID to identify the file as it's good enough.
2254 hfs_unlock(VTOC(nvp
));
2260 * Vnode pointer to File handle
2264 hfs_vptofh(struct vnode
*vp
, int *fhlenp
, unsigned char *fhp
, __unused vfs_context_t context
)
2267 struct hfsfid
*hfsfhp
;
2269 if (ISHFS(VTOVCB(vp
)))
2270 return (ENOTSUP
); /* hfs standard is not exportable */
2272 if (*fhlenp
< (int)sizeof(struct hfsfid
))
2276 hfsfhp
= (struct hfsfid
*)fhp
;
2277 /* only the CNID is used to identify the file now */
2278 hfsfhp
->hfsfid_cnid
= htonl(cp
->c_fileid
);
2279 hfsfhp
->hfsfid_gen
= htonl(cp
->c_fileid
);
2280 *fhlenp
= sizeof(struct hfsfid
);
2287 * Initial HFS filesystems, done only once.
2290 hfs_init(__unused
struct vfsconf
*vfsp
)
2292 static int done
= 0;
2298 hfs_converterinit();
2303 hfs_lock_attr
= lck_attr_alloc_init();
2304 hfs_group_attr
= lck_grp_attr_alloc_init();
2305 hfs_mutex_group
= lck_grp_alloc_init("hfs-mutex", hfs_group_attr
);
2306 hfs_rwlock_group
= lck_grp_alloc_init("hfs-rwlock", hfs_group_attr
);
2316 hfs_getmountpoint(struct vnode
*vp
, struct hfsmount
**hfsmpp
)
2318 struct hfsmount
* hfsmp
;
2319 char fstypename
[MFSNAMELEN
];
2324 if (!vnode_isvroot(vp
))
2327 vnode_vfsname(vp
, fstypename
);
2328 if (strncmp(fstypename
, "hfs", sizeof(fstypename
)) != 0)
2333 if (HFSTOVCB(hfsmp
)->vcbSigWord
== kHFSSigWord
)
2342 #include <sys/filedesc.h>
2345 * HFS filesystem related variables.
2348 hfs_sysctl(int *name
, __unused u_int namelen
, user_addr_t oldp
, size_t *oldlenp
,
2349 user_addr_t newp
, size_t newlen
, vfs_context_t context
)
2351 struct proc
*p
= vfs_context_proc(context
);
2353 struct hfsmount
*hfsmp
;
2355 /* all sysctl names at this level are terminal */
2357 if (name
[0] == HFS_ENCODINGBIAS
) {
2360 bias
= hfs_getencodingbias();
2361 error
= sysctl_int(oldp
, oldlenp
, newp
, newlen
, &bias
);
2362 if (error
== 0 && newp
)
2363 hfs_setencodingbias(bias
);
2366 } else if (name
[0] == HFS_EXTEND_FS
) {
2368 vnode_t vp
= vfs_context_cwd(context
);
2370 if (newp
== USER_ADDR_NULL
|| vp
== NULLVP
)
2372 if ((error
= hfs_getmountpoint(vp
, &hfsmp
)))
2374 error
= sysctl_quad(oldp
, oldlenp
, newp
, newlen
, (quad_t
*)&newsize
);
2378 error
= hfs_extendfs(hfsmp
, newsize
, context
);
2381 } else if (name
[0] == HFS_ENCODINGHINT
) {
2385 u_int16_t
*unicode_name
= NULL
;
2386 char *filename
= NULL
;
2388 if ((newlen
<= 0) || (newlen
> MAXPATHLEN
))
2391 bufsize
= MAX(newlen
* 3, MAXPATHLEN
);
2392 MALLOC(filename
, char *, newlen
, M_TEMP
, M_WAITOK
);
2393 if (filename
== NULL
) {
2395 goto encodinghint_exit
;
2397 MALLOC(unicode_name
, u_int16_t
*, bufsize
, M_TEMP
, M_WAITOK
);
2398 if (filename
== NULL
) {
2400 goto encodinghint_exit
;
2403 error
= copyin(newp
, (caddr_t
)filename
, newlen
);
2405 error
= utf8_decodestr((u_int8_t
*)filename
, newlen
- 1, unicode_name
,
2406 &bytes
, bufsize
, 0, UTF_DECOMPOSED
);
2408 hint
= hfs_pickencoding(unicode_name
, bytes
/ 2);
2409 error
= sysctl_int(oldp
, oldlenp
, USER_ADDR_NULL
, 0, (int32_t *)&hint
);
2415 FREE(unicode_name
, M_TEMP
);
2417 FREE(filename
, M_TEMP
);
2420 } else if (name
[0] == HFS_ENABLE_JOURNALING
) {
2421 // make the file system journaled...
2422 vnode_t vp
= vfs_context_cwd(context
);
2425 struct cat_attr jnl_attr
, jinfo_attr
;
2426 struct cat_fork jnl_fork
, jinfo_fork
;
2430 /* Only root can enable journaling */
2438 if (hfsmp
->hfs_flags
& HFS_READ_ONLY
) {
2441 if (HFSTOVCB(hfsmp
)->vcbSigWord
== kHFSSigWord
) {
2442 printf("hfs: can't make a plain hfs volume journaled.\n");
2447 printf("hfs: volume @ mp %p is already journaled!\n", vnode_mount(vp
));
2451 vcb
= HFSTOVCB(hfsmp
);
2452 lockflags
= hfs_systemfile_lock(hfsmp
, SFL_CATALOG
| SFL_EXTENTS
, HFS_EXCLUSIVE_LOCK
);
2453 if (BTHasContiguousNodes(VTOF(vcb
->catalogRefNum
)) == 0 ||
2454 BTHasContiguousNodes(VTOF(vcb
->extentsRefNum
)) == 0) {
2456 printf("hfs: volume has a btree w/non-contiguous nodes. can not enable journaling.\n");
2457 hfs_systemfile_unlock(hfsmp
, lockflags
);
2460 hfs_systemfile_unlock(hfsmp
, lockflags
);
2462 // make sure these both exist!
2463 if ( GetFileInfo(vcb
, kHFSRootFolderID
, ".journal_info_block", &jinfo_attr
, &jinfo_fork
) == 0
2464 || GetFileInfo(vcb
, kHFSRootFolderID
, ".journal", &jnl_attr
, &jnl_fork
) == 0) {
2469 hfs_sync(hfsmp
->hfs_mp
, MNT_WAIT
, context
);
2471 printf("hfs: Initializing the journal (joffset 0x%llx sz 0x%llx)...\n",
2472 (off_t
)name
[2], (off_t
)name
[3]);
2475 // XXXdbg - note that currently (Sept, 08) hfs_util does not support
2476 // enabling the journal on a separate device so it is safe
2477 // to just copy hfs_devvp here. If hfs_util gets the ability
2478 // to dynamically enable the journal on a separate device then
2479 // we will have to do the same thing as hfs_early_journal_init()
2480 // to locate and open the journal device.
2482 jvp
= hfsmp
->hfs_devvp
;
2483 jnl
= journal_create(jvp
,
2484 (off_t
)name
[2] * (off_t
)HFSTOVCB(hfsmp
)->blockSize
2485 + HFSTOVCB(hfsmp
)->hfsPlusIOPosOffset
,
2486 (off_t
)((unsigned)name
[3]),
2488 hfsmp
->hfs_logical_block_size
,
2491 hfs_sync_metadata
, hfsmp
->hfs_mp
);
2494 printf("hfs: FAILED to create the journal!\n");
2495 if (jvp
&& jvp
!= hfsmp
->hfs_devvp
) {
2496 vnode_clearmountedon(jvp
);
2497 VNOP_CLOSE(jvp
, hfsmp
->hfs_flags
& HFS_READ_ONLY
? FREAD
: FREAD
|FWRITE
, vfs_context_kernel());
2504 hfs_global_exclusive_lock_acquire(hfsmp
);
2507 * Flush all dirty metadata buffers.
2509 buf_flushdirtyblks(hfsmp
->hfs_devvp
, MNT_WAIT
, 0, "hfs_sysctl");
2510 buf_flushdirtyblks(hfsmp
->hfs_extents_vp
, MNT_WAIT
, 0, "hfs_sysctl");
2511 buf_flushdirtyblks(hfsmp
->hfs_catalog_vp
, MNT_WAIT
, 0, "hfs_sysctl");
2512 buf_flushdirtyblks(hfsmp
->hfs_allocation_vp
, MNT_WAIT
, 0, "hfs_sysctl");
2513 if (hfsmp
->hfs_attribute_vp
)
2514 buf_flushdirtyblks(hfsmp
->hfs_attribute_vp
, MNT_WAIT
, 0, "hfs_sysctl");
2516 HFSTOVCB(hfsmp
)->vcbJinfoBlock
= name
[1];
2517 HFSTOVCB(hfsmp
)->vcbAtrb
|= kHFSVolumeJournaledMask
;
2521 // save this off for the hack-y check in hfs_remove()
2522 hfsmp
->jnl_start
= (u_int32_t
)name
[2];
2523 hfsmp
->jnl_size
= (off_t
)((unsigned)name
[3]);
2524 hfsmp
->hfs_jnlinfoblkid
= jinfo_attr
.ca_fileid
;
2525 hfsmp
->hfs_jnlfileid
= jnl_attr
.ca_fileid
;
2527 vfs_setflags(hfsmp
->hfs_mp
, (u_int64_t
)((unsigned int)MNT_JOURNALED
));
2529 hfs_global_exclusive_lock_release(hfsmp
);
2530 hfs_flushvolumeheader(hfsmp
, MNT_WAIT
, 1);
2535 fsid
.val
[0] = (int32_t)hfsmp
->hfs_raw_dev
;
2536 fsid
.val
[1] = (int32_t)vfs_typenum(HFSTOVFS(hfsmp
));
2537 vfs_event_signal(&fsid
, VQ_UPDATE
, (intptr_t)NULL
);
2540 } else if (name
[0] == HFS_DISABLE_JOURNALING
) {
2541 // clear the journaling bit
2542 vnode_t vp
= vfs_context_cwd(context
);
2544 /* Only root can disable journaling */
2554 * Disabling journaling is disallowed on volumes with directory hard links
2555 * because we have not tested the relevant code path.
2557 if (hfsmp
->hfs_private_attr
[DIR_HARDLINKS
].ca_entries
!= 0){
2558 printf("hfs: cannot disable journaling on volumes with directory hardlinks\n");
2562 printf("hfs: disabling journaling for mount @ %p\n", vnode_mount(vp
));
2564 hfs_global_exclusive_lock_acquire(hfsmp
);
2566 // Lights out for you buddy!
2567 journal_close(hfsmp
->jnl
);
2570 if (hfsmp
->jvp
&& hfsmp
->jvp
!= hfsmp
->hfs_devvp
) {
2571 vnode_clearmountedon(hfsmp
->jvp
);
2572 VNOP_CLOSE(hfsmp
->jvp
, hfsmp
->hfs_flags
& HFS_READ_ONLY
? FREAD
: FREAD
|FWRITE
, vfs_context_kernel());
2573 vnode_put(hfsmp
->jvp
);
2576 vfs_clearflags(hfsmp
->hfs_mp
, (u_int64_t
)((unsigned int)MNT_JOURNALED
));
2577 hfsmp
->jnl_start
= 0;
2578 hfsmp
->hfs_jnlinfoblkid
= 0;
2579 hfsmp
->hfs_jnlfileid
= 0;
2581 HFSTOVCB(hfsmp
)->vcbAtrb
&= ~kHFSVolumeJournaledMask
;
2583 hfs_global_exclusive_lock_release(hfsmp
);
2584 hfs_flushvolumeheader(hfsmp
, MNT_WAIT
, 1);
2589 fsid
.val
[0] = (int32_t)hfsmp
->hfs_raw_dev
;
2590 fsid
.val
[1] = (int32_t)vfs_typenum(HFSTOVFS(hfsmp
));
2591 vfs_event_signal(&fsid
, VQ_UPDATE
, (intptr_t)NULL
);
2594 } else if (name
[0] == HFS_GET_JOURNAL_INFO
) {
2595 vnode_t vp
= vfs_context_cwd(context
);
2596 off_t jnl_start
, jnl_size
;
2601 /* 64-bit processes won't work with this sysctl -- can't fit a pointer into an int! */
2602 if (proc_is64bit(current_proc()))
2606 if (hfsmp
->jnl
== NULL
) {
2610 jnl_start
= (off_t
)(hfsmp
->jnl_start
* HFSTOVCB(hfsmp
)->blockSize
) + (off_t
)HFSTOVCB(hfsmp
)->hfsPlusIOPosOffset
;
2611 jnl_size
= (off_t
)hfsmp
->jnl_size
;
2614 if ((error
= copyout((caddr_t
)&jnl_start
, CAST_USER_ADDR_T(name
[1]), sizeof(off_t
))) != 0) {
2617 if ((error
= copyout((caddr_t
)&jnl_size
, CAST_USER_ADDR_T(name
[2]), sizeof(off_t
))) != 0) {
2622 } else if (name
[0] == HFS_SET_PKG_EXTENSIONS
) {
2624 return set_package_extensions_table((user_addr_t
)((unsigned)name
[1]), name
[2], name
[3]);
2626 } else if (name
[0] == VFS_CTL_QUERY
) {
2627 struct sysctl_req
*req
;
2628 union union_vfsidctl vc
;
2632 req
= CAST_DOWN(struct sysctl_req
*, oldp
); /* we're new style vfs sysctl. */
2634 error
= SYSCTL_IN(req
, &vc
, proc_is64bit(p
)? sizeof(vc
.vc64
):sizeof(vc
.vc32
));
2635 if (error
) return (error
);
2637 mp
= vfs_getvfs(&vc
.vc32
.vc_fsid
); /* works for 32 and 64 */
2638 if (mp
== NULL
) return (ENOENT
);
2640 hfsmp
= VFSTOHFS(mp
);
2641 bzero(&vq
, sizeof(vq
));
2642 vq
.vq_flags
= hfsmp
->hfs_notification_conditions
;
2643 return SYSCTL_OUT(req
, &vq
, sizeof(vq
));;
2644 } else if (name
[0] == HFS_REPLAY_JOURNAL
) {
2645 vnode_t devvp
= NULL
;
2650 device_fd
= name
[1];
2651 error
= file_vnode(device_fd
, &devvp
);
2655 error
= vnode_getwithref(devvp
);
2657 file_drop(device_fd
);
2660 error
= hfs_journal_replay(devvp
, context
);
2661 file_drop(device_fd
);
2670 * hfs_vfs_vget is not static since it is used in hfs_readwrite.c to support
2671 * the build_path ioctl. We use it to leverage the code below that updates
2672 * the origin list cache if necessary
2676 hfs_vfs_vget(struct mount
*mp
, ino64_t ino
, struct vnode
**vpp
, __unused vfs_context_t context
)
2680 struct hfsmount
*hfsmp
;
2682 hfsmp
= VFSTOHFS(mp
);
2684 error
= hfs_vget(hfsmp
, (cnid_t
)ino
, vpp
, 1);
2689 * ADLs may need to have their origin state updated
2690 * since build_path needs a valid parent. The same is true
2691 * for hardlinked files as well. There isn't a race window here
2692 * in re-acquiring the cnode lock since we aren't pulling any data
2693 * out of the cnode; instead, we're going to the catalog.
2695 if ((VTOC(*vpp
)->c_flag
& C_HARDLINK
) &&
2696 (hfs_lock(VTOC(*vpp
), HFS_EXCLUSIVE_LOCK
) == 0)) {
2697 cnode_t
*cp
= VTOC(*vpp
);
2698 struct cat_desc cdesc
;
2700 if (!hfs_haslinkorigin(cp
)) {
2701 lockflags
= hfs_systemfile_lock(hfsmp
, SFL_CATALOG
, HFS_SHARED_LOCK
);
2702 error
= cat_findname(hfsmp
, (cnid_t
)ino
, &cdesc
);
2703 hfs_systemfile_unlock(hfsmp
, lockflags
);
2705 if ((cdesc
.cd_parentcnid
!= hfsmp
->hfs_private_desc
[DIR_HARDLINKS
].cd_cnid
) &&
2706 (cdesc
.cd_parentcnid
!= hfsmp
->hfs_private_desc
[FILE_HARDLINKS
].cd_cnid
)) {
2707 hfs_savelinkorigin(cp
, cdesc
.cd_parentcnid
);
2709 cat_releasedesc(&cdesc
);
2719 * Look up an HFS object by ID.
2721 * The object is returned with an iocount reference and the cnode locked.
2723 * If the object is a file then it will represent the data fork.
2727 hfs_vget(struct hfsmount
*hfsmp
, cnid_t cnid
, struct vnode
**vpp
, int skiplock
)
2729 struct vnode
*vp
= NULLVP
;
2730 struct cat_desc cndesc
;
2731 struct cat_attr cnattr
;
2732 struct cat_fork cnfork
;
2733 u_int32_t linkref
= 0;
2736 /* Check for cnids that should't be exported. */
2737 if ((cnid
< kHFSFirstUserCatalogNodeID
) &&
2738 (cnid
!= kHFSRootFolderID
&& cnid
!= kHFSRootParentID
)) {
2741 /* Don't export our private directories. */
2742 if (cnid
== hfsmp
->hfs_private_desc
[FILE_HARDLINKS
].cd_cnid
||
2743 cnid
== hfsmp
->hfs_private_desc
[DIR_HARDLINKS
].cd_cnid
) {
2747 * Check the hash first
2749 vp
= hfs_chash_getvnode(hfsmp
, cnid
, 0, skiplock
);
2755 bzero(&cndesc
, sizeof(cndesc
));
2756 bzero(&cnattr
, sizeof(cnattr
));
2757 bzero(&cnfork
, sizeof(cnfork
));
2760 * Not in hash, lookup in catalog
2762 if (cnid
== kHFSRootParentID
) {
2763 static char hfs_rootname
[] = "/";
2765 cndesc
.cd_nameptr
= (const u_int8_t
*)&hfs_rootname
[0];
2766 cndesc
.cd_namelen
= 1;
2767 cndesc
.cd_parentcnid
= kHFSRootParentID
;
2768 cndesc
.cd_cnid
= kHFSRootFolderID
;
2769 cndesc
.cd_flags
= CD_ISDIR
;
2771 cnattr
.ca_fileid
= kHFSRootFolderID
;
2772 cnattr
.ca_linkcount
= 1;
2773 cnattr
.ca_entries
= 1;
2774 cnattr
.ca_dircount
= 1;
2775 cnattr
.ca_mode
= (S_IFDIR
| S_IRWXU
| S_IRWXG
| S_IRWXO
);
2779 const char *nameptr
;
2781 lockflags
= hfs_systemfile_lock(hfsmp
, SFL_CATALOG
, HFS_SHARED_LOCK
);
2782 error
= cat_idlookup(hfsmp
, cnid
, 0, &cndesc
, &cnattr
, &cnfork
);
2783 hfs_systemfile_unlock(hfsmp
, lockflags
);
2791 * Check for a raw hardlink inode and save its linkref.
2793 pid
= cndesc
.cd_parentcnid
;
2794 nameptr
= (const char *)cndesc
.cd_nameptr
;
2796 if ((pid
== hfsmp
->hfs_private_desc
[FILE_HARDLINKS
].cd_cnid
) &&
2797 (bcmp(nameptr
, HFS_INODE_PREFIX
, HFS_INODE_PREFIX_LEN
) == 0)) {
2798 linkref
= strtoul(&nameptr
[HFS_INODE_PREFIX_LEN
], NULL
, 10);
2800 } else if ((pid
== hfsmp
->hfs_private_desc
[DIR_HARDLINKS
].cd_cnid
) &&
2801 (bcmp(nameptr
, HFS_DIRINODE_PREFIX
, HFS_DIRINODE_PREFIX_LEN
) == 0)) {
2802 linkref
= strtoul(&nameptr
[HFS_DIRINODE_PREFIX_LEN
], NULL
, 10);
2804 } else if ((pid
== hfsmp
->hfs_private_desc
[FILE_HARDLINKS
].cd_cnid
) &&
2805 (bcmp(nameptr
, HFS_DELETE_PREFIX
, HFS_DELETE_PREFIX_LEN
) == 0)) {
2807 cat_releasedesc(&cndesc
);
2808 return (ENOENT
); /* open unlinked file */
2813 * Finish initializing cnode descriptor for hardlinks.
2815 * We need a valid name and parent for reverse lookups.
2820 struct cat_desc linkdesc
;
2823 cnattr
.ca_linkref
= linkref
;
2826 * Pick up the first link in the chain and get a descriptor for it.
2827 * This allows blind volfs paths to work for hardlinks.
2829 if ((hfs_lookuplink(hfsmp
, linkref
, &prevlinkid
, &nextlinkid
) == 0) &&
2830 (nextlinkid
!= 0)) {
2831 lockflags
= hfs_systemfile_lock(hfsmp
, SFL_CATALOG
, HFS_SHARED_LOCK
);
2832 error
= cat_findname(hfsmp
, nextlinkid
, &linkdesc
);
2833 hfs_systemfile_unlock(hfsmp
, lockflags
);
2835 cat_releasedesc(&cndesc
);
2836 bcopy(&linkdesc
, &cndesc
, sizeof(linkdesc
));
2842 error
= hfs_getnewvnode(hfsmp
, NULL
, NULL
, &cndesc
, 0, &cnattr
, &cnfork
, &vp
);
2844 VTOC(vp
)->c_flag
|= C_HARDLINK
;
2845 vnode_setmultipath(vp
);
2848 struct componentname cn
;
2850 /* Supply hfs_getnewvnode with a component name. */
2851 MALLOC_ZONE(cn
.cn_pnbuf
, caddr_t
, MAXPATHLEN
, M_NAMEI
, M_WAITOK
);
2852 cn
.cn_nameiop
= LOOKUP
;
2853 cn
.cn_flags
= ISLASTCN
| HASBUF
;
2854 cn
.cn_context
= NULL
;
2855 cn
.cn_pnlen
= MAXPATHLEN
;
2856 cn
.cn_nameptr
= cn
.cn_pnbuf
;
2857 cn
.cn_namelen
= cndesc
.cd_namelen
;
2860 bcopy(cndesc
.cd_nameptr
, cn
.cn_nameptr
, cndesc
.cd_namelen
+ 1);
2862 error
= hfs_getnewvnode(hfsmp
, NULLVP
, &cn
, &cndesc
, 0, &cnattr
, &cnfork
, &vp
);
2864 if (error
== 0 && (VTOC(vp
)->c_flag
& C_HARDLINK
)) {
2865 hfs_savelinkorigin(VTOC(vp
), cndesc
.cd_parentcnid
);
2867 FREE_ZONE(cn
.cn_pnbuf
, cn
.cn_pnlen
, M_NAMEI
);
2869 cat_releasedesc(&cndesc
);
2872 if (vp
&& skiplock
) {
2873 hfs_unlock(VTOC(vp
));
2880 * Flush out all the files in a filesystem.
2884 hfs_flushfiles(struct mount
*mp
, int flags
, struct proc
*p
)
2886 hfs_flushfiles(struct mount
*mp
, int flags
, __unused
struct proc
*p
)
2889 struct hfsmount
*hfsmp
;
2890 struct vnode
*skipvp
= NULLVP
;
2897 hfsmp
= VFSTOHFS(mp
);
2901 * The open quota files have an indirect reference on
2902 * the root directory vnode. We must account for this
2903 * extra reference when doing the intial vflush.
2906 if (((unsigned int)vfs_flags(mp
)) & MNT_QUOTA
) {
2908 /* Find out how many quota files we have open. */
2909 for (i
= 0; i
< MAXQUOTAS
; i
++) {
2910 if (hfsmp
->hfs_qfiles
[i
].qf_vp
!= NULLVP
)
2914 /* Obtain the root vnode so we can skip over it. */
2915 skipvp
= hfs_chash_getvnode(hfsmp
, kHFSRootFolderID
, 0, 0);
2919 error
= vflush(mp
, skipvp
, SKIPSYSTEM
| SKIPSWAP
| flags
);
2923 error
= vflush(mp
, skipvp
, SKIPSYSTEM
| flags
);
2926 if (((unsigned int)vfs_flags(mp
)) & MNT_QUOTA
) {
2929 * See if there are additional references on the
2930 * root vp besides the ones obtained from the open
2931 * quota files and the hfs_chash_getvnode call above.
2934 (vnode_isinuse(skipvp
, quotafilecnt
))) {
2935 error
= EBUSY
; /* root directory is still open */
2937 hfs_unlock(VTOC(skipvp
));
2940 if (error
&& (flags
& FORCECLOSE
) == 0)
2943 for (i
= 0; i
< MAXQUOTAS
; i
++) {
2944 if (hfsmp
->hfs_qfiles
[i
].qf_vp
== NULLVP
)
2946 hfs_quotaoff(p
, mp
, i
);
2948 error
= vflush(mp
, NULLVP
, SKIPSYSTEM
| flags
);
2956 * Update volume encoding bitmap (HFS Plus only)
2960 hfs_setencodingbits(struct hfsmount
*hfsmp
, u_int32_t encoding
)
2962 #define kIndexMacUkrainian 48 /* MacUkrainian encoding is 152 */
2963 #define kIndexMacFarsi 49 /* MacFarsi encoding is 140 */
2968 case kTextEncodingMacUkrainian
:
2969 index
= kIndexMacUkrainian
;
2971 case kTextEncodingMacFarsi
:
2972 index
= kIndexMacFarsi
;
2979 if (index
< 64 && (hfsmp
->encodingsBitmap
& (u_int64_t
)(1ULL << index
)) == 0) {
2980 HFS_MOUNT_LOCK(hfsmp
, TRUE
)
2981 hfsmp
->encodingsBitmap
|= (u_int64_t
)(1ULL << index
);
2982 MarkVCBDirty(hfsmp
);
2983 HFS_MOUNT_UNLOCK(hfsmp
, TRUE
);
2988 * Update volume stats
2990 * On journal volumes this will cause a volume header flush
2994 hfs_volupdate(struct hfsmount
*hfsmp
, enum volop op
, int inroot
)
3000 lck_mtx_lock(&hfsmp
->hfs_mutex
);
3002 MarkVCBDirty(hfsmp
);
3003 hfsmp
->hfs_mtime
= tv
.tv_sec
;
3009 if (hfsmp
->hfs_dircount
!= 0xFFFFFFFF)
3010 ++hfsmp
->hfs_dircount
;
3011 if (inroot
&& hfsmp
->vcbNmRtDirs
!= 0xFFFF)
3012 ++hfsmp
->vcbNmRtDirs
;
3015 if (hfsmp
->hfs_dircount
!= 0)
3016 --hfsmp
->hfs_dircount
;
3017 if (inroot
&& hfsmp
->vcbNmRtDirs
!= 0xFFFF)
3018 --hfsmp
->vcbNmRtDirs
;
3021 if (hfsmp
->hfs_filecount
!= 0xFFFFFFFF)
3022 ++hfsmp
->hfs_filecount
;
3023 if (inroot
&& hfsmp
->vcbNmFls
!= 0xFFFF)
3027 if (hfsmp
->hfs_filecount
!= 0)
3028 --hfsmp
->hfs_filecount
;
3029 if (inroot
&& hfsmp
->vcbNmFls
!= 0xFFFF)
3034 lck_mtx_unlock(&hfsmp
->hfs_mutex
);
3037 hfs_flushvolumeheader(hfsmp
, 0, 0);
3045 hfs_flushMDB(struct hfsmount
*hfsmp
, int waitfor
, int altflush
)
3047 ExtendedVCB
*vcb
= HFSTOVCB(hfsmp
);
3048 struct filefork
*fp
;
3049 HFSMasterDirectoryBlock
*mdb
;
3050 struct buf
*bp
= NULL
;
3055 sectorsize
= hfsmp
->hfs_logical_block_size
;
3056 retval
= (int)buf_bread(hfsmp
->hfs_devvp
, (daddr64_t
)HFS_PRI_SECTOR(sectorsize
), sectorsize
, NOCRED
, &bp
);
3063 lck_mtx_lock(&hfsmp
->hfs_mutex
);
3065 mdb
= (HFSMasterDirectoryBlock
*)(buf_dataptr(bp
) + HFS_PRI_OFFSET(sectorsize
));
3067 mdb
->drCrDate
= SWAP_BE32 (UTCToLocal(to_hfs_time(vcb
->vcbCrDate
)));
3068 mdb
->drLsMod
= SWAP_BE32 (UTCToLocal(to_hfs_time(vcb
->vcbLsMod
)));
3069 mdb
->drAtrb
= SWAP_BE16 (vcb
->vcbAtrb
);
3070 mdb
->drNmFls
= SWAP_BE16 (vcb
->vcbNmFls
);
3071 mdb
->drAllocPtr
= SWAP_BE16 (vcb
->nextAllocation
);
3072 mdb
->drClpSiz
= SWAP_BE32 (vcb
->vcbClpSiz
);
3073 mdb
->drNxtCNID
= SWAP_BE32 (vcb
->vcbNxtCNID
);
3074 mdb
->drFreeBks
= SWAP_BE16 (vcb
->freeBlocks
);
3076 namelen
= strlen((char *)vcb
->vcbVN
);
3077 retval
= utf8_to_hfs(vcb
, namelen
, vcb
->vcbVN
, mdb
->drVN
);
3078 /* Retry with MacRoman in case that's how it was exported. */
3080 retval
= utf8_to_mac_roman(namelen
, vcb
->vcbVN
, mdb
->drVN
);
3082 mdb
->drVolBkUp
= SWAP_BE32 (UTCToLocal(to_hfs_time(vcb
->vcbVolBkUp
)));
3083 mdb
->drWrCnt
= SWAP_BE32 (vcb
->vcbWrCnt
);
3084 mdb
->drNmRtDirs
= SWAP_BE16 (vcb
->vcbNmRtDirs
);
3085 mdb
->drFilCnt
= SWAP_BE32 (vcb
->vcbFilCnt
);
3086 mdb
->drDirCnt
= SWAP_BE32 (vcb
->vcbDirCnt
);
3088 bcopy(vcb
->vcbFndrInfo
, mdb
->drFndrInfo
, sizeof(mdb
->drFndrInfo
));
3090 fp
= VTOF(vcb
->extentsRefNum
);
3091 mdb
->drXTExtRec
[0].startBlock
= SWAP_BE16 (fp
->ff_extents
[0].startBlock
);
3092 mdb
->drXTExtRec
[0].blockCount
= SWAP_BE16 (fp
->ff_extents
[0].blockCount
);
3093 mdb
->drXTExtRec
[1].startBlock
= SWAP_BE16 (fp
->ff_extents
[1].startBlock
);
3094 mdb
->drXTExtRec
[1].blockCount
= SWAP_BE16 (fp
->ff_extents
[1].blockCount
);
3095 mdb
->drXTExtRec
[2].startBlock
= SWAP_BE16 (fp
->ff_extents
[2].startBlock
);
3096 mdb
->drXTExtRec
[2].blockCount
= SWAP_BE16 (fp
->ff_extents
[2].blockCount
);
3097 mdb
->drXTFlSize
= SWAP_BE32 (fp
->ff_blocks
* vcb
->blockSize
);
3098 mdb
->drXTClpSiz
= SWAP_BE32 (fp
->ff_clumpsize
);
3099 FTOC(fp
)->c_flag
&= ~C_MODIFIED
;
3101 fp
= VTOF(vcb
->catalogRefNum
);
3102 mdb
->drCTExtRec
[0].startBlock
= SWAP_BE16 (fp
->ff_extents
[0].startBlock
);
3103 mdb
->drCTExtRec
[0].blockCount
= SWAP_BE16 (fp
->ff_extents
[0].blockCount
);
3104 mdb
->drCTExtRec
[1].startBlock
= SWAP_BE16 (fp
->ff_extents
[1].startBlock
);
3105 mdb
->drCTExtRec
[1].blockCount
= SWAP_BE16 (fp
->ff_extents
[1].blockCount
);
3106 mdb
->drCTExtRec
[2].startBlock
= SWAP_BE16 (fp
->ff_extents
[2].startBlock
);
3107 mdb
->drCTExtRec
[2].blockCount
= SWAP_BE16 (fp
->ff_extents
[2].blockCount
);
3108 mdb
->drCTFlSize
= SWAP_BE32 (fp
->ff_blocks
* vcb
->blockSize
);
3109 mdb
->drCTClpSiz
= SWAP_BE32 (fp
->ff_clumpsize
);
3110 FTOC(fp
)->c_flag
&= ~C_MODIFIED
;
3112 MarkVCBClean( vcb
);
3114 lck_mtx_unlock(&hfsmp
->hfs_mutex
);
3116 /* If requested, flush out the alternate MDB */
3118 struct buf
*alt_bp
= NULL
;
3120 if (buf_meta_bread(hfsmp
->hfs_devvp
, hfsmp
->hfs_alt_id_sector
, sectorsize
, NOCRED
, &alt_bp
) == 0) {
3121 bcopy(mdb
, (char *)buf_dataptr(alt_bp
) + HFS_ALT_OFFSET(sectorsize
), kMDBSize
);
3123 (void) VNOP_BWRITE(alt_bp
);
3128 if (waitfor
!= MNT_WAIT
)
3131 retval
= VNOP_BWRITE(bp
);
3137 * Flush any dirty in-memory mount data to the on-disk
3140 * Note: the on-disk volume signature is intentionally
3141 * not flushed since the on-disk "H+" and "HX" signatures
3142 * are always stored in-memory as "H+".
3146 hfs_flushvolumeheader(struct hfsmount
*hfsmp
, int waitfor
, int altflush
)
3148 ExtendedVCB
*vcb
= HFSTOVCB(hfsmp
);
3149 struct filefork
*fp
;
3150 HFSPlusVolumeHeader
*volumeHeader
, *altVH
;
3152 struct buf
*bp
, *alt_bp
;
3154 daddr64_t priIDSector
;
3156 u_int16_t signature
;
3157 u_int16_t hfsversion
;
3159 if (hfsmp
->hfs_flags
& HFS_READ_ONLY
) {
3162 if (hfsmp
->hfs_flags
& HFS_STANDARD
) {
3163 return hfs_flushMDB(hfsmp
, waitfor
, altflush
);
3165 critical
= altflush
;
3166 priIDSector
= (daddr64_t
)((vcb
->hfsPlusIOPosOffset
/ hfsmp
->hfs_logical_block_size
) +
3167 HFS_PRI_SECTOR(hfsmp
->hfs_logical_block_size
));
3169 if (hfs_start_transaction(hfsmp
) != 0) {
3176 retval
= (int)buf_meta_bread(hfsmp
->hfs_devvp
,
3177 HFS_PHYSBLK_ROUNDDOWN(priIDSector
, hfsmp
->hfs_log_per_phys
),
3178 hfsmp
->hfs_physical_block_size
, NOCRED
, &bp
);
3180 printf("hfs: err %d reading VH blk (%s)\n", retval
, vcb
->vcbVN
);
3184 volumeHeader
= (HFSPlusVolumeHeader
*)((char *)buf_dataptr(bp
) +
3185 HFS_PRI_OFFSET(hfsmp
->hfs_physical_block_size
));
3188 * Sanity check what we just read. If it's bad, try the alternate
3191 signature
= SWAP_BE16 (volumeHeader
->signature
);
3192 hfsversion
= SWAP_BE16 (volumeHeader
->version
);
3193 if ((signature
!= kHFSPlusSigWord
&& signature
!= kHFSXSigWord
) ||
3194 (hfsversion
< kHFSPlusVersion
) || (hfsversion
> 100) ||
3195 (SWAP_BE32 (volumeHeader
->blockSize
) != vcb
->blockSize
)) {
3196 printf("hfs: corrupt VH on %s, sig 0x%04x, ver %d, blksize %d%s\n",
3197 vcb
->vcbVN
, signature
, hfsversion
,
3198 SWAP_BE32 (volumeHeader
->blockSize
),
3199 hfsmp
->hfs_alt_id_sector
? "; trying alternate" : "");
3200 hfs_mark_volume_inconsistent(hfsmp
);
3202 if (hfsmp
->hfs_alt_id_sector
) {
3203 retval
= buf_meta_bread(hfsmp
->hfs_devvp
,
3204 HFS_PHYSBLK_ROUNDDOWN(hfsmp
->hfs_alt_id_sector
, hfsmp
->hfs_log_per_phys
),
3205 hfsmp
->hfs_physical_block_size
, NOCRED
, &alt_bp
);
3207 printf("hfs: err %d reading alternate VH (%s)\n", retval
, vcb
->vcbVN
);
3211 altVH
= (HFSPlusVolumeHeader
*)((char *)buf_dataptr(alt_bp
) +
3212 HFS_ALT_OFFSET(hfsmp
->hfs_physical_block_size
));
3213 signature
= SWAP_BE16(altVH
->signature
);
3214 hfsversion
= SWAP_BE16(altVH
->version
);
3216 if ((signature
!= kHFSPlusSigWord
&& signature
!= kHFSXSigWord
) ||
3217 (hfsversion
< kHFSPlusVersion
) || (kHFSPlusVersion
> 100) ||
3218 (SWAP_BE32(altVH
->blockSize
) != vcb
->blockSize
)) {
3219 printf("hfs: corrupt alternate VH on %s, sig 0x%04x, ver %d, blksize %d\n",
3220 vcb
->vcbVN
, signature
, hfsversion
,
3221 SWAP_BE32(altVH
->blockSize
));
3226 /* The alternate is plausible, so use it. */
3227 bcopy(altVH
, volumeHeader
, kMDBSize
);
3231 /* No alternate VH, nothing more we can do. */
3238 journal_modify_block_start(hfsmp
->jnl
, bp
);
3242 * For embedded HFS+ volumes, update create date if it changed
3243 * (ie from a setattrlist call)
3245 if ((vcb
->hfsPlusIOPosOffset
!= 0) &&
3246 (SWAP_BE32 (volumeHeader
->createDate
) != vcb
->localCreateDate
)) {
3248 HFSMasterDirectoryBlock
*mdb
;
3250 retval
= (int)buf_meta_bread(hfsmp
->hfs_devvp
,
3251 HFS_PHYSBLK_ROUNDDOWN(HFS_PRI_SECTOR(hfsmp
->hfs_logical_block_size
), hfsmp
->hfs_log_per_phys
),
3252 hfsmp
->hfs_physical_block_size
, NOCRED
, &bp2
);
3258 mdb
= (HFSMasterDirectoryBlock
*)(buf_dataptr(bp2
) +
3259 HFS_PRI_OFFSET(hfsmp
->hfs_physical_block_size
));
3261 if ( SWAP_BE32 (mdb
->drCrDate
) != vcb
->localCreateDate
)
3264 journal_modify_block_start(hfsmp
->jnl
, bp2
);
3267 mdb
->drCrDate
= SWAP_BE32 (vcb
->localCreateDate
); /* pick up the new create date */
3270 journal_modify_block_end(hfsmp
->jnl
, bp2
, NULL
, NULL
);
3272 (void) VNOP_BWRITE(bp2
); /* write out the changes */
3277 buf_brelse(bp2
); /* just release it */
3282 lck_mtx_lock(&hfsmp
->hfs_mutex
);
3284 /* Note: only update the lower 16 bits worth of attributes */
3285 volumeHeader
->attributes
= SWAP_BE32 (vcb
->vcbAtrb
);
3286 volumeHeader
->journalInfoBlock
= SWAP_BE32 (vcb
->vcbJinfoBlock
);
3288 volumeHeader
->lastMountedVersion
= SWAP_BE32 (kHFSJMountVersion
);
3290 volumeHeader
->lastMountedVersion
= SWAP_BE32 (kHFSPlusMountVersion
);
3292 volumeHeader
->createDate
= SWAP_BE32 (vcb
->localCreateDate
); /* volume create date is in local time */
3293 volumeHeader
->modifyDate
= SWAP_BE32 (to_hfs_time(vcb
->vcbLsMod
));
3294 volumeHeader
->backupDate
= SWAP_BE32 (to_hfs_time(vcb
->vcbVolBkUp
));
3295 volumeHeader
->fileCount
= SWAP_BE32 (vcb
->vcbFilCnt
);
3296 volumeHeader
->folderCount
= SWAP_BE32 (vcb
->vcbDirCnt
);
3297 volumeHeader
->totalBlocks
= SWAP_BE32 (vcb
->totalBlocks
);
3298 volumeHeader
->freeBlocks
= SWAP_BE32 (vcb
->freeBlocks
);
3299 volumeHeader
->nextAllocation
= SWAP_BE32 (vcb
->nextAllocation
);
3300 volumeHeader
->rsrcClumpSize
= SWAP_BE32 (vcb
->vcbClpSiz
);
3301 volumeHeader
->dataClumpSize
= SWAP_BE32 (vcb
->vcbClpSiz
);
3302 volumeHeader
->nextCatalogID
= SWAP_BE32 (vcb
->vcbNxtCNID
);
3303 volumeHeader
->writeCount
= SWAP_BE32 (vcb
->vcbWrCnt
);
3304 volumeHeader
->encodingsBitmap
= SWAP_BE64 (vcb
->encodingsBitmap
);
3306 if (bcmp(vcb
->vcbFndrInfo
, volumeHeader
->finderInfo
, sizeof(volumeHeader
->finderInfo
)) != 0) {
3307 bcopy(vcb
->vcbFndrInfo
, volumeHeader
->finderInfo
, sizeof(volumeHeader
->finderInfo
));
3312 * System files are only dirty when altflush is set.
3314 if (altflush
== 0) {
3318 /* Sync Extents over-flow file meta data */
3319 fp
= VTOF(vcb
->extentsRefNum
);
3320 if (FTOC(fp
)->c_flag
& C_MODIFIED
) {
3321 for (i
= 0; i
< kHFSPlusExtentDensity
; i
++) {
3322 volumeHeader
->extentsFile
.extents
[i
].startBlock
=
3323 SWAP_BE32 (fp
->ff_extents
[i
].startBlock
);
3324 volumeHeader
->extentsFile
.extents
[i
].blockCount
=
3325 SWAP_BE32 (fp
->ff_extents
[i
].blockCount
);
3327 volumeHeader
->extentsFile
.logicalSize
= SWAP_BE64 (fp
->ff_size
);
3328 volumeHeader
->extentsFile
.totalBlocks
= SWAP_BE32 (fp
->ff_blocks
);
3329 volumeHeader
->extentsFile
.clumpSize
= SWAP_BE32 (fp
->ff_clumpsize
);
3330 FTOC(fp
)->c_flag
&= ~C_MODIFIED
;
3333 /* Sync Catalog file meta data */
3334 fp
= VTOF(vcb
->catalogRefNum
);
3335 if (FTOC(fp
)->c_flag
& C_MODIFIED
) {
3336 for (i
= 0; i
< kHFSPlusExtentDensity
; i
++) {
3337 volumeHeader
->catalogFile
.extents
[i
].startBlock
=
3338 SWAP_BE32 (fp
->ff_extents
[i
].startBlock
);
3339 volumeHeader
->catalogFile
.extents
[i
].blockCount
=
3340 SWAP_BE32 (fp
->ff_extents
[i
].blockCount
);
3342 volumeHeader
->catalogFile
.logicalSize
= SWAP_BE64 (fp
->ff_size
);
3343 volumeHeader
->catalogFile
.totalBlocks
= SWAP_BE32 (fp
->ff_blocks
);
3344 volumeHeader
->catalogFile
.clumpSize
= SWAP_BE32 (fp
->ff_clumpsize
);
3345 FTOC(fp
)->c_flag
&= ~C_MODIFIED
;
3348 /* Sync Allocation file meta data */
3349 fp
= VTOF(vcb
->allocationsRefNum
);
3350 if (FTOC(fp
)->c_flag
& C_MODIFIED
) {
3351 for (i
= 0; i
< kHFSPlusExtentDensity
; i
++) {
3352 volumeHeader
->allocationFile
.extents
[i
].startBlock
=
3353 SWAP_BE32 (fp
->ff_extents
[i
].startBlock
);
3354 volumeHeader
->allocationFile
.extents
[i
].blockCount
=
3355 SWAP_BE32 (fp
->ff_extents
[i
].blockCount
);
3357 volumeHeader
->allocationFile
.logicalSize
= SWAP_BE64 (fp
->ff_size
);
3358 volumeHeader
->allocationFile
.totalBlocks
= SWAP_BE32 (fp
->ff_blocks
);
3359 volumeHeader
->allocationFile
.clumpSize
= SWAP_BE32 (fp
->ff_clumpsize
);
3360 FTOC(fp
)->c_flag
&= ~C_MODIFIED
;
3363 /* Sync Attribute file meta data */
3364 if (hfsmp
->hfs_attribute_vp
) {
3365 fp
= VTOF(hfsmp
->hfs_attribute_vp
);
3366 for (i
= 0; i
< kHFSPlusExtentDensity
; i
++) {
3367 volumeHeader
->attributesFile
.extents
[i
].startBlock
=
3368 SWAP_BE32 (fp
->ff_extents
[i
].startBlock
);
3369 volumeHeader
->attributesFile
.extents
[i
].blockCount
=
3370 SWAP_BE32 (fp
->ff_extents
[i
].blockCount
);
3372 FTOC(fp
)->c_flag
&= ~C_MODIFIED
;
3373 volumeHeader
->attributesFile
.logicalSize
= SWAP_BE64 (fp
->ff_size
);
3374 volumeHeader
->attributesFile
.totalBlocks
= SWAP_BE32 (fp
->ff_blocks
);
3375 volumeHeader
->attributesFile
.clumpSize
= SWAP_BE32 (fp
->ff_clumpsize
);
3378 /* Sync Startup file meta data */
3379 if (hfsmp
->hfs_startup_vp
) {
3380 fp
= VTOF(hfsmp
->hfs_startup_vp
);
3381 if (FTOC(fp
)->c_flag
& C_MODIFIED
) {
3382 for (i
= 0; i
< kHFSPlusExtentDensity
; i
++) {
3383 volumeHeader
->startupFile
.extents
[i
].startBlock
=
3384 SWAP_BE32 (fp
->ff_extents
[i
].startBlock
);
3385 volumeHeader
->startupFile
.extents
[i
].blockCount
=
3386 SWAP_BE32 (fp
->ff_extents
[i
].blockCount
);
3388 volumeHeader
->startupFile
.logicalSize
= SWAP_BE64 (fp
->ff_size
);
3389 volumeHeader
->startupFile
.totalBlocks
= SWAP_BE32 (fp
->ff_blocks
);
3390 volumeHeader
->startupFile
.clumpSize
= SWAP_BE32 (fp
->ff_clumpsize
);
3391 FTOC(fp
)->c_flag
&= ~C_MODIFIED
;
3396 MarkVCBClean(hfsmp
);
3397 lck_mtx_unlock(&hfsmp
->hfs_mutex
);
3399 /* If requested, flush out the alternate volume header */
3400 if (altflush
&& hfsmp
->hfs_alt_id_sector
) {
3401 if (buf_meta_bread(hfsmp
->hfs_devvp
,
3402 HFS_PHYSBLK_ROUNDDOWN(hfsmp
->hfs_alt_id_sector
, hfsmp
->hfs_log_per_phys
),
3403 hfsmp
->hfs_physical_block_size
, NOCRED
, &alt_bp
) == 0) {
3405 journal_modify_block_start(hfsmp
->jnl
, alt_bp
);
3408 bcopy(volumeHeader
, (char *)buf_dataptr(alt_bp
) +
3409 HFS_ALT_OFFSET(hfsmp
->hfs_physical_block_size
),
3413 journal_modify_block_end(hfsmp
->jnl
, alt_bp
, NULL
, NULL
);
3415 (void) VNOP_BWRITE(alt_bp
);
3422 journal_modify_block_end(hfsmp
->jnl
, bp
, NULL
, NULL
);
3424 if (waitfor
!= MNT_WAIT
)
3427 retval
= VNOP_BWRITE(bp
);
3428 /* When critical data changes, flush the device cache */
3429 if (critical
&& (retval
== 0)) {
3430 (void) VNOP_IOCTL(hfsmp
->hfs_devvp
, DKIOCSYNCHRONIZECACHE
,
3431 NULL
, FWRITE
, NULL
);
3435 hfs_end_transaction(hfsmp
);
3444 hfs_end_transaction(hfsmp
);
3450 * Extend a file system.
3454 hfs_extendfs(struct hfsmount
*hfsmp
, u_int64_t newsize
, vfs_context_t context
)
3456 struct proc
*p
= vfs_context_proc(context
);
3457 kauth_cred_t cred
= vfs_context_ucred(context
);
3459 struct vnode
*devvp
;
3461 struct filefork
*fp
= NULL
;
3463 struct cat_fork forkdata
;
3465 u_int64_t newblkcnt
;
3466 u_int64_t prev_phys_block_count
;
3468 u_int64_t sectorcnt
;
3469 u_int32_t sectorsize
;
3470 u_int32_t phys_sectorsize
;
3471 daddr64_t prev_alt_sector
;
3475 int64_t oldBitmapSize
;
3476 Boolean usedExtendFileC
= false;
3478 devvp
= hfsmp
->hfs_devvp
;
3479 vcb
= HFSTOVCB(hfsmp
);
3482 * - HFS Plus file systems only.
3483 * - Journaling must be enabled.
3484 * - No embedded volumes.
3486 if ((vcb
->vcbSigWord
== kHFSSigWord
) ||
3487 (hfsmp
->jnl
== NULL
) ||
3488 (vcb
->hfsPlusIOPosOffset
!= 0)) {
3492 * If extending file system by non-root, then verify
3493 * ownership and check permissions.
3495 if (suser(cred
, NULL
)) {
3496 error
= hfs_vget(hfsmp
, kHFSRootFolderID
, &vp
, 0);
3500 error
= hfs_owner_rights(hfsmp
, VTOC(vp
)->c_uid
, cred
, p
, 0);
3502 error
= hfs_write_access(vp
, cred
, p
, false);
3504 hfs_unlock(VTOC(vp
));
3509 error
= vnode_authorize(devvp
, NULL
, KAUTH_VNODE_READ_DATA
| KAUTH_VNODE_WRITE_DATA
, context
);
3513 if (VNOP_IOCTL(devvp
, DKIOCGETBLOCKSIZE
, (caddr_t
)§orsize
, 0, context
)) {
3516 if (sectorsize
!= hfsmp
->hfs_logical_block_size
) {
3519 if (VNOP_IOCTL(devvp
, DKIOCGETBLOCKCOUNT
, (caddr_t
)§orcnt
, 0, context
)) {
3522 if ((sectorsize
* sectorcnt
) < newsize
) {
3523 printf("hfs_extendfs: not enough space on device\n");
3526 error
= VNOP_IOCTL(devvp
, DKIOCGETPHYSICALBLOCKSIZE
, (caddr_t
)&phys_sectorsize
, 0, context
);
3528 if ((error
!= ENOTSUP
) && (error
!= ENOTTY
)) {
3531 /* If ioctl is not supported, force physical and logical sector size to be same */
3532 phys_sectorsize
= sectorsize
;
3534 oldsize
= (u_int64_t
)hfsmp
->totalBlocks
* (u_int64_t
)hfsmp
->blockSize
;
3537 * Validate new size.
3539 if ((newsize
<= oldsize
) || (newsize
% sectorsize
) || (newsize
% phys_sectorsize
)) {
3540 printf("hfs_extendfs: invalid size\n");
3543 newblkcnt
= newsize
/ vcb
->blockSize
;
3544 if (newblkcnt
> (u_int64_t
)0xFFFFFFFF)
3547 addblks
= newblkcnt
- vcb
->totalBlocks
;
3549 printf("hfs_extendfs: growing %s by %d blocks\n", vcb
->vcbVN
, addblks
);
3551 * Enclose changes inside a transaction.
3553 if (hfs_start_transaction(hfsmp
) != 0) {
3558 * Note: we take the attributes lock in case we have an attribute data vnode
3559 * which needs to change size.
3561 lockflags
= hfs_systemfile_lock(hfsmp
, SFL_ATTRIBUTE
| SFL_EXTENTS
| SFL_BITMAP
, HFS_EXCLUSIVE_LOCK
);
3562 vp
= vcb
->allocationsRefNum
;
3564 bcopy(&fp
->ff_data
, &forkdata
, sizeof(forkdata
));
3567 * Calculate additional space required (if any) by allocation bitmap.
3569 oldBitmapSize
= fp
->ff_size
;
3570 bitmapblks
= roundup((newblkcnt
+7) / 8, vcb
->vcbVBMIOSize
) / vcb
->blockSize
;
3571 if (bitmapblks
> (daddr_t
)fp
->ff_blocks
)
3572 bitmapblks
-= fp
->ff_blocks
;
3576 if (bitmapblks
> 0) {
3582 * Get the bitmap's current size (in allocation blocks) so we know
3583 * where to start zero filling once the new space is added. We've
3584 * got to do this before the bitmap is grown.
3586 blkno
= (daddr64_t
)fp
->ff_blocks
;
3589 * Try to grow the allocation file in the normal way, using allocation
3590 * blocks already existing in the file system. This way, we might be
3591 * able to grow the bitmap contiguously, or at least in the metadata
3594 error
= ExtendFileC(vcb
, fp
, bitmapblks
* vcb
->blockSize
, 0,
3595 kEFAllMask
| kEFNoClumpMask
| kEFReserveMask
| kEFMetadataMask
,
3599 usedExtendFileC
= true;
3602 * If the above allocation failed, fall back to allocating the new
3603 * extent of the bitmap from the space we're going to add. Since those
3604 * blocks don't yet belong to the file system, we have to update the
3605 * extent list directly, and manually adjust the file size.
3608 error
= AddFileExtent(vcb
, fp
, vcb
->totalBlocks
, bitmapblks
);
3610 printf("hfs_extendfs: error %d adding extents\n", error
);
3613 fp
->ff_blocks
+= bitmapblks
;
3614 VTOC(vp
)->c_blocks
= fp
->ff_blocks
;
3615 VTOC(vp
)->c_flag
|= C_MODIFIED
;
3619 * Update the allocation file's size to include the newly allocated
3620 * blocks. Note that ExtendFileC doesn't do this, which is why this
3621 * statement is outside the above "if" statement.
3623 fp
->ff_size
+= (u_int64_t
)bitmapblks
* (u_int64_t
)vcb
->blockSize
;
3626 * Zero out the new bitmap blocks.
3631 blkcnt
= bitmapblks
;
3632 while (blkcnt
> 0) {
3633 error
= (int)buf_meta_bread(vp
, blkno
, vcb
->blockSize
, NOCRED
, &bp
);
3640 bzero((char *)buf_dataptr(bp
), vcb
->blockSize
);
3642 error
= (int)buf_bwrite(bp
);
3650 printf("hfs_extendfs: error %d clearing blocks\n", error
);
3654 * Mark the new bitmap space as allocated.
3656 * Note that ExtendFileC will have marked any blocks it allocated, so
3657 * this is only needed if we used AddFileExtent. Also note that this
3658 * has to come *after* the zero filling of new blocks in the case where
3659 * we used AddFileExtent (since the part of the bitmap we're touching
3660 * is in those newly allocated blocks).
3662 if (!usedExtendFileC
) {
3663 error
= BlockMarkAllocated(vcb
, vcb
->totalBlocks
, bitmapblks
);
3665 printf("hfs_extendfs: error %d setting bitmap\n", error
);
3668 vcb
->freeBlocks
-= bitmapblks
;
3672 * Mark the new alternate VH as allocated.
3674 if (vcb
->blockSize
== 512)
3675 error
= BlockMarkAllocated(vcb
, vcb
->totalBlocks
+ addblks
- 2, 2);
3677 error
= BlockMarkAllocated(vcb
, vcb
->totalBlocks
+ addblks
- 1, 1);
3679 printf("hfs_extendfs: error %d setting bitmap (VH)\n", error
);
3683 * Mark the old alternate VH as free.
3685 if (vcb
->blockSize
== 512)
3686 (void) BlockMarkFree(vcb
, vcb
->totalBlocks
- 2, 2);
3688 (void) BlockMarkFree(vcb
, vcb
->totalBlocks
- 1, 1);
3690 * Adjust file system variables for new space.
3692 prev_phys_block_count
= hfsmp
->hfs_logical_block_count
;
3693 prev_alt_sector
= hfsmp
->hfs_alt_id_sector
;
3695 vcb
->totalBlocks
+= addblks
;
3696 vcb
->freeBlocks
+= addblks
;
3697 hfsmp
->hfs_logical_block_count
= newsize
/ sectorsize
;
3698 hfsmp
->hfs_alt_id_sector
= (hfsmp
->hfsPlusIOPosOffset
/ sectorsize
) +
3699 HFS_ALT_SECTOR(sectorsize
, hfsmp
->hfs_logical_block_count
);
3701 error
= hfs_flushvolumeheader(hfsmp
, MNT_WAIT
, HFS_ALTFLUSH
);
3703 printf("hfs_extendfs: couldn't flush volume headers (%d)", error
);
3705 * Restore to old state.
3707 if (usedExtendFileC
) {
3708 (void) TruncateFileC(vcb
, fp
, oldBitmapSize
, false);
3710 fp
->ff_blocks
-= bitmapblks
;
3711 fp
->ff_size
-= (u_int64_t
)bitmapblks
* (u_int64_t
)vcb
->blockSize
;
3713 * No need to mark the excess blocks free since those bitmap blocks
3714 * are no longer part of the bitmap. But we do need to undo the
3715 * effect of the "vcb->freeBlocks -= bitmapblks" above.
3717 vcb
->freeBlocks
+= bitmapblks
;
3719 vcb
->totalBlocks
-= addblks
;
3720 vcb
->freeBlocks
-= addblks
;
3721 hfsmp
->hfs_logical_block_count
= prev_phys_block_count
;
3722 hfsmp
->hfs_alt_id_sector
= prev_alt_sector
;
3724 if (vcb
->blockSize
== 512)
3725 (void) BlockMarkAllocated(vcb
, vcb
->totalBlocks
- 2, 2);
3727 (void) BlockMarkAllocated(vcb
, vcb
->totalBlocks
- 1, 1);
3731 * Invalidate the old alternate volume header.
3734 if (prev_alt_sector
) {
3735 if (buf_meta_bread(hfsmp
->hfs_devvp
,
3736 HFS_PHYSBLK_ROUNDDOWN(prev_alt_sector
, hfsmp
->hfs_log_per_phys
),
3737 hfsmp
->hfs_physical_block_size
, NOCRED
, &bp
) == 0) {
3738 journal_modify_block_start(hfsmp
->jnl
, bp
);
3740 bzero((char *)buf_dataptr(bp
) + HFS_ALT_OFFSET(hfsmp
->hfs_physical_block_size
), kMDBSize
);
3742 journal_modify_block_end(hfsmp
->jnl
, bp
, NULL
, NULL
);
3749 * TODO: Adjust the size of the metadata zone based on new volume size?
3753 * Adjust the size of hfsmp->hfs_attrdata_vp
3755 if (hfsmp
->hfs_attrdata_vp
) {
3756 struct cnode
*attr_cp
;
3757 struct filefork
*attr_fp
;
3759 if (vnode_get(hfsmp
->hfs_attrdata_vp
) == 0) {
3760 attr_cp
= VTOC(hfsmp
->hfs_attrdata_vp
);
3761 attr_fp
= VTOF(hfsmp
->hfs_attrdata_vp
);
3763 attr_cp
->c_blocks
= newblkcnt
;
3764 attr_fp
->ff_blocks
= newblkcnt
;
3765 attr_fp
->ff_extents
[0].blockCount
= newblkcnt
;
3766 attr_fp
->ff_size
= (off_t
) newblkcnt
* hfsmp
->blockSize
;
3767 ubc_setsize(hfsmp
->hfs_attrdata_vp
, attr_fp
->ff_size
);
3768 vnode_put(hfsmp
->hfs_attrdata_vp
);
3774 /* Restore allocation fork. */
3775 bcopy(&forkdata
, &fp
->ff_data
, sizeof(forkdata
));
3776 VTOC(vp
)->c_blocks
= fp
->ff_blocks
;
3780 Regardless of whether or not the totalblocks actually increased,
3781 we should reset the allocLimit field. If it changed, it will
3782 get updated; if not, it will remain the same.
3784 hfsmp
->allocLimit
= vcb
->totalBlocks
;
3785 hfs_systemfile_unlock(hfsmp
, lockflags
);
3786 hfs_end_transaction(hfsmp
);
3791 #define HFS_MIN_SIZE (32LL * 1024LL * 1024LL)
3794 * Truncate a file system (while still mounted).
3798 hfs_truncatefs(struct hfsmount
*hfsmp
, u_int64_t newsize
, vfs_context_t context
)
3800 struct buf
*bp
= NULL
;
3802 u_int32_t newblkcnt
;
3803 u_int32_t reclaimblks
= 0;
3805 int transaction_begun
= 0;
3808 lck_mtx_lock(&hfsmp
->hfs_mutex
);
3809 if (hfsmp
->hfs_flags
& HFS_RESIZE_IN_PROGRESS
) {
3810 lck_mtx_unlock(&hfsmp
->hfs_mutex
);
3813 hfsmp
->hfs_flags
|= HFS_RESIZE_IN_PROGRESS
;
3814 hfsmp
->hfs_resize_filesmoved
= 0;
3815 hfsmp
->hfs_resize_totalfiles
= 0;
3816 lck_mtx_unlock(&hfsmp
->hfs_mutex
);
3819 * - Journaled HFS Plus volumes only.
3820 * - No embedded volumes.
3822 if ((hfsmp
->jnl
== NULL
) ||
3823 (hfsmp
->hfsPlusIOPosOffset
!= 0)) {
3827 oldsize
= (u_int64_t
)hfsmp
->totalBlocks
* (u_int64_t
)hfsmp
->blockSize
;
3828 newblkcnt
= newsize
/ hfsmp
->blockSize
;
3829 reclaimblks
= hfsmp
->totalBlocks
- newblkcnt
;
3831 /* Make sure new size is valid. */
3832 if ((newsize
< HFS_MIN_SIZE
) ||
3833 (newsize
>= oldsize
) ||
3834 (newsize
% hfsmp
->hfs_logical_block_size
) ||
3835 (newsize
% hfsmp
->hfs_physical_block_size
)) {
3836 printf ("hfs_truncatefs: invalid size\n");
3840 /* Make sure there's enough space to work with. */
3841 if (reclaimblks
>= hfs_freeblks(hfsmp
, 1)) {
3842 printf("hfs_truncatefs: insufficient space (need %u blocks; have %u blocks)\n", reclaimblks
, hfs_freeblks(hfsmp
, 1));
3847 /* Start with a clean journal. */
3848 hfs_journal_flush(hfsmp
);
3850 if (hfs_start_transaction(hfsmp
) != 0) {
3854 transaction_begun
= 1;
3857 * Prevent new allocations from using the part we're trying to truncate.
3859 * NOTE: allocLimit is set to the allocation block number where the new
3860 * alternate volume header will be. That way there will be no files to
3861 * interfere with allocating the new alternate volume header, and no files
3862 * in the allocation blocks beyond (i.e. the blocks we're trying to
3865 lck_mtx_lock(&hfsmp
->hfs_mutex
);
3866 if (hfsmp
->blockSize
== 512)
3867 hfsmp
->allocLimit
= newblkcnt
- 2;
3869 hfsmp
->allocLimit
= newblkcnt
- 1;
3870 hfsmp
->freeBlocks
-= reclaimblks
;
3871 lck_mtx_unlock(&hfsmp
->hfs_mutex
);
3874 * Look for files that have blocks at or beyond the location of the
3875 * new alternate volume header.
3877 if (hfs_isallocated(hfsmp
, hfsmp
->allocLimit
, reclaimblks
)) {
3879 * hfs_reclaimspace will use separate transactions when
3880 * relocating files (so we don't overwhelm the journal).
3882 hfs_end_transaction(hfsmp
);
3883 transaction_begun
= 0;
3885 /* Attempt to reclaim some space. */
3886 if (hfs_reclaimspace(hfsmp
, hfsmp
->allocLimit
, reclaimblks
, context
) != 0) {
3887 printf("hfs_truncatefs: couldn't reclaim space on %s\n", hfsmp
->vcbVN
);
3891 if (hfs_start_transaction(hfsmp
) != 0) {
3895 transaction_begun
= 1;
3897 /* Check if we're clear now. */
3898 if (hfs_isallocated(hfsmp
, hfsmp
->allocLimit
, reclaimblks
)) {
3899 printf("hfs_truncatefs: didn't reclaim enough space on %s\n", hfsmp
->vcbVN
);
3900 error
= EAGAIN
; /* tell client to try again */
3906 * Note: we take the attributes lock in case we have an attribute data vnode
3907 * which needs to change size.
3909 lockflags
= hfs_systemfile_lock(hfsmp
, SFL_ATTRIBUTE
| SFL_EXTENTS
| SFL_BITMAP
, HFS_EXCLUSIVE_LOCK
);
3912 * Mark the old alternate volume header as free.
3913 * We don't bother shrinking allocation bitmap file.
3915 if (hfsmp
->blockSize
== 512)
3916 (void) BlockMarkFree(hfsmp
, hfsmp
->totalBlocks
- 2, 2);
3918 (void) BlockMarkFree(hfsmp
, hfsmp
->totalBlocks
- 1, 1);
3921 * Allocate last 1KB for alternate volume header.
3923 error
= BlockMarkAllocated(hfsmp
, hfsmp
->allocLimit
, (hfsmp
->blockSize
== 512) ? 2 : 1);
3925 printf("hfs_truncatefs: Error %d allocating new alternate volume header\n", error
);
3930 * Invalidate the existing alternate volume header.
3932 * Don't include this in a transaction (don't call journal_modify_block)
3933 * since this block will be outside of the truncated file system!
3935 if (hfsmp
->hfs_alt_id_sector
) {
3936 if (buf_meta_bread(hfsmp
->hfs_devvp
,
3937 HFS_PHYSBLK_ROUNDDOWN(hfsmp
->hfs_alt_id_sector
, hfsmp
->hfs_log_per_phys
),
3938 hfsmp
->hfs_physical_block_size
, NOCRED
, &bp
) == 0) {
3940 bzero((void*)((char *)buf_dataptr(bp
) + HFS_ALT_OFFSET(hfsmp
->hfs_physical_block_size
)), kMDBSize
);
3941 (void) VNOP_BWRITE(bp
);
3948 /* Log successful shrinking. */
3949 printf("hfs_truncatefs: shrank \"%s\" to %d blocks (was %d blocks)\n",
3950 hfsmp
->vcbVN
, newblkcnt
, hfsmp
->totalBlocks
);
3953 * Adjust file system variables and flush them to disk.
3955 hfsmp
->totalBlocks
= newblkcnt
;
3956 hfsmp
->hfs_logical_block_count
= newsize
/ hfsmp
->hfs_logical_block_size
;
3957 hfsmp
->hfs_alt_id_sector
= HFS_ALT_SECTOR(hfsmp
->hfs_logical_block_size
, hfsmp
->hfs_logical_block_count
);
3958 MarkVCBDirty(hfsmp
);
3959 error
= hfs_flushvolumeheader(hfsmp
, MNT_WAIT
, HFS_ALTFLUSH
);
3961 panic("hfs_truncatefs: unexpected error flushing volume header (%d)\n", error
);
3964 * TODO: Adjust the size of the metadata zone based on new volume size?
3968 * Adjust the size of hfsmp->hfs_attrdata_vp
3970 if (hfsmp
->hfs_attrdata_vp
) {
3972 struct filefork
*fp
;
3974 if (vnode_get(hfsmp
->hfs_attrdata_vp
) == 0) {
3975 cp
= VTOC(hfsmp
->hfs_attrdata_vp
);
3976 fp
= VTOF(hfsmp
->hfs_attrdata_vp
);
3978 cp
->c_blocks
= newblkcnt
;
3979 fp
->ff_blocks
= newblkcnt
;
3980 fp
->ff_extents
[0].blockCount
= newblkcnt
;
3981 fp
->ff_size
= (off_t
) newblkcnt
* hfsmp
->blockSize
;
3982 ubc_setsize(hfsmp
->hfs_attrdata_vp
, fp
->ff_size
);
3983 vnode_put(hfsmp
->hfs_attrdata_vp
);
3989 hfsmp
->freeBlocks
+= reclaimblks
;
3991 lck_mtx_lock(&hfsmp
->hfs_mutex
);
3992 hfsmp
->allocLimit
= hfsmp
->totalBlocks
;
3993 if (hfsmp
->nextAllocation
>= hfsmp
->allocLimit
)
3994 hfsmp
->nextAllocation
= hfsmp
->hfs_metazone_end
+ 1;
3995 hfsmp
->hfs_flags
&= ~HFS_RESIZE_IN_PROGRESS
;
3996 lck_mtx_unlock(&hfsmp
->hfs_mutex
);
3999 hfs_systemfile_unlock(hfsmp
, lockflags
);
4001 if (transaction_begun
) {
4002 hfs_end_transaction(hfsmp
);
4003 hfs_journal_flush(hfsmp
);
4011 * Invalidate the physical block numbers associated with buffer cache blocks
4012 * in the given extent of the given vnode.
4014 struct hfs_inval_blk_no
{
4015 daddr64_t sectorStart
;
4016 daddr64_t sectorCount
;
4019 hfs_invalidate_block_numbers_callback(buf_t bp
, void *args_in
)
4022 struct hfs_inval_blk_no
*args
;
4024 blkno
= buf_blkno(bp
);
4027 if (blkno
>= args
->sectorStart
&& blkno
< args
->sectorStart
+args
->sectorCount
)
4028 buf_setblkno(bp
, buf_lblkno(bp
));
4030 return BUF_RETURNED
;
4033 hfs_invalidate_sectors(struct vnode
*vp
, daddr64_t sectorStart
, daddr64_t sectorCount
)
4035 struct hfs_inval_blk_no args
;
4036 args
.sectorStart
= sectorStart
;
4037 args
.sectorCount
= sectorCount
;
4039 buf_iterate(vp
, hfs_invalidate_block_numbers_callback
, BUF_SCAN_DIRTY
|BUF_SCAN_CLEAN
, &args
);
4044 * Copy the contents of an extent to a new location. Also invalidates the
4045 * physical block number of any buffer cache block in the copied extent
4046 * (so that if the block is written, it will go through VNOP_BLOCKMAP to
4047 * determine the new physical block number).
4051 struct hfsmount
*hfsmp
,
4052 struct vnode
*vp
, /* The file whose extent is being copied. */
4053 u_int32_t oldStart
, /* The start of the source extent. */
4054 u_int32_t newStart
, /* The start of the destination extent. */
4055 u_int32_t blockCount
, /* The number of allocation blocks to copy. */
4056 vfs_context_t context
)
4060 void *buffer
= NULL
;
4061 struct vfsioattr ioattr
;
4065 u_int32_t ioSizeSectors
; /* Device sectors in this I/O */
4066 daddr64_t srcSector
, destSector
;
4067 u_int32_t sectorsPerBlock
= hfsmp
->blockSize
/ hfsmp
->hfs_logical_block_size
;
4070 * Sanity check that we have locked the vnode of the file we're copying.
4072 * But since hfs_systemfile_lock() doesn't actually take the lock on
4073 * the allocation file if a journal is active, ignore the check if the
4074 * file being copied is the allocation file.
4076 struct cnode
*cp
= VTOC(vp
);
4077 if (cp
!= hfsmp
->hfs_allocation_cp
&& cp
->c_lockowner
!= current_thread())
4078 panic("hfs_copy_extent: vp=%p (cp=%p) not owned?\n", vp
, cp
);
4081 * Wait for any in-progress writes to this vnode to complete, so that we'll
4082 * be copying consistent bits. (Otherwise, it's possible that an async
4083 * write will complete to the old extent after we read from it. That
4084 * could lead to corruption.)
4086 err
= vnode_waitforwrites(vp
, 0, 0, 0, "hfs_copy_extent");
4088 printf("hfs_copy_extent: Error %d from vnode_waitforwrites\n", err
);
4093 * Determine the I/O size to use
4095 * NOTE: Many external drives will result in an ioSize of 128KB.
4096 * TODO: Should we use a larger buffer, doing several consecutive
4097 * reads, then several consecutive writes?
4099 vfs_ioattr(hfsmp
->hfs_mp
, &ioattr
);
4100 bufferSize
= MIN(ioattr
.io_maxreadcnt
, ioattr
.io_maxwritecnt
);
4101 if (kmem_alloc(kernel_map
, (vm_offset_t
*) &buffer
, bufferSize
))
4104 /* Get a buffer for doing the I/O */
4105 bp
= buf_alloc(hfsmp
->hfs_devvp
);
4106 buf_setdataptr(bp
, (uintptr_t)buffer
);
4108 resid
= (off_t
) blockCount
* (off_t
) hfsmp
->blockSize
;
4109 srcSector
= (daddr64_t
) oldStart
* hfsmp
->blockSize
/ hfsmp
->hfs_logical_block_size
;
4110 destSector
= (daddr64_t
) newStart
* hfsmp
->blockSize
/ hfsmp
->hfs_logical_block_size
;
4112 ioSize
= MIN(bufferSize
, (size_t) resid
);
4113 ioSizeSectors
= ioSize
/ hfsmp
->hfs_logical_block_size
;
4115 /* Prepare the buffer for reading */
4116 buf_reset(bp
, B_READ
);
4117 buf_setsize(bp
, ioSize
);
4118 buf_setcount(bp
, ioSize
);
4119 buf_setblkno(bp
, srcSector
);
4120 buf_setlblkno(bp
, srcSector
);
4123 err
= VNOP_STRATEGY(bp
);
4125 err
= buf_biowait(bp
);
4127 printf("hfs_copy_extent: Error %d from VNOP_STRATEGY (read)\n", err
);
4131 /* Prepare the buffer for writing */
4132 buf_reset(bp
, B_WRITE
);
4133 buf_setsize(bp
, ioSize
);
4134 buf_setcount(bp
, ioSize
);
4135 buf_setblkno(bp
, destSector
);
4136 buf_setlblkno(bp
, destSector
);
4137 if (journal_uses_fua(hfsmp
->jnl
))
4141 vnode_startwrite(hfsmp
->hfs_devvp
);
4142 err
= VNOP_STRATEGY(bp
);
4144 err
= buf_biowait(bp
);
4146 printf("hfs_copy_extent: Error %d from VNOP_STRATEGY (write)\n", err
);
4151 srcSector
+= ioSizeSectors
;
4152 destSector
+= ioSizeSectors
;
4157 kmem_free(kernel_map
, (vm_offset_t
)buffer
, bufferSize
);
4159 /* Make sure all writes have been flushed to disk. */
4160 if (!journal_uses_fua(hfsmp
->jnl
)) {
4161 err
= VNOP_IOCTL(hfsmp
->hfs_devvp
, DKIOCSYNCHRONIZECACHE
, NULL
, FWRITE
, context
);
4163 printf("hfs_copy_extent: DKIOCSYNCHRONIZECACHE failed (%d)\n", err
);
4164 err
= 0; /* Don't fail the copy. */
4169 hfs_invalidate_sectors(vp
, (daddr64_t
)oldStart
*sectorsPerBlock
, (daddr64_t
)blockCount
*sectorsPerBlock
);
4176 * Reclaim space at the end of a volume, used by a given system file.
4178 * This routine attempts to move any extent which contains allocation blocks
4179 * at or after "startblk." A separate transaction is used to do the move.
4180 * The contents of any moved extents are read and written via the volume's
4181 * device vnode -- NOT via "vp." During the move, moved blocks which are part
4182 * of a transaction have their physical block numbers invalidated so they will
4183 * eventually be written to their new locations.
4185 * This routine can be used to move overflow extents for the allocation file.
4188 * hfsmp The volume being resized.
4189 * startblk Blocks >= this allocation block need to be moved.
4190 * locks Which locks need to be taken for the given system file.
4191 * vp The vnode for the system file.
4194 * moved Set to true if any extents were moved.
4197 hfs_relocate_callback(__unused HFSPlusExtentKey
*key
, HFSPlusExtentRecord
*record
, HFSPlusExtentRecord
*state
)
4199 bcopy(state
, record
, sizeof(HFSPlusExtentRecord
));
4203 hfs_reclaim_sys_file(struct hfsmount
*hfsmp
, struct vnode
*vp
, u_long startblk
, int locks
, Boolean
*moved
, vfs_context_t context
)
4210 u_int32_t oldStartBlock
;
4211 u_int32_t newStartBlock
;
4212 u_int32_t blockCount
;
4213 struct filefork
*fp
;
4215 /* If there is no vnode for this file, then there's nothing to do. */
4219 /* printf("hfs_reclaim_sys_file: %.*s\n", VTOC(vp)->c_desc.cd_namelen, VTOC(vp)->c_desc.cd_nameptr); */
4221 /* We always need the allocation bitmap and extents B-tree */
4222 locks
|= SFL_BITMAP
| SFL_EXTENTS
;
4224 error
= hfs_start_transaction(hfsmp
);
4226 printf("hfs_reclaim_sys_file: hfs_start_transaction returned %d\n", error
);
4229 lockflags
= hfs_systemfile_lock(hfsmp
, locks
, HFS_EXCLUSIVE_LOCK
);
4233 /* Relocate non-overflow extents */
4234 for (i
= 0; i
< kHFSPlusExtentDensity
; ++i
) {
4235 if (fp
->ff_extents
[i
].blockCount
== 0)
4237 oldStartBlock
= fp
->ff_extents
[i
].startBlock
;
4238 blockCount
= fp
->ff_extents
[i
].blockCount
;
4239 datablks
+= blockCount
;
4240 block
= oldStartBlock
+ blockCount
;
4241 if (block
> startblk
) {
4242 error
= BlockAllocate(hfsmp
, 1, blockCount
, blockCount
, true, true, &newStartBlock
, &blockCount
);
4244 printf("hfs_reclaim_sys_file: BlockAllocate returned %d\n", error
);
4247 if (blockCount
!= fp
->ff_extents
[i
].blockCount
) {
4248 printf("hfs_reclaim_sys_file: new blockCount=%u, original blockCount=%u", blockCount
, fp
->ff_extents
[i
].blockCount
);
4251 error
= hfs_copy_extent(hfsmp
, vp
, oldStartBlock
, newStartBlock
, blockCount
, context
);
4253 printf("hfs_reclaim_sys_file: hfs_copy_extent returned %d\n", error
);
4256 fp
->ff_extents
[i
].startBlock
= newStartBlock
;
4257 VTOC(vp
)->c_flag
|= C_MODIFIED
;
4259 error
= BlockDeallocate(hfsmp
, oldStartBlock
, blockCount
);
4261 /* TODO: Mark volume inconsistent? */
4262 printf("hfs_reclaim_sys_file: BlockDeallocate returned %d\n", error
);
4265 error
= hfs_flushvolumeheader(hfsmp
, MNT_WAIT
, HFS_ALTFLUSH
);
4267 /* TODO: Mark volume inconsistent? */
4268 printf("hfs_reclaim_sys_file: hfs_flushvolumeheader returned %d\n", error
);
4274 /* Relocate overflow extents (if any) */
4275 if (i
== kHFSPlusExtentDensity
&& fp
->ff_blocks
> datablks
) {
4276 struct BTreeIterator
*iterator
= NULL
;
4277 struct FSBufferDescriptor btdata
;
4278 HFSPlusExtentRecord record
;
4279 HFSPlusExtentKey
*key
;
4284 forktype
= VNODE_IS_RSRC(vp
) ? 0xFF : 0;
4285 fileID
= VTOC(vp
)->c_cnid
;
4286 if (kmem_alloc(kernel_map
, (vm_offset_t
*) &iterator
, sizeof(*iterator
))) {
4287 printf("hfs_reclaim_sys_file: kmem_alloc failed!\n");
4292 bzero(iterator
, sizeof(*iterator
));
4293 key
= (HFSPlusExtentKey
*) &iterator
->key
;
4294 key
->keyLength
= kHFSPlusExtentKeyMaximumLength
;
4295 key
->forkType
= forktype
;
4296 key
->fileID
= fileID
;
4297 key
->startBlock
= datablks
;
4299 btdata
.bufferAddress
= &record
;
4300 btdata
.itemSize
= sizeof(record
);
4301 btdata
.itemCount
= 1;
4303 fcb
= VTOF(hfsmp
->hfs_extents_vp
);
4305 error
= BTSearchRecord(fcb
, iterator
, &btdata
, NULL
, iterator
);
4306 while (error
== 0) {
4307 /* Stop when we encounter a different file or fork. */
4308 if ((key
->fileID
!= fileID
) ||
4309 (key
->forkType
!= forktype
)) {
4313 * Check if the file overlaps target space.
4315 for (i
= 0; i
< kHFSPlusExtentDensity
; ++i
) {
4316 if (record
[i
].blockCount
== 0) {
4319 oldStartBlock
= record
[i
].startBlock
;
4320 blockCount
= record
[i
].blockCount
;
4321 block
= oldStartBlock
+ blockCount
;
4322 if (block
> startblk
) {
4323 error
= BlockAllocate(hfsmp
, 1, blockCount
, blockCount
, true, true, &newStartBlock
, &blockCount
);
4325 printf("hfs_reclaim_sys_file: BlockAllocate returned %d\n", error
);
4328 if (blockCount
!= record
[i
].blockCount
) {
4329 printf("hfs_reclaim_sys_file: new blockCount=%u, original blockCount=%u", blockCount
, fp
->ff_extents
[i
].blockCount
);
4330 kmem_free(kernel_map
, (vm_offset_t
)iterator
, sizeof(*iterator
));
4333 error
= hfs_copy_extent(hfsmp
, vp
, oldStartBlock
, newStartBlock
, blockCount
, context
);
4335 printf("hfs_reclaim_sys_file: hfs_copy_extent returned %d\n", error
);
4336 kmem_free(kernel_map
, (vm_offset_t
)iterator
, sizeof(*iterator
));
4339 record
[i
].startBlock
= newStartBlock
;
4340 VTOC(vp
)->c_flag
|= C_MODIFIED
;
4343 * NOTE: To support relocating overflow extents of the
4344 * allocation file, we must update the BTree record BEFORE
4345 * deallocating the old extent so that BlockDeallocate will
4346 * use the extent's new location to calculate physical block
4347 * numbers. (This is for the case where the old extent's
4348 * bitmap bits actually reside in the extent being moved.)
4350 error
= BTUpdateRecord(fcb
, iterator
, (IterateCallBackProcPtr
) hfs_relocate_callback
, &record
);
4352 /* TODO: Mark volume inconsistent? */
4353 printf("hfs_reclaim_sys_file: BTUpdateRecord returned %d\n", error
);
4356 error
= BlockDeallocate(hfsmp
, oldStartBlock
, blockCount
);
4358 /* TODO: Mark volume inconsistent? */
4359 printf("hfs_reclaim_sys_file: BlockDeallocate returned %d\n", error
);
4364 /* Look for more records. */
4365 error
= BTIterateRecord(fcb
, kBTreeNextRecord
, iterator
, &btdata
, NULL
);
4366 if (error
== btNotFound
) {
4372 kmem_free(kernel_map
, (vm_offset_t
)iterator
, sizeof(*iterator
));
4378 hfs_systemfile_unlock(hfsmp
, lockflags
);
4379 error
= hfs_end_transaction(hfsmp
);
4381 printf("hfs_reclaim_sys_file: hfs_end_transaction returned %d\n", error
);
4387 (void) BlockDeallocate(hfsmp
, newStartBlock
, blockCount
);
4389 (void) hfs_systemfile_unlock(hfsmp
, lockflags
);
4390 (void) hfs_end_transaction(hfsmp
);
4396 * This journal_relocate callback updates the journal info block to point
4397 * at the new journal location. This write must NOT be done using the
4398 * transaction. We must write the block immediately. We must also force
4399 * it to get to the media so that the new journal location will be seen by
4400 * the replay code before we can safely let journaled blocks be written
4401 * to their normal locations.
4403 * The tests for journal_uses_fua below are mildly hacky. Since the journal
4404 * and the file system are both on the same device, I'm leveraging what
4405 * the journal has decided about FUA.
4407 struct hfs_journal_relocate_args
{
4408 struct hfsmount
*hfsmp
;
4409 vfs_context_t context
;
4410 u_int32_t newStartBlock
;
4414 hfs_journal_relocate_callback(void *_args
)
4417 struct hfs_journal_relocate_args
*args
= _args
;
4418 struct hfsmount
*hfsmp
= args
->hfsmp
;
4420 JournalInfoBlock
*jibp
;
4422 error
= buf_meta_bread(hfsmp
->hfs_devvp
,
4423 hfsmp
->vcbJinfoBlock
* (hfsmp
->blockSize
/hfsmp
->hfs_logical_block_size
),
4424 hfsmp
->blockSize
, vfs_context_ucred(args
->context
), &bp
);
4426 printf("hfs_reclaim_journal_file: failed to read JIB (%d)\n", error
);
4429 jibp
= (JournalInfoBlock
*) buf_dataptr(bp
);
4430 jibp
->offset
= SWAP_BE64((u_int64_t
)args
->newStartBlock
* hfsmp
->blockSize
);
4431 jibp
->size
= SWAP_BE64(hfsmp
->jnl_size
);
4432 if (journal_uses_fua(hfsmp
->jnl
))
4434 error
= buf_bwrite(bp
);
4436 printf("hfs_reclaim_journal_file: failed to write JIB (%d)\n", error
);
4439 if (!journal_uses_fua(hfsmp
->jnl
)) {
4440 error
= VNOP_IOCTL(hfsmp
->hfs_devvp
, DKIOCSYNCHRONIZECACHE
, NULL
, FWRITE
, args
->context
);
4442 printf("hfs_reclaim_journal_file: DKIOCSYNCHRONIZECACHE failed (%d)\n", error
);
4443 error
= 0; /* Don't fail the operation. */
4452 hfs_reclaim_journal_file(struct hfsmount
*hfsmp
, vfs_context_t context
)
4456 u_int32_t newStartBlock
;
4457 u_int32_t oldBlockCount
;
4458 u_int32_t newBlockCount
;
4459 struct cat_desc journal_desc
;
4460 struct cat_attr journal_attr
;
4461 struct cat_fork journal_fork
;
4462 struct hfs_journal_relocate_args callback_args
;
4464 error
= hfs_start_transaction(hfsmp
);
4466 printf("hfs_reclaim_journal_file: hfs_start_transaction returned %d\n", error
);
4469 lockflags
= hfs_systemfile_lock(hfsmp
, SFL_CATALOG
| SFL_BITMAP
, HFS_EXCLUSIVE_LOCK
);
4471 oldBlockCount
= hfsmp
->jnl_size
/ hfsmp
->blockSize
;
4473 /* TODO: Allow the journal to change size based on the new volume size. */
4474 error
= BlockAllocate(hfsmp
, 1, oldBlockCount
, oldBlockCount
, true, true, &newStartBlock
, &newBlockCount
);
4476 printf("hfs_reclaim_journal_file: BlockAllocate returned %d\n", error
);
4479 if (newBlockCount
!= oldBlockCount
) {
4480 printf("hfs_reclaim_journal_file: newBlockCount != oldBlockCount (%u, %u)\n", newBlockCount
, oldBlockCount
);
4484 error
= BlockDeallocate(hfsmp
, hfsmp
->jnl_start
, oldBlockCount
);
4486 printf("hfs_reclaim_journal_file: BlockDeallocate returned %d\n", error
);
4490 /* Update the catalog record for .journal */
4491 error
= cat_idlookup(hfsmp
, hfsmp
->hfs_jnlfileid
, 1, &journal_desc
, &journal_attr
, &journal_fork
);
4493 printf("hfs_reclaim_journal_file: cat_idlookup returned %d\n", error
);
4496 journal_fork
.cf_size
= newBlockCount
* hfsmp
->blockSize
;
4497 journal_fork
.cf_extents
[0].startBlock
= newStartBlock
;
4498 journal_fork
.cf_extents
[0].blockCount
= newBlockCount
;
4499 journal_fork
.cf_blocks
= newBlockCount
;
4500 error
= cat_update(hfsmp
, &journal_desc
, &journal_attr
, &journal_fork
, NULL
);
4501 cat_releasedesc(&journal_desc
); /* all done with cat descriptor */
4503 printf("hfs_reclaim_journal_file: cat_update returned %d\n", error
);
4506 callback_args
.hfsmp
= hfsmp
;
4507 callback_args
.context
= context
;
4508 callback_args
.newStartBlock
= newStartBlock
;
4510 error
= journal_relocate(hfsmp
->jnl
, (off_t
)newStartBlock
*hfsmp
->blockSize
,
4511 (off_t
)newBlockCount
*hfsmp
->blockSize
, 0,
4512 hfs_journal_relocate_callback
, &callback_args
);
4514 /* NOTE: journal_relocate will mark the journal invalid. */
4515 printf("hfs_reclaim_journal_file: journal_relocate returned %d\n", error
);
4518 hfsmp
->jnl_start
= newStartBlock
;
4519 hfsmp
->jnl_size
= (off_t
)newBlockCount
* hfsmp
->blockSize
;
4521 hfs_systemfile_unlock(hfsmp
, lockflags
);
4522 error
= hfs_end_transaction(hfsmp
);
4524 printf("hfs_reclaim_journal_file: hfs_end_transaction returned %d\n", error
);
4530 (void) BlockDeallocate(hfsmp
, newStartBlock
, newBlockCount
);
4532 hfs_systemfile_unlock(hfsmp
, lockflags
);
4533 (void) hfs_end_transaction(hfsmp
);
4539 * Move the journal info block to a new location. We have to make sure the
4540 * new copy of the journal info block gets to the media first, then change
4541 * the field in the volume header and the catalog record.
4544 hfs_reclaim_journal_info_block(struct hfsmount
*hfsmp
, vfs_context_t context
)
4549 u_int32_t blockCount
;
4550 struct cat_desc jib_desc
;
4551 struct cat_attr jib_attr
;
4552 struct cat_fork jib_fork
;
4553 buf_t old_bp
, new_bp
;
4555 error
= hfs_start_transaction(hfsmp
);
4557 printf("hfs_reclaim_journal_info_block: hfs_start_transaction returned %d\n", error
);
4560 lockflags
= hfs_systemfile_lock(hfsmp
, SFL_CATALOG
| SFL_BITMAP
, HFS_EXCLUSIVE_LOCK
);
4562 error
= BlockAllocate(hfsmp
, 1, 1, 1, true, true, &newBlock
, &blockCount
);
4564 printf("hfs_reclaim_journal_info_block: BlockAllocate returned %d\n", error
);
4567 if (blockCount
!= 1) {
4568 printf("hfs_reclaim_journal_info_block: blockCount != 1 (%u)\n", blockCount
);
4571 error
= BlockDeallocate(hfsmp
, hfsmp
->vcbJinfoBlock
, 1);
4573 printf("hfs_reclaim_journal_info_block: BlockDeallocate returned %d\n", error
);
4577 /* Copy the old journal info block content to the new location */
4578 error
= buf_meta_bread(hfsmp
->hfs_devvp
,
4579 hfsmp
->vcbJinfoBlock
* (hfsmp
->blockSize
/hfsmp
->hfs_logical_block_size
),
4580 hfsmp
->blockSize
, vfs_context_ucred(context
), &old_bp
);
4582 printf("hfs_reclaim_journal_info_block: failed to read JIB (%d)\n", error
);
4585 new_bp
= buf_getblk(hfsmp
->hfs_devvp
,
4586 newBlock
* (hfsmp
->blockSize
/hfsmp
->hfs_logical_block_size
),
4587 hfsmp
->blockSize
, 0, 0, BLK_META
);
4588 bcopy((char*)buf_dataptr(old_bp
), (char*)buf_dataptr(new_bp
), hfsmp
->blockSize
);
4590 if (journal_uses_fua(hfsmp
->jnl
))
4591 buf_markfua(new_bp
);
4592 error
= buf_bwrite(new_bp
);
4594 printf("hfs_reclaim_journal_info_block: failed to write new JIB (%d)\n", error
);
4597 if (!journal_uses_fua(hfsmp
->jnl
)) {
4598 error
= VNOP_IOCTL(hfsmp
->hfs_devvp
, DKIOCSYNCHRONIZECACHE
, NULL
, FWRITE
, context
);
4600 printf("hfs_reclaim_journal_info_block: DKIOCSYNCHRONIZECACHE failed (%d)\n", error
);
4601 /* Don't fail the operation. */
4605 /* Update the catalog record for .journal_info_block */
4606 error
= cat_idlookup(hfsmp
, hfsmp
->hfs_jnlinfoblkid
, 1, &jib_desc
, &jib_attr
, &jib_fork
);
4608 printf("hfs_reclaim_journal_file: cat_idlookup returned %d\n", error
);
4611 jib_fork
.cf_size
= hfsmp
->blockSize
;
4612 jib_fork
.cf_extents
[0].startBlock
= newBlock
;
4613 jib_fork
.cf_extents
[0].blockCount
= 1;
4614 jib_fork
.cf_blocks
= 1;
4615 error
= cat_update(hfsmp
, &jib_desc
, &jib_attr
, &jib_fork
, NULL
);
4616 cat_releasedesc(&jib_desc
); /* all done with cat descriptor */
4618 printf("hfs_reclaim_journal_info_block: cat_update returned %d\n", error
);
4622 /* Update the pointer to the journal info block in the volume header. */
4623 hfsmp
->vcbJinfoBlock
= newBlock
;
4624 error
= hfs_flushvolumeheader(hfsmp
, MNT_WAIT
, HFS_ALTFLUSH
);
4626 printf("hfs_reclaim_journal_info_block: hfs_flushvolumeheader returned %d\n", error
);
4629 hfs_systemfile_unlock(hfsmp
, lockflags
);
4630 error
= hfs_end_transaction(hfsmp
);
4632 printf("hfs_reclaim_journal_info_block: hfs_end_transaction returned %d\n", error
);
4634 error
= hfs_journal_flush(hfsmp
);
4636 printf("hfs_reclaim_journal_info_block: journal_flush returned %d\n", error
);
4641 (void) BlockDeallocate(hfsmp
, newBlock
, blockCount
);
4643 hfs_systemfile_unlock(hfsmp
, lockflags
);
4644 (void) hfs_end_transaction(hfsmp
);
4650 * Reclaim space at the end of a file system.
4653 hfs_reclaimspace(struct hfsmount
*hfsmp
, u_int32_t startblk
, u_int32_t reclaimblks
, vfs_context_t context
)
4655 struct vnode
*vp
= NULL
;
4657 struct BTreeIterator
* iterator
= NULL
;
4658 struct FSBufferDescriptor btdata
;
4659 struct HFSPlusCatalogFile filerec
;
4660 u_int32_t saved_next_allocation
;
4668 u_int32_t blkstomove
= 0;
4672 int lastprogress
= 0;
4673 Boolean system_file_moved
= false;
4675 /* Relocate extents of the Allocation file if they're in the way. */
4676 error
= hfs_reclaim_sys_file(hfsmp
, hfsmp
->hfs_allocation_vp
, startblk
, SFL_BITMAP
, &system_file_moved
, context
);
4678 printf("hfs_reclaimspace: reclaim allocation file returned %d\n", error
);
4681 /* Relocate extents of the Extents B-tree if they're in the way. */
4682 error
= hfs_reclaim_sys_file(hfsmp
, hfsmp
->hfs_extents_vp
, startblk
, SFL_EXTENTS
, &system_file_moved
, context
);
4684 printf("hfs_reclaimspace: reclaim extents b-tree returned %d\n", error
);
4687 /* Relocate extents of the Catalog B-tree if they're in the way. */
4688 error
= hfs_reclaim_sys_file(hfsmp
, hfsmp
->hfs_catalog_vp
, startblk
, SFL_CATALOG
, &system_file_moved
, context
);
4690 printf("hfs_reclaimspace: reclaim catalog b-tree returned %d\n", error
);
4693 /* Relocate extents of the Attributes B-tree if they're in the way. */
4694 error
= hfs_reclaim_sys_file(hfsmp
, hfsmp
->hfs_attribute_vp
, startblk
, SFL_ATTRIBUTE
, &system_file_moved
, context
);
4696 printf("hfs_reclaimspace: reclaim attribute b-tree returned %d\n", error
);
4699 /* Relocate extents of the Startup File if there is one and they're in the way. */
4700 error
= hfs_reclaim_sys_file(hfsmp
, hfsmp
->hfs_startup_vp
, startblk
, SFL_STARTUP
, &system_file_moved
, context
);
4702 printf("hfs_reclaimspace: reclaim startup file returned %d\n", error
);
4707 * We need to make sure the alternate volume header gets flushed if we moved
4708 * any extents in the volume header. But we need to do that before
4709 * shrinking the size of the volume, or else the journal code will panic
4710 * with an invalid (too large) block number.
4712 * Note that system_file_moved will be set if ANY extent was moved, even
4713 * if it was just an overflow extent. In this case, the journal_flush isn't
4714 * strictly required, but shouldn't hurt.
4716 if (system_file_moved
)
4717 hfs_journal_flush(hfsmp
);
4719 if (hfsmp
->jnl_start
+ (hfsmp
->jnl_size
/ hfsmp
->blockSize
) > startblk
) {
4720 error
= hfs_reclaim_journal_file(hfsmp
, context
);
4722 printf("hfs_reclaimspace: hfs_reclaim_journal_file failed (%d)\n", error
);
4727 if (hfsmp
->vcbJinfoBlock
>= startblk
) {
4728 error
= hfs_reclaim_journal_info_block(hfsmp
, context
);
4730 printf("hfs_reclaimspace: hfs_reclaim_journal_info_block failed (%d)\n", error
);
4735 /* For now move a maximum of 250,000 files. */
4736 maxfilecnt
= MIN(hfsmp
->hfs_filecount
, 250000);
4737 maxfilecnt
= MIN((u_int32_t
)maxfilecnt
, reclaimblks
);
4738 cnidbufsize
= maxfilecnt
* sizeof(cnid_t
);
4739 if (kmem_alloc(kernel_map
, (vm_offset_t
*)&cnidbufp
, cnidbufsize
)) {
4742 if (kmem_alloc(kernel_map
, (vm_offset_t
*)&iterator
, sizeof(*iterator
))) {
4743 kmem_free(kernel_map
, (vm_offset_t
)cnidbufp
, cnidbufsize
);
4747 saved_next_allocation
= hfsmp
->nextAllocation
;
4748 HFS_UPDATE_NEXT_ALLOCATION(hfsmp
, hfsmp
->hfs_metazone_start
);
4750 fcb
= VTOF(hfsmp
->hfs_catalog_vp
);
4751 bzero(iterator
, sizeof(*iterator
));
4753 btdata
.bufferAddress
= &filerec
;
4754 btdata
.itemSize
= sizeof(filerec
);
4755 btdata
.itemCount
= 1;
4757 /* Keep the Catalog and extents files locked during iteration. */
4758 lockflags
= hfs_systemfile_lock(hfsmp
, SFL_CATALOG
| SFL_EXTENTS
, HFS_SHARED_LOCK
);
4760 error
= BTIterateRecord(fcb
, kBTreeFirstRecord
, iterator
, NULL
, NULL
);
4765 * Iterate over all the catalog records looking for files
4766 * that overlap into the space we're trying to free up.
4768 for (filecnt
= 0; filecnt
< maxfilecnt
; ) {
4769 error
= BTIterateRecord(fcb
, kBTreeNextRecord
, iterator
, &btdata
, NULL
);
4771 if (error
== fsBTRecordNotFoundErr
|| error
== fsBTEndOfIterationErr
) {
4776 if (filerec
.recordType
!= kHFSPlusFileRecord
) {
4779 datablks
= rsrcblks
= 0;
4781 * Check if either fork overlaps target space.
4783 for (i
= 0; i
< kHFSPlusExtentDensity
; ++i
) {
4784 if (filerec
.dataFork
.extents
[i
].blockCount
!= 0) {
4785 datablks
+= filerec
.dataFork
.extents
[i
].blockCount
;
4786 block
= filerec
.dataFork
.extents
[i
].startBlock
+
4787 filerec
.dataFork
.extents
[i
].blockCount
;
4788 if (block
>= startblk
) {
4789 if ((filerec
.fileID
== hfsmp
->hfs_jnlfileid
) ||
4790 (filerec
.fileID
== hfsmp
->hfs_jnlinfoblkid
)) {
4791 printf("hfs_reclaimspace: cannot move active journal\n");
4795 cnidbufp
[filecnt
++] = filerec
.fileID
;
4796 blkstomove
+= filerec
.dataFork
.totalBlocks
;
4800 if (filerec
.resourceFork
.extents
[i
].blockCount
!= 0) {
4801 rsrcblks
+= filerec
.resourceFork
.extents
[i
].blockCount
;
4802 block
= filerec
.resourceFork
.extents
[i
].startBlock
+
4803 filerec
.resourceFork
.extents
[i
].blockCount
;
4804 if (block
>= startblk
) {
4805 cnidbufp
[filecnt
++] = filerec
.fileID
;
4806 blkstomove
+= filerec
.resourceFork
.totalBlocks
;
4812 * Check for any overflow extents that overlap.
4814 if (i
== kHFSPlusExtentDensity
) {
4815 if (filerec
.dataFork
.totalBlocks
> datablks
) {
4816 if (hfs_overlapped_overflow_extents(hfsmp
, startblk
, datablks
, filerec
.fileID
, 0)) {
4817 cnidbufp
[filecnt
++] = filerec
.fileID
;
4818 blkstomove
+= filerec
.dataFork
.totalBlocks
;
4820 } else if (filerec
.resourceFork
.totalBlocks
> rsrcblks
) {
4821 if (hfs_overlapped_overflow_extents(hfsmp
, startblk
, rsrcblks
, filerec
.fileID
, 1)) {
4822 cnidbufp
[filecnt
++] = filerec
.fileID
;
4823 blkstomove
+= filerec
.resourceFork
.totalBlocks
;
4830 if (filecnt
== 0 && !system_file_moved
) {
4831 printf("hfs_reclaimspace: no files moved\n");
4834 /* All done with catalog. */
4835 hfs_systemfile_unlock(hfsmp
, lockflags
);
4836 if (error
|| filecnt
== 0)
4840 * Double check space requirements to make sure
4841 * there is enough space to relocate any files
4842 * that reside in the reclaim area.
4844 * Blocks To Move --------------
4847 * ------------------------------------------------------------------------
4851 * ------------------------------------------------------------------------
4853 * <------------------- New Total Blocks ------------------><-- Reclaim -->
4855 * <------------------------ Original Total Blocks ----------------------->
4858 if (blkstomove
>= hfs_freeblks(hfsmp
, 1)) {
4859 printf("hfs_truncatefs: insufficient space (need %u blocks; have %u blocks)\n", blkstomove
, hfs_freeblks(hfsmp
, 1));
4863 hfsmp
->hfs_resize_filesmoved
= 0;
4864 hfsmp
->hfs_resize_totalfiles
= filecnt
;
4866 /* Now move any files that are in the way. */
4867 for (i
= 0; i
< filecnt
; ++i
) {
4871 if (hfs_vget(hfsmp
, cnidbufp
[i
], &vp
, 0) != 0)
4874 /* Relocating directory hard links is not supported, so we
4875 * punt (see radar 6217026). */
4877 if ((cp
->c_flag
& C_HARDLINK
) && vnode_isdir(vp
)) {
4878 printf("hfs_reclaimspace: unable to relocate directory hard link %d\n", cp
->c_cnid
);
4883 /* Relocate any data fork blocks. */
4884 if (VTOF(vp
) && VTOF(vp
)->ff_blocks
> 0) {
4885 error
= hfs_relocate(vp
, hfsmp
->hfs_metazone_end
+ 1, kauth_cred_get(), current_proc());
4890 /* Relocate any resource fork blocks. */
4891 if ((cp
->c_blocks
- (VTOF(vp
) ? VTOF((vp
))->ff_blocks
: 0)) > 0) {
4892 error
= hfs_vgetrsrc(hfsmp
, vp
, &rvp
, TRUE
);
4895 error
= hfs_relocate(rvp
, hfsmp
->hfs_metazone_end
+ 1, kauth_cred_get(), current_proc());
4896 VTOC(rvp
)->c_flag
|= C_NEED_RVNODE_PUT
;
4904 ++hfsmp
->hfs_resize_filesmoved
;
4906 /* Report intermediate progress. */
4907 if (filecnt
> 100) {
4910 progress
= (i
* 100) / filecnt
;
4911 if (progress
> (lastprogress
+ 9)) {
4912 printf("hfs_reclaimspace: %d%% done...\n", progress
);
4913 lastprogress
= progress
;
4918 hfs_unlock(VTOC(vp
));
4922 if (hfsmp
->hfs_resize_filesmoved
!= 0) {
4923 printf("hfs_reclaimspace: relocated %d files on \"%s\"\n",
4924 (int)hfsmp
->hfs_resize_filesmoved
, hfsmp
->vcbVN
);
4927 kmem_free(kernel_map
, (vm_offset_t
)iterator
, sizeof(*iterator
));
4928 kmem_free(kernel_map
, (vm_offset_t
)cnidbufp
, cnidbufsize
);
4931 * Restore the roving allocation pointer on errors.
4932 * (but only if we didn't move any files)
4934 if (error
&& hfsmp
->hfs_resize_filesmoved
== 0) {
4935 HFS_UPDATE_NEXT_ALLOCATION(hfsmp
, saved_next_allocation
);
4942 * Check if there are any overflow extents that overlap.
4945 hfs_overlapped_overflow_extents(struct hfsmount
*hfsmp
, u_int32_t startblk
, u_int32_t catblks
, u_int32_t fileID
, int rsrcfork
)
4947 struct BTreeIterator
* iterator
= NULL
;
4948 struct FSBufferDescriptor btdata
;
4949 HFSPlusExtentRecord extrec
;
4950 HFSPlusExtentKey
*extkeyptr
;
4958 forktype
= rsrcfork
? 0xFF : 0;
4959 if (kmem_alloc(kernel_map
, (vm_offset_t
*)&iterator
, sizeof(*iterator
))) {
4962 bzero(iterator
, sizeof(*iterator
));
4963 extkeyptr
= (HFSPlusExtentKey
*)&iterator
->key
;
4964 extkeyptr
->keyLength
= kHFSPlusExtentKeyMaximumLength
;
4965 extkeyptr
->forkType
= forktype
;
4966 extkeyptr
->fileID
= fileID
;
4967 extkeyptr
->startBlock
= catblks
;
4969 btdata
.bufferAddress
= &extrec
;
4970 btdata
.itemSize
= sizeof(extrec
);
4971 btdata
.itemCount
= 1;
4973 fcb
= VTOF(hfsmp
->hfs_extents_vp
);
4975 error
= BTSearchRecord(fcb
, iterator
, &btdata
, NULL
, iterator
);
4976 while (error
== 0) {
4977 /* Stop when we encounter a different file. */
4978 if ((extkeyptr
->fileID
!= fileID
) ||
4979 (extkeyptr
->forkType
!= forktype
)) {
4983 * Check if the file overlaps target space.
4985 for (i
= 0; i
< kHFSPlusExtentDensity
; ++i
) {
4986 if (extrec
[i
].blockCount
== 0) {
4989 block
= extrec
[i
].startBlock
+ extrec
[i
].blockCount
;
4990 if (block
>= startblk
) {
4995 /* Look for more records. */
4996 error
= BTIterateRecord(fcb
, kBTreeNextRecord
, iterator
, &btdata
, NULL
);
4999 kmem_free(kernel_map
, (vm_offset_t
)iterator
, sizeof(*iterator
));
5000 return (overlapped
);
5005 * Calculate the progress of a file system resize operation.
5009 hfs_resize_progress(struct hfsmount
*hfsmp
, u_int32_t
*progress
)
5011 if ((hfsmp
->hfs_flags
& HFS_RESIZE_IN_PROGRESS
) == 0) {
5015 if (hfsmp
->hfs_resize_totalfiles
> 0)
5016 *progress
= (hfsmp
->hfs_resize_filesmoved
* 100) / hfsmp
->hfs_resize_totalfiles
;
5025 * Creates a UUID from a unique "name" in the HFS UUID Name space.
5026 * See version 3 UUID.
5029 hfs_getvoluuid(struct hfsmount
*hfsmp
, uuid_t result
)
5034 ((uint32_t *)rawUUID
)[0] = hfsmp
->vcbFndrInfo
[6];
5035 ((uint32_t *)rawUUID
)[1] = hfsmp
->vcbFndrInfo
[7];
5038 MD5Update( &md5c
, HFS_UUID_NAMESPACE_ID
, sizeof( uuid_t
) );
5039 MD5Update( &md5c
, rawUUID
, sizeof (rawUUID
) );
5040 MD5Final( result
, &md5c
);
5042 result
[6] = 0x30 | ( result
[6] & 0x0F );
5043 result
[8] = 0x80 | ( result
[8] & 0x3F );
5047 * Get file system attributes.
5050 hfs_vfs_getattr(struct mount
*mp
, struct vfs_attr
*fsap
, __unused vfs_context_t context
)
5052 #define HFS_ATTR_CMN_VALIDMASK (ATTR_CMN_VALIDMASK & ~(ATTR_CMN_NAMEDATTRCOUNT | ATTR_CMN_NAMEDATTRLIST))
5053 #define HFS_ATTR_FILE_VALIDMASK (ATTR_FILE_VALIDMASK & ~(ATTR_FILE_FILETYPE | ATTR_FILE_FORKCOUNT | ATTR_FILE_FORKLIST))
5055 ExtendedVCB
*vcb
= VFSTOVCB(mp
);
5056 struct hfsmount
*hfsmp
= VFSTOHFS(mp
);
5057 u_int32_t freeCNIDs
;
5059 freeCNIDs
= (u_int32_t
)0xFFFFFFFF - (u_int32_t
)hfsmp
->vcbNxtCNID
;
5061 VFSATTR_RETURN(fsap
, f_objcount
, (u_int64_t
)hfsmp
->vcbFilCnt
+ (u_int64_t
)hfsmp
->vcbDirCnt
);
5062 VFSATTR_RETURN(fsap
, f_filecount
, (u_int64_t
)hfsmp
->vcbFilCnt
);
5063 VFSATTR_RETURN(fsap
, f_dircount
, (u_int64_t
)hfsmp
->vcbDirCnt
);
5064 VFSATTR_RETURN(fsap
, f_maxobjcount
, (u_int64_t
)0xFFFFFFFF);
5065 VFSATTR_RETURN(fsap
, f_iosize
, (size_t)cluster_max_io_size(mp
, 0));
5066 VFSATTR_RETURN(fsap
, f_blocks
, (u_int64_t
)hfsmp
->totalBlocks
);
5067 VFSATTR_RETURN(fsap
, f_bfree
, (u_int64_t
)hfs_freeblks(hfsmp
, 0));
5068 VFSATTR_RETURN(fsap
, f_bavail
, (u_int64_t
)hfs_freeblks(hfsmp
, 1));
5069 VFSATTR_RETURN(fsap
, f_bsize
, (u_int32_t
)vcb
->blockSize
);
5070 /* XXX needs clarification */
5071 VFSATTR_RETURN(fsap
, f_bused
, hfsmp
->totalBlocks
- hfs_freeblks(hfsmp
, 1));
5072 /* Maximum files is constrained by total blocks. */
5073 VFSATTR_RETURN(fsap
, f_files
, (u_int64_t
)(hfsmp
->totalBlocks
- 2));
5074 VFSATTR_RETURN(fsap
, f_ffree
, MIN((u_int64_t
)freeCNIDs
, (u_int64_t
)hfs_freeblks(hfsmp
, 1)));
5076 fsap
->f_fsid
.val
[0] = hfsmp
->hfs_raw_dev
;
5077 fsap
->f_fsid
.val
[1] = vfs_typenum(mp
);
5078 VFSATTR_SET_SUPPORTED(fsap
, f_fsid
);
5080 VFSATTR_RETURN(fsap
, f_signature
, vcb
->vcbSigWord
);
5081 VFSATTR_RETURN(fsap
, f_carbon_fsid
, 0);
5083 if (VFSATTR_IS_ACTIVE(fsap
, f_capabilities
)) {
5084 vol_capabilities_attr_t
*cap
;
5086 cap
= &fsap
->f_capabilities
;
5088 if (hfsmp
->hfs_flags
& HFS_STANDARD
) {
5089 cap
->capabilities
[VOL_CAPABILITIES_FORMAT
] =
5090 VOL_CAP_FMT_PERSISTENTOBJECTIDS
|
5091 VOL_CAP_FMT_CASE_PRESERVING
|
5092 VOL_CAP_FMT_FAST_STATFS
|
5093 VOL_CAP_FMT_HIDDEN_FILES
|
5094 VOL_CAP_FMT_PATH_FROM_ID
;
5096 cap
->capabilities
[VOL_CAPABILITIES_FORMAT
] =
5097 VOL_CAP_FMT_PERSISTENTOBJECTIDS
|
5098 VOL_CAP_FMT_SYMBOLICLINKS
|
5099 VOL_CAP_FMT_HARDLINKS
|
5100 VOL_CAP_FMT_JOURNAL
|
5101 VOL_CAP_FMT_ZERO_RUNS
|
5102 (hfsmp
->jnl
? VOL_CAP_FMT_JOURNAL_ACTIVE
: 0) |
5103 (hfsmp
->hfs_flags
& HFS_CASE_SENSITIVE
? VOL_CAP_FMT_CASE_SENSITIVE
: 0) |
5104 VOL_CAP_FMT_CASE_PRESERVING
|
5105 VOL_CAP_FMT_FAST_STATFS
|
5106 VOL_CAP_FMT_2TB_FILESIZE
|
5107 VOL_CAP_FMT_HIDDEN_FILES
|
5109 VOL_CAP_FMT_PATH_FROM_ID
|
5110 VOL_CAP_FMT_DECMPFS_COMPRESSION
;
5112 VOL_CAP_FMT_PATH_FROM_ID
;
5115 cap
->capabilities
[VOL_CAPABILITIES_INTERFACES
] =
5116 VOL_CAP_INT_SEARCHFS
|
5117 VOL_CAP_INT_ATTRLIST
|
5118 VOL_CAP_INT_NFSEXPORT
|
5119 VOL_CAP_INT_READDIRATTR
|
5120 VOL_CAP_INT_EXCHANGEDATA
|
5121 VOL_CAP_INT_ALLOCATE
|
5122 VOL_CAP_INT_VOL_RENAME
|
5123 VOL_CAP_INT_ADVLOCK
|
5126 VOL_CAP_INT_EXTENDED_ATTR
|
5127 VOL_CAP_INT_NAMEDSTREAMS
;
5129 VOL_CAP_INT_EXTENDED_ATTR
;
5131 cap
->capabilities
[VOL_CAPABILITIES_RESERVED1
] = 0;
5132 cap
->capabilities
[VOL_CAPABILITIES_RESERVED2
] = 0;
5134 cap
->valid
[VOL_CAPABILITIES_FORMAT
] =
5135 VOL_CAP_FMT_PERSISTENTOBJECTIDS
|
5136 VOL_CAP_FMT_SYMBOLICLINKS
|
5137 VOL_CAP_FMT_HARDLINKS
|
5138 VOL_CAP_FMT_JOURNAL
|
5139 VOL_CAP_FMT_JOURNAL_ACTIVE
|
5140 VOL_CAP_FMT_NO_ROOT_TIMES
|
5141 VOL_CAP_FMT_SPARSE_FILES
|
5142 VOL_CAP_FMT_ZERO_RUNS
|
5143 VOL_CAP_FMT_CASE_SENSITIVE
|
5144 VOL_CAP_FMT_CASE_PRESERVING
|
5145 VOL_CAP_FMT_FAST_STATFS
|
5146 VOL_CAP_FMT_2TB_FILESIZE
|
5147 VOL_CAP_FMT_OPENDENYMODES
|
5148 VOL_CAP_FMT_HIDDEN_FILES
|
5150 VOL_CAP_FMT_PATH_FROM_ID
|
5151 VOL_CAP_FMT_DECMPFS_COMPRESSION
;
5153 VOL_CAP_FMT_PATH_FROM_ID
;
5155 cap
->valid
[VOL_CAPABILITIES_INTERFACES
] =
5156 VOL_CAP_INT_SEARCHFS
|
5157 VOL_CAP_INT_ATTRLIST
|
5158 VOL_CAP_INT_NFSEXPORT
|
5159 VOL_CAP_INT_READDIRATTR
|
5160 VOL_CAP_INT_EXCHANGEDATA
|
5161 VOL_CAP_INT_COPYFILE
|
5162 VOL_CAP_INT_ALLOCATE
|
5163 VOL_CAP_INT_VOL_RENAME
|
5164 VOL_CAP_INT_ADVLOCK
|
5166 VOL_CAP_INT_MANLOCK
|
5168 VOL_CAP_INT_EXTENDED_ATTR
|
5169 VOL_CAP_INT_NAMEDSTREAMS
;
5171 VOL_CAP_INT_EXTENDED_ATTR
;
5173 cap
->valid
[VOL_CAPABILITIES_RESERVED1
] = 0;
5174 cap
->valid
[VOL_CAPABILITIES_RESERVED2
] = 0;
5175 VFSATTR_SET_SUPPORTED(fsap
, f_capabilities
);
5177 if (VFSATTR_IS_ACTIVE(fsap
, f_attributes
)) {
5178 vol_attributes_attr_t
*attrp
= &fsap
->f_attributes
;
5180 attrp
->validattr
.commonattr
= HFS_ATTR_CMN_VALIDMASK
;
5181 attrp
->validattr
.volattr
= ATTR_VOL_VALIDMASK
& ~ATTR_VOL_INFO
;
5182 attrp
->validattr
.dirattr
= ATTR_DIR_VALIDMASK
;
5183 attrp
->validattr
.fileattr
= HFS_ATTR_FILE_VALIDMASK
;
5184 attrp
->validattr
.forkattr
= 0;
5186 attrp
->nativeattr
.commonattr
= HFS_ATTR_CMN_VALIDMASK
;
5187 attrp
->nativeattr
.volattr
= ATTR_VOL_VALIDMASK
& ~ATTR_VOL_INFO
;
5188 attrp
->nativeattr
.dirattr
= ATTR_DIR_VALIDMASK
;
5189 attrp
->nativeattr
.fileattr
= HFS_ATTR_FILE_VALIDMASK
;
5190 attrp
->nativeattr
.forkattr
= 0;
5191 VFSATTR_SET_SUPPORTED(fsap
, f_attributes
);
5193 fsap
->f_create_time
.tv_sec
= hfsmp
->vcbCrDate
;
5194 fsap
->f_create_time
.tv_nsec
= 0;
5195 VFSATTR_SET_SUPPORTED(fsap
, f_create_time
);
5196 fsap
->f_modify_time
.tv_sec
= hfsmp
->vcbLsMod
;
5197 fsap
->f_modify_time
.tv_nsec
= 0;
5198 VFSATTR_SET_SUPPORTED(fsap
, f_modify_time
);
5200 fsap
->f_backup_time
.tv_sec
= hfsmp
->vcbVolBkUp
;
5201 fsap
->f_backup_time
.tv_nsec
= 0;
5202 VFSATTR_SET_SUPPORTED(fsap
, f_backup_time
);
5203 if (VFSATTR_IS_ACTIVE(fsap
, f_fssubtype
)) {
5204 u_int16_t subtype
= 0;
5207 * Subtypes (flavors) for HFS
5208 * 0: Mac OS Extended
5209 * 1: Mac OS Extended (Journaled)
5210 * 2: Mac OS Extended (Case Sensitive)
5211 * 3: Mac OS Extended (Case Sensitive, Journaled)
5213 * 128: Mac OS Standard
5216 if (hfsmp
->hfs_flags
& HFS_STANDARD
) {
5217 subtype
= HFS_SUBTYPE_STANDARDHFS
;
5218 } else /* HFS Plus */ {
5220 subtype
|= HFS_SUBTYPE_JOURNALED
;
5221 if (hfsmp
->hfs_flags
& HFS_CASE_SENSITIVE
)
5222 subtype
|= HFS_SUBTYPE_CASESENSITIVE
;
5224 fsap
->f_fssubtype
= subtype
;
5225 VFSATTR_SET_SUPPORTED(fsap
, f_fssubtype
);
5228 if (VFSATTR_IS_ACTIVE(fsap
, f_vol_name
)) {
5229 strlcpy(fsap
->f_vol_name
, (char *) hfsmp
->vcbVN
, MAXPATHLEN
);
5230 VFSATTR_SET_SUPPORTED(fsap
, f_vol_name
);
5232 if (VFSATTR_IS_ACTIVE(fsap
, f_uuid
)) {
5233 hfs_getvoluuid(hfsmp
, fsap
->f_uuid
);
5234 VFSATTR_SET_SUPPORTED(fsap
, f_uuid
);
5240 * Perform a volume rename. Requires the FS' root vp.
5243 hfs_rename_volume(struct vnode
*vp
, const char *name
, proc_t p
)
5245 ExtendedVCB
*vcb
= VTOVCB(vp
);
5246 struct cnode
*cp
= VTOC(vp
);
5247 struct hfsmount
*hfsmp
= VTOHFS(vp
);
5248 struct cat_desc to_desc
;
5249 struct cat_desc todir_desc
;
5250 struct cat_desc new_desc
;
5251 cat_cookie_t cookie
;
5256 * Ignore attempts to rename a volume to a zero-length name.
5261 bzero(&to_desc
, sizeof(to_desc
));
5262 bzero(&todir_desc
, sizeof(todir_desc
));
5263 bzero(&new_desc
, sizeof(new_desc
));
5264 bzero(&cookie
, sizeof(cookie
));
5266 todir_desc
.cd_parentcnid
= kHFSRootParentID
;
5267 todir_desc
.cd_cnid
= kHFSRootFolderID
;
5268 todir_desc
.cd_flags
= CD_ISDIR
;
5270 to_desc
.cd_nameptr
= (const u_int8_t
*)name
;
5271 to_desc
.cd_namelen
= strlen(name
);
5272 to_desc
.cd_parentcnid
= kHFSRootParentID
;
5273 to_desc
.cd_cnid
= cp
->c_cnid
;
5274 to_desc
.cd_flags
= CD_ISDIR
;
5276 if ((error
= hfs_lock(cp
, HFS_EXCLUSIVE_LOCK
)) == 0) {
5277 if ((error
= hfs_start_transaction(hfsmp
)) == 0) {
5278 if ((error
= cat_preflight(hfsmp
, CAT_RENAME
, &cookie
, p
)) == 0) {
5279 lockflags
= hfs_systemfile_lock(hfsmp
, SFL_CATALOG
, HFS_EXCLUSIVE_LOCK
);
5281 error
= cat_rename(hfsmp
, &cp
->c_desc
, &todir_desc
, &to_desc
, &new_desc
);
5284 * If successful, update the name in the VCB, ensure it's terminated.
5287 strlcpy((char *)vcb
->vcbVN
, name
, sizeof(vcb
->vcbVN
));
5290 hfs_systemfile_unlock(hfsmp
, lockflags
);
5291 cat_postflight(hfsmp
, &cookie
, p
);
5295 (void) hfs_flushvolumeheader(hfsmp
, MNT_WAIT
, 0);
5297 hfs_end_transaction(hfsmp
);
5300 /* Release old allocated name buffer */
5301 if (cp
->c_desc
.cd_flags
& CD_HASBUF
) {
5302 const char *tmp_name
= (const char *)cp
->c_desc
.cd_nameptr
;
5304 cp
->c_desc
.cd_nameptr
= 0;
5305 cp
->c_desc
.cd_namelen
= 0;
5306 cp
->c_desc
.cd_flags
&= ~CD_HASBUF
;
5307 vfs_removename(tmp_name
);
5309 /* Update cnode's catalog descriptor */
5310 replace_desc(cp
, &new_desc
);
5311 vcb
->volumeNameEncodingHint
= new_desc
.cd_encoding
;
5312 cp
->c_touch_chgtime
= TRUE
;
5322 * Get file system attributes.
5325 hfs_vfs_setattr(struct mount
*mp
, struct vfs_attr
*fsap
, __unused vfs_context_t context
)
5327 kauth_cred_t cred
= vfs_context_ucred(context
);
5331 * Must be superuser or owner of filesystem to change volume attributes
5333 if (!kauth_cred_issuser(cred
) && (kauth_cred_getuid(cred
) != vfs_statfs(mp
)->f_owner
))
5336 if (VFSATTR_IS_ACTIVE(fsap
, f_vol_name
)) {
5339 error
= hfs_vfs_root(mp
, &root_vp
, context
);
5343 error
= hfs_rename_volume(root_vp
, fsap
->f_vol_name
, vfs_context_proc(context
));
5344 (void) vnode_put(root_vp
);
5348 VFSATTR_SET_SUPPORTED(fsap
, f_vol_name
);
5355 /* If a runtime corruption is detected, set the volume inconsistent
5356 * bit in the volume attributes. The volume inconsistent bit is a persistent
5357 * bit which represents that the volume is corrupt and needs repair.
5358 * The volume inconsistent bit can be set from the kernel when it detects
5359 * runtime corruption or from file system repair utilities like fsck_hfs when
5360 * a repair operation fails. The bit should be cleared only from file system
5361 * verify/repair utility like fsck_hfs when a verify/repair succeeds.
5363 void hfs_mark_volume_inconsistent(struct hfsmount
*hfsmp
)
5365 HFS_MOUNT_LOCK(hfsmp
, TRUE
);
5366 if ((hfsmp
->vcbAtrb
& kHFSVolumeInconsistentMask
) == 0) {
5367 hfsmp
->vcbAtrb
|= kHFSVolumeInconsistentMask
;
5368 MarkVCBDirty(hfsmp
);
5370 if ((hfsmp
->hfs_flags
& HFS_READ_ONLY
)==0) {
5371 /* Log information to ASL log */
5372 fslog_fs_corrupt(hfsmp
->hfs_mp
);
5373 printf("hfs: Runtime corruption detected on %s, fsck will be forced on next mount.\n", hfsmp
->vcbVN
);
5375 HFS_MOUNT_UNLOCK(hfsmp
, TRUE
);
5378 /* Replay the journal on the device node provided. Returns zero if
5379 * journal replay succeeded or no journal was supposed to be replayed.
5381 static int hfs_journal_replay(vnode_t devvp
, vfs_context_t context
)
5384 struct mount
*mp
= NULL
;
5385 struct hfs_mount_args
*args
= NULL
;
5387 /* Replay allowed only on raw devices */
5388 if (!vnode_ischr(devvp
)) {
5393 /* Create dummy mount structures */
5394 MALLOC(mp
, struct mount
*, sizeof(struct mount
), M_TEMP
, M_WAITOK
);
5399 bzero(mp
, sizeof(struct mount
));
5400 mount_lock_init(mp
);
5402 MALLOC(args
, struct hfs_mount_args
*, sizeof(struct hfs_mount_args
), M_TEMP
, M_WAITOK
);
5407 bzero(args
, sizeof(struct hfs_mount_args
));
5409 retval
= hfs_mountfs(devvp
, mp
, args
, 1, context
);
5410 buf_flushdirtyblks(devvp
, MNT_WAIT
, 0, "hfs_journal_replay");
5414 mount_lock_destroy(mp
);
5424 * hfs vfs operations.
5426 struct vfsops hfs_vfsops
= {
5432 hfs_vfs_getattr
, /* was hfs_statfs */