bsd/hfs/hfs_vfsops.c

   1 /*
   2  * Copyright (c) 1999-2008 Apple Inc. All rights reserved.
   3  *
   4  * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
   5  *
   6  * This file contains Original Code and/or Modifications of Original Code
   7  * as defined in and that are subject to the Apple Public Source License
   8  * Version 2.0 (the 'License'). You may not use this file except in
   9  * compliance with the License. The rights granted to you under the License
  10  * may not be used to create, or enable the creation or redistribution of,
  11  * unlawful or unlicensed copies of an Apple operating system, or to
  12  * circumvent, violate, or enable the circumvention or violation of, any
  13  * terms of an Apple operating system software license agreement.
  14  *
  15  * Please obtain a copy of the License at
  16  * http://www.opensource.apple.com/apsl/ and read it before using this file.
  17  *
  18  * The Original Code and all software distributed under the License are
  19  * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
  20  * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
  21  * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
  22  * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
  23  * Please see the License for the specific language governing rights and
  24  * limitations under the License.
  25  *
  26  * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
  27  */
  28 /*
  29  * Copyright (c) 1991, 1993, 1994
  30  *      The Regents of the University of California.  All rights reserved.
  31  * (c) UNIX System Laboratories, Inc.
  32  * All or some portions of this file are derived from material licensed
  33  * to the University of California by American Telephone and Telegraph
  34  * Co. or Unix System Laboratories, Inc. and are reproduced herein with
  35  * the permission of UNIX System Laboratories, Inc.
  36  *
  37  * Redistribution and use in source and binary forms, with or without
  38  * modification, are permitted provided that the following conditions
  39  * are met:
  40  * 1. Redistributions of source code must retain the above copyright
  41  *    notice, this list of conditions and the following disclaimer.
  42  * 2. Redistributions in binary form must reproduce the above copyright
  43  *    notice, this list of conditions and the following disclaimer in the
  44  *    documentation and/or other materials provided with the distribution.
  45  * 3. All advertising materials mentioning features or use of this software
  46  *    must display the following acknowledgement:
  47  *      This product includes software developed by the University of
  48  *      California, Berkeley and its contributors.
  49  * 4. Neither the name of the University nor the names of its contributors
  50  *    may be used to endorse or promote products derived from this software
  51  *    without specific prior written permission.
  52  *
  53  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
  54  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  55  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  56  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
  57  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  58  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  59  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  60  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  61  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  62  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  63  * SUCH DAMAGE.
  64  *
  65  *      hfs_vfsops.c
  66  *  derived from        @(#)ufs_vfsops.c        8.8 (Berkeley) 5/20/95
  67  *
  68  *      (c) Copyright 1997-2002 Apple Computer, Inc. All rights reserved.
  69  *
  70  *      hfs_vfsops.c -- VFS layer for loadable HFS file system.
  71  *
  72  */
  73 #include <sys/param.h>
  74 #include <sys/systm.h>
  75 #include <sys/kauth.h>
  76
  77 #include <sys/ubc.h>
  78 #include <sys/vnode_internal.h>
  79 #include <sys/mount_internal.h>
  80 #include <sys/sysctl.h>
  81 #include <sys/malloc.h>
  82 #include <sys/stat.h>
  83 #include <sys/quota.h>
  84 #include <sys/disk.h>
  85 #include <sys/paths.h>
  86 #include <sys/utfconv.h>
  87 #include <sys/kdebug.h>
  88 #include <sys/fslog.h>
  89
  90 #include <kern/locks.h>
  91
  92 #include <vfs/vfs_journal.h>
  93
  94 #include <miscfs/specfs/specdev.h>
  95 #include <hfs/hfs_mount.h>
  96
  97 #include "hfs.h"
  98 #include "hfs_catalog.h"
  99 #include "hfs_cnode.h"
 100 #include "hfs_dbg.h"
 101 #include "hfs_endian.h"
 102 #include "hfs_hotfiles.h"
 103 #include "hfs_quota.h"
 104
 105 #include "hfscommon/headers/FileMgrInternal.h"
 106 #include "hfscommon/headers/BTreesInternal.h"
 107
 108 #if     HFS_DIAGNOSTIC
 109 int hfs_dbg_all = 0;
 110 int hfs_dbg_err = 0;
 111 #endif
 112
 113
 114 lck_grp_attr_t *  hfs_group_attr;
 115 lck_attr_t *  hfs_lock_attr;
 116 lck_grp_t *  hfs_mutex_group;
 117 lck_grp_t *  hfs_rwlock_group;
 118
 119 extern struct vnodeopv_desc hfs_vnodeop_opv_desc;
 120
 121 static int hfs_changefs(struct mount *mp, struct hfs_mount_args *args);
 122 static int hfs_fhtovp(struct mount *mp, int fhlen, unsigned char *fhp, struct vnode **vpp, vfs_context_t context);
 123 static int hfs_flushfiles(struct mount *, int, struct proc *);
 124 static int hfs_flushMDB(struct hfsmount *hfsmp, int waitfor, int altflush);
 125 static int hfs_getmountpoint(struct vnode *vp, struct hfsmount **hfsmpp);
 126 static int hfs_init(struct vfsconf *vfsp);
 127 static int hfs_mount(struct mount *mp, vnode_t  devvp, user_addr_t data, vfs_context_t context);
 128 static int hfs_mountfs(struct vnode *devvp, struct mount *mp, struct hfs_mount_args *args, int journal_replay_only, vfs_context_t context);
 129 static int hfs_reload(struct mount *mp);
 130 static int hfs_vfs_root(struct mount *mp, struct vnode **vpp, vfs_context_t context);
 131 static int hfs_quotactl(struct mount *, int, uid_t, caddr_t, vfs_context_t context);
 132 static int hfs_start(struct mount *mp, int flags, vfs_context_t context);
 133 static int hfs_statfs(struct mount *mp, register struct vfsstatfs *sbp, vfs_context_t context);
 134 static int hfs_sync(struct mount *mp, int waitfor, vfs_context_t context);
 135 static int hfs_sysctl(int *name, u_int namelen, user_addr_t oldp, size_t *oldlenp,
 136                       user_addr_t newp, size_t newlen, vfs_context_t context);
 137 static int hfs_unmount(struct mount *mp, int mntflags, vfs_context_t context);
 138 static int hfs_vfs_vget(struct mount *mp, ino64_t ino, struct vnode **vpp, vfs_context_t context);
 139 static int hfs_vptofh(struct vnode *vp, int *fhlenp, unsigned char *fhp, vfs_context_t context);
 140
 141 static int hfs_reclaimspace(struct hfsmount *hfsmp, u_long startblk, u_long reclaimblks, vfs_context_t context);
 142 static int hfs_overlapped_overflow_extents(struct hfsmount *hfsmp, u_int32_t startblk,
 143                                            u_int32_t catblks, u_int32_t fileID, int rsrcfork);
 144 static int hfs_journal_replay(const char *devnode, vfs_context_t context);
 145
 146
 147 /*
 148  * Called by vfs_mountroot when mounting HFS Plus as root.
 149  */
 150
 151 __private_extern__
 152 int
 153 hfs_mountroot(mount_t mp, vnode_t rvp, vfs_context_t context)
 154 {
 155         struct hfsmount *hfsmp;
 156         ExtendedVCB *vcb;
 157         struct vfsstatfs *vfsp;
 158         int error;
 159
 160         hfs_chashinit_finish();
 161
 162         if ((error = hfs_mountfs(rvp, mp, NULL, 0, context)))
 163                 return (error);
 164
 165         /* Init hfsmp */
 166         hfsmp = VFSTOHFS(mp);
 167
 168         hfsmp->hfs_uid = UNKNOWNUID;
 169         hfsmp->hfs_gid = UNKNOWNGID;
 170         hfsmp->hfs_dir_mask = (S_IRWXU | S_IRGRP|S_IXGRP | S_IROTH|S_IXOTH); /* 0755 */
 171         hfsmp->hfs_file_mask = (S_IRWXU | S_IRGRP|S_IXGRP | S_IROTH|S_IXOTH); /* 0755 */
 172
 173         /* Establish the free block reserve. */
 174         vcb = HFSTOVCB(hfsmp);
 175         vcb->reserveBlocks = ((u_int64_t)vcb->totalBlocks * HFS_MINFREE) / 100;
 176         vcb->reserveBlocks = MIN(vcb->reserveBlocks, HFS_MAXRESERVE / vcb->blockSize);
 177
 178         vfsp = vfs_statfs(mp);
 179         (void)hfs_statfs(mp, vfsp, NULL);
 180
 181         return (0);
 182 }
 183
 184
 185 /*
 186  * VFS Operations.
 187  *
 188  * mount system call
 189  */
 190
 191 static int
 192 hfs_mount(struct mount *mp, vnode_t devvp, user_addr_t data, vfs_context_t context)
 193 {
 194         struct proc *p = vfs_context_proc(context);
 195         struct hfsmount *hfsmp = NULL;
 196         struct hfs_mount_args args;
 197         int retval = E_NONE;
 198         u_int32_t cmdflags;
 199
 200         if ((retval = copyin(data, (caddr_t)&args, sizeof(args)))) {
 201                 return (retval);
 202         }
 203         cmdflags = (u_int32_t)vfs_flags(mp) & MNT_CMDFLAGS;
 204         if (cmdflags & MNT_UPDATE) {
 205                 hfsmp = VFSTOHFS(mp);
 206
 207                 /* Reload incore data after an fsck. */
 208                 if (cmdflags & MNT_RELOAD) {
 209                         if (vfs_isrdonly(mp))
 210                                 return hfs_reload(mp);
 211                         else
 212                                 return (EINVAL);
 213                 }
 214
 215                 /* Change to a read-only file system. */
 216                 if (((hfsmp->hfs_flags & HFS_READ_ONLY) == 0) &&
 217                     vfs_isrdonly(mp)) {
 218                         int flags;
 219
 220                         /* use VFS_SYNC to push out System (btree) files */
 221                         retval = VFS_SYNC(mp, MNT_WAIT, context);
 222                         if (retval && ((cmdflags & MNT_FORCE) == 0))
 223                                 goto out;
 224
 225                         flags = WRITECLOSE;
 226                         if (cmdflags & MNT_FORCE)
 227                                 flags |= FORCECLOSE;
 228
 229                         if ((retval = hfs_flushfiles(mp, flags, p)))
 230                                 goto out;
 231                         hfsmp->hfs_flags |= HFS_READ_ONLY;
 232                         retval = hfs_flushvolumeheader(hfsmp, MNT_WAIT, 0);
 233
 234                         /* also get the volume bitmap blocks */
 235                         if (!retval) {
 236                                 if (vnode_mount(hfsmp->hfs_devvp) == mp) {
 237                                         retval = hfs_fsync(hfsmp->hfs_devvp, MNT_WAIT, 0, p);
 238                                 } else {
 239                                         vnode_get(hfsmp->hfs_devvp);
 240                                         retval = VNOP_FSYNC(hfsmp->hfs_devvp, MNT_WAIT, context);
 241                                         vnode_put(hfsmp->hfs_devvp);
 242                                 }
 243                         }
 244                         if (retval) {
 245                                 hfsmp->hfs_flags &= ~HFS_READ_ONLY;
 246                                 goto out;
 247                         }
 248                         if (hfsmp->jnl) {
 249                             hfs_global_exclusive_lock_acquire(hfsmp);
 250
 251                             journal_close(hfsmp->jnl);
 252                             hfsmp->jnl = NULL;
 253
 254                             // Note: we explicitly don't want to shutdown
 255                             //       access to the jvp because we may need
 256                             //       it later if we go back to being read-write.
 257
 258                             hfs_global_exclusive_lock_release(hfsmp);
 259                         }
 260                 }
 261
 262                 /* Change to a writable file system. */
 263                 if (vfs_iswriteupgrade(mp)) {
 264
 265                         /*
 266                          * On inconsistent disks, do not allow read-write mount
 267                          * unless it is the boot volume being mounted.
 268                          */
 269                         if (!(vfs_flags(mp) & MNT_ROOTFS) &&
 270                                         (hfsmp->vcbAtrb & kHFSVolumeInconsistentMask)) {
 271                                 retval = EINVAL;
 272                                 goto out;
 273                         }
 274
 275
 276                         retval = hfs_flushvolumeheader(hfsmp, MNT_WAIT, 0);
 277                         if (retval != E_NONE)
 278                                 goto out;
 279
 280                         // If the journal was shut-down previously because we were
 281                         // asked to be read-only, let's start it back up again now
 282
 283                         if (   (HFSTOVCB(hfsmp)->vcbAtrb & kHFSVolumeJournaledMask)
 284                             && hfsmp->jnl == NULL
 285                             && hfsmp->jvp != NULL) {
 286                             int jflags;
 287
 288                             if (hfsmp->hfs_flags & HFS_NEED_JNL_RESET) {
 289                                         jflags = JOURNAL_RESET;
 290                             } else {
 291                                         jflags = 0;
 292                             }
 293
 294                             hfs_global_exclusive_lock_acquire(hfsmp);
 295
 296                             hfsmp->jnl = journal_open(hfsmp->jvp,
 297                                                       (hfsmp->jnl_start * HFSTOVCB(hfsmp)->blockSize) + (off_t)HFSTOVCB(hfsmp)->hfsPlusIOPosOffset,
 298                                                       hfsmp->jnl_size,
 299                                                       hfsmp->hfs_devvp,
 300                                                       hfsmp->hfs_phys_block_size,
 301                                                       jflags,
 302                                                       0,
 303                                                       hfs_sync_metadata, hfsmp->hfs_mp);
 304
 305                             hfs_global_exclusive_lock_release(hfsmp);
 306
 307                             if (hfsmp->jnl == NULL) {
 308                                 retval = EINVAL;
 309                                 goto out;
 310                             } else {
 311                                 hfsmp->hfs_flags &= ~HFS_NEED_JNL_RESET;
 312                             }
 313
 314                         }
 315
 316                         /* Only clear HFS_READ_ONLY after a successfull write */
 317                         hfsmp->hfs_flags &= ~HFS_READ_ONLY;
 318
 319                         if (!(hfsmp->hfs_flags & (HFS_READ_ONLY & HFS_STANDARD))) {
 320                                 /* Setup private/hidden directories for hardlinks. */
 321                                 hfs_privatedir_init(hfsmp, FILE_HARDLINKS);
 322                                 hfs_privatedir_init(hfsmp, DIR_HARDLINKS);
 323
 324                                 hfs_remove_orphans(hfsmp);
 325
 326                                 /*
 327                                  * Allow hot file clustering if conditions allow.
 328                                  */
 329                                 if (hfsmp->hfs_flags & HFS_METADATA_ZONE) {
 330                                         (void) hfs_recording_init(hfsmp);
 331                                 }
 332                                 /* Force ACLs on HFS+ file systems. */
 333                                 if (vfs_extendedsecurity(HFSTOVFS(hfsmp)) == 0) {
 334                                         vfs_setextendedsecurity(HFSTOVFS(hfsmp));
 335                                 }
 336                         }
 337                 }
 338
 339                 /* Update file system parameters. */
 340                 retval = hfs_changefs(mp, &args);
 341
 342         } else /* not an update request */ {
 343
 344                 /* Set the mount flag to indicate that we support volfs  */
 345                 vfs_setflags(mp, (u_int64_t)((unsigned int)MNT_DOVOLFS));
 346
 347                 hfs_chashinit_finish();
 348
 349                 retval = hfs_mountfs(devvp, mp, &args, 0, context);
 350         }
 351 out:
 352         if (retval == 0) {
 353                 (void)hfs_statfs(mp, vfs_statfs(mp), context);
 354         }
 355         return (retval);
 356 }
 357
 358
 359 struct hfs_changefs_cargs {
 360         struct hfsmount *hfsmp;
 361         int             namefix;
 362         int             permfix;
 363         int             permswitch;
 364 };
 365
 366 static int
 367 hfs_changefs_callback(struct vnode *vp, void *cargs)
 368 {
 369         ExtendedVCB *vcb;
 370         struct cnode *cp;
 371         struct cat_desc cndesc;
 372         struct cat_attr cnattr;
 373         struct hfs_changefs_cargs *args;
 374
 375         args = (struct hfs_changefs_cargs *)cargs;
 376
 377         cp = VTOC(vp);
 378         vcb = HFSTOVCB(args->hfsmp);
 379
 380         if (cat_lookup(args->hfsmp, &cp->c_desc, 0, &cndesc, &cnattr, NULL, NULL)) {
 381                 /*
 382                  * If we couldn't find this guy skip to the next one
 383                  */
 384                 if (args->namefix)
 385                         cache_purge(vp);
 386
 387                 return (VNODE_RETURNED);
 388         }
 389         /*
 390          * Get the real uid/gid and perm mask from disk.
 391          */
 392         if (args->permswitch || args->permfix) {
 393                 cp->c_uid = cnattr.ca_uid;
 394                 cp->c_gid = cnattr.ca_gid;
 395                 cp->c_mode = cnattr.ca_mode;
 396         }
 397         /*
 398          * If we're switching name converters then...
 399          *   Remove the existing entry from the namei cache.
 400          *   Update name to one based on new encoder.
 401          */
 402         if (args->namefix) {
 403                 cache_purge(vp);
 404                 replace_desc(cp, &cndesc);
 405
 406                 if (cndesc.cd_cnid == kHFSRootFolderID) {
 407                         strlcpy((char *)vcb->vcbVN, (const char *)cp->c_desc.cd_nameptr, NAME_MAX+1);
 408                         cp->c_desc.cd_encoding = args->hfsmp->hfs_encoding;
 409                 }
 410         } else {
 411                 cat_releasedesc(&cndesc);
 412         }
 413         return (VNODE_RETURNED);
 414 }
 415
 416 /* Change fs mount parameters */
 417 static int
 418 hfs_changefs(struct mount *mp, struct hfs_mount_args *args)
 419 {
 420         int retval = 0;
 421         int namefix, permfix, permswitch;
 422         struct hfsmount *hfsmp;
 423         ExtendedVCB *vcb;
 424         hfs_to_unicode_func_t   get_unicode_func;
 425         unicode_to_hfs_func_t   get_hfsname_func;
 426         u_long old_encoding = 0;
 427         struct hfs_changefs_cargs cargs;
 428         u_int32_t mount_flags;
 429
 430         hfsmp = VFSTOHFS(mp);
 431         vcb = HFSTOVCB(hfsmp);
 432         mount_flags = (unsigned int)vfs_flags(mp);
 433
 434         permswitch = (((hfsmp->hfs_flags & HFS_UNKNOWN_PERMS) &&
 435                        ((mount_flags & MNT_UNKNOWNPERMISSIONS) == 0)) ||
 436                       (((hfsmp->hfs_flags & HFS_UNKNOWN_PERMS) == 0) &&
 437                        (mount_flags & MNT_UNKNOWNPERMISSIONS)));
 438
 439         /* The root filesystem must operate with actual permissions: */
 440         if (permswitch && (mount_flags & MNT_ROOTFS) && (mount_flags & MNT_UNKNOWNPERMISSIONS)) {
 441                 vfs_clearflags(mp, (u_int64_t)((unsigned int)MNT_UNKNOWNPERMISSIONS));  /* Just say "No". */
 442                 return EINVAL;
 443         }
 444         if (mount_flags & MNT_UNKNOWNPERMISSIONS)
 445                 hfsmp->hfs_flags |= HFS_UNKNOWN_PERMS;
 446         else
 447                 hfsmp->hfs_flags &= ~HFS_UNKNOWN_PERMS;
 448
 449         namefix = permfix = 0;
 450
 451         /*
 452          * Tracking of hot files requires up-to-date access times.  So if
 453          * access time updates are disabled, we must also disable hot files.
 454          */
 455         if (mount_flags & MNT_NOATIME) {
 456                 (void) hfs_recording_suspend(hfsmp);
 457         }
 458
 459         /* Change the timezone (Note: this affects all hfs volumes and hfs+ volume create dates) */
 460         if (args->hfs_timezone.tz_minuteswest != VNOVAL) {
 461                 gTimeZone = args->hfs_timezone;
 462         }
 463
 464         /* Change the default uid, gid and/or mask */
 465         if ((args->hfs_uid != (uid_t)VNOVAL) && (hfsmp->hfs_uid != args->hfs_uid)) {
 466                 hfsmp->hfs_uid = args->hfs_uid;
 467                 if (vcb->vcbSigWord == kHFSPlusSigWord)
 468                         ++permfix;
 469         }
 470         if ((args->hfs_gid != (gid_t)VNOVAL) && (hfsmp->hfs_gid != args->hfs_gid)) {
 471                 hfsmp->hfs_gid = args->hfs_gid;
 472                 if (vcb->vcbSigWord == kHFSPlusSigWord)
 473                         ++permfix;
 474         }
 475         if (args->hfs_mask != (mode_t)VNOVAL) {
 476                 if (hfsmp->hfs_dir_mask != (args->hfs_mask & ALLPERMS)) {
 477                         hfsmp->hfs_dir_mask = args->hfs_mask & ALLPERMS;
 478                         hfsmp->hfs_file_mask = args->hfs_mask & ALLPERMS;
 479                         if ((args->flags != VNOVAL) && (args->flags & HFSFSMNT_NOXONFILES))
 480                                 hfsmp->hfs_file_mask = (args->hfs_mask & DEFFILEMODE);
 481                         if (vcb->vcbSigWord == kHFSPlusSigWord)
 482                                 ++permfix;
 483                 }
 484         }
 485
 486         /* Change the hfs encoding value (hfs only) */
 487         if ((vcb->vcbSigWord == kHFSSigWord)    &&
 488             (args->hfs_encoding != (u_long)VNOVAL)              &&
 489             (hfsmp->hfs_encoding != args->hfs_encoding)) {
 490
 491                 retval = hfs_getconverter(args->hfs_encoding, &get_unicode_func, &get_hfsname_func);
 492                 if (retval)
 493                         goto exit;
 494
 495                 /*
 496                  * Connect the new hfs_get_unicode converter but leave
 497                  * the old hfs_get_hfsname converter in place so that
 498                  * we can lookup existing vnodes to get their correctly
 499                  * encoded names.
 500                  *
 501                  * When we're all finished, we can then connect the new
 502                  * hfs_get_hfsname converter and release our interest
 503                  * in the old converters.
 504                  */
 505                 hfsmp->hfs_get_unicode = get_unicode_func;
 506                 old_encoding = hfsmp->hfs_encoding;
 507                 hfsmp->hfs_encoding = args->hfs_encoding;
 508                 ++namefix;
 509         }
 510
 511         if (!(namefix || permfix || permswitch))
 512                 goto exit;
 513
 514         /* XXX 3762912 hack to support HFS filesystem 'owner' */
 515         if (permfix)
 516                 vfs_setowner(mp,
 517                     hfsmp->hfs_uid == UNKNOWNUID ? KAUTH_UID_NONE : hfsmp->hfs_uid,
 518                     hfsmp->hfs_gid == UNKNOWNGID ? KAUTH_GID_NONE : hfsmp->hfs_gid);
 519
 520         /*
 521          * For each active vnode fix things that changed
 522          *
 523          * Note that we can visit a vnode more than once
 524          * and we can race with fsync.
 525          *
 526          * hfs_changefs_callback will be called for each vnode
 527          * hung off of this mount point
 528          * the vnode will be
 529          * properly referenced and unreferenced around the callback
 530          */
 531         cargs.hfsmp = hfsmp;
 532         cargs.namefix = namefix;
 533         cargs.permfix = permfix;
 534         cargs.permswitch = permswitch;
 535
 536         vnode_iterate(mp, 0, hfs_changefs_callback, (void *)&cargs);
 537
 538         /*
 539          * If we're switching name converters we can now
 540          * connect the new hfs_get_hfsname converter and
 541          * release our interest in the old converters.
 542          */
 543         if (namefix) {
 544                 hfsmp->hfs_get_hfsname = get_hfsname_func;
 545                 vcb->volumeNameEncodingHint = args->hfs_encoding;
 546                 (void) hfs_relconverter(old_encoding);
 547         }
 548 exit:
 549         return (retval);
 550 }
 551
 552
 553 struct hfs_reload_cargs {
 554         struct hfsmount *hfsmp;
 555         int             error;
 556 };
 557
 558 static int
 559 hfs_reload_callback(struct vnode *vp, void *cargs)
 560 {
 561         struct cnode *cp;
 562         struct hfs_reload_cargs *args;
 563
 564         args = (struct hfs_reload_cargs *)cargs;
 565         /*
 566          * flush all the buffers associated with this node
 567          */
 568         (void) buf_invalidateblks(vp, 0, 0, 0);
 569
 570         cp = VTOC(vp);
 571         /*
 572          * Remove any directory hints
 573          */
 574         if (vnode_isdir(vp))
 575                 hfs_reldirhints(cp, 0);
 576
 577         /*
 578          * Re-read cnode data for all active vnodes (non-metadata files).
 579          */
 580         if (!vnode_issystem(vp) && !VNODE_IS_RSRC(vp)) {
 581                 struct cat_fork *datafork;
 582                 struct cat_desc desc;
 583
 584                 datafork = cp->c_datafork ? &cp->c_datafork->ff_data : NULL;
 585
 586                 /* lookup by fileID since name could have changed */
 587                 if ((args->error = cat_idlookup(args->hfsmp, cp->c_fileid, 0, &desc, &cp->c_attr, datafork)))
 588                         return (VNODE_RETURNED_DONE);
 589
 590                 /* update cnode's catalog descriptor */
 591                 (void) replace_desc(cp, &desc);
 592         }
 593         return (VNODE_RETURNED);
 594 }
 595
 596 /*
 597  * Reload all incore data for a filesystem (used after running fsck on
 598  * the root filesystem and finding things to fix). The filesystem must
 599  * be mounted read-only.
 600  *
 601  * Things to do to update the mount:
 602  *      invalidate all cached meta-data.
 603  *      invalidate all inactive vnodes.
 604  *      invalidate all cached file data.
 605  *      re-read volume header from disk.
 606  *      re-load meta-file info (extents, file size).
 607  *      re-load B-tree header data.
 608  *      re-read cnode data for all active vnodes.
 609  */
 610 static int
 611 hfs_reload(struct mount *mountp)
 612 {
 613         register struct vnode *devvp;
 614         struct buf *bp;
 615         int sectorsize;
 616         int error, i;
 617         struct hfsmount *hfsmp;
 618         struct HFSPlusVolumeHeader *vhp;
 619         ExtendedVCB *vcb;
 620         struct filefork *forkp;
 621         struct cat_desc cndesc;
 622         struct hfs_reload_cargs args;
 623
 624         hfsmp = VFSTOHFS(mountp);
 625         vcb = HFSTOVCB(hfsmp);
 626
 627         if (vcb->vcbSigWord == kHFSSigWord)
 628                 return (EINVAL);        /* rooting from HFS is not supported! */
 629
 630         /*
 631          * Invalidate all cached meta-data.
 632          */
 633         devvp = hfsmp->hfs_devvp;
 634         if (buf_invalidateblks(devvp, 0, 0, 0))
 635                 panic("hfs_reload: dirty1");
 636
 637         args.hfsmp = hfsmp;
 638         args.error = 0;
 639         /*
 640          * hfs_reload_callback will be called for each vnode
 641          * hung off of this mount point that can't be recycled...
 642          * vnode_iterate will recycle those that it can (the VNODE_RELOAD option)
 643          * the vnode will be in an 'unbusy' state (VNODE_WAIT) and
 644          * properly referenced and unreferenced around the callback
 645          */
 646         vnode_iterate(mountp, VNODE_RELOAD | VNODE_WAIT, hfs_reload_callback, (void *)&args);
 647
 648         if (args.error)
 649                 return (args.error);
 650
 651         /*
 652          * Re-read VolumeHeader from disk.
 653          */
 654         sectorsize = hfsmp->hfs_phys_block_size;
 655
 656         error = (int)buf_meta_bread(hfsmp->hfs_devvp,
 657                         (daddr64_t)((vcb->hfsPlusIOPosOffset / sectorsize) + HFS_PRI_SECTOR(sectorsize)),
 658                         sectorsize, NOCRED, &bp);
 659         if (error) {
 660                 if (bp != NULL)
 661                         buf_brelse(bp);
 662                 return (error);
 663         }
 664
 665         vhp = (HFSPlusVolumeHeader *) (buf_dataptr(bp) + HFS_PRI_OFFSET(sectorsize));
 666
 667         /* Do a quick sanity check */
 668         if ((SWAP_BE16(vhp->signature) != kHFSPlusSigWord &&
 669              SWAP_BE16(vhp->signature) != kHFSXSigWord) ||
 670             (SWAP_BE16(vhp->version) != kHFSPlusVersion &&
 671              SWAP_BE16(vhp->version) != kHFSXVersion) ||
 672             SWAP_BE32(vhp->blockSize) != vcb->blockSize) {
 673                 buf_brelse(bp);
 674                 return (EIO);
 675         }
 676
 677         vcb->vcbLsMod           = to_bsd_time(SWAP_BE32(vhp->modifyDate));
 678         vcb->vcbAtrb            = SWAP_BE32 (vhp->attributes);
 679         vcb->vcbJinfoBlock  = SWAP_BE32(vhp->journalInfoBlock);
 680         vcb->vcbClpSiz          = SWAP_BE32 (vhp->rsrcClumpSize);
 681         vcb->vcbNxtCNID         = SWAP_BE32 (vhp->nextCatalogID);
 682         vcb->vcbVolBkUp         = to_bsd_time(SWAP_BE32(vhp->backupDate));
 683         vcb->vcbWrCnt           = SWAP_BE32 (vhp->writeCount);
 684         vcb->vcbFilCnt          = SWAP_BE32 (vhp->fileCount);
 685         vcb->vcbDirCnt          = SWAP_BE32 (vhp->folderCount);
 686         HFS_UPDATE_NEXT_ALLOCATION(vcb, SWAP_BE32 (vhp->nextAllocation));
 687         vcb->totalBlocks        = SWAP_BE32 (vhp->totalBlocks);
 688         vcb->freeBlocks         = SWAP_BE32 (vhp->freeBlocks);
 689         vcb->encodingsBitmap    = SWAP_BE64 (vhp->encodingsBitmap);
 690         bcopy(vhp->finderInfo, vcb->vcbFndrInfo, sizeof(vhp->finderInfo));
 691         vcb->localCreateDate    = SWAP_BE32 (vhp->createDate); /* hfs+ create date is in local time */
 692
 693         /*
 694          * Re-load meta-file vnode data (extent info, file size, etc).
 695          */
 696         forkp = VTOF((struct vnode *)vcb->extentsRefNum);
 697         for (i = 0; i < kHFSPlusExtentDensity; i++) {
 698                 forkp->ff_extents[i].startBlock =
 699                         SWAP_BE32 (vhp->extentsFile.extents[i].startBlock);
 700                 forkp->ff_extents[i].blockCount =
 701                         SWAP_BE32 (vhp->extentsFile.extents[i].blockCount);
 702         }
 703         forkp->ff_size      = SWAP_BE64 (vhp->extentsFile.logicalSize);
 704         forkp->ff_blocks    = SWAP_BE32 (vhp->extentsFile.totalBlocks);
 705         forkp->ff_clumpsize = SWAP_BE32 (vhp->extentsFile.clumpSize);
 706
 707
 708         forkp = VTOF((struct vnode *)vcb->catalogRefNum);
 709         for (i = 0; i < kHFSPlusExtentDensity; i++) {
 710                 forkp->ff_extents[i].startBlock =
 711                         SWAP_BE32 (vhp->catalogFile.extents[i].startBlock);
 712                 forkp->ff_extents[i].blockCount =
 713                         SWAP_BE32 (vhp->catalogFile.extents[i].blockCount);
 714         }
 715         forkp->ff_size      = SWAP_BE64 (vhp->catalogFile.logicalSize);
 716         forkp->ff_blocks    = SWAP_BE32 (vhp->catalogFile.totalBlocks);
 717         forkp->ff_clumpsize = SWAP_BE32 (vhp->catalogFile.clumpSize);
 718
 719         if (hfsmp->hfs_attribute_vp) {
 720                 forkp = VTOF(hfsmp->hfs_attribute_vp);
 721                 for (i = 0; i < kHFSPlusExtentDensity; i++) {
 722                         forkp->ff_extents[i].startBlock =
 723                                 SWAP_BE32 (vhp->attributesFile.extents[i].startBlock);
 724                         forkp->ff_extents[i].blockCount =
 725                                 SWAP_BE32 (vhp->attributesFile.extents[i].blockCount);
 726                 }
 727                 forkp->ff_size      = SWAP_BE64 (vhp->attributesFile.logicalSize);
 728                 forkp->ff_blocks    = SWAP_BE32 (vhp->attributesFile.totalBlocks);
 729                 forkp->ff_clumpsize = SWAP_BE32 (vhp->attributesFile.clumpSize);
 730         }
 731
 732         forkp = VTOF((struct vnode *)vcb->allocationsRefNum);
 733         for (i = 0; i < kHFSPlusExtentDensity; i++) {
 734                 forkp->ff_extents[i].startBlock =
 735                         SWAP_BE32 (vhp->allocationFile.extents[i].startBlock);
 736                 forkp->ff_extents[i].blockCount =
 737                         SWAP_BE32 (vhp->allocationFile.extents[i].blockCount);
 738         }
 739         forkp->ff_size      = SWAP_BE64 (vhp->allocationFile.logicalSize);
 740         forkp->ff_blocks    = SWAP_BE32 (vhp->allocationFile.totalBlocks);
 741         forkp->ff_clumpsize = SWAP_BE32 (vhp->allocationFile.clumpSize);
 742
 743         buf_brelse(bp);
 744         vhp = NULL;
 745
 746         /*
 747          * Re-load B-tree header data
 748          */
 749         forkp = VTOF((struct vnode *)vcb->extentsRefNum);
 750         if ( (error = MacToVFSError( BTReloadData((FCB*)forkp) )) )
 751                 return (error);
 752
 753         forkp = VTOF((struct vnode *)vcb->catalogRefNum);
 754         if ( (error = MacToVFSError( BTReloadData((FCB*)forkp) )) )
 755                 return (error);
 756
 757         if (hfsmp->hfs_attribute_vp) {
 758                 forkp = VTOF(hfsmp->hfs_attribute_vp);
 759                 if ( (error = MacToVFSError( BTReloadData((FCB*)forkp) )) )
 760                         return (error);
 761         }
 762
 763         /* Reload the volume name */
 764         if ((error = cat_idlookup(hfsmp, kHFSRootFolderID, 0, &cndesc, NULL, NULL)))
 765                 return (error);
 766         vcb->volumeNameEncodingHint = cndesc.cd_encoding;
 767         bcopy(cndesc.cd_nameptr, vcb->vcbVN, min(255, cndesc.cd_namelen));
 768         cat_releasedesc(&cndesc);
 769
 770         /* Re-establish private/hidden directories. */
 771         hfs_privatedir_init(hfsmp, FILE_HARDLINKS);
 772         hfs_privatedir_init(hfsmp, DIR_HARDLINKS);
 773
 774         /* In case any volume information changed to trigger a notification */
 775         hfs_generate_volume_notifications(hfsmp);
 776
 777         return (0);
 778 }
 779
 780
 781 /*
 782  * Common code for mount and mountroot
 783  */
 784 static int
 785 hfs_mountfs(struct vnode *devvp, struct mount *mp, struct hfs_mount_args *args,
 786             int journal_replay_only, vfs_context_t context)
 787 {
 788         struct proc *p = vfs_context_proc(context);
 789         int retval = E_NONE;
 790         struct hfsmount *hfsmp;
 791         struct buf *bp;
 792         dev_t dev;
 793         HFSMasterDirectoryBlock *mdbp;
 794         int ronly;
 795 #if QUOTA
 796         int i;
 797 #endif
 798         int mntwrapper;
 799         kauth_cred_t cred;
 800         u_int64_t disksize;
 801         daddr64_t blkcnt;
 802         u_int32_t blksize;
 803         u_int32_t minblksize;
 804         u_int32_t iswritable;
 805         daddr64_t mdb_offset;
 806         int isvirtual = 0;
 807
 808         ronly = vfs_isrdonly(mp);
 809         dev = vnode_specrdev(devvp);
 810         cred = p ? vfs_context_ucred(context) : NOCRED;
 811         mntwrapper = 0;
 812
 813         bp = NULL;
 814         hfsmp = NULL;
 815         mdbp = NULL;
 816         minblksize = kHFSBlockSize;
 817
 818         /* Advisory locking should be handled at the VFS layer */
 819         vfs_setlocklocal(mp);
 820
 821         /* Get the real physical block size. */
 822         if (VNOP_IOCTL(devvp, DKIOCGETBLOCKSIZE, (caddr_t)&blksize, 0, context)) {
 823                 retval = ENXIO;
 824                 goto error_exit;
 825         }
 826         /* Switch to 512 byte sectors (temporarily) */
 827         if (blksize > 512) {
 828                 u_int32_t size512 = 512;
 829
 830                 if (VNOP_IOCTL(devvp, DKIOCSETBLOCKSIZE, (caddr_t)&size512, FWRITE, context)) {
 831                         retval = ENXIO;
 832                         goto error_exit;
 833                 }
 834         }
 835         /* Get the number of 512 byte physical blocks. */
 836         if (VNOP_IOCTL(devvp, DKIOCGETBLOCKCOUNT, (caddr_t)&blkcnt, 0, context)) {
 837                 /* resetting block size may fail if getting block count did */
 838                 (void)VNOP_IOCTL(devvp, DKIOCSETBLOCKSIZE, (caddr_t)&blksize, FWRITE, context);
 839
 840                 retval = ENXIO;
 841                 goto error_exit;
 842         }
 843         /* Compute an accurate disk size (i.e. within 512 bytes) */
 844         disksize = (u_int64_t)blkcnt * (u_int64_t)512;
 845
 846         /*
 847          * On Tiger it is not necessary to switch the device
 848          * block size to be 4k if there are more than 31-bits
 849          * worth of blocks but to insure compatibility with
 850          * pre-Tiger systems we have to do it.
 851          */
 852         if (blkcnt > 0x000000007fffffff) {
 853                 minblksize = blksize = 4096;
 854         }
 855
 856         /* Now switch to our preferred physical block size. */
 857         if (blksize > 512) {
 858                 if (VNOP_IOCTL(devvp, DKIOCSETBLOCKSIZE, (caddr_t)&blksize, FWRITE, context)) {
 859                         retval = ENXIO;
 860                         goto error_exit;
 861                 }
 862                 /* Get the count of physical blocks. */
 863                 if (VNOP_IOCTL(devvp, DKIOCGETBLOCKCOUNT, (caddr_t)&blkcnt, 0, context)) {
 864                         retval = ENXIO;
 865                         goto error_exit;
 866                 }
 867         }
 868         /*
 869          * At this point:
 870          *   minblksize is the minimum physical block size
 871          *   blksize has our preferred physical block size
 872          *   blkcnt has the total number of physical blocks
 873          */
 874
 875         mdb_offset = (daddr64_t)HFS_PRI_SECTOR(blksize);
 876         if ((retval = (int)buf_meta_bread(devvp, mdb_offset, blksize, cred, &bp))) {
 877                 goto error_exit;
 878         }
 879         MALLOC(mdbp, HFSMasterDirectoryBlock *, kMDBSize, M_TEMP, M_WAITOK);
 880         bcopy((char *)buf_dataptr(bp) + HFS_PRI_OFFSET(blksize), mdbp, kMDBSize);
 881         buf_brelse(bp);
 882         bp = NULL;
 883
 884         MALLOC(hfsmp, struct hfsmount *, sizeof(struct hfsmount), M_HFSMNT, M_WAITOK);
 885         bzero(hfsmp, sizeof(struct hfsmount));
 886
 887         /*
 888          *  Init the volume information structure
 889          */
 890
 891         lck_mtx_init(&hfsmp->hfs_mutex, hfs_mutex_group, hfs_lock_attr);
 892         lck_mtx_init(&hfsmp->hfc_mutex, hfs_mutex_group, hfs_lock_attr);
 893         lck_rw_init(&hfsmp->hfs_global_lock, hfs_rwlock_group, hfs_lock_attr);
 894         lck_rw_init(&hfsmp->hfs_insync, hfs_rwlock_group, hfs_lock_attr);
 895
 896         vfs_setfsprivate(mp, hfsmp);
 897         hfsmp->hfs_mp = mp;                     /* Make VFSTOHFS work */
 898         hfsmp->hfs_raw_dev = vnode_specrdev(devvp);
 899         hfsmp->hfs_devvp = devvp;
 900         vnode_ref(devvp);  /* Hold a ref on the device, dropped when hfsmp is freed. */
 901         hfsmp->hfs_phys_block_size = blksize;
 902         hfsmp->hfs_phys_block_count = blkcnt;
 903         hfsmp->hfs_flags |= HFS_WRITEABLE_MEDIA;
 904         if (ronly)
 905                 hfsmp->hfs_flags |= HFS_READ_ONLY;
 906         if (((unsigned int)vfs_flags(mp)) & MNT_UNKNOWNPERMISSIONS)
 907                 hfsmp->hfs_flags |= HFS_UNKNOWN_PERMS;
 908
 909 #if QUOTA
 910         for (i = 0; i < MAXQUOTAS; i++)
 911                 dqfileinit(&hfsmp->hfs_qfiles[i]);
 912 #endif
 913
 914         if (args) {
 915                 hfsmp->hfs_uid = (args->hfs_uid == (uid_t)VNOVAL) ? UNKNOWNUID : args->hfs_uid;
 916                 if (hfsmp->hfs_uid == 0xfffffffd) hfsmp->hfs_uid = UNKNOWNUID;
 917                 hfsmp->hfs_gid = (args->hfs_gid == (gid_t)VNOVAL) ? UNKNOWNGID : args->hfs_gid;
 918                 if (hfsmp->hfs_gid == 0xfffffffd) hfsmp->hfs_gid = UNKNOWNGID;
 919                 vfs_setowner(mp, hfsmp->hfs_uid, hfsmp->hfs_gid);                               /* tell the VFS */
 920                 if (args->hfs_mask != (mode_t)VNOVAL) {
 921                         hfsmp->hfs_dir_mask = args->hfs_mask & ALLPERMS;
 922                         if (args->flags & HFSFSMNT_NOXONFILES) {
 923                                 hfsmp->hfs_file_mask = (args->hfs_mask & DEFFILEMODE);
 924                         } else {
 925                                 hfsmp->hfs_file_mask = args->hfs_mask & ALLPERMS;
 926                         }
 927                 } else {
 928                         hfsmp->hfs_dir_mask = UNKNOWNPERMISSIONS & ALLPERMS;            /* 0777: rwx---rwx */
 929                         hfsmp->hfs_file_mask = UNKNOWNPERMISSIONS & DEFFILEMODE;        /* 0666: no --x by default? */
 930                 }
 931                 if ((args->flags != (int)VNOVAL) && (args->flags & HFSFSMNT_WRAPPER))
 932                         mntwrapper = 1;
 933         } else {
 934                 /* Even w/o explicit mount arguments, MNT_UNKNOWNPERMISSIONS requires setting up uid, gid, and mask: */
 935                 if (((unsigned int)vfs_flags(mp)) & MNT_UNKNOWNPERMISSIONS) {
 936                         hfsmp->hfs_uid = UNKNOWNUID;
 937                         hfsmp->hfs_gid = UNKNOWNGID;
 938                         vfs_setowner(mp, hfsmp->hfs_uid, hfsmp->hfs_gid);                       /* tell the VFS */
 939                         hfsmp->hfs_dir_mask = UNKNOWNPERMISSIONS & ALLPERMS;            /* 0777: rwx---rwx */
 940                         hfsmp->hfs_file_mask = UNKNOWNPERMISSIONS & DEFFILEMODE;        /* 0666: no --x by default? */
 941                 }
 942         }
 943
 944         /* Find out if disk media is writable. */
 945         if (VNOP_IOCTL(devvp, DKIOCISWRITABLE, (caddr_t)&iswritable, 0, context) == 0) {
 946                 if (iswritable)
 947                         hfsmp->hfs_flags |= HFS_WRITEABLE_MEDIA;
 948                 else
 949                         hfsmp->hfs_flags &= ~HFS_WRITEABLE_MEDIA;
 950         }
 951
 952         // record the current time at which we're mounting this volume
 953         struct timeval tv;
 954         microtime(&tv);
 955         hfsmp->hfs_mount_time = tv.tv_sec;
 956
 957         /* Mount a standard HFS disk */
 958         if ((SWAP_BE16(mdbp->drSigWord) == kHFSSigWord) &&
 959             (mntwrapper || (SWAP_BE16(mdbp->drEmbedSigWord) != kHFSPlusSigWord))) {
 960
 961                 /* If only journal replay is requested, exit immediately */
 962                 if (journal_replay_only) {
 963                         retval = 0;
 964                         goto error_exit;
 965                 }
 966
 967                 if ((vfs_flags(mp) & MNT_ROOTFS)) {
 968                         retval = EINVAL;  /* Cannot root from HFS standard disks */
 969                         goto error_exit;
 970                 }
 971                 /* HFS disks can only use 512 byte physical blocks */
 972                 if (blksize > kHFSBlockSize) {
 973                         blksize = kHFSBlockSize;
 974                         if (VNOP_IOCTL(devvp, DKIOCSETBLOCKSIZE, (caddr_t)&blksize, FWRITE, context)) {
 975                                 retval = ENXIO;
 976                                 goto error_exit;
 977                         }
 978                         if (VNOP_IOCTL(devvp, DKIOCGETBLOCKCOUNT, (caddr_t)&blkcnt, 0, context)) {
 979                                 retval = ENXIO;
 980                                 goto error_exit;
 981                         }
 982                         hfsmp->hfs_phys_block_size = blksize;
 983                         hfsmp->hfs_phys_block_count = blkcnt;
 984                 }
 985                 if (args) {
 986                         hfsmp->hfs_encoding = args->hfs_encoding;
 987                         HFSTOVCB(hfsmp)->volumeNameEncodingHint = args->hfs_encoding;
 988
 989                         /* establish the timezone */
 990                         gTimeZone = args->hfs_timezone;
 991                 }
 992
 993                 retval = hfs_getconverter(hfsmp->hfs_encoding, &hfsmp->hfs_get_unicode,
 994                                         &hfsmp->hfs_get_hfsname);
 995                 if (retval)
 996                         goto error_exit;
 997
 998                 retval = hfs_MountHFSVolume(hfsmp, mdbp, p);
 999                 if (retval)
1000                         (void) hfs_relconverter(hfsmp->hfs_encoding);
1001
1002         } else /* Mount an HFS Plus disk */ {
1003                 HFSPlusVolumeHeader *vhp;
1004                 off_t embeddedOffset;
1005                 int   jnl_disable = 0;
1006
1007                 /* Get the embedded Volume Header */
1008                 if (SWAP_BE16(mdbp->drEmbedSigWord) == kHFSPlusSigWord) {
1009                         embeddedOffset = SWAP_BE16(mdbp->drAlBlSt) * kHFSBlockSize;
1010                         embeddedOffset += (u_int64_t)SWAP_BE16(mdbp->drEmbedExtent.startBlock) *
1011                                           (u_int64_t)SWAP_BE32(mdbp->drAlBlkSiz);
1012
1013                         /*
1014                          * If the embedded volume doesn't start on a block
1015                          * boundary, then switch the device to a 512-byte
1016                          * block size so everything will line up on a block
1017                          * boundary.
1018                          */
1019                         if ((embeddedOffset % blksize) != 0) {
1020                                 printf("HFS Mount: embedded volume offset not"
1021                                     " a multiple of physical block size (%d);"
1022                                     " switching to 512\n", blksize);
1023                                 blksize = 512;
1024                                 if (VNOP_IOCTL(devvp, DKIOCSETBLOCKSIZE,
1025                                     (caddr_t)&blksize, FWRITE, context)) {
1026                                         retval = ENXIO;
1027                                         goto error_exit;
1028                                 }
1029                                 if (VNOP_IOCTL(devvp, DKIOCGETBLOCKCOUNT,
1030                                     (caddr_t)&blkcnt, 0, context)) {
1031                                         retval = ENXIO;
1032                                         goto error_exit;
1033                                 }
1034                                 /* Note: relative block count adjustment */
1035                                 hfsmp->hfs_phys_block_count *=
1036                                     hfsmp->hfs_phys_block_size / blksize;
1037                                 hfsmp->hfs_phys_block_size = blksize;
1038                         }
1039
1040                         disksize = (u_int64_t)SWAP_BE16(mdbp->drEmbedExtent.blockCount) *
1041                                    (u_int64_t)SWAP_BE32(mdbp->drAlBlkSiz);
1042
1043                         hfsmp->hfs_phys_block_count = disksize / blksize;
1044
1045                         mdb_offset = (daddr64_t)((embeddedOffset / blksize) + HFS_PRI_SECTOR(blksize));
1046                         retval = (int)buf_meta_bread(devvp, mdb_offset, blksize, cred, &bp);
1047                         if (retval)
1048                                 goto error_exit;
1049                         bcopy((char *)buf_dataptr(bp) + HFS_PRI_OFFSET(blksize), mdbp, 512);
1050                         buf_brelse(bp);
1051                         bp = NULL;
1052                         vhp = (HFSPlusVolumeHeader*) mdbp;
1053
1054                 } else /* pure HFS+ */ {
1055                         embeddedOffset = 0;
1056                         vhp = (HFSPlusVolumeHeader*) mdbp;
1057                 }
1058
1059                 /*
1060                  * On inconsistent disks, do not allow read-write mount
1061                  * unless it is the boot volume being mounted.
1062                  */
1063                 if (!(vfs_flags(mp) & MNT_ROOTFS) &&
1064                                 (SWAP_BE32(vhp->attributes) & kHFSVolumeInconsistentMask) &&
1065                                 !(hfsmp->hfs_flags & HFS_READ_ONLY)) {
1066                         retval = EINVAL;
1067                         goto error_exit;
1068                 }
1069
1070
1071                 // XXXdbg
1072                 //
1073                 hfsmp->jnl = NULL;
1074                 hfsmp->jvp = NULL;
1075                 if (args != NULL && (args->flags & HFSFSMNT_EXTENDED_ARGS) &&
1076                     args->journal_disable) {
1077                     jnl_disable = 1;
1078                 }
1079
1080                 //
1081                 // We only initialize the journal here if the last person
1082                 // to mount this volume was journaling aware.  Otherwise
1083                 // we delay journal initialization until later at the end
1084                 // of hfs_MountHFSPlusVolume() because the last person who
1085                 // mounted it could have messed things up behind our back
1086                 // (so we need to go find the .journal file, make sure it's
1087                 // the right size, re-sync up if it was moved, etc).
1088                 //
1089                 if (   (SWAP_BE32(vhp->lastMountedVersion) == kHFSJMountVersion)
1090                         && (SWAP_BE32(vhp->attributes) & kHFSVolumeJournaledMask)
1091                         && !jnl_disable) {
1092
1093                         // if we're able to init the journal, mark the mount
1094                         // point as journaled.
1095                         //
1096                         if (hfs_early_journal_init(hfsmp, vhp, args, embeddedOffset, mdb_offset, mdbp, cred) == 0) {
1097                                 vfs_setflags(mp, (u_int64_t)((unsigned int)MNT_JOURNALED));
1098                         } else {
1099                                 // if the journal failed to open, then set the lastMountedVersion
1100                                 // to be "FSK!" which fsck_hfs will see and force the fsck instead
1101                                 // of just bailing out because the volume is journaled.
1102                                 if (!ronly) {
1103                                     HFSPlusVolumeHeader *jvhp;
1104
1105                                     hfsmp->hfs_flags |= HFS_NEED_JNL_RESET;
1106
1107                                     if (mdb_offset == 0) {
1108                                         mdb_offset = (daddr64_t)((embeddedOffset / blksize) + HFS_PRI_SECTOR(blksize));
1109                                     }
1110
1111                                     bp = NULL;
1112                                     retval = (int)buf_meta_bread(devvp, mdb_offset, blksize, cred, &bp);
1113                                     if (retval == 0) {
1114                                         jvhp = (HFSPlusVolumeHeader *)(buf_dataptr(bp) + HFS_PRI_OFFSET(blksize));
1115
1116                                         if (SWAP_BE16(jvhp->signature) == kHFSPlusSigWord || SWAP_BE16(jvhp->signature) == kHFSXSigWord) {
1117                                                 printf ("hfs(1): Journal replay fail.  Writing lastMountVersion as FSK!\n");
1118                                             jvhp->lastMountedVersion = SWAP_BE32(kFSKMountVersion);
1119                                             buf_bwrite(bp);
1120                                         } else {
1121                                             buf_brelse(bp);
1122                                         }
1123                                         bp = NULL;
1124                                     } else if (bp) {
1125                                         buf_brelse(bp);
1126                                         // clear this so the error exit path won't try to use it
1127                                         bp = NULL;
1128                                     }
1129                                 }
1130
1131                                 // if this isn't the root device just bail out.
1132                                 // If it is the root device we just continue on
1133                                 // in the hopes that fsck_hfs will be able to
1134                                 // fix any damage that exists on the volume.
1135                                 if ( !(vfs_flags(mp) & MNT_ROOTFS)) {
1136                                     retval = EINVAL;
1137                                     goto error_exit;
1138                                 }
1139                         }
1140                 }
1141                 // XXXdbg
1142
1143                 /* Either the journal is replayed successfully, or there
1144                  * was nothing to replay, or no journal exists.  In any case,
1145                  * return success.
1146                  */
1147                 if (journal_replay_only) {
1148                         retval = 0;
1149                         goto error_exit;
1150                 }
1151
1152                 (void) hfs_getconverter(0, &hfsmp->hfs_get_unicode, &hfsmp->hfs_get_hfsname);
1153
1154                 retval = hfs_MountHFSPlusVolume(hfsmp, vhp, embeddedOffset, disksize, p, args, cred);
1155                 /*
1156                  * If the backend didn't like our physical blocksize
1157                  * then retry with physical blocksize of 512.
1158                  */
1159                 if ((retval == ENXIO) && (blksize > 512) && (blksize != minblksize)) {
1160                         printf("HFS Mount: could not use physical block size "
1161                                 "(%d) switching to 512\n", blksize);
1162                         blksize = 512;
1163                         if (VNOP_IOCTL(devvp, DKIOCSETBLOCKSIZE, (caddr_t)&blksize, FWRITE, context)) {
1164                                 retval = ENXIO;
1165                                 goto error_exit;
1166                         }
1167                         if (VNOP_IOCTL(devvp, DKIOCGETBLOCKCOUNT, (caddr_t)&blkcnt, 0, context)) {
1168                                 retval = ENXIO;
1169                                 goto error_exit;
1170                         }
1171                         devvp->v_specsize = blksize;
1172                         /* Note: relative block count adjustment (in case this is an embedded volume). */
1173                         hfsmp->hfs_phys_block_count *= hfsmp->hfs_phys_block_size / blksize;
1174                         hfsmp->hfs_phys_block_size = blksize;
1175
1176                         if (hfsmp->jnl) {
1177                             // close and re-open this with the new block size
1178                             journal_close(hfsmp->jnl);
1179                             hfsmp->jnl = NULL;
1180                             if (hfs_early_journal_init(hfsmp, vhp, args, embeddedOffset, mdb_offset, mdbp, cred) == 0) {
1181                                         vfs_setflags(mp, (u_int64_t)((unsigned int)MNT_JOURNALED));
1182                                 } else {
1183                                         // if the journal failed to open, then set the lastMountedVersion
1184                                         // to be "FSK!" which fsck_hfs will see and force the fsck instead
1185                                         // of just bailing out because the volume is journaled.
1186                                         if (!ronly) {
1187                                         HFSPlusVolumeHeader *jvhp;
1188
1189                                         hfsmp->hfs_flags |= HFS_NEED_JNL_RESET;
1190
1191                                         if (mdb_offset == 0) {
1192                                                         mdb_offset = (daddr64_t)((embeddedOffset / blksize) + HFS_PRI_SECTOR(blksize));
1193                                         }
1194
1195                                                 bp = NULL;
1196                                         retval = (int)buf_meta_bread(devvp, mdb_offset, blksize, cred, &bp);
1197                                         if (retval == 0) {
1198                                                         jvhp = (HFSPlusVolumeHeader *)(buf_dataptr(bp) + HFS_PRI_OFFSET(blksize));
1199
1200                                                         if (SWAP_BE16(jvhp->signature) == kHFSPlusSigWord || SWAP_BE16(jvhp->signature) == kHFSXSigWord) {
1201                                                                 printf ("hfs(2): Journal replay fail.  Writing lastMountVersion as FSK!\n");
1202                                                         jvhp->lastMountedVersion = SWAP_BE32(kFSKMountVersion);
1203                                                         buf_bwrite(bp);
1204                                                         } else {
1205                                                         buf_brelse(bp);
1206                                                         }
1207                                                         bp = NULL;
1208                                         } else if (bp) {
1209                                                         buf_brelse(bp);
1210                                                         // clear this so the error exit path won't try to use it
1211                                                         bp = NULL;
1212                                         }
1213                                         }
1214
1215                                         // if this isn't the root device just bail out.
1216                                         // If it is the root device we just continue on
1217                                         // in the hopes that fsck_hfs will be able to
1218                                         // fix any damage that exists on the volume.
1219                                         if ( !(vfs_flags(mp) & MNT_ROOTFS)) {
1220                                         retval = EINVAL;
1221                                         goto error_exit;
1222                                         }
1223                                 }
1224                         }
1225
1226                         /* Try again with a smaller block size... */
1227                         retval = hfs_MountHFSPlusVolume(hfsmp, vhp, embeddedOffset, disksize, p, args, cred);
1228                 }
1229                 if (retval)
1230                         (void) hfs_relconverter(0);
1231         }
1232
1233         // save off a snapshot of the mtime from the previous mount
1234         // (for matador).
1235         hfsmp->hfs_last_mounted_mtime = hfsmp->hfs_mtime;
1236
1237         if ( retval ) {
1238                 goto error_exit;
1239         }
1240
1241         mp->mnt_vfsstat.f_fsid.val[0] = (long)dev;
1242         mp->mnt_vfsstat.f_fsid.val[1] = vfs_typenum(mp);
1243         vfs_setmaxsymlen(mp, 0);
1244         mp->mnt_vtable->vfc_threadsafe = TRUE;
1245         mp->mnt_vtable->vfc_vfsflags |= VFC_VFSNATIVEXATTR;
1246 #if NAMEDSTREAMS
1247         mp->mnt_kern_flag |= MNTK_NAMED_STREAMS;
1248 #endif
1249         if (!(hfsmp->hfs_flags & HFS_STANDARD)) {
1250                 /* Tell VFS that we support directory hard links. */
1251                 mp->mnt_vtable->vfc_vfsflags |= VFC_VFSDIRLINKS;
1252         } else {
1253                 /* HFS standard doesn't support extended readdir! */
1254                 mp->mnt_vtable->vfc_vfsflags &= ~VFC_VFSREADDIR_EXTENDED;
1255         }
1256
1257         if (args) {
1258                 /*
1259                  * Set the free space warning levels for a non-root volume:
1260                  *
1261                  * Set the lower freespace limit (the level that will trigger a warning)
1262                  * to 5% of the volume size or 250MB, whichever is less, and the desired
1263                  * level (which will cancel the alert request) to 1/2 above that limit.
1264                  * Start looking for free space to drop below this level and generate a
1265                  * warning immediately if needed:
1266                  */
1267                 hfsmp->hfs_freespace_notify_warninglimit =
1268                         MIN(HFS_LOWDISKTRIGGERLEVEL / HFSTOVCB(hfsmp)->blockSize,
1269                                 (HFSTOVCB(hfsmp)->totalBlocks / 100) * HFS_LOWDISKTRIGGERFRACTION);
1270                 hfsmp->hfs_freespace_notify_desiredlevel =
1271                         MIN(HFS_LOWDISKSHUTOFFLEVEL / HFSTOVCB(hfsmp)->blockSize,
1272                                 (HFSTOVCB(hfsmp)->totalBlocks / 100) * HFS_LOWDISKSHUTOFFFRACTION);
1273         } else {
1274                 /*
1275                  * Set the free space warning levels for the root volume:
1276                  *
1277                  * Set the lower freespace limit (the level that will trigger a warning)
1278                  * to 1% of the volume size or 50MB, whichever is less, and the desired
1279                  * level (which will cancel the alert request) to 2% or 75MB, whichever is less.
1280                  */
1281                 hfsmp->hfs_freespace_notify_warninglimit =
1282                         MIN(HFS_ROOTLOWDISKTRIGGERLEVEL / HFSTOVCB(hfsmp)->blockSize,
1283                                 (HFSTOVCB(hfsmp)->totalBlocks / 100) * HFS_ROOTLOWDISKTRIGGERFRACTION);
1284                 hfsmp->hfs_freespace_notify_desiredlevel =
1285                         MIN(HFS_ROOTLOWDISKSHUTOFFLEVEL / HFSTOVCB(hfsmp)->blockSize,
1286                                 (HFSTOVCB(hfsmp)->totalBlocks / 100) * HFS_ROOTLOWDISKSHUTOFFFRACTION);
1287         };
1288
1289         /* Check if the file system exists on virtual device, like disk image */
1290         if (VNOP_IOCTL(devvp, DKIOCISVIRTUAL, (caddr_t)&isvirtual, 0, context) == 0) {
1291                 if (isvirtual) {
1292                         hfsmp->hfs_flags |= HFS_VIRTUAL_DEVICE;
1293                 }
1294         }
1295
1296         /*
1297          * Start looking for free space to drop below this level and generate a
1298          * warning immediately if needed:
1299          */
1300         hfsmp->hfs_notification_conditions = 0;
1301         hfs_generate_volume_notifications(hfsmp);
1302
1303         if (ronly == 0) {
1304                 (void) hfs_flushvolumeheader(hfsmp, MNT_WAIT, 0);
1305         }
1306         FREE(mdbp, M_TEMP);
1307         return (0);
1308
1309 error_exit:
1310         if (bp)
1311                 buf_brelse(bp);
1312         if (mdbp)
1313                 FREE(mdbp, M_TEMP);
1314
1315         if (hfsmp && hfsmp->jvp && hfsmp->jvp != hfsmp->hfs_devvp) {
1316             (void)VNOP_CLOSE(hfsmp->jvp, ronly ? FREAD : FREAD|FWRITE, context);
1317                 hfsmp->jvp = NULL;
1318         }
1319         if (hfsmp) {
1320                 if (hfsmp->hfs_devvp) {
1321                         vnode_rele(hfsmp->hfs_devvp);
1322                 }
1323                 FREE(hfsmp, M_HFSMNT);
1324                 vfs_setfsprivate(mp, NULL);
1325         }
1326         return (retval);
1327 }
1328
1329
1330 /*
1331  * Make a filesystem operational.
1332  * Nothing to do at the moment.
1333  */
1334 /* ARGSUSED */
1335 static int
1336 hfs_start(__unused struct mount *mp, __unused int flags, __unused vfs_context_t context)
1337 {
1338         return (0);
1339 }
1340
1341
1342 /*
1343  * unmount system call
1344  */
1345 static int
1346 hfs_unmount(struct mount *mp, int mntflags, vfs_context_t context)
1347 {
1348         struct proc *p = vfs_context_proc(context);
1349         struct hfsmount *hfsmp = VFSTOHFS(mp);
1350         int retval = E_NONE;
1351         int flags;
1352         int force;
1353         int started_tr = 0;
1354
1355         flags = 0;
1356         force = 0;
1357         if (mntflags & MNT_FORCE) {
1358                 flags |= FORCECLOSE;
1359                 force = 1;
1360         }
1361
1362         if ((retval = hfs_flushfiles(mp, flags, p)) && !force)
1363                 return (retval);
1364
1365         if (hfsmp->hfs_flags & HFS_METADATA_ZONE)
1366                 (void) hfs_recording_suspend(hfsmp);
1367
1368         /*
1369          * Flush out the b-trees, volume bitmap and Volume Header
1370          */
1371         if ((hfsmp->hfs_flags & HFS_READ_ONLY) == 0) {
1372                 retval = hfs_start_transaction(hfsmp);
1373                 if (retval == 0) {
1374                     started_tr = 1;
1375                 } else if (!force) {
1376                     goto err_exit;
1377                 }
1378
1379                 if (hfsmp->hfs_startup_vp) {
1380                         (void) hfs_lock(VTOC(hfsmp->hfs_startup_vp), HFS_EXCLUSIVE_LOCK);
1381                         retval = hfs_fsync(hfsmp->hfs_startup_vp, MNT_WAIT, 0, p);
1382                         hfs_unlock(VTOC(hfsmp->hfs_startup_vp));
1383                         if (retval && !force)
1384                                 goto err_exit;
1385                 }
1386
1387                 if (hfsmp->hfs_attribute_vp) {
1388                         (void) hfs_lock(VTOC(hfsmp->hfs_attribute_vp), HFS_EXCLUSIVE_LOCK);
1389                         retval = hfs_fsync(hfsmp->hfs_attribute_vp, MNT_WAIT, 0, p);
1390                         hfs_unlock(VTOC(hfsmp->hfs_attribute_vp));
1391                         if (retval && !force)
1392                                 goto err_exit;
1393                 }
1394
1395                 (void) hfs_lock(VTOC(hfsmp->hfs_catalog_vp), HFS_EXCLUSIVE_LOCK);
1396                 retval = hfs_fsync(hfsmp->hfs_catalog_vp, MNT_WAIT, 0, p);
1397                 hfs_unlock(VTOC(hfsmp->hfs_catalog_vp));
1398                 if (retval && !force)
1399                         goto err_exit;
1400
1401                 (void) hfs_lock(VTOC(hfsmp->hfs_extents_vp), HFS_EXCLUSIVE_LOCK);
1402                 retval = hfs_fsync(hfsmp->hfs_extents_vp, MNT_WAIT, 0, p);
1403                 hfs_unlock(VTOC(hfsmp->hfs_extents_vp));
1404                 if (retval && !force)
1405                         goto err_exit;
1406
1407                 if (hfsmp->hfs_allocation_vp) {
1408                         (void) hfs_lock(VTOC(hfsmp->hfs_allocation_vp), HFS_EXCLUSIVE_LOCK);
1409                         retval = hfs_fsync(hfsmp->hfs_allocation_vp, MNT_WAIT, 0, p);
1410                         hfs_unlock(VTOC(hfsmp->hfs_allocation_vp));
1411                         if (retval && !force)
1412                                 goto err_exit;
1413                 }
1414
1415                 if (hfsmp->hfc_filevp && vnode_issystem(hfsmp->hfc_filevp)) {
1416                         retval = hfs_fsync(hfsmp->hfc_filevp, MNT_WAIT, 0, p);
1417                         if (retval && !force)
1418                                 goto err_exit;
1419                 }
1420
1421                 /* If runtime corruption was detected, indicate that the volume
1422                  * was not unmounted cleanly.
1423                  */
1424                 if (hfsmp->vcbAtrb & kHFSVolumeInconsistentMask) {
1425                         HFSTOVCB(hfsmp)->vcbAtrb &= ~kHFSVolumeUnmountedMask;
1426                 } else {
1427                         HFSTOVCB(hfsmp)->vcbAtrb |= kHFSVolumeUnmountedMask;
1428                 }
1429
1430                 retval = hfs_flushvolumeheader(hfsmp, MNT_WAIT, 0);
1431                 if (retval) {
1432                         HFSTOVCB(hfsmp)->vcbAtrb &= ~kHFSVolumeUnmountedMask;
1433                         if (!force)
1434                                 goto err_exit;  /* could not flush everything */
1435                 }
1436
1437                 if (started_tr) {
1438                     hfs_end_transaction(hfsmp);
1439                     started_tr = 0;
1440                 }
1441         }
1442
1443         if (hfsmp->jnl) {
1444                 journal_flush(hfsmp->jnl);
1445         }
1446
1447         /*
1448          *      Invalidate our caches and release metadata vnodes
1449          */
1450         (void) hfsUnmount(hfsmp, p);
1451
1452         /*
1453          * Last chance to dump unreferenced system files.
1454          */
1455         (void) vflush(mp, NULLVP, FORCECLOSE);
1456
1457         if (HFSTOVCB(hfsmp)->vcbSigWord == kHFSSigWord)
1458                 (void) hfs_relconverter(hfsmp->hfs_encoding);
1459
1460         // XXXdbg
1461         if (hfsmp->jnl) {
1462             journal_close(hfsmp->jnl);
1463             hfsmp->jnl = NULL;
1464         }
1465
1466         VNOP_FSYNC(hfsmp->hfs_devvp, MNT_WAIT, context);
1467
1468         if (hfsmp->jvp && hfsmp->jvp != hfsmp->hfs_devvp) {
1469             retval = VNOP_CLOSE(hfsmp->jvp,
1470                                hfsmp->hfs_flags & HFS_READ_ONLY ? FREAD : FREAD|FWRITE,
1471                                context);
1472             vnode_put(hfsmp->jvp);
1473             hfsmp->jvp = NULL;
1474         }
1475         // XXXdbg
1476
1477 #ifdef HFS_SPARSE_DEV
1478         /* Drop our reference on the backing fs (if any). */
1479         if ((hfsmp->hfs_flags & HFS_HAS_SPARSE_DEVICE) && hfsmp->hfs_backingfs_rootvp) {
1480                 struct vnode * tmpvp;
1481
1482                 hfsmp->hfs_flags &= ~HFS_HAS_SPARSE_DEVICE;
1483                 tmpvp = hfsmp->hfs_backingfs_rootvp;
1484                 hfsmp->hfs_backingfs_rootvp = NULLVP;
1485                 vnode_rele(tmpvp);
1486         }
1487 #endif /* HFS_SPARSE_DEV */
1488         lck_mtx_destroy(&hfsmp->hfc_mutex, hfs_mutex_group);
1489         vnode_rele(hfsmp->hfs_devvp);
1490         FREE(hfsmp, M_HFSMNT);
1491
1492         return (0);
1493
1494   err_exit:
1495         if (started_tr) {
1496                 hfs_end_transaction(hfsmp);
1497         }
1498         return retval;
1499 }
1500
1501
1502 /*
1503  * Return the root of a filesystem.
1504  */
1505 static int
1506 hfs_vfs_root(struct mount *mp, struct vnode **vpp, __unused vfs_context_t context)
1507 {
1508         return hfs_vget(VFSTOHFS(mp), (cnid_t)kHFSRootFolderID, vpp, 1);
1509 }
1510
1511
1512 /*
1513  * Do operations associated with quotas
1514  */
1515 #if !QUOTA
1516 static int
1517 hfs_quotactl(__unused struct mount *mp, __unused int cmds, __unused uid_t uid, __unused caddr_t datap, __unused vfs_context_t context)
1518 {
1519         return (ENOTSUP);
1520 }
1521 #else
1522 static int
1523 hfs_quotactl(struct mount *mp, int cmds, uid_t uid, caddr_t datap, vfs_context_t context)
1524 {
1525         struct proc *p = vfs_context_proc(context);
1526         int cmd, type, error;
1527
1528         if (uid == ~0U)
1529                 uid = vfs_context_ucred(context)->cr_ruid;
1530         cmd = cmds >> SUBCMDSHIFT;
1531
1532         switch (cmd) {
1533         case Q_SYNC:
1534         case Q_QUOTASTAT:
1535                 break;
1536         case Q_GETQUOTA:
1537                 if (uid == vfs_context_ucred(context)->cr_ruid)
1538                         break;
1539                 /* fall through */
1540         default:
1541                 if ( (error = vfs_context_suser(context)) )
1542                         return (error);
1543         }
1544
1545         type = cmds & SUBCMDMASK;
1546         if ((u_int)type >= MAXQUOTAS)
1547                 return (EINVAL);
1548         if (vfs_busy(mp, LK_NOWAIT))
1549                 return (0);
1550
1551         switch (cmd) {
1552
1553         case Q_QUOTAON:
1554                 error = hfs_quotaon(p, mp, type, datap);
1555                 break;
1556
1557         case Q_QUOTAOFF:
1558                 error = hfs_quotaoff(p, mp, type);
1559                 break;
1560
1561         case Q_SETQUOTA:
1562                 error = hfs_setquota(mp, uid, type, datap);
1563                 break;
1564
1565         case Q_SETUSE:
1566                 error = hfs_setuse(mp, uid, type, datap);
1567                 break;
1568
1569         case Q_GETQUOTA:
1570                 error = hfs_getquota(mp, uid, type, datap);
1571                 break;
1572
1573         case Q_SYNC:
1574                 error = hfs_qsync(mp);
1575                 break;
1576
1577         case Q_QUOTASTAT:
1578                 error = hfs_quotastat(mp, type, datap);
1579                 break;
1580
1581         default:
1582                 error = EINVAL;
1583                 break;
1584         }
1585         vfs_unbusy(mp);
1586
1587         return (error);
1588 }
1589 #endif /* QUOTA */
1590
1591 /* Subtype is composite of bits */
1592 #define HFS_SUBTYPE_JOURNALED      0x01
1593 #define HFS_SUBTYPE_CASESENSITIVE  0x02
1594 /* bits 2 - 6 reserved */
1595 #define HFS_SUBTYPE_STANDARDHFS    0x80
1596
1597 /*
1598  * Get file system statistics.
1599  */
1600 static int
1601 hfs_statfs(struct mount *mp, register struct vfsstatfs *sbp, __unused vfs_context_t context)
1602 {
1603         ExtendedVCB *vcb = VFSTOVCB(mp);
1604         struct hfsmount *hfsmp = VFSTOHFS(mp);
1605         u_long freeCNIDs;
1606         u_int16_t subtype = 0;
1607
1608         freeCNIDs = (u_long)0xFFFFFFFF - (u_long)vcb->vcbNxtCNID;
1609
1610         sbp->f_bsize = (u_int32_t)vcb->blockSize;
1611         sbp->f_iosize = (size_t)(MAX_UPL_TRANSFER * PAGE_SIZE);
1612         sbp->f_blocks = (u_int64_t)((unsigned long)vcb->totalBlocks);
1613         sbp->f_bfree = (u_int64_t)((unsigned long )hfs_freeblks(hfsmp, 0));
1614         sbp->f_bavail = (u_int64_t)((unsigned long )hfs_freeblks(hfsmp, 1));
1615         sbp->f_files = (u_int64_t)((unsigned long )(vcb->totalBlocks - 2));  /* max files is constrained by total blocks */
1616         sbp->f_ffree = (u_int64_t)((unsigned long )(MIN(freeCNIDs, sbp->f_bavail)));
1617
1618         /*
1619          * Subtypes (flavors) for HFS
1620          *   0:   Mac OS Extended
1621          *   1:   Mac OS Extended (Journaled)
1622          *   2:   Mac OS Extended (Case Sensitive)
1623          *   3:   Mac OS Extended (Case Sensitive, Journaled)
1624          *   4 - 127:   Reserved
1625          * 128:   Mac OS Standard
1626          *
1627          */
1628         if (hfsmp->hfs_flags & HFS_STANDARD) {
1629                 subtype = HFS_SUBTYPE_STANDARDHFS;
1630         } else /* HFS Plus */ {
1631                 if (hfsmp->jnl)
1632                         subtype |= HFS_SUBTYPE_JOURNALED;
1633                 if (hfsmp->hfs_flags & HFS_CASE_SENSITIVE)
1634                         subtype |= HFS_SUBTYPE_CASESENSITIVE;
1635         }
1636         sbp->f_fssubtype = subtype;
1637
1638         return (0);
1639 }
1640
1641
1642 //
1643 // XXXdbg -- this is a callback to be used by the journal to
1644 //           get meta data blocks flushed out to disk.
1645 //
1646 // XXXdbg -- be smarter and don't flush *every* block on each
1647 //           call.  try to only flush some so we don't wind up
1648 //           being too synchronous.
1649 //
1650 __private_extern__
1651 void
1652 hfs_sync_metadata(void *arg)
1653 {
1654         struct mount *mp = (struct mount *)arg;
1655         struct hfsmount *hfsmp;
1656         ExtendedVCB *vcb;
1657         buf_t   bp;
1658         int  sectorsize, retval;
1659         daddr64_t priIDSector;
1660         hfsmp = VFSTOHFS(mp);
1661         vcb = HFSTOVCB(hfsmp);
1662
1663         // now make sure the super block is flushed
1664         sectorsize = hfsmp->hfs_phys_block_size;
1665         priIDSector = (daddr64_t)((vcb->hfsPlusIOPosOffset / sectorsize) +
1666                                   HFS_PRI_SECTOR(sectorsize));
1667         retval = (int)buf_meta_bread(hfsmp->hfs_devvp, priIDSector, sectorsize, NOCRED, &bp);
1668         if ((retval != 0 ) && (retval != ENXIO)) {
1669                 printf("hfs_sync_metadata: can't read volume header at %d! (retval 0x%x)\n",
1670                        (int)priIDSector, retval);
1671         }
1672
1673         if (retval == 0 && ((buf_flags(bp) & (B_DELWRI | B_LOCKED)) == B_DELWRI)) {
1674             buf_bwrite(bp);
1675         } else if (bp) {
1676             buf_brelse(bp);
1677         }
1678
1679         // the alternate super block...
1680         // XXXdbg - we probably don't need to do this each and every time.
1681         //          hfs_btreeio.c:FlushAlternate() should flag when it was
1682         //          written...
1683         if (hfsmp->hfs_alt_id_sector) {
1684                 retval = (int)buf_meta_bread(hfsmp->hfs_devvp, hfsmp->hfs_alt_id_sector, sectorsize, NOCRED, &bp);
1685                 if (retval == 0 && ((buf_flags(bp) & (B_DELWRI | B_LOCKED)) == B_DELWRI)) {
1686                     buf_bwrite(bp);
1687                 } else if (bp) {
1688                     buf_brelse(bp);
1689                 }
1690         }
1691 }
1692
1693
1694 struct hfs_sync_cargs {
1695         kauth_cred_t cred;
1696         struct proc  *p;
1697         int    waitfor;
1698         int    error;
1699 };
1700
1701
1702 static int
1703 hfs_sync_callback(struct vnode *vp, void *cargs)
1704 {
1705         struct cnode *cp;
1706         struct hfs_sync_cargs *args;
1707         int error;
1708
1709         args = (struct hfs_sync_cargs *)cargs;
1710
1711         if (hfs_lock(VTOC(vp), HFS_EXCLUSIVE_LOCK) != 0) {
1712                 return (VNODE_RETURNED);
1713         }
1714         cp = VTOC(vp);
1715
1716         if ((cp->c_flag & C_MODIFIED) ||
1717             (cp->c_touch_acctime | cp->c_touch_chgtime | cp->c_touch_modtime) ||
1718             vnode_hasdirtyblks(vp)) {
1719                 error = hfs_fsync(vp, args->waitfor, 0, args->p);
1720
1721                 if (error)
1722                         args->error = error;
1723         }
1724         hfs_unlock(cp);
1725         return (VNODE_RETURNED);
1726 }
1727
1728
1729
1730 /*
1731  * Go through the disk queues to initiate sandbagged IO;
1732  * go through the inodes to write those that have been modified;
1733  * initiate the writing of the super block if it has been modified.
1734  *
1735  * Note: we are always called with the filesystem marked `MPBUSY'.
1736  */
1737 static int
1738 hfs_sync(struct mount *mp, int waitfor, vfs_context_t context)
1739 {
1740         struct proc *p = vfs_context_proc(context);
1741         struct cnode *cp;
1742         struct hfsmount *hfsmp;
1743         ExtendedVCB *vcb;
1744         struct vnode *meta_vp[4];
1745         int i;
1746         int error, allerror = 0;
1747         struct hfs_sync_cargs args;
1748
1749         /*
1750          * During MNT_UPDATE hfs_changefs might be manipulating
1751          * vnodes so back off
1752          */
1753         if (((u_int32_t)vfs_flags(mp)) & MNT_UPDATE)    /* XXX MNT_UPDATE may not be visible here */
1754                 return (0);
1755
1756         hfsmp = VFSTOHFS(mp);
1757         if (hfsmp->hfs_flags & HFS_READ_ONLY)
1758                 return (EROFS);
1759
1760         /* skip over frozen volumes */
1761         if (!lck_rw_try_lock_shared(&hfsmp->hfs_insync))
1762                 return 0;
1763
1764         args.cred = kauth_cred_get();
1765         args.waitfor = waitfor;
1766         args.p = p;
1767         args.error = 0;
1768         /*
1769          * hfs_sync_callback will be called for each vnode
1770          * hung off of this mount point... the vnode will be
1771          * properly referenced and unreferenced around the callback
1772          */
1773         vnode_iterate(mp, 0, hfs_sync_callback, (void *)&args);
1774
1775         if (args.error)
1776                 allerror = args.error;
1777
1778         vcb = HFSTOVCB(hfsmp);
1779
1780         meta_vp[0] = vcb->extentsRefNum;
1781         meta_vp[1] = vcb->catalogRefNum;
1782         meta_vp[2] = vcb->allocationsRefNum;  /* This is NULL for standard HFS */
1783         meta_vp[3] = hfsmp->hfs_attribute_vp; /* Optional file */
1784
1785         /* Now sync our three metadata files */
1786         for (i = 0; i < 4; ++i) {
1787                 struct vnode *btvp;
1788
1789                 btvp = meta_vp[i];;
1790                 if ((btvp==0) || (vnode_mount(btvp) != mp))
1791                         continue;
1792
1793                 /* XXX use hfs_systemfile_lock instead ? */
1794                 (void) hfs_lock(VTOC(btvp), HFS_EXCLUSIVE_LOCK);
1795                 cp = VTOC(btvp);
1796
1797                 if (((cp->c_flag &  C_MODIFIED) == 0) &&
1798                     (cp->c_touch_acctime == 0) &&
1799                     (cp->c_touch_chgtime == 0) &&
1800                     (cp->c_touch_modtime == 0) &&
1801                     vnode_hasdirtyblks(btvp) == 0) {
1802                         hfs_unlock(VTOC(btvp));
1803                         continue;
1804                 }
1805                 error = vnode_get(btvp);
1806                 if (error) {
1807                         hfs_unlock(VTOC(btvp));
1808                         continue;
1809                 }
1810                 if ((error = hfs_fsync(btvp, waitfor, 0, p)))
1811                         allerror = error;
1812
1813                 hfs_unlock(cp);
1814                 vnode_put(btvp);
1815         };
1816
1817         /*
1818          * Force stale file system control information to be flushed.
1819          */
1820         if (vcb->vcbSigWord == kHFSSigWord) {
1821                 if ((error = VNOP_FSYNC(hfsmp->hfs_devvp, waitfor, context))) {
1822                         allerror = error;
1823                 }
1824         }
1825 #if QUOTA
1826         hfs_qsync(mp);
1827 #endif /* QUOTA */
1828
1829         hfs_hotfilesync(hfsmp, vfs_context_kernel());
1830
1831         /*
1832          * Write back modified superblock.
1833          */
1834         if (IsVCBDirty(vcb)) {
1835                 error = hfs_flushvolumeheader(hfsmp, waitfor, 0);
1836                 if (error)
1837                         allerror = error;
1838         }
1839
1840         if (hfsmp->jnl) {
1841             journal_flush(hfsmp->jnl);
1842         }
1843
1844         lck_rw_unlock_shared(&hfsmp->hfs_insync);
1845         return (allerror);
1846 }
1847
1848
1849 /*
1850  * File handle to vnode
1851  *
1852  * Have to be really careful about stale file handles:
1853  * - check that the cnode id is valid
1854  * - call hfs_vget() to get the locked cnode
1855  * - check for an unallocated cnode (i_mode == 0)
1856  * - check that the given client host has export rights and return
1857  *   those rights via. exflagsp and credanonp
1858  */
1859 static int
1860 hfs_fhtovp(struct mount *mp, int fhlen, unsigned char *fhp, struct vnode **vpp, __unused vfs_context_t context)
1861 {
1862         struct hfsfid *hfsfhp;
1863         struct vnode *nvp;
1864         int result;
1865
1866         *vpp = NULL;
1867         hfsfhp = (struct hfsfid *)fhp;
1868
1869         if (fhlen < (int)sizeof(struct hfsfid))
1870                 return (EINVAL);
1871
1872         result = hfs_vget(VFSTOHFS(mp), ntohl(hfsfhp->hfsfid_cnid), &nvp, 0);
1873         if (result) {
1874                 if (result == ENOENT)
1875                         result = ESTALE;
1876                 return result;
1877         }
1878
1879         /* The createtime can be changed by hfs_setattr or hfs_setattrlist.
1880          * For NFS, we are assuming that only if the createtime was moved
1881          * forward would it mean the fileID got reused in that session by
1882          * wrapping. We don't have a volume ID or other unique identifier to
1883          * to use here for a generation ID across reboots, crashes where
1884          * metadata noting lastFileID didn't make it to disk but client has
1885          * it, or volume erasures where fileIDs start over again. Lastly,
1886          * with HFS allowing "wraps" of fileIDs now, this becomes more
1887          * error prone. Future, would be change the "wrap bit" to a unique
1888          * wrap number and use that for generation number. For now do this.
1889          */
1890         if (((time_t)(ntohl(hfsfhp->hfsfid_gen)) < VTOC(nvp)->c_itime)) {
1891                 hfs_unlock(VTOC(nvp));
1892                 vnode_put(nvp);
1893                 return (ESTALE);
1894         }
1895         *vpp = nvp;
1896
1897         hfs_unlock(VTOC(nvp));
1898         return (0);
1899 }
1900
1901
1902 /*
1903  * Vnode pointer to File handle
1904  */
1905 /* ARGSUSED */
1906 static int
1907 hfs_vptofh(struct vnode *vp, int *fhlenp, unsigned char *fhp, __unused vfs_context_t context)
1908 {
1909         struct cnode *cp;
1910         struct hfsfid *hfsfhp;
1911
1912         if (ISHFS(VTOVCB(vp)))
1913                 return (ENOTSUP);       /* hfs standard is not exportable */
1914
1915         if (*fhlenp < (int)sizeof(struct hfsfid))
1916                 return (EOVERFLOW);
1917
1918         cp = VTOC(vp);
1919         hfsfhp = (struct hfsfid *)fhp;
1920         hfsfhp->hfsfid_cnid = htonl(cp->c_fileid);
1921         hfsfhp->hfsfid_gen = htonl(cp->c_itime);
1922         *fhlenp = sizeof(struct hfsfid);
1923
1924         return (0);
1925 }
1926
1927
1928 /*
1929  * Initial HFS filesystems, done only once.
1930  */
1931 static int
1932 hfs_init(__unused struct vfsconf *vfsp)
1933 {
1934         static int done = 0;
1935
1936         if (done)
1937                 return (0);
1938         done = 1;
1939         hfs_chashinit();
1940         hfs_converterinit();
1941
1942         BTReserveSetup();
1943
1944
1945         hfs_lock_attr    = lck_attr_alloc_init();
1946         hfs_group_attr   = lck_grp_attr_alloc_init();
1947         hfs_mutex_group  = lck_grp_alloc_init("hfs-mutex", hfs_group_attr);
1948         hfs_rwlock_group = lck_grp_alloc_init("hfs-rwlock", hfs_group_attr);
1949
1950
1951         return (0);
1952 }
1953
1954 static int
1955 hfs_getmountpoint(struct vnode *vp, struct hfsmount **hfsmpp)
1956 {
1957         struct hfsmount * hfsmp;
1958         char fstypename[MFSNAMELEN];
1959
1960         if (vp == NULL)
1961                 return (EINVAL);
1962
1963         if (!vnode_isvroot(vp))
1964                 return (EINVAL);
1965
1966         vnode_vfsname(vp, fstypename);
1967         if (strncmp(fstypename, "hfs", sizeof(fstypename)) != 0)
1968                 return (EINVAL);
1969
1970         hfsmp = VTOHFS(vp);
1971
1972         if (HFSTOVCB(hfsmp)->vcbSigWord == kHFSSigWord)
1973                 return (EINVAL);
1974
1975         *hfsmpp = hfsmp;
1976
1977         return (0);
1978 }
1979
1980 // XXXdbg
1981 #include <sys/filedesc.h>
1982
1983 /*
1984  * HFS filesystem related variables.
1985  */
1986 static int
1987 hfs_sysctl(int *name, __unused u_int namelen, user_addr_t oldp, size_t *oldlenp,
1988                         user_addr_t newp, size_t newlen, vfs_context_t context)
1989 {
1990         struct proc *p = vfs_context_proc(context);
1991         int error;
1992         struct hfsmount *hfsmp;
1993
1994         /* all sysctl names at this level are terminal */
1995
1996         if (name[0] == HFS_ENCODINGBIAS) {
1997                 int bias;
1998
1999                 bias = hfs_getencodingbias();
2000                 error = sysctl_int(oldp, oldlenp, newp, newlen, &bias);
2001                 if (error == 0 && newp)
2002                         hfs_setencodingbias(bias);
2003                 return (error);
2004
2005         } else if (name[0] == HFS_EXTEND_FS) {
2006         u_int64_t  newsize;
2007                 vnode_t vp = vfs_context_cwd(context);
2008
2009                 if (newp == USER_ADDR_NULL || vp == NULLVP)
2010                         return (EINVAL);
2011                 if ((error = hfs_getmountpoint(vp, &hfsmp)))
2012                         return (error);
2013                 error = sysctl_quad(oldp, oldlenp, newp, newlen, (quad_t *)&newsize);
2014                 if (error)
2015                         return (error);
2016
2017                 error = hfs_extendfs(hfsmp, newsize, context);
2018                 return (error);
2019
2020         } else if (name[0] == HFS_ENCODINGHINT) {
2021                 size_t bufsize;
2022                 size_t bytes;
2023                 u_int32_t hint;
2024                 u_int16_t *unicode_name;
2025                 char *filename;
2026
2027                 if ((newlen <= 0) || (newlen > MAXPATHLEN))
2028                         return (EINVAL);
2029
2030                 bufsize = MAX(newlen * 3, MAXPATHLEN);
2031                 MALLOC(filename, char *, newlen, M_TEMP, M_WAITOK);
2032                 MALLOC(unicode_name, u_int16_t *, bufsize, M_TEMP, M_WAITOK);
2033
2034                 error = copyin(newp, (caddr_t)filename, newlen);
2035                 if (error == 0) {
2036                         error = utf8_decodestr((u_int8_t *)filename, newlen - 1, unicode_name,
2037                                                &bytes, bufsize, 0, UTF_DECOMPOSED);
2038                         if (error == 0) {
2039                                 hint = hfs_pickencoding(unicode_name, bytes / 2);
2040                                 error = sysctl_int(oldp, oldlenp, USER_ADDR_NULL, 0, (int32_t *)&hint);
2041                         }
2042                 }
2043                 FREE(unicode_name, M_TEMP);
2044                 FREE(filename, M_TEMP);
2045                 return (error);
2046
2047         } else if (name[0] == HFS_ENABLE_JOURNALING) {
2048                 // make the file system journaled...
2049                 vnode_t vp = vfs_context_cwd(context);
2050                 vnode_t jvp;
2051                 ExtendedVCB *vcb;
2052                 struct cat_attr jnl_attr, jinfo_attr;
2053                 struct cat_fork jnl_fork, jinfo_fork;
2054                 void *jnl = NULL;
2055                 int lockflags;
2056
2057                 /* Only root can enable journaling */
2058                 if (!is_suser()) {
2059                         return (EPERM);
2060                 }
2061                 if (vp == NULLVP)
2062                         return EINVAL;
2063
2064                 hfsmp = VTOHFS(vp);
2065                 if (hfsmp->hfs_flags & HFS_READ_ONLY) {
2066                         return EROFS;
2067                 }
2068                 if (HFSTOVCB(hfsmp)->vcbSigWord == kHFSSigWord) {
2069                         printf("hfs: can't make a plain hfs volume journaled.\n");
2070                         return EINVAL;
2071                 }
2072
2073                 if (hfsmp->jnl) {
2074                     printf("hfs: volume @ mp %p is already journaled!\n", vnode_mount(vp));
2075                     return EAGAIN;
2076                 }
2077
2078                 vcb = HFSTOVCB(hfsmp);
2079                 lockflags = hfs_systemfile_lock(hfsmp, SFL_CATALOG | SFL_EXTENTS, HFS_EXCLUSIVE_LOCK);
2080                 if (BTHasContiguousNodes(VTOF(vcb->catalogRefNum)) == 0 ||
2081                         BTHasContiguousNodes(VTOF(vcb->extentsRefNum)) == 0) {
2082
2083                         printf("hfs: volume has a btree w/non-contiguous nodes.  can not enable journaling.\n");
2084                         hfs_systemfile_unlock(hfsmp, lockflags);
2085                         return EINVAL;
2086                 }
2087                 hfs_systemfile_unlock(hfsmp, lockflags);
2088
2089                 // make sure these both exist!
2090                 if (   GetFileInfo(vcb, kHFSRootFolderID, ".journal_info_block", &jinfo_attr, &jinfo_fork) == 0
2091                         || GetFileInfo(vcb, kHFSRootFolderID, ".journal", &jnl_attr, &jnl_fork) == 0) {
2092
2093                         return EINVAL;
2094                 }
2095
2096                 hfs_sync(hfsmp->hfs_mp, MNT_WAIT, context);
2097
2098                 printf("hfs: Initializing the journal (joffset 0x%llx sz 0x%llx)...\n",
2099                            (off_t)name[2], (off_t)name[3]);
2100
2101                 jvp = hfsmp->hfs_devvp;
2102                 jnl = journal_create(jvp,
2103                                                          (off_t)name[2] * (off_t)HFSTOVCB(hfsmp)->blockSize
2104                                                          + HFSTOVCB(hfsmp)->hfsPlusIOPosOffset,
2105                                                          (off_t)((unsigned)name[3]),
2106                                                          hfsmp->hfs_devvp,
2107                                                          hfsmp->hfs_phys_block_size,
2108                                                          0,
2109                                                          0,
2110                                                          hfs_sync_metadata, hfsmp->hfs_mp);
2111
2112                 if (jnl == NULL) {
2113                         printf("hfs: FAILED to create the journal!\n");
2114                         if (jvp && jvp != hfsmp->hfs_devvp) {
2115                                 VNOP_CLOSE(jvp, hfsmp->hfs_flags & HFS_READ_ONLY ? FREAD : FREAD|FWRITE, context);
2116                         }
2117                         jvp = NULL;
2118
2119                         return EINVAL;
2120                 }
2121
2122                 hfs_global_exclusive_lock_acquire(hfsmp);
2123
2124                 /*
2125                  * Flush all dirty metadata buffers.
2126                  */
2127                 buf_flushdirtyblks(hfsmp->hfs_devvp, MNT_WAIT, 0, "hfs_sysctl");
2128                 buf_flushdirtyblks(hfsmp->hfs_extents_vp, MNT_WAIT, 0, "hfs_sysctl");
2129                 buf_flushdirtyblks(hfsmp->hfs_catalog_vp, MNT_WAIT, 0, "hfs_sysctl");
2130                 buf_flushdirtyblks(hfsmp->hfs_allocation_vp, MNT_WAIT, 0, "hfs_sysctl");
2131                 if (hfsmp->hfs_attribute_vp)
2132                         buf_flushdirtyblks(hfsmp->hfs_attribute_vp, MNT_WAIT, 0, "hfs_sysctl");
2133
2134                 HFSTOVCB(hfsmp)->vcbJinfoBlock = name[1];
2135                 HFSTOVCB(hfsmp)->vcbAtrb |= kHFSVolumeJournaledMask;
2136                 hfsmp->jvp = jvp;
2137                 hfsmp->jnl = jnl;
2138
2139                 // save this off for the hack-y check in hfs_remove()
2140                 hfsmp->jnl_start        = (u_int32_t)name[2];
2141                 hfsmp->jnl_size         = (off_t)((unsigned)name[3]);
2142                 hfsmp->hfs_jnlinfoblkid = jinfo_attr.ca_fileid;
2143                 hfsmp->hfs_jnlfileid    = jnl_attr.ca_fileid;
2144
2145                 vfs_setflags(hfsmp->hfs_mp, (u_int64_t)((unsigned int)MNT_JOURNALED));
2146
2147                 hfs_global_exclusive_lock_release(hfsmp);
2148                 hfs_flushvolumeheader(hfsmp, MNT_WAIT, 1);
2149
2150                 return 0;
2151         } else if (name[0] == HFS_DISABLE_JOURNALING) {
2152                 // clear the journaling bit
2153                 vnode_t vp = vfs_context_cwd(context);
2154
2155                 /* Only root can disable journaling */
2156                 if (!is_suser()) {
2157                         return (EPERM);
2158                 }
2159                 if (vp == NULLVP)
2160                         return EINVAL;
2161
2162                 hfsmp = VTOHFS(vp);
2163
2164                 /*
2165                  * Disabling journaling is disallowed on volumes with directory hard links
2166                  * because we have not tested the relevant code path.
2167                  */
2168                 if (hfsmp->hfs_private_attr[DIR_HARDLINKS].ca_entries != 0){
2169                         printf("hfs: cannot disable journaling on volumes with directory hardlinks\n");
2170                         return EPERM;
2171                 }
2172
2173                 printf("hfs: disabling journaling for mount @ %p\n", vnode_mount(vp));
2174
2175                 hfs_global_exclusive_lock_acquire(hfsmp);
2176
2177                 // Lights out for you buddy!
2178                 journal_close(hfsmp->jnl);
2179                 hfsmp->jnl = NULL;
2180
2181                 if (hfsmp->jvp && hfsmp->jvp != hfsmp->hfs_devvp) {
2182                         VNOP_CLOSE(hfsmp->jvp, hfsmp->hfs_flags & HFS_READ_ONLY ? FREAD : FREAD|FWRITE, context);
2183                 }
2184                 hfsmp->jvp = NULL;
2185                 vfs_clearflags(hfsmp->hfs_mp, (u_int64_t)((unsigned int)MNT_JOURNALED));
2186                 hfsmp->jnl_start        = 0;
2187                 hfsmp->hfs_jnlinfoblkid = 0;
2188                 hfsmp->hfs_jnlfileid    = 0;
2189
2190                 HFSTOVCB(hfsmp)->vcbAtrb &= ~kHFSVolumeJournaledMask;
2191
2192                 hfs_global_exclusive_lock_release(hfsmp);
2193                 hfs_flushvolumeheader(hfsmp, MNT_WAIT, 1);
2194
2195                 return 0;
2196         } else if (name[0] == HFS_GET_JOURNAL_INFO) {
2197                 vnode_t vp = vfs_context_cwd(context);
2198                 off_t jnl_start, jnl_size;
2199
2200                 if (vp == NULLVP)
2201                         return EINVAL;
2202
2203                 hfsmp = VTOHFS(vp);
2204             if (hfsmp->jnl == NULL) {
2205                         jnl_start = 0;
2206                         jnl_size  = 0;
2207             } else {
2208                         jnl_start = (off_t)(hfsmp->jnl_start * HFSTOVCB(hfsmp)->blockSize) + (off_t)HFSTOVCB(hfsmp)->hfsPlusIOPosOffset;
2209                         jnl_size  = (off_t)hfsmp->jnl_size;
2210             }
2211
2212             if ((error = copyout((caddr_t)&jnl_start, CAST_USER_ADDR_T(name[1]), sizeof(off_t))) != 0) {
2213                         return error;
2214                 }
2215             if ((error = copyout((caddr_t)&jnl_size, CAST_USER_ADDR_T(name[2]), sizeof(off_t))) != 0) {
2216                         return error;
2217                 }
2218
2219                 return 0;
2220         } else if (name[0] == HFS_SET_PKG_EXTENSIONS) {
2221
2222             return set_package_extensions_table((void *)name[1], name[2], name[3]);
2223
2224         } else if (name[0] == VFS_CTL_QUERY) {
2225         struct sysctl_req *req;
2226         struct vfsidctl vc;
2227             struct user_vfsidctl user_vc;
2228         struct mount *mp;
2229             struct vfsquery vq;
2230             boolean_t is_64_bit;
2231
2232         is_64_bit = proc_is64bit(p);
2233                 req = CAST_DOWN(struct sysctl_req *, oldp);     /* we're new style vfs sysctl. */
2234
2235         if (is_64_bit) {
2236             error = SYSCTL_IN(req, &user_vc, sizeof(user_vc));
2237             if (error) return (error);
2238
2239             mp = vfs_getvfs(&user_vc.vc_fsid);
2240         }
2241         else {
2242             error = SYSCTL_IN(req, &vc, sizeof(vc));
2243             if (error) return (error);
2244
2245             mp = vfs_getvfs(&vc.vc_fsid);
2246         }
2247         if (mp == NULL) return (ENOENT);
2248
2249                 hfsmp = VFSTOHFS(mp);
2250                 bzero(&vq, sizeof(vq));
2251                 vq.vq_flags = hfsmp->hfs_notification_conditions;
2252                 return SYSCTL_OUT(req, &vq, sizeof(vq));;
2253         } else if (name[0] == HFS_REPLAY_JOURNAL) {
2254                 char *devnode = NULL;
2255                 size_t devnode_len;
2256
2257                 devnode_len = *oldlenp;
2258                 MALLOC(devnode, char *, devnode_len + 1, M_TEMP, M_WAITOK);
2259                 if (devnode == NULL) {
2260                         return ENOMEM;
2261                 }
2262
2263                 error = copyin(oldp, (caddr_t)devnode, devnode_len);
2264                 if (error) {
2265                         FREE(devnode, M_TEMP);
2266                         return error;
2267                 }
2268                 devnode[devnode_len] = 0;
2269
2270                 error = hfs_journal_replay(devnode, context);
2271                 FREE(devnode, M_TEMP);
2272                 return error;
2273         }
2274
2275         return (ENOTSUP);
2276 }
2277
2278
2279 static int
2280 hfs_vfs_vget(struct mount *mp, ino64_t ino, struct vnode **vpp, __unused vfs_context_t context)
2281 {
2282         int error;
2283
2284         error = hfs_vget(VFSTOHFS(mp), (cnid_t)ino, vpp, 1);
2285         if (error)
2286                 return (error);
2287
2288         /*
2289          * ADLs may need to have their origin state updated
2290          * since build_path needs a valid parent.
2291          */
2292         if (vnode_isdir(*vpp) &&
2293             (VTOC(*vpp)->c_flag & C_HARDLINK) &&
2294             (hfs_lock(VTOC(*vpp), HFS_EXCLUSIVE_LOCK) == 0)) {
2295                 cnode_t *cp = VTOC(*vpp);
2296                 struct cat_desc cdesc;
2297
2298                 if (!hfs_haslinkorigin(cp) &&
2299                     (cat_findname(VFSTOHFS(mp), (cnid_t)ino, &cdesc) == 0)) {
2300                         if (cdesc.cd_parentcnid !=
2301                             VFSTOHFS(mp)->hfs_private_desc[DIR_HARDLINKS].cd_cnid) {
2302                                 hfs_savelinkorigin(cp, cdesc.cd_parentcnid);
2303                         }
2304                         cat_releasedesc(&cdesc);
2305                 }
2306                 hfs_unlock(cp);
2307         }
2308         return (0);
2309 }
2310
2311
2312 /*
2313  * Look up an HFS object by ID.
2314  *
2315  * The object is returned with an iocount reference and the cnode locked.
2316  *
2317  * If the object is a file then it will represent the data fork.
2318  */
2319 __private_extern__
2320 int
2321 hfs_vget(struct hfsmount *hfsmp, cnid_t cnid, struct vnode **vpp, int skiplock)
2322 {
2323         struct vnode *vp = NULLVP;
2324         struct cat_desc cndesc;
2325         struct cat_attr cnattr;
2326         struct cat_fork cnfork;
2327         u_int32_t linkref = 0;
2328         int error;
2329
2330         /* Check for cnids that should't be exported. */
2331         if ((cnid < kHFSFirstUserCatalogNodeID) &&
2332             (cnid != kHFSRootFolderID && cnid != kHFSRootParentID)) {
2333                 return (ENOENT);
2334         }
2335         /* Don't export our private directories. */
2336         if (cnid == hfsmp->hfs_private_desc[FILE_HARDLINKS].cd_cnid ||
2337             cnid == hfsmp->hfs_private_desc[DIR_HARDLINKS].cd_cnid) {
2338                 return (ENOENT);
2339         }
2340         /*
2341          * Check the hash first
2342          */
2343         vp = hfs_chash_getvnode(hfsmp->hfs_raw_dev, cnid, 0, skiplock);
2344         if (vp) {
2345                 *vpp = vp;
2346                 return(0);
2347         }
2348
2349         bzero(&cndesc, sizeof(cndesc));
2350         bzero(&cnattr, sizeof(cnattr));
2351         bzero(&cnfork, sizeof(cnfork));
2352
2353         /*
2354          * Not in hash, lookup in catalog
2355          */
2356         if (cnid == kHFSRootParentID) {
2357                 static char hfs_rootname[] = "/";
2358
2359                 cndesc.cd_nameptr = (const u_int8_t *)&hfs_rootname[0];
2360                 cndesc.cd_namelen = 1;
2361                 cndesc.cd_parentcnid = kHFSRootParentID;
2362                 cndesc.cd_cnid = kHFSRootFolderID;
2363                 cndesc.cd_flags = CD_ISDIR;
2364
2365                 cnattr.ca_fileid = kHFSRootFolderID;
2366                 cnattr.ca_linkcount = 1;
2367                 cnattr.ca_entries = 1;
2368                 cnattr.ca_dircount = 1;
2369                 cnattr.ca_mode = (S_IFDIR | S_IRWXU | S_IRWXG | S_IRWXO);
2370         } else {
2371                 int lockflags;
2372                 cnid_t pid;
2373                 const char *nameptr;
2374
2375                 lockflags = hfs_systemfile_lock(hfsmp, SFL_CATALOG, HFS_SHARED_LOCK);
2376                 error = cat_idlookup(hfsmp, cnid, 0, &cndesc, &cnattr, &cnfork);
2377                 hfs_systemfile_unlock(hfsmp, lockflags);
2378
2379                 if (error) {
2380                         *vpp = NULL;
2381                         return (error);
2382                 }
2383
2384                 /*
2385                  * Check for a raw hardlink inode and save its linkref.
2386                  */
2387                 pid = cndesc.cd_parentcnid;
2388                 nameptr = (const char *)cndesc.cd_nameptr;
2389
2390                 if ((pid == hfsmp->hfs_private_desc[FILE_HARDLINKS].cd_cnid) &&
2391                     (bcmp(nameptr, HFS_INODE_PREFIX, HFS_INODE_PREFIX_LEN) == 0)) {
2392                         linkref = strtoul(&nameptr[HFS_INODE_PREFIX_LEN], NULL, 10);
2393
2394                 } else if ((pid == hfsmp->hfs_private_desc[DIR_HARDLINKS].cd_cnid) &&
2395                            (bcmp(nameptr, HFS_DIRINODE_PREFIX, HFS_DIRINODE_PREFIX_LEN) == 0)) {
2396                         linkref = strtoul(&nameptr[HFS_DIRINODE_PREFIX_LEN], NULL, 10);
2397
2398                 } else if ((pid == hfsmp->hfs_private_desc[FILE_HARDLINKS].cd_cnid) &&
2399                            (bcmp(nameptr, HFS_DELETE_PREFIX, HFS_DELETE_PREFIX_LEN) == 0)) {
2400                         *vpp = NULL;
2401                         cat_releasedesc(&cndesc);
2402                         return (ENOENT);  /* open unlinked file */
2403                 }
2404         }
2405
2406         /*
2407          * Finish initializing cnode descriptor for hardlinks.
2408          *
2409          * We need a valid name and parent for reverse lookups.
2410          */
2411         if (linkref) {
2412                 cnid_t nextlinkid;
2413                 cnid_t prevlinkid;
2414                 struct cat_desc linkdesc;
2415
2416                 cnattr.ca_linkref = linkref;
2417
2418                 /*
2419                  * Pick up the first link in the chain and get a descriptor for it.
2420                  * This allows blind volfs paths to work for hardlinks.
2421                  */
2422                 if ((hfs_lookuplink(hfsmp, linkref, &prevlinkid,  &nextlinkid) == 0) &&
2423                     (nextlinkid != 0)) {
2424                         if (cat_findname(hfsmp, nextlinkid, &linkdesc) == 0) {
2425                                 cat_releasedesc(&cndesc);
2426                                 bcopy(&linkdesc, &cndesc, sizeof(linkdesc));
2427                         }
2428                 }
2429         }
2430
2431         if (linkref) {
2432                 error = hfs_getnewvnode(hfsmp, NULL, NULL, &cndesc, 0, &cnattr, &cnfork, &vp);
2433                 if (error == 0) {
2434                         VTOC(vp)->c_flag |= C_HARDLINK;
2435                         vnode_setmultipath(vp);
2436                 }
2437         } else {
2438                 struct componentname cn;
2439
2440                 /* Supply hfs_getnewvnode with a component name. */
2441                 MALLOC_ZONE(cn.cn_pnbuf, caddr_t, MAXPATHLEN, M_NAMEI, M_WAITOK);
2442                 cn.cn_nameiop = LOOKUP;
2443                 cn.cn_flags = ISLASTCN | HASBUF;
2444                 cn.cn_context = NULL;
2445                 cn.cn_pnlen = MAXPATHLEN;
2446                 cn.cn_nameptr = cn.cn_pnbuf;
2447                 cn.cn_namelen = cndesc.cd_namelen;
2448                 cn.cn_hash = 0;
2449                 cn.cn_consume = 0;
2450                 bcopy(cndesc.cd_nameptr, cn.cn_nameptr, cndesc.cd_namelen + 1);
2451
2452                 error = hfs_getnewvnode(hfsmp, NULLVP, &cn, &cndesc, 0, &cnattr, &cnfork, &vp);
2453
2454                 if (error == 0 && (VTOC(vp)->c_flag & C_HARDLINK) && vnode_isdir(vp)) {
2455                         hfs_savelinkorigin(VTOC(vp), cndesc.cd_parentcnid);
2456                 }
2457                 FREE_ZONE(cn.cn_pnbuf, cn.cn_pnlen, M_NAMEI);
2458         }
2459         cat_releasedesc(&cndesc);
2460
2461         *vpp = vp;
2462         if (vp && skiplock) {
2463                 hfs_unlock(VTOC(vp));
2464         }
2465         return (error);
2466 }
2467
2468
2469 /*
2470  * Flush out all the files in a filesystem.
2471  */
2472 static int
2473 #if QUOTA
2474 hfs_flushfiles(struct mount *mp, int flags, struct proc *p)
2475 #else
2476 hfs_flushfiles(struct mount *mp, int flags, __unused struct proc *p)
2477 #endif /* QUOTA */
2478 {
2479         struct hfsmount *hfsmp;
2480         struct vnode *skipvp = NULLVP;
2481         int error;
2482 #if QUOTA
2483         int quotafilecnt;
2484         int i;
2485 #endif
2486
2487         hfsmp = VFSTOHFS(mp);
2488
2489 #if QUOTA
2490         /*
2491          * The open quota files have an indirect reference on
2492          * the root directory vnode.  We must account for this
2493          * extra reference when doing the intial vflush.
2494          */
2495         quotafilecnt = 0;
2496         if (((unsigned int)vfs_flags(mp)) & MNT_QUOTA) {
2497
2498                 /* Find out how many quota files we have open. */
2499                 for (i = 0; i < MAXQUOTAS; i++) {
2500                         if (hfsmp->hfs_qfiles[i].qf_vp != NULLVP)
2501                                 ++quotafilecnt;
2502                 }
2503
2504                 /* Obtain the root vnode so we can skip over it. */
2505                 skipvp = hfs_chash_getvnode(hfsmp->hfs_raw_dev, kHFSRootFolderID, 0, 0);
2506         }
2507 #endif /* QUOTA */
2508
2509         error = vflush(mp, skipvp, SKIPSYSTEM | SKIPSWAP | flags);
2510         if (error != 0)
2511                 return(error);
2512
2513         error = vflush(mp, skipvp, SKIPSYSTEM | flags);
2514
2515 #if QUOTA
2516         if (((unsigned int)vfs_flags(mp)) & MNT_QUOTA) {
2517                 if (skipvp) {
2518                         /*
2519                          * See if there are additional references on the
2520                          * root vp besides the ones obtained from the open
2521                          * quota files and the hfs_chash_getvnode call above.
2522                          */
2523                         if ((error == 0) &&
2524                             (vnode_isinuse(skipvp,  quotafilecnt))) {
2525                                 error = EBUSY;  /* root directory is still open */
2526                         }
2527                         hfs_unlock(VTOC(skipvp));
2528                         vnode_put(skipvp);
2529                 }
2530                 if (error && (flags & FORCECLOSE) == 0)
2531                         return (error);
2532
2533                 for (i = 0; i < MAXQUOTAS; i++) {
2534                         if (hfsmp->hfs_qfiles[i].qf_vp == NULLVP)
2535                                 continue;
2536                         hfs_quotaoff(p, mp, i);
2537                 }
2538                 error = vflush(mp, NULLVP, SKIPSYSTEM | flags);
2539         }
2540 #endif /* QUOTA */
2541
2542         return (error);
2543 }
2544
2545 /*
2546  * Update volume encoding bitmap (HFS Plus only)
2547  */
2548 __private_extern__
2549 void
2550 hfs_setencodingbits(struct hfsmount *hfsmp, u_int32_t encoding)
2551 {
2552 #define  kIndexMacUkrainian     48  /* MacUkrainian encoding is 152 */
2553 #define  kIndexMacFarsi         49  /* MacFarsi encoding is 140 */
2554
2555         u_int32_t       index;
2556
2557         switch (encoding) {
2558         case kTextEncodingMacUkrainian:
2559                 index = kIndexMacUkrainian;
2560                 break;
2561         case kTextEncodingMacFarsi:
2562                 index = kIndexMacFarsi;
2563                 break;
2564         default:
2565                 index = encoding;
2566                 break;
2567         }
2568
2569         if (index < 64 && (hfsmp->encodingsBitmap & (u_int64_t)(1ULL << index)) == 0) {
2570                 HFS_MOUNT_LOCK(hfsmp, TRUE)
2571                 hfsmp->encodingsBitmap |= (u_int64_t)(1ULL << index);
2572                 MarkVCBDirty(hfsmp);
2573                 HFS_MOUNT_UNLOCK(hfsmp, TRUE);
2574         }
2575 }
2576
2577 /*
2578  * Update volume stats
2579  *
2580  * On journal volumes this will cause a volume header flush
2581  */
2582 __private_extern__
2583 int
2584 hfs_volupdate(struct hfsmount *hfsmp, enum volop op, int inroot)
2585 {
2586         struct timeval tv;
2587
2588         microtime(&tv);
2589
2590         lck_mtx_lock(&hfsmp->hfs_mutex);
2591
2592         MarkVCBDirty(hfsmp);
2593         hfsmp->hfs_mtime = tv.tv_sec;
2594
2595         switch (op) {
2596         case VOL_UPDATE:
2597                 break;
2598         case VOL_MKDIR:
2599                 if (hfsmp->hfs_dircount != 0xFFFFFFFF)
2600                         ++hfsmp->hfs_dircount;
2601                 if (inroot && hfsmp->vcbNmRtDirs != 0xFFFF)
2602                         ++hfsmp->vcbNmRtDirs;
2603                 break;
2604         case VOL_RMDIR:
2605                 if (hfsmp->hfs_dircount != 0)
2606                         --hfsmp->hfs_dircount;
2607                 if (inroot && hfsmp->vcbNmRtDirs != 0xFFFF)
2608                         --hfsmp->vcbNmRtDirs;
2609                 break;
2610         case VOL_MKFILE:
2611                 if (hfsmp->hfs_filecount != 0xFFFFFFFF)
2612                         ++hfsmp->hfs_filecount;
2613                 if (inroot && hfsmp->vcbNmFls != 0xFFFF)
2614                         ++hfsmp->vcbNmFls;
2615                 break;
2616         case VOL_RMFILE:
2617                 if (hfsmp->hfs_filecount != 0)
2618                         --hfsmp->hfs_filecount;
2619                 if (inroot && hfsmp->vcbNmFls != 0xFFFF)
2620                         --hfsmp->vcbNmFls;
2621                 break;
2622         }
2623
2624         lck_mtx_unlock(&hfsmp->hfs_mutex);
2625
2626         if (hfsmp->jnl) {
2627                 hfs_flushvolumeheader(hfsmp, 0, 0);
2628         }
2629
2630         return (0);
2631 }
2632
2633
2634 static int
2635 hfs_flushMDB(struct hfsmount *hfsmp, int waitfor, int altflush)
2636 {
2637         ExtendedVCB *vcb = HFSTOVCB(hfsmp);
2638         struct filefork *fp;
2639         HFSMasterDirectoryBlock *mdb;
2640         struct buf *bp = NULL;
2641         int retval;
2642         int sectorsize;
2643         ByteCount namelen;
2644
2645         sectorsize = hfsmp->hfs_phys_block_size;
2646         retval = (int)buf_bread(hfsmp->hfs_devvp, (daddr64_t)HFS_PRI_SECTOR(sectorsize), sectorsize, NOCRED, &bp);
2647         if (retval) {
2648                 if (bp)
2649                         buf_brelse(bp);
2650                 return retval;
2651         }
2652
2653         lck_mtx_lock(&hfsmp->hfs_mutex);
2654
2655         mdb = (HFSMasterDirectoryBlock *)(buf_dataptr(bp) + HFS_PRI_OFFSET(sectorsize));
2656
2657         mdb->drCrDate   = SWAP_BE32 (UTCToLocal(to_hfs_time(vcb->vcbCrDate)));
2658         mdb->drLsMod    = SWAP_BE32 (UTCToLocal(to_hfs_time(vcb->vcbLsMod)));
2659         mdb->drAtrb     = SWAP_BE16 (vcb->vcbAtrb);
2660         mdb->drNmFls    = SWAP_BE16 (vcb->vcbNmFls);
2661         mdb->drAllocPtr = SWAP_BE16 (vcb->nextAllocation);
2662         mdb->drClpSiz   = SWAP_BE32 (vcb->vcbClpSiz);
2663         mdb->drNxtCNID  = SWAP_BE32 (vcb->vcbNxtCNID);
2664         mdb->drFreeBks  = SWAP_BE16 (vcb->freeBlocks);
2665
2666         namelen = strlen((char *)vcb->vcbVN);
2667         retval = utf8_to_hfs(vcb, namelen, vcb->vcbVN, mdb->drVN);
2668         /* Retry with MacRoman in case that's how it was exported. */
2669         if (retval)
2670                 retval = utf8_to_mac_roman(namelen, vcb->vcbVN, mdb->drVN);
2671
2672         mdb->drVolBkUp  = SWAP_BE32 (UTCToLocal(to_hfs_time(vcb->vcbVolBkUp)));
2673         mdb->drWrCnt    = SWAP_BE32 (vcb->vcbWrCnt);
2674         mdb->drNmRtDirs = SWAP_BE16 (vcb->vcbNmRtDirs);
2675         mdb->drFilCnt   = SWAP_BE32 (vcb->vcbFilCnt);
2676         mdb->drDirCnt   = SWAP_BE32 (vcb->vcbDirCnt);
2677
2678         bcopy(vcb->vcbFndrInfo, mdb->drFndrInfo, sizeof(mdb->drFndrInfo));
2679
2680         fp = VTOF(vcb->extentsRefNum);
2681         mdb->drXTExtRec[0].startBlock = SWAP_BE16 (fp->ff_extents[0].startBlock);
2682         mdb->drXTExtRec[0].blockCount = SWAP_BE16 (fp->ff_extents[0].blockCount);
2683         mdb->drXTExtRec[1].startBlock = SWAP_BE16 (fp->ff_extents[1].startBlock);
2684         mdb->drXTExtRec[1].blockCount = SWAP_BE16 (fp->ff_extents[1].blockCount);
2685         mdb->drXTExtRec[2].startBlock = SWAP_BE16 (fp->ff_extents[2].startBlock);
2686         mdb->drXTExtRec[2].blockCount = SWAP_BE16 (fp->ff_extents[2].blockCount);
2687         mdb->drXTFlSize = SWAP_BE32 (fp->ff_blocks * vcb->blockSize);
2688         mdb->drXTClpSiz = SWAP_BE32 (fp->ff_clumpsize);
2689         FTOC(fp)->c_flag &= ~C_MODIFIED;
2690
2691         fp = VTOF(vcb->catalogRefNum);
2692         mdb->drCTExtRec[0].startBlock = SWAP_BE16 (fp->ff_extents[0].startBlock);
2693         mdb->drCTExtRec[0].blockCount = SWAP_BE16 (fp->ff_extents[0].blockCount);
2694         mdb->drCTExtRec[1].startBlock = SWAP_BE16 (fp->ff_extents[1].startBlock);
2695         mdb->drCTExtRec[1].blockCount = SWAP_BE16 (fp->ff_extents[1].blockCount);
2696         mdb->drCTExtRec[2].startBlock = SWAP_BE16 (fp->ff_extents[2].startBlock);
2697         mdb->drCTExtRec[2].blockCount = SWAP_BE16 (fp->ff_extents[2].blockCount);
2698         mdb->drCTFlSize = SWAP_BE32 (fp->ff_blocks * vcb->blockSize);
2699         mdb->drCTClpSiz = SWAP_BE32 (fp->ff_clumpsize);
2700         FTOC(fp)->c_flag &= ~C_MODIFIED;
2701
2702         MarkVCBClean( vcb );
2703
2704         lck_mtx_unlock(&hfsmp->hfs_mutex);
2705
2706         /* If requested, flush out the alternate MDB */
2707         if (altflush) {
2708                 struct buf *alt_bp = NULL;
2709
2710                 if (buf_meta_bread(hfsmp->hfs_devvp, hfsmp->hfs_alt_id_sector, sectorsize, NOCRED, &alt_bp) == 0) {
2711                         bcopy(mdb, (char *)buf_dataptr(alt_bp) + HFS_ALT_OFFSET(sectorsize), kMDBSize);
2712
2713                         (void) VNOP_BWRITE(alt_bp);
2714                 } else if (alt_bp)
2715                         buf_brelse(alt_bp);
2716         }
2717
2718         if (waitfor != MNT_WAIT)
2719                 buf_bawrite(bp);
2720         else
2721                 retval = VNOP_BWRITE(bp);
2722
2723         return (retval);
2724 }
2725
2726 /*
2727  *  Flush any dirty in-memory mount data to the on-disk
2728  *  volume header.
2729  *
2730  *  Note: the on-disk volume signature is intentionally
2731  *  not flushed since the on-disk "H+" and "HX" signatures
2732  *  are always stored in-memory as "H+".
2733  */
2734 __private_extern__
2735 int
2736 hfs_flushvolumeheader(struct hfsmount *hfsmp, int waitfor, int altflush)
2737 {
2738         ExtendedVCB *vcb = HFSTOVCB(hfsmp);
2739         struct filefork *fp;
2740         HFSPlusVolumeHeader *volumeHeader;
2741         int retval;
2742         struct buf *bp;
2743         int i;
2744         int sectorsize;
2745         daddr64_t priIDSector;
2746         int critical;
2747         u_int16_t  signature;
2748         u_int16_t  hfsversion;
2749
2750         if (hfsmp->hfs_flags & HFS_READ_ONLY) {
2751                 return(0);
2752         }
2753         if (hfsmp->hfs_flags & HFS_STANDARD) {
2754                 return hfs_flushMDB(hfsmp, waitfor, altflush);
2755         }
2756         critical = altflush;
2757         sectorsize = hfsmp->hfs_phys_block_size;
2758         priIDSector = (daddr64_t)((vcb->hfsPlusIOPosOffset / sectorsize) +
2759                                   HFS_PRI_SECTOR(sectorsize));
2760
2761         if (hfs_start_transaction(hfsmp) != 0) {
2762             return EINVAL;
2763         }
2764
2765         retval = (int)buf_meta_bread(hfsmp->hfs_devvp, priIDSector, sectorsize, NOCRED, &bp);
2766         if (retval) {
2767                 if (bp)
2768                         buf_brelse(bp);
2769
2770                 hfs_end_transaction(hfsmp);
2771
2772                 printf("HFS: err %d reading VH blk (%s)\n", retval, vcb->vcbVN);
2773                 return (retval);
2774         }
2775
2776         if (hfsmp->jnl) {
2777                 journal_modify_block_start(hfsmp->jnl, bp);
2778         }
2779
2780         volumeHeader = (HFSPlusVolumeHeader *)((char *)buf_dataptr(bp) + HFS_PRI_OFFSET(sectorsize));
2781
2782         /*
2783          * Sanity check what we just read.
2784          */
2785         signature = SWAP_BE16 (volumeHeader->signature);
2786         hfsversion   = SWAP_BE16 (volumeHeader->version);
2787         if ((signature != kHFSPlusSigWord && signature != kHFSXSigWord) ||
2788             (hfsversion < kHFSPlusVersion) || (hfsversion > 100) ||
2789             (SWAP_BE32 (volumeHeader->blockSize) != vcb->blockSize)) {
2790 #if 1
2791                 panic("HFS: corrupt VH on %s, sig 0x%04x, ver %d, blksize %d",
2792                       vcb->vcbVN, signature, hfsversion,
2793                       SWAP_BE32 (volumeHeader->blockSize));
2794 #endif
2795                 printf("HFS: corrupt VH blk (%s)\n", vcb->vcbVN);
2796                 buf_brelse(bp);
2797                 return (EIO);
2798         }
2799
2800         /*
2801          * For embedded HFS+ volumes, update create date if it changed
2802          * (ie from a setattrlist call)
2803          */
2804         if ((vcb->hfsPlusIOPosOffset != 0) &&
2805             (SWAP_BE32 (volumeHeader->createDate) != vcb->localCreateDate)) {
2806                 struct buf *bp2;
2807                 HFSMasterDirectoryBlock *mdb;
2808
2809                 retval = (int)buf_meta_bread(hfsmp->hfs_devvp, (daddr64_t)HFS_PRI_SECTOR(sectorsize),
2810                                 sectorsize, NOCRED, &bp2);
2811                 if (retval) {
2812                         if (bp2)
2813                                 buf_brelse(bp2);
2814                         retval = 0;
2815                 } else {
2816                         mdb = (HFSMasterDirectoryBlock *)(buf_dataptr(bp2) +
2817                                 HFS_PRI_OFFSET(sectorsize));
2818
2819                         if ( SWAP_BE32 (mdb->drCrDate) != vcb->localCreateDate )
2820                           {
2821                                 if (hfsmp->jnl) {
2822                                     journal_modify_block_start(hfsmp->jnl, bp2);
2823                                 }
2824
2825                                 mdb->drCrDate = SWAP_BE32 (vcb->localCreateDate);       /* pick up the new create date */
2826
2827                                 if (hfsmp->jnl) {
2828                                         journal_modify_block_end(hfsmp->jnl, bp2, NULL, NULL);
2829                                 } else {
2830                                         (void) VNOP_BWRITE(bp2);                /* write out the changes */
2831                                 }
2832                           }
2833                         else
2834                           {
2835                                 buf_brelse(bp2);                                                /* just release it */
2836                           }
2837                   }
2838         }
2839
2840         lck_mtx_lock(&hfsmp->hfs_mutex);
2841
2842         /* Note: only update the lower 16 bits worth of attributes */
2843         volumeHeader->attributes       = SWAP_BE32 (vcb->vcbAtrb);
2844         volumeHeader->journalInfoBlock = SWAP_BE32 (vcb->vcbJinfoBlock);
2845         if (hfsmp->jnl) {
2846                 volumeHeader->lastMountedVersion = SWAP_BE32 (kHFSJMountVersion);
2847         } else {
2848                 volumeHeader->lastMountedVersion = SWAP_BE32 (kHFSPlusMountVersion);
2849         }
2850         volumeHeader->createDate        = SWAP_BE32 (vcb->localCreateDate);  /* volume create date is in local time */
2851         volumeHeader->modifyDate        = SWAP_BE32 (to_hfs_time(vcb->vcbLsMod));
2852         volumeHeader->backupDate        = SWAP_BE32 (to_hfs_time(vcb->vcbVolBkUp));
2853         volumeHeader->fileCount         = SWAP_BE32 (vcb->vcbFilCnt);
2854         volumeHeader->folderCount       = SWAP_BE32 (vcb->vcbDirCnt);
2855         volumeHeader->totalBlocks       = SWAP_BE32 (vcb->totalBlocks);
2856         volumeHeader->freeBlocks        = SWAP_BE32 (vcb->freeBlocks);
2857         volumeHeader->nextAllocation    = SWAP_BE32 (vcb->nextAllocation);
2858         volumeHeader->rsrcClumpSize     = SWAP_BE32 (vcb->vcbClpSiz);
2859         volumeHeader->dataClumpSize     = SWAP_BE32 (vcb->vcbClpSiz);
2860         volumeHeader->nextCatalogID     = SWAP_BE32 (vcb->vcbNxtCNID);
2861         volumeHeader->writeCount        = SWAP_BE32 (vcb->vcbWrCnt);
2862         volumeHeader->encodingsBitmap   = SWAP_BE64 (vcb->encodingsBitmap);
2863
2864         if (bcmp(vcb->vcbFndrInfo, volumeHeader->finderInfo, sizeof(volumeHeader->finderInfo)) != 0) {
2865                 bcopy(vcb->vcbFndrInfo, volumeHeader->finderInfo, sizeof(volumeHeader->finderInfo));
2866                 critical = 1;
2867         }
2868
2869         /*
2870          * System files are only dirty when altflush is set.
2871          */
2872         if (altflush == 0) {
2873                 goto done;
2874         }
2875
2876         /* Sync Extents over-flow file meta data */
2877         fp = VTOF(vcb->extentsRefNum);
2878         if (FTOC(fp)->c_flag & C_MODIFIED) {
2879                 for (i = 0; i < kHFSPlusExtentDensity; i++) {
2880                         volumeHeader->extentsFile.extents[i].startBlock =
2881                                 SWAP_BE32 (fp->ff_extents[i].startBlock);
2882                         volumeHeader->extentsFile.extents[i].blockCount =
2883                                 SWAP_BE32 (fp->ff_extents[i].blockCount);
2884                 }
2885                 volumeHeader->extentsFile.logicalSize = SWAP_BE64 (fp->ff_size);
2886                 volumeHeader->extentsFile.totalBlocks = SWAP_BE32 (fp->ff_blocks);
2887                 volumeHeader->extentsFile.clumpSize   = SWAP_BE32 (fp->ff_clumpsize);
2888                 FTOC(fp)->c_flag &= ~C_MODIFIED;
2889         }
2890
2891         /* Sync Catalog file meta data */
2892         fp = VTOF(vcb->catalogRefNum);
2893         if (FTOC(fp)->c_flag & C_MODIFIED) {
2894                 for (i = 0; i < kHFSPlusExtentDensity; i++) {
2895                         volumeHeader->catalogFile.extents[i].startBlock =
2896                                 SWAP_BE32 (fp->ff_extents[i].startBlock);
2897                         volumeHeader->catalogFile.extents[i].blockCount =
2898                                 SWAP_BE32 (fp->ff_extents[i].blockCount);
2899                 }
2900                 volumeHeader->catalogFile.logicalSize = SWAP_BE64 (fp->ff_size);
2901                 volumeHeader->catalogFile.totalBlocks = SWAP_BE32 (fp->ff_blocks);
2902                 volumeHeader->catalogFile.clumpSize   = SWAP_BE32 (fp->ff_clumpsize);
2903                 FTOC(fp)->c_flag &= ~C_MODIFIED;
2904         }
2905
2906         /* Sync Allocation file meta data */
2907         fp = VTOF(vcb->allocationsRefNum);
2908         if (FTOC(fp)->c_flag & C_MODIFIED) {
2909                 for (i = 0; i < kHFSPlusExtentDensity; i++) {
2910                         volumeHeader->allocationFile.extents[i].startBlock =
2911                                 SWAP_BE32 (fp->ff_extents[i].startBlock);
2912                         volumeHeader->allocationFile.extents[i].blockCount =
2913                                 SWAP_BE32 (fp->ff_extents[i].blockCount);
2914                 }
2915                 volumeHeader->allocationFile.logicalSize = SWAP_BE64 (fp->ff_size);
2916                 volumeHeader->allocationFile.totalBlocks = SWAP_BE32 (fp->ff_blocks);
2917                 volumeHeader->allocationFile.clumpSize   = SWAP_BE32 (fp->ff_clumpsize);
2918                 FTOC(fp)->c_flag &= ~C_MODIFIED;
2919         }
2920
2921         /* Sync Attribute file meta data */
2922         if (hfsmp->hfs_attribute_vp) {
2923                 fp = VTOF(hfsmp->hfs_attribute_vp);
2924                 for (i = 0; i < kHFSPlusExtentDensity; i++) {
2925                         volumeHeader->attributesFile.extents[i].startBlock =
2926                                 SWAP_BE32 (fp->ff_extents[i].startBlock);
2927                         volumeHeader->attributesFile.extents[i].blockCount =
2928                                 SWAP_BE32 (fp->ff_extents[i].blockCount);
2929                 }
2930                 FTOC(fp)->c_flag &= ~C_MODIFIED;
2931                 volumeHeader->attributesFile.logicalSize = SWAP_BE64 (fp->ff_size);
2932                 volumeHeader->attributesFile.totalBlocks = SWAP_BE32 (fp->ff_blocks);
2933                 volumeHeader->attributesFile.clumpSize   = SWAP_BE32 (fp->ff_clumpsize);
2934         }
2935
2936         /* Sync Startup file meta data */
2937         if (hfsmp->hfs_startup_vp) {
2938                 fp = VTOF(hfsmp->hfs_startup_vp);
2939                 if (FTOC(fp)->c_flag & C_MODIFIED) {
2940                         for (i = 0; i < kHFSPlusExtentDensity; i++) {
2941                                 volumeHeader->startupFile.extents[i].startBlock =
2942                                         SWAP_BE32 (fp->ff_extents[i].startBlock);
2943                                 volumeHeader->startupFile.extents[i].blockCount =
2944                                         SWAP_BE32 (fp->ff_extents[i].blockCount);
2945                         }
2946                         volumeHeader->startupFile.logicalSize = SWAP_BE64 (fp->ff_size);
2947                         volumeHeader->startupFile.totalBlocks = SWAP_BE32 (fp->ff_blocks);
2948                         volumeHeader->startupFile.clumpSize   = SWAP_BE32 (fp->ff_clumpsize);
2949                         FTOC(fp)->c_flag &= ~C_MODIFIED;
2950                 }
2951         }
2952
2953 done:
2954         MarkVCBClean(hfsmp);
2955         lck_mtx_unlock(&hfsmp->hfs_mutex);
2956
2957         /* If requested, flush out the alternate volume header */
2958         if (altflush && hfsmp->hfs_alt_id_sector) {
2959                 struct buf *alt_bp = NULL;
2960
2961                 if (buf_meta_bread(hfsmp->hfs_devvp, hfsmp->hfs_alt_id_sector, sectorsize, NOCRED, &alt_bp) == 0) {
2962                         if (hfsmp->jnl) {
2963                                 journal_modify_block_start(hfsmp->jnl, alt_bp);
2964                         }
2965
2966                         bcopy(volumeHeader, (char *)buf_dataptr(alt_bp) + HFS_ALT_OFFSET(sectorsize), kMDBSize);
2967
2968                         if (hfsmp->jnl) {
2969                                 journal_modify_block_end(hfsmp->jnl, alt_bp, NULL, NULL);
2970                         } else {
2971                                 (void) VNOP_BWRITE(alt_bp);
2972                         }
2973                 } else if (alt_bp)
2974                         buf_brelse(alt_bp);
2975         }
2976
2977         if (hfsmp->jnl) {
2978                 journal_modify_block_end(hfsmp->jnl, bp, NULL, NULL);
2979         } else {
2980                 if (waitfor != MNT_WAIT)
2981                         buf_bawrite(bp);
2982                 else {
2983                     retval = VNOP_BWRITE(bp);
2984                     /* When critical data changes, flush the device cache */
2985                     if (critical && (retval == 0)) {
2986                         (void) VNOP_IOCTL(hfsmp->hfs_devvp, DKIOCSYNCHRONIZECACHE,
2987                                          NULL, FWRITE, NULL);
2988                     }
2989                 }
2990         }
2991         hfs_end_transaction(hfsmp);
2992
2993         return (retval);
2994 }
2995
2996
2997 /*
2998  * Extend a file system.
2999  */
3000 __private_extern__
3001 int
3002 hfs_extendfs(struct hfsmount *hfsmp, u_int64_t newsize, vfs_context_t context)
3003 {
3004         struct proc *p = vfs_context_proc(context);
3005         kauth_cred_t cred = vfs_context_ucred(context);
3006         struct  vnode *vp;
3007         struct  vnode *devvp;
3008         struct  buf *bp;
3009         struct  filefork *fp = NULL;
3010         ExtendedVCB  *vcb;
3011         struct  cat_fork forkdata;
3012         u_int64_t  oldsize;
3013         u_int64_t  newblkcnt;
3014         u_int64_t  prev_phys_block_count;
3015         u_int32_t  addblks;
3016         u_int64_t  sectorcnt;
3017         u_int32_t  sectorsize;
3018         daddr64_t  prev_alt_sector;
3019         daddr_t    bitmapblks;
3020         int  lockflags;
3021         int  error;
3022         int64_t oldBitmapSize;
3023         Boolean  usedExtendFileC = false;
3024
3025         devvp = hfsmp->hfs_devvp;
3026         vcb = HFSTOVCB(hfsmp);
3027
3028         /*
3029          * - HFS Plus file systems only.
3030          * - Journaling must be enabled.
3031          * - No embedded volumes.
3032          */
3033         if ((vcb->vcbSigWord == kHFSSigWord) ||
3034              (hfsmp->jnl == NULL) ||
3035              (vcb->hfsPlusIOPosOffset != 0)) {
3036                 return (EPERM);
3037         }
3038         /*
3039          * If extending file system by non-root, then verify
3040          * ownership and check permissions.
3041          */
3042         if (suser(cred, NULL)) {
3043                 error = hfs_vget(hfsmp, kHFSRootFolderID, &vp, 0);
3044
3045                 if (error)
3046                         return (error);
3047                 error = hfs_owner_rights(hfsmp, VTOC(vp)->c_uid, cred, p, 0);
3048                 if (error == 0) {
3049                         error = hfs_write_access(vp, cred, p, false);
3050                 }
3051                 hfs_unlock(VTOC(vp));
3052                 vnode_put(vp);
3053                 if (error)
3054                         return (error);
3055
3056                 error = vnode_authorize(devvp, NULL, KAUTH_VNODE_READ_DATA | KAUTH_VNODE_WRITE_DATA, context);
3057                 if (error)
3058                         return (error);
3059         }
3060         if (VNOP_IOCTL(devvp, DKIOCGETBLOCKSIZE, (caddr_t)&sectorsize, 0, context)) {
3061                 return (ENXIO);
3062         }
3063         if (sectorsize != hfsmp->hfs_phys_block_size) {
3064                 return (ENXIO);
3065         }
3066         if (VNOP_IOCTL(devvp, DKIOCGETBLOCKCOUNT, (caddr_t)&sectorcnt, 0, context)) {
3067                 return (ENXIO);
3068         }
3069         if ((sectorsize * sectorcnt) < newsize) {
3070                 printf("hfs_extendfs: not enough space on device\n");
3071                 return (ENOSPC);
3072         }
3073         oldsize = (u_int64_t)hfsmp->totalBlocks * (u_int64_t)hfsmp->blockSize;
3074
3075         /*
3076          * Validate new size.
3077          */
3078         if ((newsize <= oldsize) || (newsize % sectorsize)) {
3079                 printf("hfs_extendfs: invalid size\n");
3080                 return (EINVAL);
3081         }
3082         newblkcnt = newsize / vcb->blockSize;
3083         if (newblkcnt > (u_int64_t)0xFFFFFFFF)
3084                 return (EOVERFLOW);
3085
3086         addblks = newblkcnt - vcb->totalBlocks;
3087
3088         printf("hfs_extendfs: growing %s by %d blocks\n", vcb->vcbVN, addblks);
3089         /*
3090          * Enclose changes inside a transaction.
3091          */
3092         if (hfs_start_transaction(hfsmp) != 0) {
3093                 return (EINVAL);
3094         }
3095
3096         /*
3097          * Note: we take the attributes lock in case we have an attribute data vnode
3098          * which needs to change size.
3099          */
3100         lockflags = hfs_systemfile_lock(hfsmp, SFL_ATTRIBUTE | SFL_EXTENTS | SFL_BITMAP, HFS_EXCLUSIVE_LOCK);
3101         vp = vcb->allocationsRefNum;
3102         fp = VTOF(vp);
3103         bcopy(&fp->ff_data, &forkdata, sizeof(forkdata));
3104
3105         /*
3106          * Calculate additional space required (if any) by allocation bitmap.
3107          */
3108         oldBitmapSize = fp->ff_size;
3109         bitmapblks = roundup((newblkcnt+7) / 8, vcb->vcbVBMIOSize) / vcb->blockSize;
3110         if (bitmapblks > (daddr_t)fp->ff_blocks)
3111                 bitmapblks -= fp->ff_blocks;
3112         else
3113                 bitmapblks = 0;
3114
3115         if (bitmapblks > 0) {
3116                 daddr64_t blkno;
3117                 daddr_t blkcnt;
3118                 off_t bytesAdded;
3119
3120                 /*
3121                  * Get the bitmap's current size (in allocation blocks) so we know
3122                  * where to start zero filling once the new space is added.  We've
3123                  * got to do this before the bitmap is grown.
3124                  */
3125                 blkno  = (daddr64_t)fp->ff_blocks;
3126
3127                 /*
3128                  * Try to grow the allocation file in the normal way, using allocation
3129                  * blocks already existing in the file system.  This way, we might be
3130                  * able to grow the bitmap contiguously, or at least in the metadata
3131                  * zone.
3132                  */
3133                 error = ExtendFileC(vcb, fp, bitmapblks * vcb->blockSize, 0,
3134                                 kEFAllMask | kEFNoClumpMask | kEFReserveMask | kEFMetadataMask,
3135                                 &bytesAdded);
3136
3137                 if (error == 0) {
3138                         usedExtendFileC = true;
3139                 } else {
3140                         /*
3141                          * If the above allocation failed, fall back to allocating the new
3142                          * extent of the bitmap from the space we're going to add.  Since those
3143                          * blocks don't yet belong to the file system, we have to update the
3144                          * extent list directly, and manually adjust the file size.
3145                          */
3146                         bytesAdded = 0;
3147                         error = AddFileExtent(vcb, fp, vcb->totalBlocks, bitmapblks);
3148                         if (error) {
3149                                 printf("hfs_extendfs: error %d adding extents\n", error);
3150                                 goto out;
3151                         }
3152                         fp->ff_blocks += bitmapblks;
3153                         VTOC(vp)->c_blocks = fp->ff_blocks;
3154                         VTOC(vp)->c_flag |= C_MODIFIED;
3155                 }
3156
3157                 /*
3158                  * Update the allocation file's size to include the newly allocated
3159                  * blocks.  Note that ExtendFileC doesn't do this, which is why this
3160                  * statement is outside the above "if" statement.
3161                  */
3162                 fp->ff_size += (u_int64_t)bitmapblks * (u_int64_t)vcb->blockSize;
3163
3164                 /*
3165                  * Zero out the new bitmap blocks.
3166                  */
3167                 {
3168
3169                         bp = NULL;
3170                         blkcnt = bitmapblks;
3171                         while (blkcnt > 0) {
3172                                 error = (int)buf_meta_bread(vp, blkno, vcb->blockSize, NOCRED, &bp);
3173                                 if (error) {
3174                                         if (bp) {
3175                                                 buf_brelse(bp);
3176                                         }
3177                                         break;
3178                                 }
3179                                 bzero((char *)buf_dataptr(bp), vcb->blockSize);
3180                                 buf_markaged(bp);
3181                                 error = (int)buf_bwrite(bp);
3182                                 if (error)
3183                                         break;
3184                                 --blkcnt;
3185                                 ++blkno;
3186                         }
3187                 }
3188                 if (error) {
3189                         printf("hfs_extendfs: error %d  clearing blocks\n", error);
3190                         goto out;
3191                 }
3192                 /*
3193                  * Mark the new bitmap space as allocated.
3194                  *
3195                  * Note that ExtendFileC will have marked any blocks it allocated, so
3196                  * this is only needed if we used AddFileExtent.  Also note that this
3197                  * has to come *after* the zero filling of new blocks in the case where
3198                  * we used AddFileExtent (since the part of the bitmap we're touching
3199                  * is in those newly allocated blocks).
3200                  */
3201                 if (!usedExtendFileC) {
3202                         error = BlockMarkAllocated(vcb, vcb->totalBlocks, bitmapblks);
3203                         if (error) {
3204                                 printf("hfs_extendfs: error %d setting bitmap\n", error);
3205                                 goto out;
3206                         }
3207                         vcb->freeBlocks -= bitmapblks;
3208                 }
3209         }
3210         /*
3211          * Mark the new alternate VH as allocated.
3212          */
3213         if (vcb->blockSize == 512)
3214                 error = BlockMarkAllocated(vcb, vcb->totalBlocks + addblks - 2, 2);
3215         else
3216                 error = BlockMarkAllocated(vcb, vcb->totalBlocks + addblks - 1, 1);
3217         if (error) {
3218                 printf("hfs_extendfs: error %d setting bitmap (VH)\n", error);
3219                 goto out;
3220         }
3221         /*
3222          * Mark the old alternate VH as free.
3223          */
3224         if (vcb->blockSize == 512)
3225                 (void) BlockMarkFree(vcb, vcb->totalBlocks - 2, 2);
3226         else
3227                 (void) BlockMarkFree(vcb, vcb->totalBlocks - 1, 1);
3228         /*
3229          * Adjust file system variables for new space.
3230          */
3231         prev_phys_block_count = hfsmp->hfs_phys_block_count;
3232         prev_alt_sector = hfsmp->hfs_alt_id_sector;
3233
3234         vcb->totalBlocks += addblks;
3235         vcb->freeBlocks += addblks;
3236         hfsmp->hfs_phys_block_count = newsize / sectorsize;
3237         hfsmp->hfs_alt_id_sector = (hfsmp->hfsPlusIOPosOffset / sectorsize) +
3238                                   HFS_ALT_SECTOR(sectorsize, hfsmp->hfs_phys_block_count);
3239         MarkVCBDirty(vcb);
3240         error = hfs_flushvolumeheader(hfsmp, MNT_WAIT, HFS_ALTFLUSH);
3241         if (error) {
3242                 printf("hfs_extendfs: couldn't flush volume headers (%d)", error);
3243                 /*
3244                  * Restore to old state.
3245                  */
3246                 if (usedExtendFileC) {
3247                         (void) TruncateFileC(vcb, fp, oldBitmapSize, false);
3248                 } else {
3249                         fp->ff_blocks -= bitmapblks;
3250                         fp->ff_size -= (u_int64_t)bitmapblks * (u_int64_t)vcb->blockSize;
3251                         /*
3252                          * No need to mark the excess blocks free since those bitmap blocks
3253                          * are no longer part of the bitmap.  But we do need to undo the
3254                          * effect of the "vcb->freeBlocks -= bitmapblks" above.
3255                          */
3256                         vcb->freeBlocks += bitmapblks;
3257                 }
3258                 vcb->totalBlocks -= addblks;
3259                 vcb->freeBlocks -= addblks;
3260                 hfsmp->hfs_phys_block_count = prev_phys_block_count;
3261                 hfsmp->hfs_alt_id_sector = prev_alt_sector;
3262                 MarkVCBDirty(vcb);
3263                 if (vcb->blockSize == 512)
3264                         (void) BlockMarkAllocated(vcb, vcb->totalBlocks - 2, 2);
3265                 else
3266                         (void) BlockMarkAllocated(vcb, vcb->totalBlocks - 1, 1);
3267                 goto out;
3268         }
3269         /*
3270          * Invalidate the old alternate volume header.
3271          */
3272         bp = NULL;
3273         if (prev_alt_sector) {
3274                 if (buf_meta_bread(hfsmp->hfs_devvp, prev_alt_sector, sectorsize,
3275                                    NOCRED, &bp) == 0) {
3276                         journal_modify_block_start(hfsmp->jnl, bp);
3277
3278                         bzero((char *)buf_dataptr(bp) + HFS_ALT_OFFSET(sectorsize), kMDBSize);
3279
3280                         journal_modify_block_end(hfsmp->jnl, bp, NULL, NULL);
3281                 } else if (bp) {
3282                         buf_brelse(bp);
3283                 }
3284         }
3285
3286         /*
3287          * TODO: Adjust the size of the metadata zone based on new volume size?
3288          */
3289
3290         /*
3291          * Adjust the size of hfsmp->hfs_attrdata_vp
3292          */
3293         if (hfsmp->hfs_attrdata_vp) {
3294                 struct cnode *attr_cp;
3295                 struct filefork *attr_fp;
3296
3297                 if (vnode_get(hfsmp->hfs_attrdata_vp) == 0) {
3298                         attr_cp = VTOC(hfsmp->hfs_attrdata_vp);
3299                         attr_fp = VTOF(hfsmp->hfs_attrdata_vp);
3300
3301                         attr_cp->c_blocks = newblkcnt;
3302                         attr_fp->ff_blocks = newblkcnt;
3303                         attr_fp->ff_extents[0].blockCount = newblkcnt;
3304                         attr_fp->ff_size = (off_t) newblkcnt * hfsmp->blockSize;
3305                         ubc_setsize(hfsmp->hfs_attrdata_vp, attr_fp->ff_size);
3306                         vnode_put(hfsmp->hfs_attrdata_vp);
3307                 }
3308         }
3309
3310 out:
3311         if (error && fp) {
3312                 /* Restore allocation fork. */
3313                 bcopy(&forkdata, &fp->ff_data, sizeof(forkdata));
3314                 VTOC(vp)->c_blocks = fp->ff_blocks;
3315
3316         }
3317         /*
3318            Regardless of whether or not the totalblocks actually increased,
3319            we should reset the allocLimit field. If it changed, it will
3320            get updated; if not, it will remain the same.
3321         */
3322         hfsmp->allocLimit = vcb->totalBlocks;
3323         hfs_systemfile_unlock(hfsmp, lockflags);
3324         hfs_end_transaction(hfsmp);
3325
3326         return (error);
3327 }
3328
3329 #define HFS_MIN_SIZE  (32LL * 1024LL * 1024LL)
3330
3331 /*
3332  * Truncate a file system (while still mounted).
3333  */
3334 __private_extern__
3335 int
3336 hfs_truncatefs(struct hfsmount *hfsmp, u_int64_t newsize, vfs_context_t context)
3337 {
3338         struct  buf *bp = NULL;
3339         u_int64_t oldsize;
3340         u_int32_t newblkcnt;
3341         u_int32_t reclaimblks = 0;
3342         int lockflags = 0;
3343         int transaction_begun = 0;
3344         int error;
3345
3346         lck_mtx_lock(&hfsmp->hfs_mutex);
3347         if (hfsmp->hfs_flags & HFS_RESIZE_IN_PROGRESS) {
3348                 lck_mtx_unlock(&hfsmp->hfs_mutex);
3349                 return (EALREADY);
3350         }
3351         hfsmp->hfs_flags |= HFS_RESIZE_IN_PROGRESS;
3352         hfsmp->hfs_resize_filesmoved = 0;
3353         hfsmp->hfs_resize_totalfiles = 0;
3354         lck_mtx_unlock(&hfsmp->hfs_mutex);
3355
3356         /*
3357          * - Journaled HFS Plus volumes only.
3358          * - No embedded volumes.
3359          */
3360         if ((hfsmp->jnl == NULL) ||
3361             (hfsmp->hfsPlusIOPosOffset != 0)) {
3362                 error = EPERM;
3363                 goto out;
3364         }
3365         oldsize = (u_int64_t)hfsmp->totalBlocks * (u_int64_t)hfsmp->blockSize;
3366         newblkcnt = newsize / hfsmp->blockSize;
3367         reclaimblks = hfsmp->totalBlocks - newblkcnt;
3368
3369         /* Make sure new size is valid. */
3370         if ((newsize < HFS_MIN_SIZE) ||
3371             (newsize >= oldsize) ||
3372             (newsize % hfsmp->hfs_phys_block_size)) {
3373                 error = EINVAL;
3374                 goto out;
3375         }
3376         /* Make sure there's enough space to work with. */
3377         if (reclaimblks >= hfs_freeblks(hfsmp, 1)) {
3378                 printf("hfs_truncatefs: insufficient space (need %u blocks; have %u blocks)\n", reclaimblks, hfs_freeblks(hfsmp, 1));
3379                 error = ENOSPC;
3380                 goto out;
3381         }
3382
3383         /* Start with a clean journal. */
3384         journal_flush(hfsmp->jnl);
3385
3386         if (hfs_start_transaction(hfsmp) != 0) {
3387                 error = EINVAL;
3388                 goto out;
3389         }
3390         transaction_begun = 1;
3391
3392         /*
3393          * Prevent new allocations from using the part we're trying to truncate.
3394          *
3395          * NOTE: allocLimit is set to the allocation block number where the new
3396          * alternate volume header will be.  That way there will be no files to
3397          * interfere with allocating the new alternate volume header, and no files
3398          * in the allocation blocks beyond (i.e. the blocks we're trying to
3399          * truncate away.
3400          */
3401         lck_mtx_lock(&hfsmp->hfs_mutex);
3402         if (hfsmp->blockSize == 512)
3403                 hfsmp->allocLimit = newblkcnt - 2;
3404         else
3405                 hfsmp->allocLimit = newblkcnt - 1;
3406         hfsmp->freeBlocks -= reclaimblks;
3407         lck_mtx_unlock(&hfsmp->hfs_mutex);
3408
3409         /*
3410          * Look for files that have blocks at or beyond the location of the
3411          * new alternate volume header.
3412          */
3413         if (hfs_isallocated(hfsmp, hfsmp->allocLimit, reclaimblks)) {
3414                 /*
3415                  * hfs_reclaimspace will use separate transactions when
3416                  * relocating files (so we don't overwhelm the journal).
3417                  */
3418                 hfs_end_transaction(hfsmp);
3419                 transaction_begun = 0;
3420
3421                 /* Attempt to reclaim some space. */
3422                 if (hfs_reclaimspace(hfsmp, hfsmp->allocLimit, reclaimblks, context) != 0) {
3423                         printf("hfs_truncatefs: couldn't reclaim space on %s\n", hfsmp->vcbVN);
3424                         error = ENOSPC;
3425                         goto out;
3426                 }
3427                 if (hfs_start_transaction(hfsmp) != 0) {
3428                         error = EINVAL;
3429                         goto out;
3430                 }
3431                 transaction_begun = 1;
3432
3433                 /* Check if we're clear now. */
3434                 if (hfs_isallocated(hfsmp, hfsmp->allocLimit, reclaimblks)) {
3435                         printf("hfs_truncatefs: didn't reclaim enough space on %s\n", hfsmp->vcbVN);
3436                         error = EAGAIN;  /* tell client to try again */
3437                         goto out;
3438                 }
3439         }
3440
3441         /*
3442          * Note: we take the attributes lock in case we have an attribute data vnode
3443          * which needs to change size.
3444          */
3445         lockflags = hfs_systemfile_lock(hfsmp, SFL_ATTRIBUTE | SFL_EXTENTS | SFL_BITMAP, HFS_EXCLUSIVE_LOCK);
3446
3447         /*
3448          * Mark the old alternate volume header as free.
3449          * We don't bother shrinking allocation bitmap file.
3450          */
3451         if (hfsmp->blockSize == 512)
3452                 (void) BlockMarkFree(hfsmp, hfsmp->totalBlocks - 2, 2);
3453         else
3454                 (void) BlockMarkFree(hfsmp, hfsmp->totalBlocks - 1, 1);
3455
3456         /*
3457          * Allocate last 1KB for alternate volume header.
3458          */
3459         error = BlockMarkAllocated(hfsmp, hfsmp->allocLimit, (hfsmp->blockSize == 512) ? 2 : 1);
3460         if (error) {
3461                 printf("hfs_truncatefs: Error %d allocating new alternate volume header\n", error);
3462                 goto out;
3463         }
3464
3465         /*
3466          * Invalidate the existing alternate volume header.
3467          *
3468          * Don't include this in a transaction (don't call journal_modify_block)
3469          * since this block will be outside of the truncated file system!
3470          */
3471         if (hfsmp->hfs_alt_id_sector) {
3472                 if (buf_meta_bread(hfsmp->hfs_devvp, hfsmp->hfs_alt_id_sector,
3473                                    hfsmp->hfs_phys_block_size, NOCRED, &bp) == 0) {
3474
3475                         bzero((void*)((char *)buf_dataptr(bp) + HFS_ALT_OFFSET(hfsmp->hfs_phys_block_size)), kMDBSize);
3476                         (void) VNOP_BWRITE(bp);
3477                 } else if (bp) {
3478                         buf_brelse(bp);
3479                 }
3480                 bp = NULL;
3481         }
3482
3483         /* Log successful shrinking. */
3484         printf("hfs_truncatefs: shrank \"%s\" to %d blocks (was %d blocks)\n",
3485                hfsmp->vcbVN, newblkcnt, hfsmp->totalBlocks);
3486
3487         /*
3488          * Adjust file system variables and flush them to disk.
3489          */
3490         hfsmp->totalBlocks = newblkcnt;
3491         hfsmp->hfs_phys_block_count = newsize / hfsmp->hfs_phys_block_size;
3492         hfsmp->hfs_alt_id_sector = HFS_ALT_SECTOR(hfsmp->hfs_phys_block_size, hfsmp->hfs_phys_block_count);
3493         MarkVCBDirty(hfsmp);
3494         error = hfs_flushvolumeheader(hfsmp, MNT_WAIT, HFS_ALTFLUSH);
3495         if (error)
3496                 panic("hfs_truncatefs: unexpected error flushing volume header (%d)\n", error);
3497
3498         /*
3499          * TODO: Adjust the size of the metadata zone based on new volume size?
3500          */
3501
3502         /*
3503          * Adjust the size of hfsmp->hfs_attrdata_vp
3504          */
3505         if (hfsmp->hfs_attrdata_vp) {
3506                 struct cnode *cp;
3507                 struct filefork *fp;
3508
3509                 if (vnode_get(hfsmp->hfs_attrdata_vp) == 0) {
3510                         cp = VTOC(hfsmp->hfs_attrdata_vp);
3511                         fp = VTOF(hfsmp->hfs_attrdata_vp);
3512
3513                         cp->c_blocks = newblkcnt;
3514                         fp->ff_blocks = newblkcnt;
3515                         fp->ff_extents[0].blockCount = newblkcnt;
3516                         fp->ff_size = (off_t) newblkcnt * hfsmp->blockSize;
3517                         ubc_setsize(hfsmp->hfs_attrdata_vp, fp->ff_size);
3518                         vnode_put(hfsmp->hfs_attrdata_vp);
3519                 }
3520         }
3521
3522 out:
3523         if (error)
3524                 hfsmp->freeBlocks += reclaimblks;
3525
3526         lck_mtx_lock(&hfsmp->hfs_mutex);
3527         hfsmp->allocLimit = hfsmp->totalBlocks;
3528         if (hfsmp->nextAllocation >= hfsmp->allocLimit)
3529                 hfsmp->nextAllocation = hfsmp->hfs_metazone_end + 1;
3530         hfsmp->hfs_flags &= ~HFS_RESIZE_IN_PROGRESS;
3531         lck_mtx_unlock(&hfsmp->hfs_mutex);
3532
3533         if (lockflags) {
3534                 hfs_systemfile_unlock(hfsmp, lockflags);
3535         }
3536         if (transaction_begun) {
3537                 hfs_end_transaction(hfsmp);
3538                 journal_flush(hfsmp->jnl);
3539         }
3540
3541         return (error);
3542 }
3543
3544
3545 /*
3546  * Invalidate the physical block numbers associated with buffer cache blocks
3547  * in the given extent of the given vnode.
3548  */
3549 struct hfs_inval_blk_no {
3550         daddr64_t sectorStart;
3551         daddr64_t sectorCount;
3552 };
3553 static int
3554 hfs_invalidate_block_numbers_callback(buf_t bp, void *args_in)
3555 {
3556         daddr64_t blkno;
3557         struct hfs_inval_blk_no *args;
3558
3559         blkno = buf_blkno(bp);
3560         args = args_in;
3561
3562         if (blkno >= args->sectorStart && blkno < args->sectorStart+args->sectorCount)
3563                 buf_setblkno(bp, buf_lblkno(bp));
3564
3565         return BUF_RETURNED;
3566 }
3567 static void
3568 hfs_invalidate_sectors(struct vnode *vp, daddr64_t sectorStart, daddr64_t sectorCount)
3569 {
3570         struct hfs_inval_blk_no args;
3571         args.sectorStart = sectorStart;
3572         args.sectorCount = sectorCount;
3573
3574         buf_iterate(vp, hfs_invalidate_block_numbers_callback, BUF_SCAN_DIRTY|BUF_SCAN_CLEAN, &args);
3575 }
3576
3577
3578 /*
3579  * Copy the contents of an extent to a new location.  Also invalidates the
3580  * physical block number of any buffer cache block in the copied extent
3581  * (so that if the block is written, it will go through VNOP_BLOCKMAP to
3582  * determine the new physical block number).
3583  */
3584 static int
3585 hfs_copy_extent(
3586         struct hfsmount *hfsmp,
3587         struct vnode *vp,               /* The file whose extent is being copied. */
3588         u_int32_t oldStart,             /* The start of the source extent. */
3589         u_int32_t newStart,             /* The start of the destination extent. */
3590         u_int32_t blockCount,   /* The number of allocation blocks to copy. */
3591         vfs_context_t context)
3592 {
3593         int err = 0;
3594         size_t bufferSize;
3595         void *buffer = NULL;
3596         struct vfsioattr ioattr;
3597         buf_t bp = NULL;
3598         off_t resid;
3599         size_t ioSize;
3600         u_int32_t ioSizeSectors;        /* Device sectors in this I/O */
3601         daddr64_t srcSector, destSector;
3602         u_int32_t sectorsPerBlock = hfsmp->blockSize / hfsmp->hfs_phys_block_size;
3603
3604         /*
3605          * Sanity check that we have locked the vnode of the file we're copying.
3606          *
3607          * But since hfs_systemfile_lock() doesn't actually take the lock on
3608          * the allocation file if a journal is active, ignore the check if the
3609          * file being copied is the allocation file.
3610          */
3611         struct cnode *cp = VTOC(vp);
3612         if (cp != hfsmp->hfs_allocation_cp && cp->c_lockowner != current_thread())
3613                 panic("hfs_copy_extent: vp=%p (cp=%p) not owned?\n", vp, cp);
3614
3615         /*
3616          * Wait for any in-progress writes to this vnode to complete, so that we'll
3617          * be copying consistent bits.  (Otherwise, it's possible that an async
3618          * write will complete to the old extent after we read from it.  That
3619          * could lead to corruption.)
3620          */
3621         err = vnode_waitforwrites(vp, 0, 0, 0, "hfs_copy_extent");
3622         if (err) {
3623                 printf("hfs_copy_extent: Error %d from vnode_waitforwrites\n", err);
3624                 return err;
3625         }
3626
3627         /*
3628          * Determine the I/O size to use
3629          *
3630          * NOTE: Many external drives will result in an ioSize of 128KB.
3631          * TODO: Should we use a larger buffer, doing several consecutive
3632          * reads, then several consecutive writes?
3633          */
3634         vfs_ioattr(hfsmp->hfs_mp, &ioattr);
3635         bufferSize = MIN(ioattr.io_maxreadcnt, ioattr.io_maxwritecnt);
3636         if (kmem_alloc(kernel_map, (vm_offset_t*) &buffer, bufferSize))
3637                 return ENOMEM;
3638
3639         /* Get a buffer for doing the I/O */
3640         bp = buf_alloc(hfsmp->hfs_devvp);
3641         buf_setdataptr(bp, (uintptr_t)buffer);
3642
3643         resid = (off_t) blockCount * (off_t) hfsmp->blockSize;
3644         srcSector = (daddr64_t) oldStart * hfsmp->blockSize / hfsmp->hfs_phys_block_size;
3645         destSector = (daddr64_t) newStart * hfsmp->blockSize / hfsmp->hfs_phys_block_size;
3646         while (resid > 0) {
3647                 ioSize = MIN(bufferSize, resid);
3648                 ioSizeSectors = ioSize / hfsmp->hfs_phys_block_size;
3649
3650                 /* Prepare the buffer for reading */
3651                 buf_reset(bp, B_READ);
3652                 buf_setsize(bp, ioSize);
3653                 buf_setcount(bp, ioSize);
3654                 buf_setblkno(bp, srcSector);
3655                 buf_setlblkno(bp, srcSector);
3656
3657                 /* Do the read */
3658                 err = VNOP_STRATEGY(bp);
3659                 if (!err)
3660                         err = buf_biowait(bp);
3661                 if (err) {
3662                         printf("hfs_copy_extent: Error %d from VNOP_STRATEGY (read)\n", err);
3663                         break;
3664                 }
3665
3666                 /* Prepare the buffer for writing */
3667                 buf_reset(bp, B_WRITE);
3668                 buf_setsize(bp, ioSize);
3669                 buf_setcount(bp, ioSize);
3670                 buf_setblkno(bp, destSector);
3671                 buf_setlblkno(bp, destSector);
3672                 if (journal_uses_fua(hfsmp->jnl))
3673                         buf_markfua(bp);
3674
3675                 /* Do the write */
3676                 vnode_startwrite(hfsmp->hfs_devvp);
3677                 err = VNOP_STRATEGY(bp);
3678                 if (!err)
3679                         err = buf_biowait(bp);
3680                 if (err) {
3681                         printf("hfs_copy_extent: Error %d from VNOP_STRATEGY (write)\n", err);
3682                         break;
3683                 }
3684
3685                 resid -= ioSize;
3686                 srcSector += ioSizeSectors;
3687                 destSector += ioSizeSectors;
3688         }
3689         if (bp)
3690                 buf_free(bp);
3691         if (buffer)
3692                 kmem_free(kernel_map, (vm_offset_t)buffer, bufferSize);
3693
3694         /* Make sure all writes have been flushed to disk. */
3695         if (!journal_uses_fua(hfsmp->jnl)) {
3696                 err = VNOP_IOCTL(hfsmp->hfs_devvp, DKIOCSYNCHRONIZECACHE, NULL, FWRITE, context);
3697                 if (err) {
3698                         printf("hfs_copy_extent: DKIOCSYNCHRONIZECACHE failed (%d)\n", err);
3699                         err = 0;        /* Don't fail the copy. */
3700                 }
3701         }
3702
3703         if (!err)
3704                 hfs_invalidate_sectors(vp, (daddr64_t)oldStart*sectorsPerBlock, (daddr64_t)blockCount*sectorsPerBlock);
3705
3706         return err;
3707 }
3708
3709
3710 /*
3711  * Reclaim space at the end of a volume, used by a given system file.
3712  *
3713  * This routine attempts to move any extent which contains allocation blocks
3714  * at or after "startblk."  A separate transaction is used to do the move.
3715  * The contents of any moved extents are read and written via the volume's
3716  * device vnode -- NOT via "vp."  During the move, moved blocks which are part
3717  * of a transaction have their physical block numbers invalidated so they will
3718  * eventually be written to their new locations.
3719  *
3720  * This routine can be used to move overflow extents for the allocation file.
3721  *
3722  * Inputs:
3723  *    hfsmp       The volume being resized.
3724  *    startblk    Blocks >= this allocation block need to be moved.
3725  *    locks       Which locks need to be taken for the given system file.
3726  *    vp          The vnode for the system file.
3727  *
3728  * Outputs:
3729  *    moved       Set to true if any extents were moved.
3730  */
3731 static int
3732 hfs_relocate_callback(__unused HFSPlusExtentKey *key, HFSPlusExtentRecord *record, HFSPlusExtentRecord *state)
3733 {
3734         bcopy(state, record, sizeof(HFSPlusExtentRecord));
3735         return 0;
3736 }
3737 static int
3738 hfs_reclaim_sys_file(struct hfsmount *hfsmp, struct vnode *vp, u_long startblk, int locks, Boolean *moved, vfs_context_t context)
3739 {
3740         int error;
3741         int lockflags;
3742         int i;
3743         u_long datablks;
3744         u_long block;
3745         u_int32_t oldStartBlock;
3746         u_int32_t newStartBlock;
3747         u_int32_t blockCount;
3748         struct filefork *fp;
3749
3750         /* If there is no vnode for this file, then there's nothing to do. */
3751         if (vp == NULL)
3752                 return 0;
3753
3754         /* printf("hfs_reclaim_sys_file: %.*s\n", VTOC(vp)->c_desc.cd_namelen, VTOC(vp)->c_desc.cd_nameptr); */
3755
3756         /* We always need the allocation bitmap and extents B-tree */
3757         locks |= SFL_BITMAP | SFL_EXTENTS;
3758
3759         error = hfs_start_transaction(hfsmp);
3760         if (error) {
3761                 printf("hfs_reclaim_sys_file: hfs_start_transaction returned %d\n", error);
3762                 return error;
3763         }
3764         lockflags = hfs_systemfile_lock(hfsmp, locks, HFS_EXCLUSIVE_LOCK);
3765         fp = VTOF(vp);
3766         datablks = 0;
3767
3768         /* Relocate non-overflow extents */
3769         for (i = 0; i < kHFSPlusExtentDensity; ++i) {
3770                 if (fp->ff_extents[i].blockCount == 0)
3771                         break;
3772                 oldStartBlock = fp->ff_extents[i].startBlock;
3773                 blockCount = fp->ff_extents[i].blockCount;
3774                 datablks += blockCount;
3775                 block = oldStartBlock + blockCount;
3776                 if (block > startblk) {
3777                         error = BlockAllocate(hfsmp, 1, blockCount, blockCount, true, true, &newStartBlock, &blockCount);
3778                         if (error) {
3779                                 printf("hfs_reclaim_sys_file: BlockAllocate returned %d\n", error);
3780                                 goto fail;
3781                         }
3782                         if (blockCount != fp->ff_extents[i].blockCount) {
3783                                 printf("hfs_reclaim_sys_file: new blockCount=%u, original blockCount=%u", blockCount, fp->ff_extents[i].blockCount);
3784                                 goto free_fail;
3785                         }
3786                         error = hfs_copy_extent(hfsmp, vp, oldStartBlock, newStartBlock, blockCount, context);
3787                         if (error) {
3788                                 printf("hfs_reclaim_sys_file: hfs_copy_extent returned %d\n", error);
3789                                 goto free_fail;
3790                         }
3791                         fp->ff_extents[i].startBlock = newStartBlock;
3792                         VTOC(vp)->c_flag |= C_MODIFIED;
3793                         *moved = true;
3794                         error = BlockDeallocate(hfsmp, oldStartBlock, blockCount);
3795                         if (error) {
3796                                 /* TODO: Mark volume inconsistent? */
3797                                 printf("hfs_reclaim_sys_file: BlockDeallocate returned %d\n", error);
3798                                 goto fail;
3799                         }
3800                         error = hfs_flushvolumeheader(hfsmp, MNT_WAIT, HFS_ALTFLUSH);
3801                         if (error) {
3802                                 /* TODO: Mark volume inconsistent? */
3803                                 printf("hfs_reclaim_sys_file: hfs_flushvolumeheader returned %d\n", error);
3804                                 goto fail;
3805                         }
3806                 }
3807         }
3808
3809         /* Relocate overflow extents (if any) */
3810         if (i == kHFSPlusExtentDensity && fp->ff_blocks > datablks) {
3811                 struct BTreeIterator *iterator = NULL;
3812                 struct FSBufferDescriptor btdata;
3813                 HFSPlusExtentRecord record;
3814                 HFSPlusExtentKey *key;
3815                 FCB *fcb;
3816                 u_int32_t fileID;
3817                 u_int8_t forktype;
3818
3819                 forktype = VNODE_IS_RSRC(vp) ? 0xFF : 0;
3820                 fileID = VTOC(vp)->c_cnid;
3821                 if (kmem_alloc(kernel_map, (vm_offset_t*) &iterator, sizeof(*iterator))) {
3822                         printf("hfs_reclaim_sys_file: kmem_alloc failed!\n");
3823                         error = ENOMEM;
3824                         goto fail;
3825                 }
3826
3827                 bzero(iterator, sizeof(*iterator));
3828                 key = (HFSPlusExtentKey *) &iterator->key;
3829                 key->keyLength = kHFSPlusExtentKeyMaximumLength;
3830                 key->forkType = forktype;
3831                 key->fileID = fileID;
3832                 key->startBlock = datablks;
3833
3834                 btdata.bufferAddress = &record;
3835                 btdata.itemSize = sizeof(record);
3836                 btdata.itemCount = 1;
3837
3838                 fcb = VTOF(hfsmp->hfs_extents_vp);
3839
3840                 error = BTSearchRecord(fcb, iterator, &btdata, NULL, iterator);
3841                 while (error == 0) {
3842                         /* Stop when we encounter a different file or fork. */
3843                         if ((key->fileID != fileID) ||
3844                                 (key->forkType != forktype)) {
3845                                 break;
3846                         }
3847                         /*
3848                          * Check if the file overlaps target space.
3849                          */
3850                         for (i = 0; i < kHFSPlusExtentDensity; ++i) {
3851                                 if (record[i].blockCount == 0) {
3852                                         goto overflow_done;
3853                                 }
3854                                 oldStartBlock = record[i].startBlock;
3855                                 blockCount = record[i].blockCount;
3856                                 block = oldStartBlock + blockCount;
3857                                 if (block > startblk) {
3858                                         error = BlockAllocate(hfsmp, 1, blockCount, blockCount, true, true, &newStartBlock, &blockCount);
3859                                         if (error) {
3860                                                 printf("hfs_reclaim_sys_file: BlockAllocate returned %d\n", error);
3861                                                 goto overflow_done;
3862                                         }
3863                                         if (blockCount != record[i].blockCount) {
3864                                                 printf("hfs_reclaim_sys_file: new blockCount=%u, original blockCount=%u", blockCount, fp->ff_extents[i].blockCount);
3865                                                 kmem_free(kernel_map, (vm_offset_t)iterator, sizeof(*iterator));
3866                                                 goto free_fail;
3867                                         }
3868                                         error = hfs_copy_extent(hfsmp, vp, oldStartBlock, newStartBlock, blockCount, context);
3869                                         if (error) {
3870                                                 printf("hfs_reclaim_sys_file: hfs_copy_extent returned %d\n", error);
3871                                                 kmem_free(kernel_map, (vm_offset_t)iterator, sizeof(*iterator));
3872                                                 goto free_fail;
3873                                         }
3874                                         record[i].startBlock = newStartBlock;
3875                                         VTOC(vp)->c_flag |= C_MODIFIED;
3876                                         *moved = true;
3877                                         /*
3878                                          * NOTE: To support relocating overflow extents of the
3879                                          * allocation file, we must update the BTree record BEFORE
3880                                          * deallocating the old extent so that BlockDeallocate will
3881                                          * use the extent's new location to calculate physical block
3882                                          * numbers.  (This is for the case where the old extent's
3883                                          * bitmap bits actually reside in the extent being moved.)
3884                                          */
3885                                         error = BTUpdateRecord(fcb, iterator, (IterateCallBackProcPtr) hfs_relocate_callback, &record);
3886                                         if (error) {
3887                                                 /* TODO: Mark volume inconsistent? */
3888                                                 printf("hfs_reclaim_sys_file: BTUpdateRecord returned %d\n", error);
3889                                                 goto overflow_done;
3890                                         }
3891                                         error = BlockDeallocate(hfsmp, oldStartBlock, blockCount);
3892                                         if (error) {
3893                                                 /* TODO: Mark volume inconsistent? */
3894                                                 printf("hfs_reclaim_sys_file: BlockDeallocate returned %d\n", error);
3895                                                 goto overflow_done;
3896                                         }
3897                                 }
3898                         }
3899                         /* Look for more records. */
3900                         error = BTIterateRecord(fcb, kBTreeNextRecord, iterator, &btdata, NULL);
3901                         if (error == btNotFound) {
3902                                 error = 0;
3903                                 break;
3904                         }
3905                 }
3906 overflow_done:
3907                 kmem_free(kernel_map, (vm_offset_t)iterator, sizeof(*iterator));
3908                 if (error) {
3909                         goto fail;
3910                 }
3911         }
3912
3913         hfs_systemfile_unlock(hfsmp, lockflags);
3914         error = hfs_end_transaction(hfsmp);
3915         if (error) {
3916                 printf("hfs_reclaim_sys_file: hfs_end_transaction returned %d\n", error);
3917         }
3918
3919         return error;
3920
3921 free_fail:
3922         (void) BlockDeallocate(hfsmp, newStartBlock, blockCount);
3923 fail:
3924         (void) hfs_systemfile_unlock(hfsmp, lockflags);
3925         (void) hfs_end_transaction(hfsmp);
3926         return error;
3927 }
3928
3929
3930 /*
3931  * This journal_relocate callback updates the journal info block to point
3932  * at the new journal location.  This write must NOT be done using the
3933  * transaction.  We must write the block immediately.  We must also force
3934  * it to get to the media so that the new journal location will be seen by
3935  * the replay code before we can safely let journaled blocks be written
3936  * to their normal locations.
3937  *
3938  * The tests for journal_uses_fua below are mildly hacky.  Since the journal
3939  * and the file system are both on the same device, I'm leveraging what
3940  * the journal has decided about FUA.
3941  */
3942 struct hfs_journal_relocate_args {
3943         struct hfsmount *hfsmp;
3944         vfs_context_t context;
3945         u_int32_t newStartBlock;
3946 };
3947
3948 static errno_t
3949 hfs_journal_relocate_callback(void *_args)
3950 {
3951         int error;
3952         struct hfs_journal_relocate_args *args = _args;
3953         struct hfsmount *hfsmp = args->hfsmp;
3954         buf_t bp;
3955         JournalInfoBlock *jibp;
3956
3957         error = buf_meta_bread(hfsmp->hfs_devvp,
3958                 hfsmp->vcbJinfoBlock * (hfsmp->blockSize/hfsmp->hfs_phys_block_size),
3959                 hfsmp->blockSize, vfs_context_ucred(args->context), &bp);
3960         if (error) {
3961                 printf("hfs_reclaim_journal_file: failed to read JIB (%d)\n", error);
3962                 return error;
3963         }
3964         jibp = (JournalInfoBlock*) buf_dataptr(bp);
3965         jibp->offset = SWAP_BE64((u_int64_t)args->newStartBlock * hfsmp->blockSize);
3966         jibp->size = SWAP_BE64(hfsmp->jnl_size);
3967         if (journal_uses_fua(hfsmp->jnl))
3968                 buf_markfua(bp);
3969         error = buf_bwrite(bp);
3970         if (error) {
3971                 printf("hfs_reclaim_journal_file: failed to write JIB (%d)\n", error);
3972                 return error;
3973         }
3974         if (!journal_uses_fua(hfsmp->jnl)) {
3975                 error = VNOP_IOCTL(hfsmp->hfs_devvp, DKIOCSYNCHRONIZECACHE, NULL, FWRITE, args->context);
3976                 if (error) {
3977                         printf("hfs_reclaim_journal_file: DKIOCSYNCHRONIZECACHE failed (%d)\n", error);
3978                         error = 0;              /* Don't fail the operation. */
3979                 }
3980         }
3981
3982         return error;
3983 }
3984
3985
3986 static int
3987 hfs_reclaim_journal_file(struct hfsmount *hfsmp, vfs_context_t context)
3988 {
3989         int error;
3990         int lockflags;
3991         u_int32_t newStartBlock;
3992         u_int32_t oldBlockCount;
3993         u_int32_t newBlockCount;
3994         struct cat_desc journal_desc;
3995         struct cat_attr journal_attr;
3996         struct cat_fork journal_fork;
3997         struct hfs_journal_relocate_args callback_args;
3998
3999         error = hfs_start_transaction(hfsmp);
4000         if (error) {
4001                 printf("hfs_reclaim_journal_file: hfs_start_transaction returned %d\n", error);
4002                 return error;
4003         }
4004         lockflags = hfs_systemfile_lock(hfsmp, SFL_CATALOG | SFL_BITMAP, HFS_EXCLUSIVE_LOCK);
4005
4006         oldBlockCount = hfsmp->jnl_size / hfsmp->blockSize;
4007
4008         /* TODO: Allow the journal to change size based on the new volume size. */
4009         error = BlockAllocate(hfsmp, 1, oldBlockCount, oldBlockCount, true, true, &newStartBlock, &newBlockCount);
4010         if (error) {
4011                 printf("hfs_reclaim_journal_file: BlockAllocate returned %d\n", error);
4012                 goto fail;
4013         }
4014         if (newBlockCount != oldBlockCount) {
4015                 printf("hfs_reclaim_journal_file: newBlockCount != oldBlockCount (%u, %u)\n", newBlockCount, oldBlockCount);
4016                 goto free_fail;
4017         }
4018
4019         error = BlockDeallocate(hfsmp, hfsmp->jnl_start, oldBlockCount);
4020         if (error) {
4021                 printf("hfs_reclaim_journal_file: BlockDeallocate returned %d\n", error);
4022                 goto free_fail;
4023         }
4024
4025         /* Update the catalog record for .journal */
4026         error = cat_idlookup(hfsmp, hfsmp->hfs_jnlfileid, 1, &journal_desc, &journal_attr, &journal_fork);
4027         if (error) {
4028                 printf("hfs_reclaim_journal_file: cat_idlookup returned %d\n", error);
4029                 goto free_fail;
4030         }
4031         journal_fork.cf_size = newBlockCount * hfsmp->blockSize;
4032         journal_fork.cf_extents[0].startBlock = newStartBlock;
4033         journal_fork.cf_extents[0].blockCount = newBlockCount;
4034         journal_fork.cf_blocks = newBlockCount;
4035         error = cat_update(hfsmp, &journal_desc, &journal_attr, &journal_fork, NULL);
4036         cat_releasedesc(&journal_desc);  /* all done with cat descriptor */
4037         if (error) {
4038                 printf("hfs_reclaim_journal_file: cat_update returned %d\n", error);
4039                 goto free_fail;
4040         }
4041         callback_args.hfsmp = hfsmp;
4042         callback_args.context = context;
4043         callback_args.newStartBlock = newStartBlock;
4044
4045         error = journal_relocate(hfsmp->jnl, (off_t)newStartBlock*hfsmp->blockSize,
4046                 (off_t)newBlockCount*hfsmp->blockSize, 0,
4047                 hfs_journal_relocate_callback, &callback_args);
4048         if (error) {
4049                 /* NOTE: journal_relocate will mark the journal invalid. */
4050                 printf("hfs_reclaim_journal_file: journal_relocate returned %d\n", error);
4051                 goto fail;
4052         }
4053         hfsmp->jnl_start = newStartBlock;
4054         hfsmp->jnl_size = (off_t)newBlockCount * hfsmp->blockSize;
4055
4056         hfs_systemfile_unlock(hfsmp, lockflags);
4057         error = hfs_end_transaction(hfsmp);
4058         if (error) {
4059                 printf("hfs_reclaim_journal_file: hfs_end_transaction returned %d\n", error);
4060         }
4061
4062         return error;
4063
4064 free_fail:
4065         (void) BlockDeallocate(hfsmp, newStartBlock, newBlockCount);
4066 fail:
4067         hfs_systemfile_unlock(hfsmp, lockflags);
4068         (void) hfs_end_transaction(hfsmp);
4069         return error;
4070 }
4071
4072
4073 /*
4074  * Move the journal info block to a new location.  We have to make sure the
4075  * new copy of the journal info block gets to the media first, then change
4076  * the field in the volume header and the catalog record.
4077  */
4078 static int
4079 hfs_reclaim_journal_info_block(struct hfsmount *hfsmp, vfs_context_t context)
4080 {
4081         int error;
4082         int lockflags;
4083         u_int32_t newBlock;
4084         u_int32_t blockCount;
4085         struct cat_desc jib_desc;
4086         struct cat_attr jib_attr;
4087         struct cat_fork jib_fork;
4088         buf_t old_bp, new_bp;
4089
4090         error = hfs_start_transaction(hfsmp);
4091         if (error) {
4092                 printf("hfs_reclaim_journal_info_block: hfs_start_transaction returned %d\n", error);
4093                 return error;
4094         }
4095         lockflags = hfs_systemfile_lock(hfsmp, SFL_CATALOG | SFL_BITMAP, HFS_EXCLUSIVE_LOCK);
4096
4097         error = BlockAllocate(hfsmp, 1, 1, 1, true, true, &newBlock, &blockCount);
4098         if (error) {
4099                 printf("hfs_reclaim_journal_info_block: BlockAllocate returned %d\n", error);
4100                 goto fail;
4101         }
4102         if (blockCount != 1) {
4103                 printf("hfs_reclaim_journal_info_block: blockCount != 1 (%u)\n", blockCount);
4104                 goto free_fail;
4105         }
4106         error = BlockDeallocate(hfsmp, hfsmp->vcbJinfoBlock, 1);
4107         if (error) {
4108                 printf("hfs_reclaim_journal_info_block: BlockDeallocate returned %d\n", error);
4109                 goto free_fail;
4110         }
4111
4112         /* Copy the old journal info block content to the new location */
4113         error = buf_meta_bread(hfsmp->hfs_devvp,
4114                 hfsmp->vcbJinfoBlock * (hfsmp->blockSize/hfsmp->hfs_phys_block_size),
4115                 hfsmp->blockSize, vfs_context_ucred(context), &old_bp);
4116         if (error) {
4117                 printf("hfs_reclaim_journal_info_block: failed to read JIB (%d)\n", error);
4118                 goto free_fail;
4119         }
4120         new_bp = buf_getblk(hfsmp->hfs_devvp,
4121                 newBlock * (hfsmp->blockSize/hfsmp->hfs_phys_block_size),
4122                 hfsmp->blockSize, 0, 0, BLK_META);
4123         bcopy((char*)buf_dataptr(old_bp), (char*)buf_dataptr(new_bp), hfsmp->blockSize);
4124         buf_brelse(old_bp);
4125         if (journal_uses_fua(hfsmp->jnl))
4126                 buf_markfua(new_bp);
4127         error = buf_bwrite(new_bp);
4128         if (error) {
4129                 printf("hfs_reclaim_journal_info_block: failed to write new JIB (%d)\n", error);
4130                 goto free_fail;
4131         }
4132         if (!journal_uses_fua(hfsmp->jnl)) {
4133                 error = VNOP_IOCTL(hfsmp->hfs_devvp, DKIOCSYNCHRONIZECACHE, NULL, FWRITE, context);
4134                 if (error) {
4135                         printf("hfs_reclaim_journal_info_block: DKIOCSYNCHRONIZECACHE failed (%d)\n", error);
4136                         /* Don't fail the operation. */
4137                 }
4138         }
4139
4140         /* Update the catalog record for .journal_info_block */
4141         error = cat_idlookup(hfsmp, hfsmp->hfs_jnlinfoblkid, 1, &jib_desc, &jib_attr, &jib_fork);
4142         if (error) {
4143                 printf("hfs_reclaim_journal_file: cat_idlookup returned %d\n", error);
4144                 goto fail;
4145         }
4146         jib_fork.cf_size = hfsmp->blockSize;
4147         jib_fork.cf_extents[0].startBlock = newBlock;
4148         jib_fork.cf_extents[0].blockCount = 1;
4149         jib_fork.cf_blocks = 1;
4150         error = cat_update(hfsmp, &jib_desc, &jib_attr, &jib_fork, NULL);
4151         cat_releasedesc(&jib_desc);  /* all done with cat descriptor */
4152         if (error) {
4153                 printf("hfs_reclaim_journal_info_block: cat_update returned %d\n", error);
4154                 goto fail;
4155         }
4156
4157         /* Update the pointer to the journal info block in the volume header. */
4158         hfsmp->vcbJinfoBlock = newBlock;
4159         error = hfs_flushvolumeheader(hfsmp, MNT_WAIT, HFS_ALTFLUSH);
4160         if (error) {
4161                 printf("hfs_reclaim_journal_info_block: hfs_flushvolumeheader returned %d\n", error);
4162                 goto fail;
4163         }
4164         hfs_systemfile_unlock(hfsmp, lockflags);
4165         error = hfs_end_transaction(hfsmp);
4166         if (error) {
4167                 printf("hfs_reclaim_journal_info_block: hfs_end_transaction returned %d\n", error);
4168         }
4169         error = journal_flush(hfsmp->jnl);
4170         if (error) {
4171                 printf("hfs_reclaim_journal_info_block: journal_flush returned %d\n", error);
4172         }
4173         return error;
4174
4175 free_fail:
4176         (void) BlockDeallocate(hfsmp, newBlock, blockCount);
4177 fail:
4178         hfs_systemfile_unlock(hfsmp, lockflags);
4179         (void) hfs_end_transaction(hfsmp);
4180         return error;
4181 }
4182
4183
4184 /*
4185  * Reclaim space at the end of a file system.
4186  */
4187 static int
4188 hfs_reclaimspace(struct hfsmount *hfsmp, u_long startblk, u_long reclaimblks, vfs_context_t context)
4189 {
4190         struct vnode *vp = NULL;
4191         FCB *fcb;
4192         struct BTreeIterator * iterator = NULL;
4193         struct FSBufferDescriptor btdata;
4194         struct HFSPlusCatalogFile filerec;
4195         u_int32_t  saved_next_allocation;
4196         cnid_t * cnidbufp;
4197         size_t cnidbufsize;
4198         int filecnt = 0;
4199         int maxfilecnt;
4200         u_long block;
4201         u_long datablks;
4202         u_long rsrcblks;
4203         u_long blkstomove = 0;
4204         int lockflags;
4205         int i;
4206         int error;
4207         int lastprogress = 0;
4208         Boolean system_file_moved = false;
4209
4210         /* Relocate extents of the Allocation file if they're in the way. */
4211         error = hfs_reclaim_sys_file(hfsmp, hfsmp->hfs_allocation_vp, startblk, SFL_BITMAP, &system_file_moved, context);
4212         if (error) {
4213                 printf("hfs_reclaimspace: reclaim allocation file returned %d\n", error);
4214                 return error;
4215         }
4216         /* Relocate extents of the Extents B-tree if they're in the way. */
4217         error = hfs_reclaim_sys_file(hfsmp, hfsmp->hfs_extents_vp, startblk, SFL_EXTENTS, &system_file_moved, context);
4218         if (error) {
4219                 printf("hfs_reclaimspace: reclaim extents b-tree returned %d\n", error);
4220                 return error;
4221         }
4222         /* Relocate extents of the Catalog B-tree if they're in the way. */
4223         error = hfs_reclaim_sys_file(hfsmp, hfsmp->hfs_catalog_vp, startblk, SFL_CATALOG, &system_file_moved, context);
4224         if (error) {
4225                 printf("hfs_reclaimspace: reclaim catalog b-tree returned %d\n", error);
4226                 return error;
4227         }
4228         /* Relocate extents of the Attributes B-tree if they're in the way. */
4229         error = hfs_reclaim_sys_file(hfsmp, hfsmp->hfs_attribute_vp, startblk, SFL_ATTRIBUTE, &system_file_moved, context);
4230         if (error) {
4231                 printf("hfs_reclaimspace: reclaim attribute b-tree returned %d\n", error);
4232                 return error;
4233         }
4234         /* Relocate extents of the Startup File if there is one and they're in the way. */
4235         error = hfs_reclaim_sys_file(hfsmp, hfsmp->hfs_startup_vp, startblk, SFL_STARTUP, &system_file_moved, context);
4236         if (error) {
4237                 printf("hfs_reclaimspace: reclaim startup file returned %d\n", error);
4238                 return error;
4239         }
4240
4241         /*
4242          * We need to make sure the alternate volume header gets flushed if we moved
4243          * any extents in the volume header.  But we need to do that before
4244          * shrinking the size of the volume, or else the journal code will panic
4245          * with an invalid (too large) block number.
4246          *
4247          * Note that system_file_moved will be set if ANY extent was moved, even
4248          * if it was just an overflow extent.  In this case, the journal_flush isn't
4249          * strictly required, but shouldn't hurt.
4250          */
4251         if (system_file_moved)
4252                 journal_flush(hfsmp->jnl);
4253
4254         if (hfsmp->jnl_start + (hfsmp->jnl_size / hfsmp->blockSize) > startblk) {
4255                 error = hfs_reclaim_journal_file(hfsmp, context);
4256                 if (error) {
4257                         printf("hfs_reclaimspace: hfs_reclaim_journal_file failed (%d)\n", error);
4258                         return error;
4259                 }
4260         }
4261
4262         if (hfsmp->vcbJinfoBlock >= startblk) {
4263                 error = hfs_reclaim_journal_info_block(hfsmp, context);
4264                 if (error) {
4265                         printf("hfs_reclaimspace: hfs_reclaim_journal_info_block failed (%d)\n", error);
4266                         return error;
4267                 }
4268         }
4269
4270         /* For now move a maximum of 250,000 files. */
4271         maxfilecnt = MIN(hfsmp->hfs_filecount, 250000);
4272         maxfilecnt = MIN((u_long)maxfilecnt, reclaimblks);
4273         cnidbufsize = maxfilecnt * sizeof(cnid_t);
4274         if (kmem_alloc(kernel_map, (vm_offset_t *)&cnidbufp, cnidbufsize)) {
4275                 return (ENOMEM);
4276         }
4277         if (kmem_alloc(kernel_map, (vm_offset_t *)&iterator, sizeof(*iterator))) {
4278                 kmem_free(kernel_map, (vm_offset_t)cnidbufp, cnidbufsize);
4279                 return (ENOMEM);
4280         }
4281
4282         saved_next_allocation = hfsmp->nextAllocation;
4283         HFS_UPDATE_NEXT_ALLOCATION(hfsmp, hfsmp->hfs_metazone_start);
4284
4285         fcb = VTOF(hfsmp->hfs_catalog_vp);
4286         bzero(iterator, sizeof(*iterator));
4287
4288         btdata.bufferAddress = &filerec;
4289         btdata.itemSize = sizeof(filerec);
4290         btdata.itemCount = 1;
4291
4292         /* Keep the Catalog and extents files locked during iteration. */
4293         lockflags = hfs_systemfile_lock(hfsmp, SFL_CATALOG | SFL_EXTENTS, HFS_SHARED_LOCK);
4294
4295         error = BTIterateRecord(fcb, kBTreeFirstRecord, iterator, NULL, NULL);
4296         if (error) {
4297                 goto end_iteration;
4298         }
4299         /*
4300          * Iterate over all the catalog records looking for files
4301          * that overlap into the space we're trying to free up.
4302          */
4303         for (filecnt = 0; filecnt < maxfilecnt; ) {
4304                 error = BTIterateRecord(fcb, kBTreeNextRecord, iterator, &btdata, NULL);
4305                 if (error) {
4306                         if (error == fsBTRecordNotFoundErr || error == fsBTEndOfIterationErr) {
4307                                 error = 0;
4308                         }
4309                         break;
4310                 }
4311                 if (filerec.recordType != kHFSPlusFileRecord) {
4312                         continue;
4313                 }
4314                 datablks = rsrcblks = 0;
4315                 /*
4316                  * Check if either fork overlaps target space.
4317                  */
4318                 for (i = 0; i < kHFSPlusExtentDensity; ++i) {
4319                         if (filerec.dataFork.extents[i].blockCount != 0) {
4320                                 datablks += filerec.dataFork.extents[i].blockCount;
4321                                 block = filerec.dataFork.extents[i].startBlock +
4322                                                 filerec.dataFork.extents[i].blockCount;
4323                                 if (block >= startblk) {
4324                                         if ((filerec.fileID == hfsmp->hfs_jnlfileid) ||
4325                                                 (filerec.fileID == hfsmp->hfs_jnlinfoblkid)) {
4326                                                 printf("hfs_reclaimspace: cannot move active journal\n");
4327                                                 error = EPERM;
4328                                                 goto end_iteration;
4329                                         }
4330                                         cnidbufp[filecnt++] = filerec.fileID;
4331                                         blkstomove += filerec.dataFork.totalBlocks;
4332                                         break;
4333                                 }
4334                         }
4335                         if (filerec.resourceFork.extents[i].blockCount != 0) {
4336                                 rsrcblks += filerec.resourceFork.extents[i].blockCount;
4337                                 block = filerec.resourceFork.extents[i].startBlock +
4338                                                 filerec.resourceFork.extents[i].blockCount;
4339                                 if (block >= startblk) {
4340                                         cnidbufp[filecnt++] = filerec.fileID;
4341                                         blkstomove += filerec.resourceFork.totalBlocks;
4342                                         break;
4343                                 }
4344                         }
4345                 }
4346                 /*
4347                  * Check for any overflow extents that overlap.
4348                  */
4349                 if (i == kHFSPlusExtentDensity) {
4350                         if (filerec.dataFork.totalBlocks > datablks) {
4351                                 if (hfs_overlapped_overflow_extents(hfsmp, startblk, datablks, filerec.fileID, 0)) {
4352                                         cnidbufp[filecnt++] = filerec.fileID;
4353                                         blkstomove += filerec.dataFork.totalBlocks;
4354                                 }
4355                         } else if (filerec.resourceFork.totalBlocks > rsrcblks) {
4356                                 if (hfs_overlapped_overflow_extents(hfsmp, startblk, rsrcblks, filerec.fileID, 1)) {
4357                                         cnidbufp[filecnt++] = filerec.fileID;
4358                                         blkstomove += filerec.resourceFork.totalBlocks;
4359                                 }
4360                         }
4361                 }
4362         }
4363
4364 end_iteration:
4365         if (filecnt == 0 && !system_file_moved) {
4366                 printf("hfs_reclaimspace: no files moved\n");
4367                 error = ENOSPC;
4368         }
4369         /* All done with catalog. */
4370         hfs_systemfile_unlock(hfsmp, lockflags);
4371         if (error || filecnt == 0)
4372                 goto out;
4373
4374         /*
4375          * Double check space requirements to make sure
4376          * there is enough space to relocate any files
4377          * that reside in the reclaim area.
4378          *
4379          *                                          Blocks To Move --------------
4380          *                                                            |    |    |
4381          *                                                            V    V    V
4382          * ------------------------------------------------------------------------
4383          * |                                                        | /   ///  // |
4384          * |                                                        | /   ///  // |
4385          * |                                                        | /   ///  // |
4386          * ------------------------------------------------------------------------
4387          *
4388          * <------------------- New Total Blocks ------------------><-- Reclaim -->
4389          *
4390          * <------------------------ Original Total Blocks ----------------------->
4391          *
4392          */
4393         if (blkstomove >= hfs_freeblks(hfsmp, 1)) {
4394                 printf("hfs_truncatefs: insufficient space (need %lu blocks; have %u blocks)\n", blkstomove, hfs_freeblks(hfsmp, 1));
4395                 error = ENOSPC;
4396                 goto out;
4397         }
4398         hfsmp->hfs_resize_filesmoved = 0;
4399         hfsmp->hfs_resize_totalfiles = filecnt;
4400
4401         /* Now move any files that are in the way. */
4402         for (i = 0; i < filecnt; ++i) {
4403                 struct vnode * rvp;
4404
4405                 if (hfs_vget(hfsmp, cnidbufp[i], &vp, 0) != 0)
4406                         continue;
4407
4408                 /* Relocate any data fork blocks. */
4409                 if (VTOF(vp)->ff_blocks > 0) {
4410                         error = hfs_relocate(vp, hfsmp->hfs_metazone_end + 1, kauth_cred_get(), current_proc());
4411                 }
4412                 if (error)
4413                         break;
4414
4415                 /* Relocate any resource fork blocks. */
4416                 if ((VTOC((vp))->c_blocks - VTOF((vp))->ff_blocks) > 0) {
4417                         error = hfs_vgetrsrc(hfsmp, vp, &rvp, TRUE);
4418                         if (error)
4419                                 break;
4420                         error = hfs_relocate(rvp, hfsmp->hfs_metazone_end + 1, kauth_cred_get(), current_proc());
4421                         vnode_put(rvp);
4422                         if (error)
4423                                 break;
4424                 }
4425                 hfs_unlock(VTOC(vp));
4426                 vnode_put(vp);
4427                 vp = NULL;
4428
4429                 ++hfsmp->hfs_resize_filesmoved;
4430
4431                 /* Report intermediate progress. */
4432                 if (filecnt > 100) {
4433                         int progress;
4434
4435                         progress = (i * 100) / filecnt;
4436                         if (progress > (lastprogress + 9)) {
4437                                 printf("hfs_reclaimspace: %d%% done...\n", progress);
4438                                 lastprogress = progress;
4439                         }
4440                 }
4441         }
4442         if (vp) {
4443                 hfs_unlock(VTOC(vp));
4444                 vnode_put(vp);
4445                 vp = NULL;
4446         }
4447         if (hfsmp->hfs_resize_filesmoved != 0) {
4448                 printf("hfs_reclaimspace: relocated %d files on \"%s\"\n",
4449                        (int)hfsmp->hfs_resize_filesmoved, hfsmp->vcbVN);
4450         }
4451 out:
4452         kmem_free(kernel_map, (vm_offset_t)iterator, sizeof(*iterator));
4453         kmem_free(kernel_map, (vm_offset_t)cnidbufp, cnidbufsize);
4454
4455         /*
4456          * Restore the roving allocation pointer on errors.
4457          * (but only if we didn't move any files)
4458          */
4459         if (error && hfsmp->hfs_resize_filesmoved == 0) {
4460                 HFS_UPDATE_NEXT_ALLOCATION(hfsmp, saved_next_allocation);
4461         }
4462         return (error);
4463 }
4464
4465
4466 /*
4467  * Check if there are any overflow extents that overlap.
4468  */
4469 static int
4470 hfs_overlapped_overflow_extents(struct hfsmount *hfsmp, u_int32_t startblk, u_int32_t catblks, u_int32_t fileID, int rsrcfork)
4471 {
4472         struct BTreeIterator * iterator = NULL;
4473         struct FSBufferDescriptor btdata;
4474         HFSPlusExtentRecord extrec;
4475         HFSPlusExtentKey *extkeyptr;
4476         FCB *fcb;
4477         u_int32_t block;
4478         u_int8_t forktype;
4479         int overlapped = 0;
4480         int i;
4481         int error;
4482
4483         forktype = rsrcfork ? 0xFF : 0;
4484         if (kmem_alloc(kernel_map, (vm_offset_t *)&iterator, sizeof(*iterator))) {
4485                 return (0);
4486         }
4487         bzero(iterator, sizeof(*iterator));
4488         extkeyptr = (HFSPlusExtentKey *)&iterator->key;
4489         extkeyptr->keyLength = kHFSPlusExtentKeyMaximumLength;
4490         extkeyptr->forkType = forktype;
4491         extkeyptr->fileID = fileID;
4492         extkeyptr->startBlock = catblks;
4493
4494         btdata.bufferAddress = &extrec;
4495         btdata.itemSize = sizeof(extrec);
4496         btdata.itemCount = 1;
4497
4498         fcb = VTOF(hfsmp->hfs_extents_vp);
4499
4500         error = BTSearchRecord(fcb, iterator, &btdata, NULL, iterator);
4501         while (error == 0) {
4502                 /* Stop when we encounter a different file. */
4503                 if ((extkeyptr->fileID != fileID) ||
4504                     (extkeyptr->forkType != forktype)) {
4505                         break;
4506                 }
4507                 /*
4508                  * Check if the file overlaps target space.
4509                  */
4510                 for (i = 0; i < kHFSPlusExtentDensity; ++i) {
4511                         if (extrec[i].blockCount == 0) {
4512                                 break;
4513                         }
4514                         block = extrec[i].startBlock + extrec[i].blockCount;
4515                         if (block >= startblk) {
4516                                 overlapped = 1;
4517                                 break;
4518                         }
4519                 }
4520                 /* Look for more records. */
4521                 error = BTIterateRecord(fcb, kBTreeNextRecord, iterator, &btdata, NULL);
4522         }
4523
4524         kmem_free(kernel_map, (vm_offset_t)iterator, sizeof(*iterator));
4525         return (overlapped);
4526 }
4527
4528
4529 /*
4530  * Calculate the progress of a file system resize operation.
4531  */
4532 __private_extern__
4533 int
4534 hfs_resize_progress(struct hfsmount *hfsmp, u_int32_t *progress)
4535 {
4536         if ((hfsmp->hfs_flags & HFS_RESIZE_IN_PROGRESS) == 0) {
4537                 return (ENXIO);
4538         }
4539
4540         if (hfsmp->hfs_resize_totalfiles > 0)
4541                 *progress = (hfsmp->hfs_resize_filesmoved * 100) / hfsmp->hfs_resize_totalfiles;
4542         else
4543                 *progress = 0;
4544
4545         return (0);
4546 }
4547
4548
4549 /*
4550  * Get file system attributes.
4551  */
4552 static int
4553 hfs_vfs_getattr(struct mount *mp, struct vfs_attr *fsap, __unused vfs_context_t context)
4554 {
4555 #define HFS_ATTR_CMN_VALIDMASK (ATTR_CMN_VALIDMASK & ~(ATTR_CMN_NAMEDATTRCOUNT | ATTR_CMN_NAMEDATTRLIST))
4556 #define HFS_ATTR_FILE_VALIDMASK (ATTR_FILE_VALIDMASK & ~(ATTR_FILE_FILETYPE | ATTR_FILE_FORKCOUNT | ATTR_FILE_FORKLIST))
4557
4558         ExtendedVCB *vcb = VFSTOVCB(mp);
4559         struct hfsmount *hfsmp = VFSTOHFS(mp);
4560         u_long freeCNIDs;
4561
4562         freeCNIDs = (u_long)0xFFFFFFFF - (u_long)hfsmp->vcbNxtCNID;
4563
4564         VFSATTR_RETURN(fsap, f_objcount, (u_int64_t)hfsmp->vcbFilCnt + (u_int64_t)hfsmp->vcbDirCnt);
4565         VFSATTR_RETURN(fsap, f_filecount, (u_int64_t)hfsmp->vcbFilCnt);
4566         VFSATTR_RETURN(fsap, f_dircount, (u_int64_t)hfsmp->vcbDirCnt);
4567         VFSATTR_RETURN(fsap, f_maxobjcount, (u_int64_t)0xFFFFFFFF);
4568         VFSATTR_RETURN(fsap, f_iosize, (size_t)(MAX_UPL_TRANSFER * PAGE_SIZE));
4569         VFSATTR_RETURN(fsap, f_blocks, (u_int64_t)hfsmp->totalBlocks);
4570         VFSATTR_RETURN(fsap, f_bfree, (u_int64_t)hfs_freeblks(hfsmp, 0));
4571         VFSATTR_RETURN(fsap, f_bavail, (u_int64_t)hfs_freeblks(hfsmp, 1));
4572         VFSATTR_RETURN(fsap, f_bsize, (u_int32_t)vcb->blockSize);
4573         /* XXX needs clarification */
4574         VFSATTR_RETURN(fsap, f_bused, hfsmp->totalBlocks - hfs_freeblks(hfsmp, 1));
4575         /* Maximum files is constrained by total blocks. */
4576         VFSATTR_RETURN(fsap, f_files, (u_int64_t)(hfsmp->totalBlocks - 2));
4577         VFSATTR_RETURN(fsap, f_ffree, MIN((u_int64_t)freeCNIDs, (u_int64_t)hfs_freeblks(hfsmp, 1)));
4578
4579         fsap->f_fsid.val[0] = hfsmp->hfs_raw_dev;
4580         fsap->f_fsid.val[1] = vfs_typenum(mp);
4581         VFSATTR_SET_SUPPORTED(fsap, f_fsid);
4582
4583         VFSATTR_RETURN(fsap, f_signature, vcb->vcbSigWord);
4584         VFSATTR_RETURN(fsap, f_carbon_fsid, 0);
4585
4586         if (VFSATTR_IS_ACTIVE(fsap, f_capabilities)) {
4587                 vol_capabilities_attr_t *cap;
4588
4589                 cap = &fsap->f_capabilities;
4590
4591                 if (hfsmp->hfs_flags & HFS_STANDARD) {
4592                         cap->capabilities[VOL_CAPABILITIES_FORMAT] =
4593                                 VOL_CAP_FMT_PERSISTENTOBJECTIDS |
4594                                 VOL_CAP_FMT_CASE_PRESERVING |
4595                                 VOL_CAP_FMT_FAST_STATFS |
4596                                 VOL_CAP_FMT_HIDDEN_FILES |
4597                                 VOL_CAP_FMT_PATH_FROM_ID;
4598                 } else {
4599                         cap->capabilities[VOL_CAPABILITIES_FORMAT] =
4600                                 VOL_CAP_FMT_PERSISTENTOBJECTIDS |
4601                                 VOL_CAP_FMT_SYMBOLICLINKS |
4602                                 VOL_CAP_FMT_HARDLINKS |
4603                                 VOL_CAP_FMT_JOURNAL |
4604                                 VOL_CAP_FMT_ZERO_RUNS |
4605                                 (hfsmp->jnl ? VOL_CAP_FMT_JOURNAL_ACTIVE : 0) |
4606                                 (hfsmp->hfs_flags & HFS_CASE_SENSITIVE ? VOL_CAP_FMT_CASE_SENSITIVE : 0) |
4607                                 VOL_CAP_FMT_CASE_PRESERVING |
4608                                 VOL_CAP_FMT_FAST_STATFS |
4609                                 VOL_CAP_FMT_2TB_FILESIZE |
4610                                 VOL_CAP_FMT_HIDDEN_FILES |
4611                                 VOL_CAP_FMT_PATH_FROM_ID;
4612                 }
4613                 cap->capabilities[VOL_CAPABILITIES_INTERFACES] =
4614                         VOL_CAP_INT_SEARCHFS |
4615                         VOL_CAP_INT_ATTRLIST |
4616                         VOL_CAP_INT_NFSEXPORT |
4617                         VOL_CAP_INT_READDIRATTR |
4618                         VOL_CAP_INT_EXCHANGEDATA |
4619                         VOL_CAP_INT_ALLOCATE |
4620                         VOL_CAP_INT_VOL_RENAME |
4621                         VOL_CAP_INT_ADVLOCK |
4622                         VOL_CAP_INT_FLOCK |
4623 #if NAMEDSTREAMS
4624                         VOL_CAP_INT_EXTENDED_ATTR |
4625                         VOL_CAP_INT_NAMEDSTREAMS;
4626 #else
4627                         VOL_CAP_INT_EXTENDED_ATTR;
4628 #endif
4629                 cap->capabilities[VOL_CAPABILITIES_RESERVED1] = 0;
4630                 cap->capabilities[VOL_CAPABILITIES_RESERVED2] = 0;
4631
4632                 cap->valid[VOL_CAPABILITIES_FORMAT] =
4633                         VOL_CAP_FMT_PERSISTENTOBJECTIDS |
4634                         VOL_CAP_FMT_SYMBOLICLINKS |
4635                         VOL_CAP_FMT_HARDLINKS |
4636                         VOL_CAP_FMT_JOURNAL |
4637                         VOL_CAP_FMT_JOURNAL_ACTIVE |
4638                         VOL_CAP_FMT_NO_ROOT_TIMES |
4639                         VOL_CAP_FMT_SPARSE_FILES |
4640                         VOL_CAP_FMT_ZERO_RUNS |
4641                         VOL_CAP_FMT_CASE_SENSITIVE |
4642                         VOL_CAP_FMT_CASE_PRESERVING |
4643                         VOL_CAP_FMT_FAST_STATFS |
4644                         VOL_CAP_FMT_2TB_FILESIZE |
4645                         VOL_CAP_FMT_OPENDENYMODES |
4646                         VOL_CAP_FMT_HIDDEN_FILES |
4647                         VOL_CAP_FMT_PATH_FROM_ID;
4648                 cap->valid[VOL_CAPABILITIES_INTERFACES] =
4649                         VOL_CAP_INT_SEARCHFS |
4650                         VOL_CAP_INT_ATTRLIST |
4651                         VOL_CAP_INT_NFSEXPORT |
4652                         VOL_CAP_INT_READDIRATTR |
4653                         VOL_CAP_INT_EXCHANGEDATA |
4654                         VOL_CAP_INT_COPYFILE |
4655                         VOL_CAP_INT_ALLOCATE |
4656                         VOL_CAP_INT_VOL_RENAME |
4657                         VOL_CAP_INT_ADVLOCK |
4658                         VOL_CAP_INT_FLOCK |
4659                         VOL_CAP_INT_MANLOCK |
4660 #if NAMEDSTREAMS
4661                         VOL_CAP_INT_EXTENDED_ATTR |
4662                         VOL_CAP_INT_NAMEDSTREAMS;
4663 #else
4664                         VOL_CAP_INT_EXTENDED_ATTR;
4665 #endif
4666                 cap->valid[VOL_CAPABILITIES_RESERVED1] = 0;
4667                 cap->valid[VOL_CAPABILITIES_RESERVED2] = 0;
4668                 VFSATTR_SET_SUPPORTED(fsap, f_capabilities);
4669         }
4670         if (VFSATTR_IS_ACTIVE(fsap, f_attributes)) {
4671                 vol_attributes_attr_t *attrp = &fsap->f_attributes;
4672
4673                 attrp->validattr.commonattr = HFS_ATTR_CMN_VALIDMASK;
4674                 attrp->validattr.volattr = ATTR_VOL_VALIDMASK & ~ATTR_VOL_INFO;
4675                 attrp->validattr.dirattr = ATTR_DIR_VALIDMASK;
4676                 attrp->validattr.fileattr = HFS_ATTR_FILE_VALIDMASK;
4677                 attrp->validattr.forkattr = 0;
4678
4679                 attrp->nativeattr.commonattr = HFS_ATTR_CMN_VALIDMASK;
4680                 attrp->nativeattr.volattr = ATTR_VOL_VALIDMASK & ~ATTR_VOL_INFO;
4681                 attrp->nativeattr.dirattr = ATTR_DIR_VALIDMASK;
4682                 attrp->nativeattr.fileattr = HFS_ATTR_FILE_VALIDMASK;
4683                 attrp->nativeattr.forkattr = 0;
4684                 VFSATTR_SET_SUPPORTED(fsap, f_attributes);
4685         }
4686         fsap->f_create_time.tv_sec = hfsmp->vcbCrDate;
4687         fsap->f_create_time.tv_nsec = 0;
4688         VFSATTR_SET_SUPPORTED(fsap, f_create_time);
4689         fsap->f_modify_time.tv_sec = hfsmp->vcbLsMod;
4690         fsap->f_modify_time.tv_nsec = 0;
4691         VFSATTR_SET_SUPPORTED(fsap, f_modify_time);
4692
4693         fsap->f_backup_time.tv_sec = hfsmp->vcbVolBkUp;
4694         fsap->f_backup_time.tv_nsec = 0;
4695         VFSATTR_SET_SUPPORTED(fsap, f_backup_time);
4696         if (VFSATTR_IS_ACTIVE(fsap, f_fssubtype)) {
4697                 u_int16_t subtype = 0;
4698
4699                 /*
4700                  * Subtypes (flavors) for HFS
4701                  *   0:   Mac OS Extended
4702                  *   1:   Mac OS Extended (Journaled)
4703                  *   2:   Mac OS Extended (Case Sensitive)
4704                  *   3:   Mac OS Extended (Case Sensitive, Journaled)
4705                  *   4 - 127:   Reserved
4706                  * 128:   Mac OS Standard
4707                  *
4708                  */
4709                 if (hfsmp->hfs_flags & HFS_STANDARD) {
4710                         subtype = HFS_SUBTYPE_STANDARDHFS;
4711                 } else /* HFS Plus */ {
4712                         if (hfsmp->jnl)
4713                                 subtype |= HFS_SUBTYPE_JOURNALED;
4714                         if (hfsmp->hfs_flags & HFS_CASE_SENSITIVE)
4715                                 subtype |= HFS_SUBTYPE_CASESENSITIVE;
4716                 }
4717                 fsap->f_fssubtype = subtype;
4718                 VFSATTR_SET_SUPPORTED(fsap, f_fssubtype);
4719         }
4720
4721         if (VFSATTR_IS_ACTIVE(fsap, f_vol_name)) {
4722                 strlcpy(fsap->f_vol_name, (char *) hfsmp->vcbVN, MAXPATHLEN);
4723                 VFSATTR_SET_SUPPORTED(fsap, f_vol_name);
4724         }
4725         return (0);
4726 }
4727
4728 /*
4729  * Perform a volume rename.  Requires the FS' root vp.
4730  */
4731 static int
4732 hfs_rename_volume(struct vnode *vp, const char *name, proc_t p)
4733 {
4734         ExtendedVCB *vcb = VTOVCB(vp);
4735         struct cnode *cp = VTOC(vp);
4736         struct hfsmount *hfsmp = VTOHFS(vp);
4737         struct cat_desc to_desc;
4738         struct cat_desc todir_desc;
4739         struct cat_desc new_desc;
4740         cat_cookie_t cookie;
4741         int lockflags;
4742         int error = 0;
4743
4744         /*
4745          * Ignore attempts to rename a volume to a zero-length name.
4746          */
4747         if (name[0] == 0)
4748                 return(0);
4749
4750         bzero(&to_desc, sizeof(to_desc));
4751         bzero(&todir_desc, sizeof(todir_desc));
4752         bzero(&new_desc, sizeof(new_desc));
4753         bzero(&cookie, sizeof(cookie));
4754
4755         todir_desc.cd_parentcnid = kHFSRootParentID;
4756         todir_desc.cd_cnid = kHFSRootFolderID;
4757         todir_desc.cd_flags = CD_ISDIR;
4758
4759         to_desc.cd_nameptr = (const u_int8_t *)name;
4760         to_desc.cd_namelen = strlen(name);
4761         to_desc.cd_parentcnid = kHFSRootParentID;
4762         to_desc.cd_cnid = cp->c_cnid;
4763         to_desc.cd_flags = CD_ISDIR;
4764
4765         if ((error = hfs_lock(cp, HFS_EXCLUSIVE_LOCK)) == 0) {
4766                 if ((error = hfs_start_transaction(hfsmp)) == 0) {
4767                         if ((error = cat_preflight(hfsmp, CAT_RENAME, &cookie, p)) == 0) {
4768                                 lockflags = hfs_systemfile_lock(hfsmp, SFL_CATALOG, HFS_EXCLUSIVE_LOCK);
4769
4770                                 error = cat_rename(hfsmp, &cp->c_desc, &todir_desc, &to_desc, &new_desc);
4771
4772                                 /*
4773                                  * If successful, update the name in the VCB, ensure it's terminated.
4774                                  */
4775                                 if (!error) {
4776                                         strlcpy((char *)vcb->vcbVN, name, sizeof(vcb->vcbVN));
4777                                 }
4778
4779                                 hfs_systemfile_unlock(hfsmp, lockflags);
4780                                 cat_postflight(hfsmp, &cookie, p);
4781
4782                                 if (error)
4783                                         MarkVCBDirty(vcb);
4784                                 (void) hfs_flushvolumeheader(hfsmp, MNT_WAIT, 0);
4785                         }
4786                         hfs_end_transaction(hfsmp);
4787                 }
4788                 if (!error) {
4789                         /* Release old allocated name buffer */
4790                         if (cp->c_desc.cd_flags & CD_HASBUF) {
4791                                 const char *tmp_name = (const char *)cp->c_desc.cd_nameptr;
4792
4793                                 cp->c_desc.cd_nameptr = 0;
4794                                 cp->c_desc.cd_namelen = 0;
4795                                 cp->c_desc.cd_flags &= ~CD_HASBUF;
4796                                 vfs_removename(tmp_name);
4797                         }
4798                         /* Update cnode's catalog descriptor */
4799                         replace_desc(cp, &new_desc);
4800                         vcb->volumeNameEncodingHint = new_desc.cd_encoding;
4801                         cp->c_touch_chgtime = TRUE;
4802                 }
4803
4804                 hfs_unlock(cp);
4805         }
4806
4807         return(error);
4808 }
4809
4810 /*
4811  * Get file system attributes.
4812  */
4813 static int
4814 hfs_vfs_setattr(struct mount *mp, struct vfs_attr *fsap, __unused vfs_context_t context)
4815 {
4816         kauth_cred_t cred = vfs_context_ucred(context);
4817         int error = 0;
4818
4819         /*
4820          * Must be superuser or owner of filesystem to change volume attributes
4821          */
4822         if (!kauth_cred_issuser(cred) && (kauth_cred_getuid(cred) != vfs_statfs(mp)->f_owner))
4823                 return(EACCES);
4824
4825         if (VFSATTR_IS_ACTIVE(fsap, f_vol_name)) {
4826                 vnode_t root_vp;
4827
4828                 error = hfs_vfs_root(mp, &root_vp, context);
4829                 if (error)
4830                         goto out;
4831
4832                 error = hfs_rename_volume(root_vp, fsap->f_vol_name, vfs_context_proc(context));
4833                 (void) vnode_put(root_vp);
4834                 if (error)
4835                         goto out;
4836
4837                 VFSATTR_SET_SUPPORTED(fsap, f_vol_name);
4838         }
4839
4840 out:
4841         return error;
4842 }
4843
4844 /* If a runtime corruption is detected, set the volume inconsistent
4845  * bit in the volume attributes.  The volume inconsistent bit is a persistent
4846  * bit which represents that the volume is corrupt and needs repair.
4847  * The volume inconsistent bit can be set from the kernel when it detects
4848  * runtime corruption or from file system repair utilities like fsck_hfs when
4849  * a repair operation fails.  The bit should be cleared only from file system
4850  * verify/repair utility like fsck_hfs when a verify/repair succeeds.
4851  */
4852 void hfs_mark_volume_inconsistent(struct hfsmount *hfsmp)
4853 {
4854         HFS_MOUNT_LOCK(hfsmp, TRUE);
4855         if ((hfsmp->vcbAtrb & kHFSVolumeInconsistentMask) == 0) {
4856                 hfsmp->vcbAtrb |= kHFSVolumeInconsistentMask;
4857                 MarkVCBDirty(hfsmp);
4858         }
4859         /* Log information to ASL log */
4860         fslog_fs_corrupt(hfsmp->hfs_mp);
4861         printf("HFS: Runtime corruption detected on %s, fsck will be forced on next mount.\n", hfsmp->vcbVN);
4862         HFS_MOUNT_UNLOCK(hfsmp, TRUE);
4863 }
4864
4865 /* Replay the journal on the device node provided.  Returns zero if
4866  * journal replay succeeded or no journal was supposed to be replayed.
4867  */
4868 static int hfs_journal_replay(const char *devnode, vfs_context_t context)
4869 {
4870         int retval = 0;
4871         struct vnode *devvp = NULL;
4872         struct mount *mp = NULL;
4873         struct hfs_mount_args *args = NULL;
4874
4875         /* Lookup vnode for given raw device path */
4876         retval = vnode_open(devnode, FREAD|FWRITE, 0, 0, &devvp, NULL);
4877         if (retval) {
4878                 goto out;
4879         }
4880
4881         /* Replay allowed only on raw devices */
4882         if (!vnode_ischr(devvp)) {
4883                 retval = EINVAL;
4884                 goto out;
4885         }
4886
4887         /* Create dummy mount structures */
4888         MALLOC(mp, struct mount *, sizeof(struct mount), M_TEMP, M_WAITOK);
4889         bzero(mp, sizeof(struct mount));
4890         mount_lock_init(mp);
4891
4892         MALLOC(args, struct hfs_mount_args *, sizeof(struct hfs_mount_args), M_TEMP, M_WAITOK);
4893         bzero(args, sizeof(struct hfs_mount_args));
4894
4895         retval = hfs_mountfs(devvp, mp, args, 1, context);
4896         buf_flushdirtyblks(devvp, MNT_WAIT, 0, "hfs_journal_replay");
4897
4898 out:
4899         if (mp) {
4900                 mount_lock_destroy(mp);
4901                 FREE(mp, M_TEMP);
4902         }
4903         if (args) {
4904                 FREE(args, M_TEMP);
4905         }
4906         if (devvp) {
4907                 vnode_close(devvp, FREAD|FWRITE, NULL);
4908         }
4909         return retval;
4910 }
4911
4912 /*
4913  * hfs vfs operations.
4914  */
4915 struct vfsops hfs_vfsops = {
4916         hfs_mount,
4917         hfs_start,
4918         hfs_unmount,
4919         hfs_vfs_root,
4920         hfs_quotactl,
4921         hfs_vfs_getattr,        /* was hfs_statfs */
4922         hfs_sync,
4923         hfs_vfs_vget,
4924         hfs_fhtovp,
4925         hfs_vptofh,
4926         hfs_init,
4927         hfs_sysctl,
4928         hfs_vfs_setattr,
4929         {NULL}
4930 };