]> git.saurik.com Git - apple/xnu.git/blob - bsd/hfs/hfs_hotfiles.c
xnu-3248.30.4.tar.gz
[apple/xnu.git] / bsd / hfs / hfs_hotfiles.c
1 /*
2 * Copyright (c) 2003-2013 Apple Inc. All rights reserved.
3 *
4 * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
5 *
6 * This file contains Original Code and/or Modifications of Original Code
7 * as defined in and that are subject to the Apple Public Source License
8 * Version 2.0 (the 'License'). You may not use this file except in
9 * compliance with the License. The rights granted to you under the License
10 * may not be used to create, or enable the creation or redistribution of,
11 * unlawful or unlicensed copies of an Apple operating system, or to
12 * circumvent, violate, or enable the circumvention or violation of, any
13 * terms of an Apple operating system software license agreement.
14 *
15 * Please obtain a copy of the License at
16 * http://www.opensource.apple.com/apsl/ and read it before using this file.
17 *
18 * The Original Code and all software distributed under the License are
19 * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
20 * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
21 * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
23 * Please see the License for the specific language governing rights and
24 * limitations under the License.
25 *
26 * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
27 */
28
29 #include <sys/param.h>
30 #include <sys/systm.h>
31 #include <sys/fcntl.h>
32 #include <sys/kernel.h>
33 #include <sys/malloc.h>
34 #include <sys/ubc.h>
35 #include <sys/ubc_internal.h>
36 #include <sys/vnode.h>
37 #include <sys/vnode_internal.h>
38 #include <sys/kauth.h>
39
40 #include <hfs/hfs.h>
41 #include <hfs/hfs_endian.h>
42 #include <hfs/hfs_format.h>
43 #include <hfs/hfs_mount.h>
44 #include <hfs/hfs_hotfiles.h>
45
46 #include "hfscommon/headers/BTreeScanner.h"
47
48
49 #define HFC_DEBUG 0
50 #define HFC_VERBOSE 0
51
52
53 /*
54 * Minimum post Tiger base time.
55 * Thu Mar 31 17:00:00 2005
56 */
57 #define HFC_MIN_BASE_TIME 0x424c8f00L
58
59 /*
60 * Hot File List (runtime).
61 */
62 typedef struct hotfileinfo {
63 u_int32_t hf_fileid;
64 u_int32_t hf_temperature;
65 u_int32_t hf_blocks;
66 } hotfileinfo_t;
67
68 typedef struct hotfilelist {
69 u_int32_t hfl_magic;
70 u_int32_t hfl_version;
71 time_t hfl_duration; /* duration of sample period */
72 int hfl_count; /* count of hot files recorded */
73 int hfl_next; /* next file to move */
74 int hfl_totalblocks; /* total hot file blocks */
75 int hfl_reclaimblks; /* blocks to reclaim in HFV */
76 u_int32_t hfl_spare[2];
77 hotfileinfo_t hfl_hotfile[1]; /* array of hot files */
78 } hotfilelist_t;
79
80
81 /*
82 * Hot File Entry (runtime).
83 */
84 typedef struct hotfile_entry {
85 struct hotfile_entry *left;
86 struct hotfile_entry *right;
87 u_int32_t fileid;
88 u_int32_t temperature;
89 u_int32_t blocks;
90 } hotfile_entry_t;
91
92
93 //
94 // We cap the max temperature for non-system files to "MAX_NORMAL_TEMP"
95 // so that they will always have a lower temperature than system (aka
96 // "auto-cached") files. System files have MAX_NORMAL_TEMP added to
97 // their temperature which produces two bands of files (all non-system
98 // files will have a temp less than MAX_NORMAL_TEMP and all system
99 // files will have a temp greatern than MAX_NORMAL_TEMP).
100 //
101 // This puts non-system files on the left side of the hotfile btree
102 // (and we start evicting from the left-side of the tree). The idea is
103 // that we will evict non-system files more aggressively since their
104 // working set changes much more dynamically than system files (which
105 // are for the most part, static).
106 //
107 // NOTE: these values have to fit into a 32-bit int. We use a
108 // value of 1-billion which gives a pretty broad range
109 // and yet should not run afoul of any sign issues.
110 //
111 #define MAX_NORMAL_TEMP 1000000000
112 #define HF_TEMP_RANGE MAX_NORMAL_TEMP
113
114
115 //
116 // These used to be defines of the hard coded values. But if
117 // we're on an cooperative fusion (CF) system we need to change
118 // the values (which happens in hfs_recording_init()
119 //
120 uint32_t hfc_default_file_count = 1000;
121 uint32_t hfc_default_duration = (3600 * 60);
122 uint32_t hfc_max_file_count = 5000;
123 uint64_t hfc_max_file_size = (10 * 1024 * 1024);
124
125
126 /*
127 * Hot File Recording Data (runtime).
128 */
129 typedef struct hotfile_data {
130 struct hfsmount *hfsmp;
131 long refcount;
132 u_int32_t activefiles; /* active number of hot files */
133 u_int32_t threshold;
134 u_int32_t maxblocks;
135 hotfile_entry_t *rootentry;
136 hotfile_entry_t *freelist;
137 hotfile_entry_t *coldest;
138 hotfile_entry_t entries[1];
139 } hotfile_data_t;
140
141 static int hfs_recording_start (struct hfsmount *);
142 static int hfs_recording_stop (struct hfsmount *);
143
144 /* Hotfiles pinning routines */
145 static int hfs_getvnode_and_pin (struct hfsmount *hfsmp, uint32_t fileid, uint32_t *pinned);
146 static int hfs_pin_extent_record (struct hfsmount *hfsmp, HFSPlusExtentRecord extents, uint32_t *pinned);
147 static int hfs_pin_catalog_rec (struct hfsmount *hfsmp, HFSPlusCatalogFile *cfp, int rsrc);
148
149 /*
150 * Hot File Data recording functions (in-memory binary tree).
151 */
152 static int hf_insert (hotfile_data_t *, hotfile_entry_t *);
153 static void hf_delete (hotfile_data_t *, u_int32_t, u_int32_t);
154 static hotfile_entry_t * hf_coldest (hotfile_data_t *);
155 static hotfile_entry_t * hf_getnewentry (hotfile_data_t *);
156 static void hf_getsortedlist (hotfile_data_t *, hotfilelist_t *);
157
158 #if HFC_DEBUG
159 static hotfile_entry_t * hf_lookup (hotfile_data_t *, u_int32_t, u_int32_t);
160 static void hf_maxdepth(hotfile_entry_t *, int, int *);
161 static void hf_printtree (hotfile_entry_t *);
162 #endif
163
164 /*
165 * Hot File misc support functions.
166 */
167 static int hotfiles_collect (struct hfsmount *);
168 static int hotfiles_age (struct hfsmount *);
169 static int hotfiles_adopt (struct hfsmount *, vfs_context_t);
170 static int hotfiles_evict (struct hfsmount *, vfs_context_t);
171 static int hotfiles_refine (struct hfsmount *);
172 static int hotextents(struct hfsmount *, HFSPlusExtentDescriptor *);
173 static int hfs_addhotfile_internal(struct vnode *);
174 static int hfs_hotfile_cur_freeblks(hfsmount_t *hfsmp);
175
176
177 /*
178 * Hot File Cluster B-tree (on disk) functions.
179 */
180 static int hfc_btree_create (struct hfsmount *, unsigned int, unsigned int);
181 static int hfc_btree_open (struct hfsmount *, struct vnode **);
182 static int hfc_btree_open_ext(struct hfsmount *hfsmp, struct vnode **vpp, int ignore_btree_errs);
183 static int hfc_btree_close (struct hfsmount *, struct vnode *);
184 static int hfc_btree_delete_record(struct hfsmount *hfsmp, BTreeIterator *iterator, HotFileKey *key);
185 static int hfc_btree_delete(struct hfsmount *hfsmp);
186 static int hfc_comparekeys (HotFileKey *, HotFileKey *);
187
188
189 char hfc_tag[] = "CLUSTERED HOT FILES B-TREE ";
190
191
192 /*
193 *========================================================================
194 * HOT FILE INTERFACE ROUTINES
195 *========================================================================
196 */
197
198 /*
199 * Start recording the hottest files on a file system.
200 *
201 * Requires that the hfc_mutex be held.
202 */
203 static int
204 hfs_recording_start(struct hfsmount *hfsmp)
205 {
206 hotfile_data_t *hotdata;
207 struct timeval tv;
208 int maxentries;
209 size_t size;
210 int i;
211 int error;
212
213 if ((hfsmp->hfs_flags & HFS_READ_ONLY) ||
214 (hfsmp->jnl == NULL) ||
215 (hfsmp->hfs_flags & HFS_METADATA_ZONE) == 0) {
216 return (EPERM);
217 }
218 if (HFSTOVCB(hfsmp)->freeBlocks < (2 * (u_int32_t)hfsmp->hfs_hotfile_maxblks)) {
219 return (ENOSPC);
220 }
221 if (hfsmp->hfc_stage != HFC_IDLE) {
222 return (EBUSY);
223 }
224 hfsmp->hfc_stage = HFC_BUSY;
225
226 /*
227 * Dump previous recording data.
228 */
229 if (hfsmp->hfc_recdata) {
230 void * tmp;
231
232 tmp = hfsmp->hfc_recdata;
233 hfsmp->hfc_recdata = NULL;
234 FREE(tmp, M_TEMP);
235 }
236
237 microtime(&tv); /* Times are base on GMT time. */
238
239 /*
240 * On first startup check for suspended recording.
241 */
242 if (hfsmp->hfc_timebase == 0 &&
243 hfc_btree_open(hfsmp, &hfsmp->hfc_filevp) == 0) {
244 HotFilesInfo hotfileinfo;
245
246 if ((BTGetUserData(VTOF(hfsmp->hfc_filevp), &hotfileinfo,
247 sizeof(hotfileinfo)) == 0) &&
248 (SWAP_BE32 (hotfileinfo.magic) == HFC_MAGIC) &&
249 (SWAP_BE32 (hotfileinfo.timeleft) > 0) &&
250 (SWAP_BE32 (hotfileinfo.timebase) > 0)) {
251 if (hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN) {
252 if (hfsmp->hfs_hotfile_freeblks == 0) {
253 hfsmp->hfs_hotfile_freeblks = hfsmp->hfs_hotfile_maxblks - SWAP_BE32 (hotfileinfo.usedblocks);
254 }
255 hfsmp->hfc_maxfiles = 0x7fffffff;
256 printf("hfs: %s: %s: hotfile freeblocks: %d, max: %d\n", hfsmp->vcbVN, __FUNCTION__,
257 hfsmp->hfs_hotfile_freeblks, hfsmp->hfs_hotfile_maxblks);
258 } else {
259 hfsmp->hfc_maxfiles = SWAP_BE32 (hotfileinfo.maxfilecnt);
260 }
261 hfsmp->hfc_timebase = SWAP_BE32 (hotfileinfo.timebase);
262 int timeleft = (int)SWAP_BE32(hotfileinfo.timeleft);
263 if (timeleft < 0 || timeleft > (int)(HFC_DEFAULT_DURATION*2)) {
264 // in case this field got botched, don't let it screw things up
265 // printf("hfs: hotfiles: bogus looking timeleft: %d\n", timeleft);
266 timeleft = HFC_DEFAULT_DURATION;
267 }
268 hfsmp->hfc_timeout = timeleft + tv.tv_sec ;
269 /* Fix up any bogus timebase values. */
270 if (hfsmp->hfc_timebase < HFC_MIN_BASE_TIME) {
271 hfsmp->hfc_timebase = hfsmp->hfc_timeout - HFC_DEFAULT_DURATION;
272 }
273 #if HFC_VERBOSE
274 printf("hfs: Resume recording hot files on %s (%d secs left (%d); timeout %ld)\n",
275 hfsmp->vcbVN, SWAP_BE32 (hotfileinfo.timeleft), timeleft, hfsmp->hfc_timeout - tv.tv_sec);
276 #endif
277 } else {
278 hfsmp->hfc_maxfiles = HFC_DEFAULT_FILE_COUNT;
279 hfsmp->hfc_timebase = tv.tv_sec + 1;
280 hfsmp->hfc_timeout = hfsmp->hfc_timebase + HFC_DEFAULT_DURATION;
281 }
282 (void) hfc_btree_close(hfsmp, hfsmp->hfc_filevp);
283 hfsmp->hfc_filevp = NULL;
284 } else {
285 struct cat_attr cattr;
286 u_int32_t cnid;
287
288 /*
289 * Make sure a btree file exists.
290 */
291 cnid = GetFileInfo(HFSTOVCB(hfsmp), kRootDirID, HFC_FILENAME, &cattr, NULL);
292 if ((cnid == 0) &&
293 !S_ISREG(cattr.ca_mode) &&
294 (error = hfc_btree_create(hfsmp, HFSTOVCB(hfsmp)->blockSize, HFC_DEFAULT_FILE_COUNT))) {
295 hfsmp->hfc_stage = HFC_IDLE;
296 wakeup((caddr_t)&hfsmp->hfc_stage);
297 return (error);
298 }
299 #if HFC_VERBOSE
300 printf("hfs: begin recording hot files on %s (hotfile start/end block: %d - %d; max/free: %d/%d; maxfiles: %d)\n",
301 hfsmp->vcbVN,
302 hfsmp->hfs_hotfile_start, hfsmp->hfs_hotfile_end,
303 hfsmp->hfs_hotfile_maxblks, hfsmp->hfs_hotfile_freeblks, hfsmp->hfc_maxfiles);
304 #endif
305 hfsmp->hfc_maxfiles = HFC_DEFAULT_FILE_COUNT;
306 hfsmp->hfc_timeout = tv.tv_sec + HFC_DEFAULT_DURATION;
307
308 /* Reset time base. */
309 if (hfsmp->hfc_timebase == 0) {
310 hfsmp->hfc_timebase = tv.tv_sec + 1;
311 } else {
312 time_t cumulativebase;
313
314 cumulativebase = hfsmp->hfc_timeout - (HFC_CUMULATIVE_CYCLES * HFC_DEFAULT_DURATION);
315 hfsmp->hfc_timebase = MAX(hfsmp->hfc_timebase, cumulativebase);
316 }
317 }
318
319 if ((hfsmp->hfc_maxfiles == 0) ||
320 (hfsmp->hfc_maxfiles > HFC_MAXIMUM_FILE_COUNT)) {
321 hfsmp->hfc_maxfiles = HFC_DEFAULT_FILE_COUNT;
322 }
323 maxentries = hfsmp->hfc_maxfiles;
324
325 size = sizeof(hotfile_data_t) + (maxentries * sizeof(hotfile_entry_t));
326 MALLOC(hotdata, hotfile_data_t *, size, M_TEMP, M_WAITOK);
327 if (hotdata == NULL) {
328 hfsmp->hfc_recdata = NULL;
329 hfsmp->hfc_stage = HFC_IDLE;
330 wakeup((caddr_t)&hfsmp->hfc_stage);
331 return(ENOMEM);
332 }
333
334 bzero(hotdata, size);
335
336 for (i = 1; i < maxentries ; i++)
337 hotdata->entries[i-1].right = &hotdata->entries[i];
338
339 hotdata->freelist = &hotdata->entries[0];
340 /*
341 * Establish minimum temperature and maximum file size.
342 */
343 hotdata->threshold = HFC_MINIMUM_TEMPERATURE;
344 hotdata->maxblocks = HFC_MAXIMUM_FILESIZE / HFSTOVCB(hfsmp)->blockSize;
345 hotdata->hfsmp = hfsmp;
346
347 hfsmp->hfc_recdata = hotdata;
348 hfsmp->hfc_stage = HFC_RECORDING;
349 wakeup((caddr_t)&hfsmp->hfc_stage);
350 return (0);
351 }
352
353 /*
354 * Stop recording the hotest files on a file system.
355 *
356 * Requires that the hfc_mutex be held.
357 */
358 static int
359 hfs_recording_stop(struct hfsmount *hfsmp)
360 {
361 hotfile_data_t *hotdata;
362 hotfilelist_t *listp;
363 struct timeval tv;
364 size_t size;
365 enum hfc_stage newstage = HFC_IDLE;
366 int error;
367
368 if (hfsmp->hfc_stage != HFC_RECORDING)
369 return (EPERM);
370
371 hfsmp->hfc_stage = HFC_BUSY;
372
373 hotfiles_collect(hfsmp);
374
375
376 /*
377 * Convert hot file data into a simple file id list....
378 *
379 * then dump the sample data
380 */
381 #if HFC_VERBOSE
382 printf("hfs: end of hot file recording on %s\n", hfsmp->vcbVN);
383 #endif
384 hotdata = (hotfile_data_t *)hfsmp->hfc_recdata;
385 if (hotdata == NULL)
386 return (0);
387 hfsmp->hfc_recdata = NULL;
388 hfsmp->hfc_stage = HFC_EVALUATION;
389 wakeup((caddr_t)&hfsmp->hfc_stage);
390
391 #if HFC_VERBOSE
392 printf("hfs: curentries: %d\n", hotdata->activefiles);
393 #endif
394 /*
395 * If no hot files recorded then we're done.
396 */
397 if (hotdata->rootentry == NULL) {
398 error = 0;
399 goto out;
400 }
401
402 /* Open the B-tree file for writing... */
403 if (hfsmp->hfc_filevp)
404 panic("hfs_recording_stop: hfc_filevp exists (vp = %p)", hfsmp->hfc_filevp);
405
406 error = hfc_btree_open(hfsmp, &hfsmp->hfc_filevp);
407 if (error) {
408 goto out;
409 }
410
411 /*
412 * Age the previous set of clustered hot files.
413 */
414 error = hotfiles_age(hfsmp);
415 if (error) {
416 (void) hfc_btree_close(hfsmp, hfsmp->hfc_filevp);
417 hfsmp->hfc_filevp = NULL;
418 goto out;
419 }
420
421 /*
422 * Create a sorted list of hotest files.
423 */
424 size = sizeof(hotfilelist_t);
425 size += sizeof(hotfileinfo_t) * (hotdata->activefiles - 1);
426 MALLOC(listp, hotfilelist_t *, size, M_TEMP, M_WAITOK);
427 if (listp == NULL) {
428 error = ENOMEM;
429 (void) hfc_btree_close(hfsmp, hfsmp->hfc_filevp);
430 hfsmp->hfc_filevp = NULL;
431 goto out;
432 }
433
434 bzero(listp, size);
435
436 hf_getsortedlist(hotdata, listp); /* NOTE: destroys hot file tree! */
437 microtime(&tv);
438 listp->hfl_duration = tv.tv_sec - hfsmp->hfc_timebase;
439 hfsmp->hfc_recdata = listp;
440
441 /*
442 * Account for duplicates.
443 */
444 error = hotfiles_refine(hfsmp);
445 if (error) {
446 (void) hfc_btree_close(hfsmp, hfsmp->hfc_filevp);
447 hfsmp->hfc_filevp = NULL;
448 goto out;
449 }
450
451 /*
452 * Compute the amount of space to reclaim...
453 */
454 if (listp->hfl_totalblocks > hfs_hotfile_cur_freeblks(hfsmp)) {
455 listp->hfl_reclaimblks =
456 MIN(listp->hfl_totalblocks, hfsmp->hfs_hotfile_maxblks) -
457 hfsmp->hfs_hotfile_freeblks;
458 #if HFC_VERBOSE
459 printf("hfs_recording_stop: need to reclaim %d blocks\n", listp->hfl_reclaimblks);
460 #endif
461 if (listp->hfl_reclaimblks)
462 newstage = HFC_EVICTION;
463 else
464 newstage = HFC_ADOPTION;
465 } else {
466 newstage = HFC_ADOPTION;
467 }
468
469 if (newstage == HFC_ADOPTION && listp->hfl_totalblocks == 0) {
470 (void) hfc_btree_close(hfsmp, hfsmp->hfc_filevp);
471 hfsmp->hfc_filevp = NULL;
472 newstage = HFC_IDLE;
473 }
474 out:
475 #if HFC_VERBOSE
476 if (newstage == HFC_EVICTION)
477 printf("hfs: evicting coldest files\n");
478 else if (newstage == HFC_ADOPTION)
479 printf("hfs: adopting hotest files\n");
480 #endif
481 FREE(hotdata, M_TEMP);
482
483 hfsmp->hfc_stage = newstage;
484 wakeup((caddr_t)&hfsmp->hfc_stage);
485 return (error);
486 }
487
488 static void
489 save_btree_user_info(struct hfsmount *hfsmp)
490 {
491 HotFilesInfo hotfileinfo;
492 struct timeval tv;
493
494 microtime(&tv);
495 hotfileinfo.magic = SWAP_BE32 (HFC_MAGIC);
496 hotfileinfo.version = SWAP_BE32 (HFC_VERSION);
497 hotfileinfo.duration = SWAP_BE32 (HFC_DEFAULT_DURATION);
498 hotfileinfo.timebase = SWAP_BE32 (hfsmp->hfc_timebase);
499 hotfileinfo.timeleft = SWAP_BE32 (hfsmp->hfc_timeout - tv.tv_sec);
500 hotfileinfo.threshold = SWAP_BE32 (HFC_MINIMUM_TEMPERATURE);
501 hotfileinfo.maxfileblks = SWAP_BE32 (HFC_MAXIMUM_FILESIZE / HFSTOVCB(hfsmp)->blockSize);
502 if (hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN) {
503 hotfileinfo.usedblocks = SWAP_BE32 (hfsmp->hfs_hotfile_maxblks - hfs_hotfile_cur_freeblks(hfsmp));
504 #if HFC_VERBOSE
505 printf("hfs: %s: saving usedblocks = %d (timeleft: %d; timeout %ld)\n", hfsmp->vcbVN, (hfsmp->hfs_hotfile_maxblks - hfsmp->hfs_hotfile_freeblks),
506 SWAP_BE32(hotfileinfo.timeleft), hfsmp->hfc_timeout);
507 #endif
508 } else {
509 hotfileinfo.maxfilecnt = SWAP_BE32 (HFC_DEFAULT_FILE_COUNT);
510 }
511 strlcpy((char *)hotfileinfo.tag, hfc_tag, sizeof hotfileinfo.tag);
512 (void) BTSetUserData(VTOF(hfsmp->hfc_filevp), &hotfileinfo, sizeof(hotfileinfo));
513 }
514
515 /*
516 * Suspend recording the hotest files on a file system.
517 */
518 int
519 hfs_recording_suspend(struct hfsmount *hfsmp)
520 {
521 hotfile_data_t *hotdata = NULL;
522 int error;
523
524 if (hfsmp->hfc_stage == HFC_DISABLED)
525 return (0);
526
527 lck_mtx_lock(&hfsmp->hfc_mutex);
528
529 /*
530 * XXX NOTE
531 * A suspend can occur during eval/evict/adopt stage.
532 * In that case we would need to write out info and
533 * flush our HFBT vnode. Currently we just bail.
534 */
535
536 hotdata = (hotfile_data_t *)hfsmp->hfc_recdata;
537 if (hotdata == NULL || hfsmp->hfc_stage != HFC_RECORDING) {
538 error = 0;
539 goto out;
540 }
541 hfsmp->hfc_stage = HFC_BUSY;
542
543 #if HFC_VERBOSE
544 printf("hfs: suspend hot file recording on %s\n", hfsmp->vcbVN);
545 #endif
546 error = hfc_btree_open(hfsmp, &hfsmp->hfc_filevp);
547 if (error) {
548 printf("hfs_recording_suspend: err %d opening btree\n", error);
549 goto out;
550 }
551
552 if (hfs_start_transaction(hfsmp) != 0) {
553 goto out;
554 }
555 if (hfs_lock(VTOC(hfsmp->hfc_filevp), HFS_EXCLUSIVE_LOCK, HFS_LOCK_DEFAULT) != 0) {
556 goto end_transaction;
557 }
558
559 save_btree_user_info(hfsmp);
560
561 hfs_unlock(VTOC(hfsmp->hfc_filevp));
562
563 end_transaction:
564 hfs_end_transaction(hfsmp);
565
566 out:
567 if (hfsmp->hfc_filevp) {
568 (void) hfc_btree_close(hfsmp, hfsmp->hfc_filevp);
569 hfsmp->hfc_filevp = NULL;
570 }
571 if (hotdata) {
572 FREE(hotdata, M_TEMP);
573 hfsmp->hfc_recdata = NULL;
574 }
575 hfsmp->hfc_stage = HFC_DISABLED;
576 wakeup((caddr_t)&hfsmp->hfc_stage);
577
578 lck_mtx_unlock(&hfsmp->hfc_mutex);
579 return (error);
580 }
581
582
583 static void
584 reset_file_ids(struct hfsmount *hfsmp, uint32_t *fileid_table, int num_ids)
585 {
586 int i, error;
587
588 for(i=0; i < num_ids; i++) {
589 struct vnode *vp;
590
591 error = hfs_vget(hfsmp, fileid_table[i], &vp, 0, 0);
592 if (error) {
593 if (error == ENOENT) {
594 error = 0;
595 continue; /* stale entry, go to next */
596 }
597 continue;
598 }
599
600 // hfs_vget returns a locked cnode so no need to lock here
601
602 if ((hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN) && (VTOC(vp)->c_attr.ca_recflags & kHFSFastDevPinnedMask)) {
603 error = hfs_pin_vnode(hfsmp, vp, HFS_UNPIN_IT, NULL, vfs_context_kernel());
604 }
605
606 /*
607 * The updates to the catalog must be journaled
608 */
609 hfs_start_transaction(hfsmp);
610
611 //
612 // turn off _all_ the hotfile related bits since we're resetting state
613 //
614 if (VTOC(vp)->c_attr.ca_recflags & kHFSFastDevCandidateMask) {
615 vnode_clearfastdevicecandidate(vp);
616 }
617
618 VTOC(vp)->c_attr.ca_recflags &= ~(kHFSFastDevPinnedMask|kHFSDoNotFastDevPinMask|kHFSFastDevCandidateMask|kHFSAutoCandidateMask);
619 VTOC(vp)->c_flag |= C_MODIFIED;
620
621 hfs_update(vp, 0);
622
623 hfs_end_transaction(hfsmp);
624
625 hfs_unlock(VTOC(vp));
626 vnode_put(vp);
627 }
628 }
629
630 static int
631 flag_hotfile(struct hfsmount *hfsmp, const char *filename)
632 {
633 struct vnode *dvp = NULL, *fvp = NULL;
634 vfs_context_t ctx = vfs_context_kernel();
635 struct componentname cname;
636 int error=0;
637 size_t fname_len;
638 const char *orig_fname = filename;
639
640 if (filename == NULL) {
641 return EINVAL;
642 }
643
644 fname_len = strlen(filename); // do NOT include the trailing '\0' so that we break out of the loop below
645
646 error = VFS_ROOT(HFSTOVFS(hfsmp), &dvp, ctx);
647 if (error) {
648 return (error);
649 }
650
651 /* At this point, 'dvp' must be considered iocounted */
652 const char *ptr;
653 ptr = filename;
654
655 while (ptr < (orig_fname + fname_len - 1)) {
656 for(; ptr < (orig_fname + fname_len) && *ptr && *ptr != '/'; ptr++) {
657 /* just keep advancing till we reach the end of the string or a slash */
658 }
659
660 cname.cn_nameiop = LOOKUP;
661 cname.cn_flags = ISLASTCN;
662 cname.cn_context = ctx;
663 cname.cn_ndp = NULL;
664 cname.cn_pnbuf = __DECONST(char *, orig_fname);
665 cname.cn_nameptr = __DECONST(char *, filename);
666 cname.cn_pnlen = fname_len;
667 cname.cn_namelen = ptr - filename;
668 cname.cn_hash = 0;
669 cname.cn_consume = 0;
670
671 error = VNOP_LOOKUP(dvp, &fvp, &cname, ctx);
672 if (error) {
673 /*
674 * If 'dvp' is non-NULL, then it has an iocount. Make sure to release it
675 * before bailing out. VNOP_LOOKUP could legitimately return ENOENT
676 * if the item didn't exist or if we raced with a delete.
677 */
678 if (dvp) {
679 vnode_put(dvp);
680 dvp = NULL;
681 }
682 return error;
683 }
684
685 if (ptr < orig_fname + fname_len - 1) {
686 //
687 // we've got a multi-part pathname so drop the ref on the dir,
688 // make dvp become what we just looked up, and advance over
689 // the slash character in the pathname to get to the next part
690 // of the component
691 //
692 vnode_put(dvp);
693 dvp = fvp;
694 fvp = NULL;
695
696 filename = ++ptr; // skip the slash character
697 }
698 }
699
700 if (fvp == NULL) {
701 error = ENOENT;
702 goto out;
703 }
704
705 struct cnode *cp = VTOC(fvp);
706 if ((error = hfs_lock(cp, HFS_EXCLUSIVE_LOCK, HFS_LOCK_DEFAULT)) != 0) {
707 goto out;
708 }
709
710 hfs_start_transaction(hfsmp);
711
712 cp->c_attr.ca_recflags |= (kHFSFastDevCandidateMask|kHFSAutoCandidateMask);
713 cp->c_flag |= C_MODIFIED;
714
715 hfs_update(fvp, 0);
716
717 hfs_end_transaction(hfsmp);
718
719 hfs_unlock(cp);
720 //printf("hfs: flagged /%s with the fast-dev-candidate|auto-candidate flags\n", filename);
721
722
723 out:
724 if (fvp) {
725 vnode_put(fvp);
726 fvp = NULL;
727 }
728
729 if (dvp) {
730 vnode_put(dvp);
731 dvp = NULL;
732 }
733
734 return error;
735 }
736
737
738 static void
739 hfs_setup_default_cf_hotfiles(struct hfsmount *hfsmp)
740 {
741 const char *system_default_hotfiles[] = {
742 "usr",
743 "System",
744 "Applications",
745 "private/var/db/dyld"
746 };
747 int i;
748
749 for(i=0; i < (int)(sizeof(system_default_hotfiles)/sizeof(char *)); i++) {
750 flag_hotfile(hfsmp, system_default_hotfiles[i]);
751 }
752 }
753
754
755 #define NUM_FILE_RESET_IDS 4096 // so we allocate 16k to hold file-ids
756
757 static void
758 hfs_hotfile_reset(struct hfsmount *hfsmp)
759 {
760 CatalogKey * keyp;
761 CatalogRecord * datap;
762 u_int32_t dataSize;
763 BTScanState scanstate;
764 BTreeIterator * iterator = NULL;
765 FSBufferDescriptor record;
766 u_int32_t data;
767 u_int32_t cnid;
768 int error = 0;
769 uint32_t *fileids=NULL;
770 int cur_id_index = 0;
771
772 int cleared = 0; /* debug variables */
773 int filecount = 0;
774 int dircount = 0;
775
776 #if HFC_VERBOSE
777 printf("hfs: %s: %s\n", hfsmp->vcbVN, __FUNCTION__);
778 #endif
779
780 MALLOC(iterator, BTreeIterator *, sizeof(*iterator), M_TEMP, M_WAITOK);
781 if (iterator == NULL) {
782 error = ENOMEM;
783 goto out;
784 }
785 bzero(iterator, sizeof(*iterator));
786
787 MALLOC(fileids, uint32_t *, NUM_FILE_RESET_IDS * sizeof(uint32_t), M_TEMP, M_WAITOK);
788 if (fileids == NULL) {
789 error = ENOMEM;
790 goto out;
791 }
792
793 record.bufferAddress = &data;
794 record.itemSize = sizeof(u_int32_t);
795 record.itemCount = 1;
796
797 /*
798 * Get ready to scan the Catalog file.
799 */
800 error = BTScanInitialize(VTOF(HFSTOVCB(hfsmp)->catalogRefNum), 0, 0, 0,
801 kCatSearchBufferSize, &scanstate);
802 if (error) {
803 printf("hfs_hotfile_reset: err %d BTScanInit\n", error);
804 goto out;
805 }
806
807 /*
808 * Visit all the catalog btree leaf records, clearing any that have the
809 * HotFileCached bit set.
810 */
811 for (;;) {
812 error = BTScanNextRecord(&scanstate, 0, (void **)&keyp, (void **)&datap, &dataSize);
813 if (error) {
814 if (error == btNotFound)
815 error = 0;
816 else
817 printf("hfs_hotfile_reset: err %d BTScanNext\n", error);
818 break;
819 }
820
821 if (datap->recordType == kHFSPlusFolderRecord && (dataSize == sizeof(HFSPlusCatalogFolder))) {
822 HFSPlusCatalogFolder *dirp = (HFSPlusCatalogFolder *)datap;
823
824 dircount++;
825
826 if ((dirp->flags & (kHFSFastDevPinnedMask|kHFSDoNotFastDevPinMask|kHFSFastDevCandidateMask|kHFSAutoCandidateMask)) == 0) {
827 continue;
828 }
829
830 cnid = dirp->folderID;
831 } else if ((datap->recordType == kHFSPlusFileRecord) && (dataSize == sizeof(HFSPlusCatalogFile))) {
832 HFSPlusCatalogFile *filep = (HFSPlusCatalogFile *)datap;
833
834 filecount++;
835
836 /*
837 * If the file doesn't have any of the HotFileCached bits set, ignore it.
838 */
839 if ((filep->flags & (kHFSFastDevPinnedMask|kHFSDoNotFastDevPinMask|kHFSFastDevCandidateMask|kHFSAutoCandidateMask)) == 0) {
840 continue;
841 }
842
843 cnid = filep->fileID;
844 } else {
845 continue;
846 }
847
848 /* Skip over journal files. */
849 if (cnid == hfsmp->hfs_jnlfileid || cnid == hfsmp->hfs_jnlinfoblkid) {
850 continue;
851 }
852
853 //
854 // Just record the cnid of the file for now. We will modify it separately
855 // because we can't modify the catalog while we're scanning it.
856 //
857 fileids[cur_id_index++] = cnid;
858 if (cur_id_index >= NUM_FILE_RESET_IDS) {
859 //
860 // We're over the limit of file-ids so we have to terminate this
861 // scan, go modify all the catalog records, then restart the scan.
862 // This is required because it's not permissible to modify the
863 // catalog while scanning it.
864 //
865 (void) BTScanTerminate(&scanstate, &data, &data, &data);
866
867 reset_file_ids(hfsmp, fileids, cur_id_index);
868 cleared += cur_id_index;
869 cur_id_index = 0;
870
871 // restart the scan
872 error = BTScanInitialize(VTOF(HFSTOVCB(hfsmp)->catalogRefNum), 0, 0, 0,
873 kCatSearchBufferSize, &scanstate);
874 if (error) {
875 printf("hfs_hotfile_reset: err %d BTScanInit\n", error);
876 goto out;
877 }
878 continue;
879 }
880 }
881
882 if (cur_id_index) {
883 reset_file_ids(hfsmp, fileids, cur_id_index);
884 cleared += cur_id_index;
885 cur_id_index = 0;
886 }
887
888 printf("hfs: cleared HotFileCache related bits on %d files out of %d (dircount %d)\n", cleared, filecount, dircount);
889
890 (void) BTScanTerminate(&scanstate, &data, &data, &data);
891
892 out:
893 if (fileids)
894 FREE(fileids, M_TEMP);
895
896 if (iterator)
897 FREE(iterator, M_TEMP);
898
899 //
900 // If the hotfile btree exists, delete it. We need to open
901 // it to be able to delete it because we need the hfc_filevp
902 // for deletion.
903 //
904 error = hfc_btree_open_ext(hfsmp, &hfsmp->hfc_filevp, 1);
905 if (!error) {
906 printf("hfs: hotfile_reset: deleting existing hotfile btree\n");
907 hfc_btree_delete(hfsmp);
908 }
909
910 if (hfsmp->hfc_filevp) {
911 (void) hfc_btree_close(hfsmp, hfsmp->hfc_filevp);
912 hfsmp->hfc_filevp = NULL;
913 }
914
915 hfsmp->hfs_hotfile_blk_adjust = 0;
916 hfsmp->hfs_hotfile_freeblks = hfsmp->hfs_hotfile_maxblks;
917 }
918
919
920 //
921 // This should ONLY be called by hfs_recording_init() and the special fsctl.
922 //
923 // We assume that the hotfile btree is already opened.
924 //
925 static int
926 hfs_hotfile_repin_files(struct hfsmount *hfsmp)
927 {
928 BTreeIterator * iterator = NULL;
929 HotFileKey * key;
930 filefork_t * filefork;
931 int error = 0;
932 int bt_op;
933 enum hfc_stage stage;
934 uint32_t pinned_blocks;
935 uint32_t num_files=0, nrsrc=0;
936 uint32_t total_pinned=0;
937
938 if (!(hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN) || !hfsmp->hfc_filevp) {
939 //
940 // this is only meaningful if we're pinning hotfiles
941 // (as opposed to the regular form of hotfiles that
942 // get relocated to the hotfile zone)
943 //
944 return 0;
945 }
946
947 #if HFC_VERBOSE
948 printf("hfs: %s: %s\n", hfsmp->vcbVN, __FUNCTION__);
949 #endif
950
951 if (hfs_lock(VTOC(hfsmp->hfc_filevp), HFS_EXCLUSIVE_LOCK, HFS_LOCK_DEFAULT) != 0) {
952 return (EPERM);
953 }
954
955
956 MALLOC(iterator, BTreeIterator *, sizeof(*iterator), M_TEMP, M_WAITOK);
957 if (iterator == NULL) {
958 hfs_unlock(VTOC(hfsmp->hfc_filevp));
959 return (ENOMEM);
960 }
961
962 stage = hfsmp->hfc_stage;
963 hfsmp->hfc_stage = HFC_BUSY;
964
965 bt_op = kBTreeFirstRecord;
966
967 bzero(iterator, sizeof(*iterator));
968 key = (HotFileKey*) &iterator->key;
969
970 filefork = VTOF(hfsmp->hfc_filevp);
971 int lockflags;
972
973 while (1) {
974
975 lockflags = 0;
976 /*
977 * Obtain the first record (ie the coldest one).
978 */
979 if (BTIterateRecord(filefork, bt_op, iterator, NULL, NULL) != 0) {
980 // no more records
981 error = 0;
982 break;
983 }
984 if (key->keyLength != HFC_KEYLENGTH) {
985 // printf("hfs: hotfiles_repin_files: invalid key length %d\n", key->keyLength);
986 error = EFTYPE;
987 break;
988 }
989 if (key->temperature == HFC_LOOKUPTAG) {
990 // ran into thread records in the hotfile btree
991 error = 0;
992 break;
993 }
994
995 //
996 // Just lookup the records in the catalog and pin the direct
997 // mapped extents. Faster than instantiating full vnodes
998 // (and thereby thrashing the system vnode cache).
999 //
1000 struct cat_desc fdesc;
1001 struct cat_attr attr;
1002 struct cat_fork fork;
1003 uint8_t forktype = 0;
1004
1005 lockflags = hfs_systemfile_lock(hfsmp, (SFL_CATALOG | SFL_EXTENTS), HFS_SHARED_LOCK);
1006 /*
1007 * Snoop the cnode hash to find out if the item we want is in-core already.
1008 *
1009 * We largely expect this function to fail (the items we want are probably not in the hash).
1010 * we use the special variant which bails out as soon as it finds a vnode (even if it is
1011 * marked as open-unlinked or actually removed on-disk. If we find a vnode, then we
1012 * release the systemfile locks and go through the pin-vnode path instead.
1013 */
1014 if (hfs_chash_snoop (hfsmp, key->fileID, 1, NULL, NULL) == 0) {
1015 pinned_blocks = 0;
1016
1017 /* unlock immediately and go through the in-core path */
1018 hfs_systemfile_unlock(hfsmp, lockflags);
1019 lockflags = 0;
1020
1021 error = hfs_getvnode_and_pin (hfsmp, key->fileID, &pinned_blocks);
1022 if (error) {
1023 /* if ENOENT, then it was deleted in the catalog. Remove from our hotfiles tracking */
1024 if (error == ENOENT) {
1025 hfc_btree_delete_record(hfsmp, iterator, key);
1026 }
1027 /* other errors, just ignore and move on with life */
1028 }
1029 else { //!error
1030 total_pinned += pinned_blocks;
1031 num_files++;
1032 }
1033
1034 goto next;
1035 }
1036
1037 /* If we get here, we're still holding the systemfile locks */
1038 error = cat_idlookup(hfsmp, key->fileID, 1, 0, &fdesc, &attr, &fork);
1039 if (error) {
1040 //
1041 // this file system could have been mounted while booted from a
1042 // different partition and thus the hotfile btree would not have
1043 // been maintained. thus a file that was hotfile cached could
1044 // have been deleted while booted from a different partition which
1045 // means we need to delete it from the hotfile btree.
1046 //
1047 // block accounting is taken care of at the end: we re-assign
1048 // hfsmp->hfs_hotfile_freeblks based on how many blocks we actually
1049 // pinned.
1050 //
1051 hfc_btree_delete_record(hfsmp, iterator, key);
1052
1053 goto next;
1054 }
1055
1056 if (fork.cf_size == 0) {
1057 // hmmm, the data is probably in the resource fork (aka a compressed file)
1058 error = cat_idlookup(hfsmp, key->fileID, 1, 1, &fdesc, &attr, &fork);
1059 if (error) {
1060 hfc_btree_delete_record(hfsmp, iterator, key);
1061 goto next;
1062 }
1063 forktype = 0xff;
1064 nrsrc++;
1065 }
1066
1067 pinned_blocks = 0;
1068
1069 /* Can't release the catalog /extents lock yet, we may need to go find the overflow blocks */
1070 error = hfs_pin_extent_record (hfsmp, fork.cf_extents, &pinned_blocks);
1071 if (error) {
1072 goto next; //skip to next
1073 }
1074 /* add in the blocks from the inline 8 */
1075 total_pinned += pinned_blocks;
1076 pinned_blocks = 0;
1077
1078 /* Could this file have overflow extents? */
1079 if (fork.cf_extents[kHFSPlusExtentDensity-1].startBlock) {
1080 /* better pin them, too */
1081 error = hfs_pin_overflow_extents (hfsmp, key->fileID, forktype, &pinned_blocks);
1082 if (error) {
1083 /* If we fail to pin all of the overflow extents, then just skip to the next file */
1084 goto next;
1085 }
1086 }
1087
1088 num_files++;
1089 if (pinned_blocks) {
1090 /* now add in any overflow also */
1091 total_pinned += pinned_blocks;
1092 }
1093
1094 next:
1095 if (lockflags) {
1096 hfs_systemfile_unlock(hfsmp, lockflags);
1097 lockflags = 0;
1098 }
1099 bt_op = kBTreeNextRecord;
1100
1101 } /* end while */
1102
1103 #if HFC_VERBOSE
1104 printf("hfs: hotfiles_repin_files: re-pinned %d files (nrsrc %d, total pinned %d blks; freeblock %d, maxblocks %d, calculated free: %d)\n",
1105 num_files, nrsrc, total_pinned, hfsmp->hfs_hotfile_freeblks, hfsmp->hfs_hotfile_maxblks,
1106 hfsmp->hfs_hotfile_maxblks - total_pinned);
1107 #endif
1108 //
1109 // make sure this is accurate based on how many blocks we actually pinned
1110 //
1111 hfsmp->hfs_hotfile_freeblks = hfsmp->hfs_hotfile_maxblks - total_pinned;
1112
1113 hfs_unlock(VTOC(hfsmp->hfc_filevp));
1114
1115 FREE(iterator, M_TEMP);
1116 hfsmp->hfc_stage = stage;
1117 wakeup((caddr_t)&hfsmp->hfc_stage);
1118 return (error);
1119 }
1120
1121 void
1122 hfs_repin_hotfiles(struct hfsmount *hfsmp)
1123 {
1124 int error, need_close;
1125
1126 lck_mtx_lock(&hfsmp->hfc_mutex);
1127
1128 if (hfsmp->hfc_filevp == NULL) {
1129 error = hfc_btree_open(hfsmp, &hfsmp->hfc_filevp);
1130 if (!error) {
1131 need_close = 1;
1132 } else {
1133 printf("hfs: failed to open the btree err=%d. Unable to re-pin hotfiles.\n", error);
1134 lck_mtx_unlock(&hfsmp->hfc_mutex);
1135 return;
1136 }
1137 } else {
1138 need_close = 0;
1139 }
1140
1141 hfs_pin_vnode(hfsmp, hfsmp->hfc_filevp, HFS_PIN_IT, NULL, vfs_context_kernel());
1142
1143 hfs_hotfile_repin_files(hfsmp);
1144
1145 if (need_close) {
1146 (void) hfc_btree_close(hfsmp, hfsmp->hfc_filevp);
1147 hfsmp->hfc_filevp = NULL;
1148 }
1149
1150 lck_mtx_unlock(&hfsmp->hfc_mutex);
1151 }
1152
1153 /*
1154 * For a given file ID, find and pin all of its overflow extents to the underlying CS
1155 * device. Assumes that the extents overflow b-tree is locked for the duration of this call.
1156 *
1157 * Emit the number of blocks pinned in output argument 'pinned'
1158 *
1159 * Return success or failure (errno) in return value.
1160 *
1161 */
1162 int hfs_pin_overflow_extents (struct hfsmount *hfsmp, uint32_t fileid,
1163 uint8_t forktype, uint32_t *pinned) {
1164
1165 struct BTreeIterator *ext_iter = NULL;
1166 ExtentKey *ext_key_ptr = NULL;
1167 ExtentRecord ext_data;
1168 FSBufferDescriptor btRecord;
1169 uint16_t btRecordSize;
1170 int error = 0;
1171
1172 uint32_t pinned_blocks = 0;
1173
1174
1175 MALLOC (ext_iter, struct BTreeIterator*, sizeof (struct BTreeIterator), M_TEMP, M_WAITOK);
1176 if (ext_iter == NULL) {
1177 return ENOMEM;
1178 }
1179 bzero (ext_iter, sizeof(*ext_iter));
1180
1181 BTInvalidateHint (ext_iter);
1182 ext_key_ptr = (ExtentKey*)&ext_iter->key;
1183 btRecord.bufferAddress = &ext_data;
1184 btRecord.itemCount = 1;
1185
1186 /*
1187 * This is like when you delete a file; we don't actually need most of the search machinery because
1188 * we are going to need all of the extent records that belong to this file (for a given fork type),
1189 * so we might as well use a straight-up iterator.
1190 *
1191 * Position the B-Tree iterator at the first record with this file ID
1192 */
1193 btRecord.itemSize = sizeof (HFSPlusExtentRecord);
1194 ext_key_ptr->hfsPlus.keyLength = kHFSPlusExtentKeyMaximumLength;
1195 ext_key_ptr->hfsPlus.forkType = forktype;
1196 ext_key_ptr->hfsPlus.pad = 0;
1197 ext_key_ptr->hfsPlus.fileID = fileid;
1198 ext_key_ptr->hfsPlus.startBlock = 0;
1199
1200 error = BTSearchRecord (VTOF(hfsmp->hfs_extents_vp), ext_iter, &btRecord, &btRecordSize, ext_iter);
1201 if (error == btNotFound) {
1202 /* empty b-tree, so that's ok. we'll fall out during error check below. */
1203 error = 0;
1204 }
1205
1206 while (1) {
1207 uint32_t found_fileid;
1208 uint32_t pblocks;
1209
1210 error = BTIterateRecord (VTOF(hfsmp->hfs_extents_vp), kBTreeNextRecord, ext_iter, &btRecord, &btRecordSize);
1211 if (error) {
1212 /* swallow it if it's btNotFound, otherwise just bail out */
1213 if (error == btNotFound)
1214 error = 0;
1215 break;
1216 }
1217
1218 found_fileid = ext_key_ptr->hfsPlus.fileID;
1219 /*
1220 * We only do one fork type at a time. So if either the fork-type doesn't
1221 * match what we are looking for (resource or data), OR the file id doesn't match
1222 * which indicates that there's nothing more with this file ID as the key, then bail out
1223 */
1224 if ((found_fileid != fileid) || (ext_key_ptr->hfsPlus.forkType != forktype)) {
1225 error = 0;
1226 break;
1227 }
1228
1229 /* Otherwise, we now have an extent record. Process and pin all of the file extents. */
1230 pblocks = 0;
1231 error = hfs_pin_extent_record (hfsmp, ext_data.hfsPlus, &pblocks);
1232
1233 if (error) {
1234 break;
1235 }
1236 pinned_blocks += pblocks;
1237
1238 /* if 8th extent is empty, then bail out */
1239 if (ext_data.hfsPlus[kHFSPlusExtentDensity-1].startBlock == 0) {
1240 error = 0;
1241 break;
1242 }
1243
1244 } // end extent-getting loop
1245
1246 /* dump the iterator */
1247 FREE (ext_iter, M_TEMP);
1248
1249 if (error == 0) {
1250 /*
1251 * In the event that the file has no overflow extents, pinned_blocks
1252 * will never be updated, so we'll properly export 0 pinned blocks to caller
1253 */
1254 *pinned = pinned_blocks;
1255 }
1256
1257 return error;
1258
1259 }
1260
1261
1262 static int
1263 hfs_getvnode_and_pin (struct hfsmount *hfsmp, uint32_t fileid, uint32_t *pinned) {
1264 struct vnode *vp;
1265 int error = 0;
1266 *pinned = 0;
1267 uint32_t pblocks;
1268
1269 /*
1270 * Acquire the vnode for this file. This returns a locked cnode on success
1271 */
1272 error = hfs_vget(hfsmp, fileid, &vp, 0, 0);
1273 if (error) {
1274 /* It's possible the file was open-unlinked. In this case, we'll get ENOENT back. */
1275 return error;
1276 }
1277
1278 /*
1279 * Symlinks that may have been inserted into the hotfile zone during a previous OS are now stuck
1280 * here. We do not want to move them.
1281 */
1282 if (!vnode_isreg(vp)) {
1283 hfs_unlock(VTOC(vp));
1284 vnode_put(vp);
1285 return EPERM;
1286 }
1287
1288 if (!(VTOC(vp)->c_attr.ca_recflags & kHFSFastDevPinnedMask)) {
1289 hfs_unlock(VTOC(vp));
1290 vnode_put(vp);
1291 return EINVAL;
1292 }
1293
1294 error = hfs_pin_vnode(hfsmp, vp, HFS_PIN_IT, &pblocks, vfs_context_kernel());
1295 if (error == 0) {
1296 *pinned = pblocks;
1297 }
1298
1299 hfs_unlock(VTOC(vp));
1300 vnode_put(vp);
1301
1302 return error;
1303
1304 }
1305
1306 /*
1307 * Pins an HFS Extent record to the underlying CoreStorage. Assumes that Catalog & Extents overflow
1308 * B-trees are held locked, as needed.
1309 *
1310 * Returns the number of blocks pinned in the output argument 'pinned'
1311 *
1312 * Returns error status (0 || errno) in return value.
1313 */
1314 static int hfs_pin_extent_record (struct hfsmount *hfsmp, HFSPlusExtentRecord extents, uint32_t *pinned) {
1315 uint32_t pb = 0;
1316 int i;
1317 int error;
1318
1319 if (pinned == NULL) {
1320 return EINVAL;
1321 }
1322 *pinned = 0;
1323
1324
1325
1326 /* iterate through the extents */
1327 for ( i = 0; i < kHFSPlusExtentDensity; i++) {
1328 if (extents[i].startBlock == 0) {
1329 break;
1330 }
1331
1332 error = hfs_pin_block_range (hfsmp, HFS_PIN_IT, extents[i].startBlock,
1333 extents[i].blockCount, vfs_context_kernel());
1334
1335 if (error) {
1336 break;
1337 }
1338 pb += extents[i].blockCount;
1339 }
1340
1341 *pinned = pb;
1342
1343 return error;
1344 }
1345
1346 /*
1347 * Consume an HFS Plus on-disk catalog record and pin its blocks
1348 * to the underlying CS devnode.
1349 *
1350 * NOTE: This is an important distinction!
1351 * This function takes in an HFSPlusCatalogFile* which is the actual
1352 * 200-some-odd-byte on-disk representation in the Catalog B-Tree (not
1353 * one of the run-time structs that we normally use.
1354 *
1355 * This assumes that the catalog and extents-overflow btrees
1356 * are locked, at least in shared mode
1357 */
1358 static int hfs_pin_catalog_rec (struct hfsmount *hfsmp, HFSPlusCatalogFile *cfp, int rsrc) {
1359 uint32_t pinned_blocks = 0;
1360 HFSPlusForkData *forkdata;
1361 int error = 0;
1362 uint8_t forktype = 0;
1363
1364 if (rsrc) {
1365 forkdata = &cfp->resourceFork;
1366 forktype = 0xff;
1367 }
1368 else {
1369 forkdata = &cfp->dataFork;
1370 }
1371
1372 uint32_t pblocks = 0;
1373
1374 /* iterate through the inline extents */
1375 error = hfs_pin_extent_record (hfsmp, forkdata->extents, &pblocks);
1376 if (error) {
1377 return error;
1378 }
1379
1380 pinned_blocks += pblocks;
1381 pblocks = 0;
1382
1383 /* it may have overflow extents */
1384 if (forkdata->extents[kHFSPlusExtentDensity-1].startBlock != 0) {
1385 error = hfs_pin_overflow_extents (hfsmp, cfp->fileID, forktype, &pblocks);
1386 }
1387 pinned_blocks += pblocks;
1388
1389 hfsmp->hfs_hotfile_freeblks -= pinned_blocks;
1390
1391 return error;
1392 }
1393
1394
1395 /*
1396 *
1397 */
1398 int
1399 hfs_recording_init(struct hfsmount *hfsmp)
1400 {
1401 CatalogKey * keyp;
1402 CatalogRecord * datap;
1403 u_int32_t dataSize;
1404 HFSPlusCatalogFile *filep;
1405 BTScanState scanstate;
1406 BTreeIterator * iterator = NULL;
1407 FSBufferDescriptor record;
1408 HotFileKey * key;
1409 filefork_t * filefork;
1410 u_int32_t data;
1411 struct cat_attr cattr;
1412 u_int32_t cnid;
1413 int error = 0;
1414 long starting_temp;
1415
1416 int started_tr = 0;
1417 int started_scan = 0;
1418
1419 int inserted = 0; /* debug variables */
1420 int filecount = 0;
1421 int uncacheable = 0;
1422
1423 /*
1424 * For now, only the boot volume is supported.
1425 */
1426 if ((vfs_flags(HFSTOVFS(hfsmp)) & MNT_ROOTFS) == 0) {
1427 hfsmp->hfc_stage = HFC_DISABLED;
1428 return (EPERM);
1429 }
1430
1431 /* We grab the HFC mutex even though we're not fully mounted yet, just for orderliness */
1432 lck_mtx_lock (&hfsmp->hfc_mutex);
1433
1434 /*
1435 * Tracking of hot files requires up-to-date access times.
1436 * So if access time updates are disabled, then we disable
1437 * hot files, too.
1438 */
1439 if (vfs_flags(HFSTOVFS(hfsmp)) & MNT_NOATIME) {
1440 hfsmp->hfc_stage = HFC_DISABLED;
1441 lck_mtx_unlock (&hfsmp->hfc_mutex);
1442 return EPERM;
1443 }
1444
1445 //
1446 // Check if we've been asked to suspend operation
1447 //
1448 cnid = GetFileInfo(HFSTOVCB(hfsmp), kRootDirID, ".hotfile-suspend", &cattr, NULL);
1449 if (cnid != 0) {
1450 printf("hfs: %s: %s: hotfiles explicitly disabled! remove /.hotfiles-suspend to re-enable\n", hfsmp->vcbVN, __FUNCTION__);
1451 hfsmp->hfc_stage = HFC_DISABLED;
1452 lck_mtx_unlock (&hfsmp->hfc_mutex);
1453 return EPERM;
1454 }
1455
1456 //
1457 // Check if we've been asked to reset our state.
1458 //
1459 cnid = GetFileInfo(HFSTOVCB(hfsmp), kRootDirID, ".hotfile-reset", &cattr, NULL);
1460 if (cnid != 0) {
1461 hfs_hotfile_reset(hfsmp);
1462 }
1463
1464 if (hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN) {
1465 //
1466 // Cooperative Fusion (CF) systems use different constants
1467 // than traditional hotfile systems. These were picked after a bit of
1468 // experimentation - we can cache many more files on the
1469 // ssd in an CF system and we can do so more rapidly
1470 // so bump the limits considerably (and turn down the
1471 // duration so that it doesn't take weeks to adopt all
1472 // the files).
1473 //
1474 hfc_default_file_count = 20000;
1475 hfc_default_duration = 300; // 5min
1476 hfc_max_file_count = 50000;
1477 hfc_max_file_size = (512ULL * 1024ULL * 1024ULL);
1478 }
1479
1480 /*
1481 * If the Hot File btree exists then metadata zone is ready.
1482 */
1483 cnid = GetFileInfo(HFSTOVCB(hfsmp), kRootDirID, HFC_FILENAME, &cattr, NULL);
1484 if (cnid != 0 && S_ISREG(cattr.ca_mode)) {
1485 int recreate = 0;
1486
1487 if (hfsmp->hfc_stage == HFC_DISABLED)
1488 hfsmp->hfc_stage = HFC_IDLE;
1489 hfsmp->hfs_hotfile_freeblks = 0;
1490
1491 if ((hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN) && cattr.ca_blocks > 0) {
1492 //
1493 // make sure the hotfile btree is pinned
1494 //
1495 error = hfc_btree_open(hfsmp, &hfsmp->hfc_filevp);
1496 if (!error) {
1497 /* XXX: must fix hfs_pin_vnode too */
1498 hfs_pin_vnode(hfsmp, hfsmp->hfc_filevp, HFS_PIN_IT, NULL, vfs_context_kernel());
1499
1500 } else {
1501 printf("hfs: failed to open the btree err=%d. Recreating hotfile btree.\n", error);
1502 recreate = 1;
1503 }
1504
1505 hfs_hotfile_repin_files(hfsmp);
1506
1507 if (hfsmp->hfc_filevp) {
1508 (void) hfc_btree_close(hfsmp, hfsmp->hfc_filevp);
1509 hfsmp->hfc_filevp = NULL;
1510 }
1511
1512 } else if (hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN) {
1513 // hmmm, the hotfile btree is zero bytes long? how odd. let's recreate it.
1514 printf("hfs: hotfile btree is zero bytes long?! recreating it.\n");
1515 recreate = 1;
1516 }
1517
1518 if (!recreate) {
1519 /* don't forget to unlock the mutex */
1520 lck_mtx_unlock (&hfsmp->hfc_mutex);
1521 return (0);
1522 } else {
1523 //
1524 // open the hotfile btree file ignoring errors because
1525 // we need the vnode pointer for hfc_btree_delete() to
1526 // be able to do its work
1527 //
1528 error = hfc_btree_open_ext(hfsmp, &hfsmp->hfc_filevp, 1);
1529 if (!error) {
1530 // and delete it!
1531 error = hfc_btree_delete(hfsmp);
1532 (void) hfc_btree_close(hfsmp, hfsmp->hfc_filevp);
1533 hfsmp->hfc_filevp = NULL;
1534 }
1535 }
1536 }
1537
1538 printf("hfs: %s: %s: creating the hotfile btree\n", hfsmp->vcbVN, __FUNCTION__);
1539 if (hfs_start_transaction(hfsmp) != 0) {
1540 lck_mtx_unlock (&hfsmp->hfc_mutex);
1541 return EINVAL;
1542 }
1543
1544 /* B-tree creation must be journaled */
1545 started_tr = 1;
1546
1547 error = hfc_btree_create(hfsmp, HFSTOVCB(hfsmp)->blockSize, HFC_DEFAULT_FILE_COUNT);
1548 if (error) {
1549 #if HFC_VERBOSE
1550 printf("hfs: Error %d creating hot file b-tree on %s \n", error, hfsmp->vcbVN);
1551 #endif
1552 goto recording_init_out;
1553 }
1554
1555 hfs_end_transaction (hfsmp);
1556 started_tr = 0;
1557 /*
1558 * Do a journal flush + flush track cache. We have to ensure that the async I/Os have been issued to the media
1559 * before proceeding.
1560 */
1561 hfs_flush (hfsmp, HFS_FLUSH_FULL);
1562
1563 /* now re-start a new transaction */
1564 if (hfs_start_transaction (hfsmp) != 0) {
1565 lck_mtx_unlock (&hfsmp->hfc_mutex);
1566 return EINVAL;
1567 }
1568 started_tr = 1;
1569
1570 /*
1571 * Open the Hot File B-tree file for writing.
1572 */
1573 if (hfsmp->hfc_filevp)
1574 panic("hfs_recording_init: hfc_filevp exists (vp = %p)", hfsmp->hfc_filevp);
1575
1576 error = hfc_btree_open(hfsmp, &hfsmp->hfc_filevp);
1577 if (error) {
1578 #if HFC_VERBOSE
1579 printf("hfs: Error %d opening hot file b-tree on %s \n", error, hfsmp->vcbVN);
1580 #endif
1581 goto recording_init_out;
1582 }
1583
1584 /*
1585 * This function performs work similar to namei; we must NOT hold the catalog lock while
1586 * calling it. This will decorate catalog records as being pinning candidates. (no hotfiles work)
1587 */
1588 hfs_setup_default_cf_hotfiles(hfsmp);
1589
1590 /*
1591 * now grab the hotfiles b-tree vnode/cnode lock first, as it is not classified as a systemfile.
1592 */
1593 if (hfs_lock(VTOC(hfsmp->hfc_filevp), HFS_EXCLUSIVE_LOCK, HFS_LOCK_DEFAULT) != 0) {
1594 error = EPERM;
1595 (void) hfc_btree_close(hfsmp, hfsmp->hfc_filevp);
1596 /* zero it out to avoid pinning later on */
1597 hfsmp->hfc_filevp = NULL;
1598 goto recording_init_out;
1599 }
1600
1601 MALLOC(iterator, BTreeIterator *, sizeof(*iterator), M_TEMP, M_WAITOK);
1602 if (iterator == NULL) {
1603 error = ENOMEM;
1604 hfs_unlock (VTOC(hfsmp->hfc_filevp));
1605 (void) hfc_btree_close(hfsmp, hfsmp->hfc_filevp);
1606 /* zero it out to avoid pinning */
1607 hfsmp->hfc_filevp = NULL;
1608 goto recording_init_out;
1609 }
1610
1611 bzero(iterator, sizeof(*iterator));
1612 key = (HotFileKey*) &iterator->key;
1613 key->keyLength = HFC_KEYLENGTH;
1614
1615 record.bufferAddress = &data;
1616 record.itemSize = sizeof(u_int32_t);
1617 record.itemCount = 1;
1618
1619 #if HFC_VERBOSE
1620 printf("hfs: Evaluating space for \"%s\" metadata zone... (freeblks %d)\n", HFSTOVCB(hfsmp)->vcbVN,
1621 hfsmp->hfs_hotfile_freeblks);
1622 #endif
1623
1624 /*
1625 * Get ready to scan the Catalog file. We explicitly do NOT grab the catalog lock because
1626 * we're fully single-threaded at the moment (by virtue of being called during mount()),
1627 * and if we have to grow the hotfile btree, then we would need to grab the catalog lock
1628 * and if we take a shared lock here, it would deadlock (see <rdar://problem/21486585>)
1629 *
1630 * We already started a transaction so we should already be holding the journal lock at this point.
1631 * Note that we have to hold the journal lock / start a txn BEFORE the systemfile locks.
1632 */
1633
1634 error = BTScanInitialize(VTOF(HFSTOVCB(hfsmp)->catalogRefNum), 0, 0, 0,
1635 kCatSearchBufferSize, &scanstate);
1636 if (error) {
1637 printf("hfs_recording_init: err %d BTScanInit\n", error);
1638
1639 /* drop the systemfile locks */
1640 hfs_unlock(VTOC(hfsmp->hfc_filevp));
1641
1642 (void) hfc_btree_close(hfsmp, hfsmp->hfc_filevp);
1643
1644 /* zero it out to avoid pinning */
1645 hfsmp->hfc_filevp = NULL;
1646 goto recording_init_out;
1647 }
1648
1649 started_scan = 1;
1650
1651 filefork = VTOF(hfsmp->hfc_filevp);
1652
1653 starting_temp = random() % HF_TEMP_RANGE;
1654
1655 /*
1656 * Visit all the catalog btree leaf records. We have to hold the catalog lock to do this.
1657 *
1658 * NOTE: The B-Tree scanner reads from the media itself. Under normal circumstances it would be
1659 * fine to simply use b-tree routines to read blocks that correspond to b-tree nodes, because the
1660 * block cache is going to ensure you always get the cached copy of a block (even if a journal
1661 * txn has modified one of those blocks). That is NOT true when
1662 * using the scanner. In particular, it will always read whatever is on-disk. So we have to ensure
1663 * that the journal has flushed and that the async I/Os to the metadata files have been issued.
1664 */
1665 for (;;) {
1666 error = BTScanNextRecord(&scanstate, 0, (void **)&keyp, (void **)&datap, &dataSize);
1667 if (error) {
1668 if (error == btNotFound)
1669 error = 0;
1670 else
1671 printf("hfs_recording_init: err %d BTScanNext\n", error);
1672 break;
1673 }
1674 if ((datap->recordType != kHFSPlusFileRecord) ||
1675 (dataSize != sizeof(HFSPlusCatalogFile))) {
1676 continue;
1677 }
1678 filep = (HFSPlusCatalogFile *)datap;
1679 filecount++;
1680
1681 if (hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN) {
1682 if (filep->flags & kHFSDoNotFastDevPinMask) {
1683 uncacheable++;
1684 }
1685
1686 //
1687 // If the file does not have the FastDevPinnedMask set, we
1688 // can ignore it and just go to the next record.
1689 //
1690 if ((filep->flags & kHFSFastDevPinnedMask) == 0) {
1691 continue;
1692 }
1693 } else if (filep->dataFork.totalBlocks == 0) {
1694 continue;
1695 }
1696
1697 /*
1698 * On a regular hdd, any file that has blocks inside
1699 * the hot file space is recorded for later eviction.
1700 *
1701 * For now, resource forks are ignored.
1702 *
1703 * We don't do this on CF systems as there is no real
1704 * hotfile area - we just pin/unpin blocks belonging to
1705 * interesting files.
1706 */
1707 if (!(hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN) && !hotextents(hfsmp, &filep->dataFork.extents[0])) {
1708 continue;
1709 }
1710 cnid = filep->fileID;
1711
1712 /* Skip over journal files and the hotfiles B-Tree file. */
1713 if (cnid == hfsmp->hfs_jnlfileid
1714 || cnid == hfsmp->hfs_jnlinfoblkid
1715 || cnid == VTOC(hfsmp->hfc_filevp)->c_fileid) {
1716 continue;
1717 }
1718 /*
1719 * XXX - need to skip quota files as well.
1720 */
1721
1722 uint32_t temp;
1723
1724 if (hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN) {
1725 int rsrc = 0;
1726
1727 temp = (uint32_t)starting_temp++;
1728 if (filep->flags & kHFSAutoCandidateMask) {
1729 temp += MAX_NORMAL_TEMP;
1730 }
1731
1732 /* use the data fork by default */
1733 if (filep->dataFork.totalBlocks == 0) {
1734 /*
1735 * but if empty, switch to rsrc as its likely
1736 * a compressed file
1737 */
1738 rsrc = 1;
1739 }
1740
1741 error = hfs_pin_catalog_rec (hfsmp, filep, rsrc);
1742 if (error)
1743 break;
1744
1745 } else {
1746 temp = HFC_MINIMUM_TEMPERATURE;
1747 }
1748
1749 /* Insert a hot file entry. */
1750 key->keyLength = HFC_KEYLENGTH;
1751 key->temperature = temp;
1752 key->fileID = cnid;
1753 key->forkType = 0;
1754 data = 0x3f3f3f3f;
1755 error = BTInsertRecord(filefork, iterator, &record, record.itemSize);
1756 if (error) {
1757 printf("hfs_recording_init: BTInsertRecord failed %d (fileid %d)\n", error, key->fileID);
1758 error = MacToVFSError(error);
1759 break;
1760 }
1761
1762 /* Insert the corresponding thread record. */
1763 key->keyLength = HFC_KEYLENGTH;
1764 key->temperature = HFC_LOOKUPTAG;
1765 key->fileID = cnid;
1766 key->forkType = 0;
1767 data = temp;
1768 error = BTInsertRecord(filefork, iterator, &record, record.itemSize);
1769 if (error) {
1770 printf("hfs_recording_init: BTInsertRecord failed %d (fileid %d)\n", error, key->fileID);
1771 error = MacToVFSError(error);
1772 break;
1773 }
1774 inserted++;
1775 } // end catalog iteration loop
1776
1777 save_btree_user_info(hfsmp);
1778 (void) BTFlushPath(filefork);
1779
1780 recording_init_out:
1781
1782 /* Unlock first, then pin after releasing everything else */
1783 if (hfsmp->hfc_filevp) {
1784 hfs_unlock (VTOC(hfsmp->hfc_filevp));
1785 }
1786
1787 if (started_scan) {
1788 (void) BTScanTerminate (&scanstate, &data, &data, &data);
1789 }
1790
1791 if (started_tr) {
1792 hfs_end_transaction(hfsmp);
1793 }
1794
1795 #if HFC_VERBOSE
1796 printf("hfs: %d files identified out of %d (freeblocks is now: %d)\n", inserted, filecount, hfsmp->hfs_hotfile_freeblks);
1797 if (uncacheable) {
1798 printf("hfs: %d files were marked as uncacheable\n", uncacheable);
1799 }
1800 #endif
1801
1802 if (iterator)
1803 FREE(iterator, M_TEMP);
1804
1805 if (hfsmp->hfc_filevp) {
1806 if (hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN) {
1807 hfs_pin_vnode(hfsmp, hfsmp->hfc_filevp, HFS_PIN_IT, NULL, vfs_context_kernel());
1808 }
1809 (void) hfc_btree_close(hfsmp, hfsmp->hfc_filevp);
1810 hfsmp->hfc_filevp = NULL;
1811 }
1812
1813 if (error == 0)
1814 hfsmp->hfc_stage = HFC_IDLE;
1815
1816 /* Finally, unlock the HFC mutex */
1817 lck_mtx_unlock (&hfsmp->hfc_mutex);
1818
1819 return (error);
1820 }
1821
1822 /*
1823 * Use sync to perform ocassional background work.
1824 */
1825 int
1826 hfs_hotfilesync(struct hfsmount *hfsmp, vfs_context_t ctx)
1827 {
1828 if (hfsmp->hfc_stage) {
1829 struct timeval tv;
1830
1831 lck_mtx_lock(&hfsmp->hfc_mutex);
1832
1833 switch (hfsmp->hfc_stage) {
1834 case HFC_IDLE:
1835 (void) hfs_recording_start(hfsmp);
1836 break;
1837
1838 case HFC_RECORDING:
1839 microtime(&tv);
1840 if (tv.tv_sec > hfsmp->hfc_timeout)
1841 (void) hfs_recording_stop(hfsmp);
1842 break;
1843
1844 case HFC_EVICTION:
1845 (void) hotfiles_evict(hfsmp, ctx);
1846 break;
1847
1848 case HFC_ADOPTION:
1849 (void) hotfiles_adopt(hfsmp, ctx);
1850 break;
1851 default:
1852 break;
1853 }
1854
1855 lck_mtx_unlock(&hfsmp->hfc_mutex);
1856 }
1857 return (0);
1858 }
1859
1860 /*
1861 * Add a hot file to the recording list.
1862 *
1863 * This can happen when a hot file gets reclaimed or at the
1864 * end of the recording period for any active hot file.
1865 *
1866 * NOTE: Since both the data and resource fork can be hot,
1867 * there can be two entries for the same file id.
1868 *
1869 * Note: the cnode is locked on entry.
1870 */
1871 int
1872 hfs_addhotfile(struct vnode *vp)
1873 {
1874 hfsmount_t *hfsmp;
1875 int error;
1876
1877 hfsmp = VTOHFS(vp);
1878 if (hfsmp->hfc_stage != HFC_RECORDING)
1879 return (0);
1880
1881 lck_mtx_lock(&hfsmp->hfc_mutex);
1882 error = hfs_addhotfile_internal(vp);
1883 lck_mtx_unlock(&hfsmp->hfc_mutex);
1884 return (error);
1885 }
1886
1887 static int
1888 hf_ignore_process(const char *pname, size_t maxlen)
1889 {
1890 if ( strncmp(pname, "mds", maxlen) == 0
1891 || strncmp(pname, "mdworker", maxlen) == 0
1892 || strncmp(pname, "mds_stores", maxlen) == 0
1893 || strncmp(pname, "makewhatis", maxlen) == 0) {
1894 return 1;
1895 }
1896
1897 return 0;
1898
1899 }
1900
1901 static int
1902 hfs_addhotfile_internal(struct vnode *vp)
1903 {
1904 hotfile_data_t *hotdata;
1905 hotfile_entry_t *entry;
1906 hfsmount_t *hfsmp;
1907 cnode_t *cp;
1908 filefork_t *ffp;
1909 u_int32_t temperature;
1910
1911 hfsmp = VTOHFS(vp);
1912 if (hfsmp->hfc_stage != HFC_RECORDING)
1913 return (0);
1914
1915 /*
1916 * Only regular files are eligible for hotfiles addition.
1917 *
1918 * Symlinks were previously added to the list and may exist in
1919 * extant hotfiles regions, but no new ones will be added, and no
1920 * symlinks will now be relocated/evicted from the hotfiles region.
1921 */
1922 if (!vnode_isreg(vp) || vnode_issystem(vp)) {
1923 return (0);
1924 }
1925
1926 /* Skip resource forks for now. */
1927 if (VNODE_IS_RSRC(vp)) {
1928 return (0);
1929 }
1930 if ((hotdata = (hotfile_data_t *)hfsmp->hfc_recdata) == NULL) {
1931 return (0);
1932 }
1933 ffp = VTOF(vp);
1934 cp = VTOC(vp);
1935
1936 if (cp->c_attr.ca_recflags & (kHFSFastDevPinnedMask|kHFSDoNotFastDevPinMask)) {
1937 // it's already a hotfile or can't be a hotfile...
1938 return 0;
1939 }
1940
1941 if (vnode_isdir(vp) || vnode_issystem(vp) || (cp->c_flag & (C_DELETED | C_NOEXISTS))) {
1942 return 0;
1943 }
1944
1945 if ((hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN) && vnode_isfastdevicecandidate(vp)) {
1946 //
1947 // On cooperative fusion (CF) systems we have different criteria for whether something
1948 // can be pinned to the ssd.
1949 //
1950 if (cp->c_flag & (C_DELETED|C_NOEXISTS)) {
1951 //
1952 // dead files are definitely not worth caching
1953 //
1954 return 0;
1955 } else if (ffp->ff_blocks == 0 && !(cp->c_bsdflags & UF_COMPRESSED) && !(cp->c_attr.ca_recflags & kHFSFastDevCandidateMask)) {
1956 //
1957 // empty files aren't worth caching but compressed ones might be, as are
1958 // newly created files that live in WorthCaching directories...
1959 //
1960 return 0;
1961 }
1962
1963 char pname[256];
1964 pname[0] = '\0';
1965 proc_selfname(pname, sizeof(pname));
1966 if (hf_ignore_process(pname, sizeof(pname))) {
1967 // ignore i/o's from certain system daemons
1968 return 0;
1969 }
1970
1971 temperature = cp->c_fileid; // in memory we just keep it sorted by file-id
1972 } else {
1973 // the normal hard drive based hotfile checks
1974 if ((ffp->ff_bytesread == 0) ||
1975 (ffp->ff_blocks == 0) ||
1976 (ffp->ff_size == 0) ||
1977 (ffp->ff_blocks > hotdata->maxblocks) ||
1978 (cp->c_bsdflags & (UF_NODUMP | UF_COMPRESSED)) ||
1979 (cp->c_atime < hfsmp->hfc_timebase)) {
1980 return (0);
1981 }
1982
1983 temperature = ffp->ff_bytesread / ffp->ff_size;
1984 if (temperature < hotdata->threshold) {
1985 return (0);
1986 }
1987 }
1988
1989 /*
1990 * If there is room or this file is hotter than
1991 * the coldest one then add it to the list.
1992 *
1993 */
1994 if ((hotdata->activefiles < hfsmp->hfc_maxfiles) ||
1995 (hotdata->coldest == NULL) ||
1996 (temperature >= hotdata->coldest->temperature)) {
1997 ++hotdata->refcount;
1998 entry = hf_getnewentry(hotdata);
1999 entry->temperature = temperature;
2000 entry->fileid = cp->c_fileid;
2001 //
2002 // if ffp->ff_blocks is zero, it might be compressed so make sure we record
2003 // that there's at least one block.
2004 //
2005 entry->blocks = ffp->ff_blocks ? ffp->ff_blocks : 1;
2006 if (hf_insert(hotdata, entry) == EEXIST) {
2007 // entry is already present, don't need to add it again
2008 entry->right = hotdata->freelist;
2009 hotdata->freelist = entry;
2010 }
2011 --hotdata->refcount;
2012 }
2013
2014 return (0);
2015 }
2016
2017 /*
2018 * Remove a hot file from the recording list.
2019 *
2020 * This can happen when a hot file becomes
2021 * an active vnode (active hot files are
2022 * not kept in the recording list until the
2023 * end of the recording period).
2024 *
2025 * Note: the cnode is locked on entry.
2026 */
2027 int
2028 hfs_removehotfile(struct vnode *vp)
2029 {
2030 hotfile_data_t *hotdata;
2031 hfsmount_t *hfsmp;
2032 cnode_t *cp;
2033 filefork_t *ffp;
2034 u_int32_t temperature;
2035
2036 hfsmp = VTOHFS(vp);
2037 if (hfsmp->hfc_stage != HFC_RECORDING)
2038 return (0);
2039
2040 if ((!vnode_isreg(vp)) || vnode_issystem(vp)) {
2041 return (0);
2042 }
2043
2044 ffp = VTOF(vp);
2045 cp = VTOC(vp);
2046
2047 if ((ffp->ff_bytesread == 0) || (ffp->ff_blocks == 0) ||
2048 (ffp->ff_size == 0) || (cp->c_atime < hfsmp->hfc_timebase)) {
2049 return (0);
2050 }
2051
2052 lck_mtx_lock(&hfsmp->hfc_mutex);
2053 if (hfsmp->hfc_stage != HFC_RECORDING)
2054 goto out;
2055 if ((hotdata = (hotfile_data_t *)hfsmp->hfc_recdata) == NULL)
2056 goto out;
2057
2058 temperature = ffp->ff_bytesread / ffp->ff_size;
2059 if (temperature < hotdata->threshold)
2060 goto out;
2061
2062 if (hotdata->coldest && (temperature >= hotdata->coldest->temperature)) {
2063 ++hotdata->refcount;
2064 hf_delete(hotdata, VTOC(vp)->c_fileid, temperature);
2065 --hotdata->refcount;
2066 }
2067 out:
2068 lck_mtx_unlock(&hfsmp->hfc_mutex);
2069 return (0);
2070 }
2071
2072 int
2073 hfs_hotfile_deleted(__unused struct vnode *vp)
2074 {
2075 #if 1
2076 return 0;
2077 #else
2078 //
2079 // XXXdbg - this code, while it would work, would introduce a huge inefficiency
2080 // to deleting files as the way it's written would require us to open
2081 // the hotfile btree on every open, delete two records in it and then
2082 // close the hotfile btree (which involves more writes).
2083 //
2084 // We actually can be lazy about deleting hotfile records for files
2085 // that get deleted. When it's time to evict things, if we encounter
2086 // a record that references a dead file (i.e. a fileid which no
2087 // longer exists), the eviction code will remove the records. Likewise
2088 // the code that scans the HotFile B-Tree at boot time to re-pin files
2089 // will remove dead records.
2090 //
2091
2092 hotfile_data_t *hotdata;
2093 hfsmount_t *hfsmp;
2094 cnode_t *cp;
2095 filefork_t *filefork;
2096 u_int32_t temperature;
2097 BTreeIterator * iterator = NULL;
2098 FSBufferDescriptor record;
2099 HotFileKey *key;
2100 u_int32_t data;
2101 int error=0;
2102
2103 cp = VTOC(vp);
2104 if (cp == NULL || !(cp->c_attr.ca_recflags & kHFSFastDevPinnedMask)) {
2105 return 0;
2106 }
2107
2108 hfsmp = VTOHFS(vp);
2109 if (!(hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN)) {
2110 return 0;
2111 }
2112
2113 if (hfc_btree_open(hfsmp, &hfsmp->hfc_filevp) != 0 || hfsmp->hfc_filevp == NULL) {
2114 // either there is no hotfile info or it's damaged
2115 return EINVAL;
2116 }
2117
2118 filefork = VTOF(hfsmp->hfc_filevp);
2119 if (filefork == NULL) {
2120 return 0;
2121 }
2122
2123 MALLOC(iterator, BTreeIterator *, sizeof(*iterator), M_TEMP, M_WAITOK);
2124 if (iterator == NULL) {
2125 return ENOMEM;
2126 }
2127 bzero(iterator, sizeof(*iterator));
2128 key = (HotFileKey*) &iterator->key;
2129
2130 record.bufferAddress = &data;
2131 record.itemSize = sizeof(u_int32_t);
2132 record.itemCount = 1;
2133
2134 key->keyLength = HFC_KEYLENGTH;
2135 key->temperature = HFC_LOOKUPTAG;
2136 key->fileID = cp->c_fileid;
2137 key->forkType = 0;
2138
2139 lck_mtx_lock(&hfsmp->hfc_mutex);
2140 (void) BTInvalidateHint(iterator);
2141 if (BTSearchRecord(filefork, iterator, &record, NULL, iterator) == 0) {
2142 temperature = key->temperature;
2143 hfc_btree_delete_record(hfsmp, iterator, key);
2144 } else {
2145 //printf("hfs: hotfile_deleted: did not find fileid %d\n", cp->c_fileid);
2146 error = ENOENT;
2147 }
2148
2149 if ((hotdata = (hotfile_data_t *)hfsmp->hfc_recdata) != NULL) {
2150 // just in case, also make sure it's removed from the in-memory list as well
2151 ++hotdata->refcount;
2152 hf_delete(hotdata, cp->c_fileid, cp->c_fileid);
2153 --hotdata->refcount;
2154 }
2155
2156 lck_mtx_unlock(&hfsmp->hfc_mutex);
2157 FREE(iterator, M_TEMP);
2158
2159 hfc_btree_close(hfsmp, hfsmp->hfc_filevp);
2160
2161 return error;
2162 #endif
2163 }
2164
2165 int
2166 hfs_hotfile_adjust_blocks(struct vnode *vp, int64_t num_blocks)
2167 {
2168 hfsmount_t *hfsmp;
2169
2170 if (vp == NULL) {
2171 return 0;
2172 }
2173
2174 hfsmp = VTOHFS(vp);
2175
2176 if (!(hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN) || num_blocks == 0 || vp == NULL) {
2177 return 0;
2178 }
2179
2180 //
2181 // if file is not HotFileCached or it has the CanNotHotFile cache
2182 // bit set then there is nothing to do
2183 //
2184 if (!(VTOC(vp)->c_attr.ca_recflags & kHFSFastDevPinnedMask) || (VTOC(vp)->c_attr.ca_recflags & kHFSDoNotFastDevPinMask)) {
2185 // it's not a hot file or can't be one so don't bother tracking
2186 return 0;
2187 }
2188
2189 OSAddAtomic(num_blocks, &hfsmp->hfs_hotfile_blk_adjust);
2190
2191 return (0);
2192 }
2193
2194 //
2195 // Assumes hfsmp->hfc_mutex is LOCKED
2196 //
2197 static int
2198 hfs_hotfile_cur_freeblks(hfsmount_t *hfsmp)
2199 {
2200 if (hfsmp->hfc_stage < HFC_IDLE) {
2201 return 0;
2202 }
2203
2204 int cur_blk_adjust = hfsmp->hfs_hotfile_blk_adjust; // snap a copy of this value
2205
2206 if (cur_blk_adjust) {
2207 OSAddAtomic(-cur_blk_adjust, &hfsmp->hfs_hotfile_blk_adjust);
2208 hfsmp->hfs_hotfile_freeblks += cur_blk_adjust;
2209 }
2210
2211 return hfsmp->hfs_hotfile_freeblks;
2212 }
2213
2214
2215 /*
2216 *========================================================================
2217 * HOT FILE MAINTENANCE ROUTINES
2218 *========================================================================
2219 */
2220
2221 static int
2222 hotfiles_collect_callback(struct vnode *vp, __unused void *cargs)
2223 {
2224 if ((vnode_isreg(vp)) && !vnode_issystem(vp))
2225 (void) hfs_addhotfile_internal(vp);
2226
2227 return (VNODE_RETURNED);
2228 }
2229
2230 /*
2231 * Add all active hot files to the recording list.
2232 */
2233 static int
2234 hotfiles_collect(struct hfsmount *hfsmp)
2235 {
2236 struct mount *mp = HFSTOVFS(hfsmp);
2237
2238 if (vfs_busy(mp, LK_NOWAIT))
2239 return (0);
2240
2241 /*
2242 * hotfiles_collect_callback will be called for each vnode
2243 * hung off of this mount point
2244 * the vnode will be
2245 * properly referenced and unreferenced around the callback
2246 */
2247 vnode_iterate(mp, 0, hotfiles_collect_callback, (void *)NULL);
2248
2249 vfs_unbusy(mp);
2250
2251 return (0);
2252 }
2253
2254
2255 /*
2256 * Update the data of a btree record
2257 * This is called from within BTUpdateRecord.
2258 */
2259 static int
2260 update_callback(const HotFileKey *key, u_int32_t *data, u_int32_t *state)
2261 {
2262 if (key->temperature == HFC_LOOKUPTAG)
2263 *data = *state;
2264 return (0);
2265 }
2266
2267 /*
2268 * Identify files already in hot area.
2269 */
2270 static int
2271 hotfiles_refine(struct hfsmount *hfsmp)
2272 {
2273 BTreeIterator * iterator = NULL;
2274 struct mount *mp;
2275 filefork_t * filefork;
2276 hotfilelist_t *listp;
2277 FSBufferDescriptor record;
2278 HotFileKey * key;
2279 u_int32_t data;
2280 int i;
2281 int error = 0;
2282
2283 if ((listp = (hotfilelist_t *)hfsmp->hfc_recdata) == NULL)
2284 return (0);
2285
2286 if (hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN) {
2287 // on ssd's we don't refine the temperature since the
2288 // replacement algorithm is simply random
2289 return 0;
2290 }
2291
2292 mp = HFSTOVFS(hfsmp);
2293
2294 MALLOC(iterator, BTreeIterator *, sizeof(*iterator), M_TEMP, M_WAITOK);
2295 if (iterator == NULL) {
2296 error = ENOMEM;
2297 goto out;
2298 }
2299 bzero(iterator, sizeof(*iterator));
2300 key = (HotFileKey*) &iterator->key;
2301
2302 record.bufferAddress = &data;
2303 record.itemSize = sizeof(u_int32_t);
2304 record.itemCount = 1;
2305
2306 if (hfs_start_transaction(hfsmp) != 0) {
2307 error = EINVAL;
2308 goto out;
2309 }
2310 if (hfs_lock(VTOC(hfsmp->hfc_filevp), HFS_EXCLUSIVE_LOCK, HFS_LOCK_DEFAULT) != 0) {
2311 error = EPERM;
2312 goto out1;
2313 }
2314 filefork = VTOF(hfsmp->hfc_filevp);
2315
2316 for (i = 0; i < listp->hfl_count; ++i) {
2317 /*
2318 * Check if entry (thread) is already in hot area.
2319 */
2320 key->keyLength = HFC_KEYLENGTH;
2321 key->temperature = HFC_LOOKUPTAG;
2322 key->fileID = listp->hfl_hotfile[i].hf_fileid;
2323 key->forkType = 0;
2324 (void) BTInvalidateHint(iterator);
2325 if (BTSearchRecord(filefork, iterator, &record, NULL, iterator) != 0) {
2326 continue; /* not in hot area, so skip */
2327 }
2328
2329 /*
2330 * Update thread entry with latest temperature.
2331 */
2332 error = BTUpdateRecord(filefork, iterator,
2333 (IterateCallBackProcPtr)update_callback,
2334 &listp->hfl_hotfile[i].hf_temperature);
2335 if (error) {
2336 printf("hfs: hotfiles_refine: BTUpdateRecord failed %d (file %d)\n", error, key->fileID);
2337 error = MacToVFSError(error);
2338 // break;
2339 }
2340 /*
2341 * Re-key entry with latest temperature.
2342 */
2343 key->keyLength = HFC_KEYLENGTH;
2344 key->temperature = data;
2345 key->fileID = listp->hfl_hotfile[i].hf_fileid;
2346 key->forkType = 0;
2347 /* Pick up record data. */
2348 (void) BTInvalidateHint(iterator);
2349 (void) BTSearchRecord(filefork, iterator, &record, NULL, iterator);
2350 error = BTDeleteRecord(filefork, iterator);
2351 if (error) {
2352 printf("hfs: hotfiles_refine: BTDeleteRecord failed %d (file %d)\n", error, key->fileID);
2353 error = MacToVFSError(error);
2354 break;
2355 }
2356 key->keyLength = HFC_KEYLENGTH;
2357 key->temperature = listp->hfl_hotfile[i].hf_temperature;
2358 key->fileID = listp->hfl_hotfile[i].hf_fileid;
2359 key->forkType = 0;
2360 error = BTInsertRecord(filefork, iterator, &record, record.itemSize);
2361 if (error) {
2362 printf("hfs: hotfiles_refine: BTInsertRecord failed %d (file %d)\n", error, key->fileID);
2363 error = MacToVFSError(error);
2364 break;
2365 }
2366 /*
2367 * Invalidate this entry in the list.
2368 */
2369 listp->hfl_hotfile[i].hf_temperature = 0;
2370 listp->hfl_totalblocks -= listp->hfl_hotfile[i].hf_blocks;
2371
2372 } /* end for */
2373
2374 (void) BTFlushPath(filefork);
2375 hfs_unlock(VTOC(hfsmp->hfc_filevp));
2376
2377 out1:
2378 hfs_end_transaction(hfsmp);
2379 out:
2380 if (iterator)
2381 FREE(iterator, M_TEMP);
2382 return (error);
2383 }
2384
2385 /*
2386 * Move new hot files into hot area.
2387 *
2388 * Requires that the hfc_mutex be held.
2389 */
2390 static int
2391 hotfiles_adopt(struct hfsmount *hfsmp, vfs_context_t ctx)
2392 {
2393 BTreeIterator * iterator = NULL;
2394 struct vnode *vp;
2395 filefork_t * filefork;
2396 hotfilelist_t *listp;
2397 FSBufferDescriptor record;
2398 HotFileKey * key;
2399 u_int32_t data;
2400 enum hfc_stage stage;
2401 int fileblocks;
2402 int blksmoved;
2403 int i;
2404 int last;
2405 int error = 0;
2406 int startedtrans = 0;
2407 //
2408 // all files in a given adoption phase have a temperature
2409 // that starts at a random value and then increases linearly.
2410 // the idea is that during eviction, files that were adopted
2411 // together will be evicted together
2412 //
2413 long starting_temp = random() % HF_TEMP_RANGE;
2414 long temp_adjust = 0;
2415
2416 if ((listp = (hotfilelist_t *)hfsmp->hfc_recdata) == NULL)
2417 return (0);
2418
2419 if (hfsmp->hfc_stage != HFC_ADOPTION) {
2420 return (EBUSY);
2421 }
2422 if (hfs_lock(VTOC(hfsmp->hfc_filevp), HFS_EXCLUSIVE_LOCK, HFS_LOCK_DEFAULT) != 0) {
2423 return (EPERM);
2424 }
2425
2426 MALLOC(iterator, BTreeIterator *, sizeof(*iterator), M_TEMP, M_WAITOK);
2427 if (iterator == NULL) {
2428 hfs_unlock(VTOC(hfsmp->hfc_filevp));
2429 return (ENOMEM);
2430 }
2431
2432 #if HFC_VERBOSE
2433 printf("hfs:%s: hotfiles_adopt: (hfl_next: %d, hotfile start/end block: %d - %d; max/free: %d/%d; maxfiles: %d)\n",
2434 hfsmp->vcbVN,
2435 listp->hfl_next,
2436 hfsmp->hfs_hotfile_start, hfsmp->hfs_hotfile_end,
2437 hfsmp->hfs_hotfile_maxblks, hfsmp->hfs_hotfile_freeblks, hfsmp->hfc_maxfiles);
2438 #endif
2439
2440 stage = hfsmp->hfc_stage;
2441 hfsmp->hfc_stage = HFC_BUSY;
2442
2443 blksmoved = 0;
2444 last = listp->hfl_next + HFC_FILESPERSYNC;
2445 if (last > listp->hfl_count)
2446 last = listp->hfl_count;
2447
2448 bzero(iterator, sizeof(*iterator));
2449 key = (HotFileKey*) &iterator->key;
2450 key->keyLength = HFC_KEYLENGTH;
2451
2452 record.bufferAddress = &data;
2453 record.itemSize = sizeof(u_int32_t);
2454 record.itemCount = 1;
2455
2456 filefork = VTOF(hfsmp->hfc_filevp);
2457
2458 for (i = listp->hfl_next; (i < last) && (blksmoved < HFC_BLKSPERSYNC); ++i) {
2459 /*
2460 * Skip entries that aren't going to work.
2461 */
2462 if (listp->hfl_hotfile[i].hf_temperature == 0) {
2463 //printf("hfs: zero temp on file-id %d\n", listp->hfl_hotfile[i].hf_fileid);
2464 listp->hfl_next++;
2465 continue;
2466 }
2467 if (listp->hfl_hotfile[i].hf_fileid == VTOC(hfsmp->hfc_filevp)->c_fileid) {
2468 //printf("hfs: cannot adopt the hotfile b-tree itself! (file-id %d)\n", listp->hfl_hotfile[i].hf_fileid);
2469 listp->hfl_next++;
2470 continue;
2471 }
2472 if (listp->hfl_hotfile[i].hf_fileid < kHFSFirstUserCatalogNodeID) {
2473 //printf("hfs: cannot adopt system files (file-id %d)\n", listp->hfl_hotfile[i].hf_fileid);
2474 listp->hfl_next++;
2475 continue;
2476 }
2477
2478 /*
2479 * Acquire a vnode for this file.
2480 */
2481 error = hfs_vget(hfsmp, listp->hfl_hotfile[i].hf_fileid, &vp, 0, 0);
2482 if (error) {
2483 //printf("failed to get fileid %d (err %d)\n", listp->hfl_hotfile[i].hf_fileid, error);
2484 if (error == ENOENT) {
2485 error = 0;
2486 listp->hfl_next++;
2487 continue; /* stale entry, go to next */
2488 }
2489 break;
2490 }
2491
2492 //printf("hfs: examining hotfile entry w/fileid %d, temp %d, blocks %d (HotFileCached: %s)\n",
2493 // listp->hfl_hotfile[i].hf_fileid, listp->hfl_hotfile[i].hf_temperature,
2494 // listp->hfl_hotfile[i].hf_blocks,
2495 // (VTOC(vp)->c_attr.ca_recflags & kHFSFastDevPinnedMask) ? "YES" : "NO");
2496
2497 if (!vnode_isreg(vp)) {
2498 /* Symlinks are ineligible for adoption into the hotfile zone. */
2499 //printf("hfs: hotfiles_adopt: huh, not a file %d (%d)\n", listp->hfl_hotfile[i].hf_fileid, VTOC(vp)->c_cnid);
2500 hfs_unlock(VTOC(vp));
2501 vnode_put(vp);
2502 listp->hfl_hotfile[i].hf_temperature = 0;
2503 listp->hfl_next++;
2504 continue; /* stale entry, go to next */
2505 }
2506 if ( (VTOC(vp)->c_flag & (C_DELETED | C_NOEXISTS))
2507 || (!(hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN) && hotextents(hfsmp, &VTOF(vp)->ff_extents[0]))
2508 || (VTOC(vp)->c_attr.ca_recflags & (kHFSFastDevPinnedMask|kHFSDoNotFastDevPinMask))) {
2509 hfs_unlock(VTOC(vp));
2510 vnode_put(vp);
2511 listp->hfl_hotfile[i].hf_temperature = 0;
2512 listp->hfl_next++;
2513 listp->hfl_totalblocks -= listp->hfl_hotfile[i].hf_blocks;
2514 continue; /* stale entry, go to next */
2515 }
2516
2517 fileblocks = VTOF(vp)->ff_blocks;
2518
2519 //
2520 // for CF, if the file is empty (and not compressed) or it is too large,
2521 // do not try to pin it. (note: if fileblocks == 0 but the file is marked
2522 // as compressed, we may still be able to cache it).
2523 //
2524 if ((hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN) &&
2525 ((fileblocks == 0 && !(VTOC(vp)->c_bsdflags & UF_COMPRESSED)) ||
2526 (unsigned int)fileblocks > (HFC_MAXIMUM_FILESIZE / (uint64_t)HFSTOVCB(hfsmp)->blockSize))) {
2527 // don't try to cache something too large or that's zero-bytes
2528
2529 vnode_clearfastdevicecandidate(vp); // turn off the fast-dev-candidate flag so we don't keep trying to cache it.
2530
2531 hfs_unlock(VTOC(vp));
2532 vnode_put(vp);
2533 listp->hfl_hotfile[i].hf_temperature = 0;
2534 listp->hfl_next++;
2535 listp->hfl_totalblocks -= listp->hfl_hotfile[i].hf_blocks;
2536 continue; /* entry is too big, just carry on with the next guy */
2537 }
2538
2539 //
2540 // If a file is not an autocandidate (i.e. it's a user-tagged file desirous of
2541 // being hotfile cached) but it is already bigger than 4 megs, don't bother
2542 // hotfile caching it. Note that if a user tagged file starts small, gets
2543 // adopted and then grows over time we will allow it to grow bigger than 4 megs
2544 // which is intentional for things like the Mail or Photos database files which
2545 // grow slowly over time and benefit from being on the FastDevice.
2546 //
2547 if ((hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN) &&
2548 !(VTOC(vp)->c_attr.ca_recflags & kHFSAutoCandidateMask) &&
2549 (VTOC(vp)->c_attr.ca_recflags & kHFSFastDevCandidateMask) &&
2550 (unsigned int)fileblocks > ((4*1024*1024) / (uint64_t)HFSTOVCB(hfsmp)->blockSize)) {
2551
2552 vnode_clearfastdevicecandidate(vp); // turn off the fast-dev-candidate flag so we don't keep trying to cache it.
2553
2554 hfs_unlock(VTOC(vp));
2555 vnode_put(vp);
2556 listp->hfl_hotfile[i].hf_temperature = 0;
2557 listp->hfl_next++;
2558 listp->hfl_totalblocks -= listp->hfl_hotfile[i].hf_blocks;
2559 continue; /* entry is too big, just carry on with the next guy */
2560 }
2561
2562 if (fileblocks > hfs_hotfile_cur_freeblks(hfsmp)) {
2563 //
2564 // No room for this file. Although eviction should have made space
2565 // it's best that we check here as well since writes to existing
2566 // hotfiles may have eaten up space since we performed eviction
2567 //
2568 hfs_unlock(VTOC(vp));
2569 vnode_put(vp);
2570 listp->hfl_next++;
2571 listp->hfl_totalblocks -= fileblocks;
2572 continue; /* entry too big, go to next */
2573 }
2574
2575 if ((blksmoved > 0) &&
2576 (blksmoved + fileblocks) > HFC_BLKSPERSYNC) {
2577 //
2578 // we've done enough work, let's be nice to the system and
2579 // stop until the next iteration
2580 //
2581 hfs_unlock(VTOC(vp));
2582 vnode_put(vp);
2583 break; /* adopt this entry the next time around */
2584 }
2585 if (VTOC(vp)->c_desc.cd_nameptr)
2586 data = *(const u_int32_t *)(VTOC(vp)->c_desc.cd_nameptr);
2587 else
2588 data = 0x3f3f3f3f;
2589
2590
2591 if (hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN) {
2592 //
2593 // For CF we pin the blocks belonging to the file
2594 // to the "fast" (aka ssd) media
2595 //
2596 uint32_t pinned_blocks;
2597
2598 if (vnode_isautocandidate(vp)) {
2599 VTOC(vp)->c_attr.ca_recflags |= kHFSAutoCandidateMask;
2600 }
2601 if (VTOC(vp)->c_attr.ca_recflags & kHFSAutoCandidateMask) {
2602 //
2603 // this moves auto-cached files to the higher tier
2604 // of "temperatures" which means they are less likely
2605 // to get evicted (user selected hotfiles will get
2606 // evicted first in the theory that they change more
2607 // frequently compared to system files)
2608 //
2609 temp_adjust = MAX_NORMAL_TEMP;
2610 } else {
2611 temp_adjust = 0;
2612 }
2613
2614 hfs_unlock(VTOC(vp)); // don't need an exclusive lock for this
2615 hfs_lock(VTOC(vp), HFS_SHARED_LOCK, HFS_LOCK_ALLOW_NOEXISTS);
2616
2617 error = hfs_pin_vnode(hfsmp, vp, HFS_PIN_IT, &pinned_blocks, ctx);
2618
2619 fileblocks = pinned_blocks;
2620
2621 // go back to an exclusive lock since we're going to modify the cnode again
2622 hfs_unlock(VTOC(vp));
2623 hfs_lock(VTOC(vp), HFS_EXCLUSIVE_LOCK, HFS_LOCK_ALLOW_NOEXISTS);
2624 } else {
2625 //
2626 // Old style hotfiles moves the data to the center (aka "hot")
2627 // region of the disk
2628 //
2629 error = hfs_relocate(vp, hfsmp->hfs_hotfile_start, kauth_cred_get(), current_proc());
2630 }
2631
2632 if (!error) {
2633 VTOC(vp)->c_attr.ca_recflags |= kHFSFastDevPinnedMask;
2634 VTOC(vp)->c_flag |= C_MODIFIED;
2635 } else if ((hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN) && error == EALREADY) {
2636 //
2637 // If hfs_pin_vnode() returned EALREADY then this file is not
2638 // ever able to be hotfile cached the normal way. This can
2639 // happen with compressed files which have their data stored
2640 // in an extended attribute. We flag them so that we won't
2641 // bother to try and hotfile cache them again the next time
2642 // they're read.
2643 //
2644 VTOC(vp)->c_attr.ca_recflags |= kHFSDoNotFastDevPinMask;
2645 VTOC(vp)->c_flag |= C_MODIFIED;
2646 }
2647
2648 hfs_unlock(VTOC(vp));
2649 vnode_put(vp);
2650 if (error) {
2651 #if HFC_VERBOSE
2652 if (error != EALREADY) {
2653 printf("hfs: hotfiles_adopt: could not relocate file %d (err %d)\n", listp->hfl_hotfile[i].hf_fileid, error);
2654 }
2655 #endif
2656
2657 if (last < listp->hfl_count) {
2658 last++;
2659 }
2660 /* Move on to next item. */
2661 listp->hfl_next++;
2662 continue;
2663 }
2664 /* Keep hot file free space current. */
2665 hfsmp->hfs_hotfile_freeblks -= fileblocks;
2666 listp->hfl_totalblocks -= fileblocks;
2667
2668 /* Insert hot file entry */
2669 key->keyLength = HFC_KEYLENGTH;
2670
2671 if (hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN) {
2672 //
2673 // The "temperature" for a CF hotfile is simply a random
2674 // number that we sequentially increment for each file in
2675 // the set of files we're currently adopting. This has the
2676 // nice property that all of the files we pin to the ssd
2677 // in the current phase will sort together in the hotfile
2678 // btree. When eviction time comes we will evict them
2679 // together as well. This gives the eviction phase temporal
2680 // locality - things written together get evicted together
2681 // which is what ssd's like.
2682 //
2683 listp->hfl_hotfile[i].hf_temperature = (uint32_t)temp_adjust + starting_temp++;
2684 }
2685
2686 key->temperature = listp->hfl_hotfile[i].hf_temperature;
2687 key->fileID = listp->hfl_hotfile[i].hf_fileid;
2688 key->forkType = 0;
2689
2690 /* Start a new transaction before calling BTree code. */
2691 if (hfs_start_transaction(hfsmp) != 0) {
2692 error = EINVAL;
2693 break;
2694 }
2695 startedtrans = 1;
2696
2697 error = BTInsertRecord(filefork, iterator, &record, record.itemSize);
2698 if (error) {
2699 int orig_error = error;
2700 error = MacToVFSError(error);
2701 printf("hfs: hotfiles_adopt:1: BTInsertRecord failed %d/%d (fileid %d)\n", error, orig_error, key->fileID);
2702 stage = HFC_IDLE;
2703 break;
2704 }
2705
2706 /* Insert thread record */
2707 key->keyLength = HFC_KEYLENGTH;
2708 key->temperature = HFC_LOOKUPTAG;
2709 key->fileID = listp->hfl_hotfile[i].hf_fileid;
2710 key->forkType = 0;
2711 data = listp->hfl_hotfile[i].hf_temperature;
2712 error = BTInsertRecord(filefork, iterator, &record, record.itemSize);
2713 if (error) {
2714 int orig_error = error;
2715 error = MacToVFSError(error);
2716 printf("hfs: hotfiles_adopt:2: BTInsertRecord failed %d/%d (fileid %d)\n", error, orig_error, key->fileID);
2717 stage = HFC_IDLE;
2718 break;
2719 } else {
2720 (void) BTFlushPath(filefork);
2721 blksmoved += fileblocks;
2722 }
2723
2724 listp->hfl_next++;
2725 if (listp->hfl_next >= listp->hfl_count) {
2726 break;
2727 }
2728
2729 /* Transaction complete. */
2730 if (startedtrans) {
2731 hfs_end_transaction(hfsmp);
2732 startedtrans = 0;
2733 }
2734
2735 if (hfs_hotfile_cur_freeblks(hfsmp) <= 0) {
2736 #if HFC_VERBOSE
2737 printf("hfs: hotfiles_adopt: free space exhausted (%d)\n", hfsmp->hfs_hotfile_freeblks);
2738 #endif
2739 break;
2740 }
2741 } /* end for */
2742
2743 #if HFC_VERBOSE
2744 printf("hfs: hotfiles_adopt: [%d] adopted %d blocks (%d files left)\n", listp->hfl_next, blksmoved, listp->hfl_count - i);
2745 #endif
2746 if (!startedtrans) {
2747 // start a txn so we'll save the btree summary info
2748 if (hfs_start_transaction(hfsmp) == 0) {
2749 startedtrans = 1;
2750 }
2751 }
2752
2753 /* Finish any outstanding transactions. */
2754 if (startedtrans) {
2755 save_btree_user_info(hfsmp);
2756
2757 (void) BTFlushPath(filefork);
2758 hfs_end_transaction(hfsmp);
2759 startedtrans = 0;
2760 }
2761 hfs_unlock(VTOC(hfsmp->hfc_filevp));
2762
2763 if ((listp->hfl_next >= listp->hfl_count) || (hfsmp->hfs_hotfile_freeblks <= 0)) {
2764 #if HFC_VERBOSE
2765 printf("hfs: hotfiles_adopt: all done relocating %d files\n", listp->hfl_count);
2766 printf("hfs: hotfiles_adopt: %d blocks free in hot file band\n", hfsmp->hfs_hotfile_freeblks);
2767 #endif
2768 stage = HFC_IDLE;
2769 }
2770 FREE(iterator, M_TEMP);
2771
2772 if (stage != HFC_ADOPTION && hfsmp->hfc_filevp) {
2773 (void) hfc_btree_close(hfsmp, hfsmp->hfc_filevp);
2774 hfsmp->hfc_filevp = NULL;
2775 }
2776 hfsmp->hfc_stage = stage;
2777 wakeup((caddr_t)&hfsmp->hfc_stage);
2778 return (error);
2779 }
2780
2781 /*
2782 * Reclaim space by evicting the coldest files.
2783 *
2784 * Requires that the hfc_mutex be held.
2785 */
2786 static int
2787 hotfiles_evict(struct hfsmount *hfsmp, vfs_context_t ctx)
2788 {
2789 BTreeIterator * iterator = NULL;
2790 struct vnode *vp;
2791 HotFileKey * key;
2792 filefork_t * filefork;
2793 hotfilelist_t *listp;
2794 enum hfc_stage stage;
2795 u_int32_t savedtemp;
2796 int blksmoved;
2797 int filesmoved;
2798 int fileblocks;
2799 int error = 0;
2800 int startedtrans = 0;
2801 int bt_op;
2802
2803 if (hfsmp->hfc_stage != HFC_EVICTION) {
2804 return (EBUSY);
2805 }
2806
2807 if ((listp = (hotfilelist_t *)hfsmp->hfc_recdata) == NULL)
2808 return (0);
2809
2810 if (hfs_lock(VTOC(hfsmp->hfc_filevp), HFS_EXCLUSIVE_LOCK, HFS_LOCK_DEFAULT) != 0) {
2811 return (EPERM);
2812 }
2813
2814 #if HFC_VERBOSE
2815 printf("hfs:%s: hotfiles_evict (hotfile start/end block: %d - %d; max/free: %d/%d; maxfiles: %d)\n",
2816 hfsmp->vcbVN,
2817 hfsmp->hfs_hotfile_start, hfsmp->hfs_hotfile_end,
2818 hfsmp->hfs_hotfile_maxblks, hfsmp->hfs_hotfile_freeblks, hfsmp->hfc_maxfiles);
2819 #endif
2820
2821 MALLOC(iterator, BTreeIterator *, sizeof(*iterator), M_TEMP, M_WAITOK);
2822 if (iterator == NULL) {
2823 hfs_unlock(VTOC(hfsmp->hfc_filevp));
2824 return (ENOMEM);
2825 }
2826
2827 stage = hfsmp->hfc_stage;
2828 hfsmp->hfc_stage = HFC_BUSY;
2829
2830 filesmoved = blksmoved = 0;
2831 bt_op = kBTreeFirstRecord;
2832
2833 bzero(iterator, sizeof(*iterator));
2834 key = (HotFileKey*) &iterator->key;
2835
2836 filefork = VTOF(hfsmp->hfc_filevp);
2837
2838 #if HFC_VERBOSE
2839 printf("hfs: hotfiles_evict: reclaim blks %d\n", listp->hfl_reclaimblks);
2840 #endif
2841
2842 while (listp->hfl_reclaimblks > 0 &&
2843 blksmoved < HFC_BLKSPERSYNC &&
2844 filesmoved < HFC_FILESPERSYNC) {
2845
2846 /*
2847 * Obtain the first record (ie the coldest one).
2848 */
2849 if (BTIterateRecord(filefork, bt_op, iterator, NULL, NULL) != 0) {
2850 #if HFC_VERBOSE
2851 printf("hfs: hotfiles_evict: no more records\n");
2852 #endif
2853 error = 0;
2854 stage = HFC_ADOPTION;
2855 break;
2856 }
2857 if (key->keyLength != HFC_KEYLENGTH) {
2858 printf("hfs: hotfiles_evict: invalid key length %d\n", key->keyLength);
2859 error = EFTYPE;
2860 break;
2861 }
2862 if (key->temperature == HFC_LOOKUPTAG) {
2863 #if HFC_VERBOSE
2864 printf("hfs: hotfiles_evict: ran into thread records\n");
2865 #endif
2866 error = 0;
2867 stage = HFC_ADOPTION;
2868 break;
2869 }
2870
2871 // Jump straight to delete for some files...
2872 if (key->fileID == VTOC(hfsmp->hfc_filevp)->c_fileid
2873 || key->fileID == hfsmp->hfs_jnlfileid
2874 || key->fileID == hfsmp->hfs_jnlinfoblkid
2875 || key->fileID < kHFSFirstUserCatalogNodeID) {
2876 goto delete;
2877 }
2878
2879 /*
2880 * Aquire the vnode for this file.
2881 */
2882 error = hfs_vget(hfsmp, key->fileID, &vp, 0, 0);
2883 if (error) {
2884 if (error == ENOENT) {
2885 goto delete; /* stale entry, go to next */
2886 } else {
2887 printf("hfs: hotfiles_evict: err %d getting file %d\n",
2888 error, key->fileID);
2889 }
2890 break;
2891 }
2892
2893 /*
2894 * Symlinks that may have been inserted into the hotfile zone during a previous OS are now stuck
2895 * here. We do not want to move them.
2896 */
2897 if (!vnode_isreg(vp)) {
2898 //printf("hfs: hotfiles_evict: huh, not a file %d\n", key->fileID);
2899 hfs_unlock(VTOC(vp));
2900 vnode_put(vp);
2901 goto delete; /* invalid entry, go to next */
2902 }
2903
2904 fileblocks = VTOF(vp)->ff_blocks;
2905 if ((blksmoved > 0) &&
2906 (blksmoved + fileblocks) > HFC_BLKSPERSYNC) {
2907 hfs_unlock(VTOC(vp));
2908 vnode_put(vp);
2909 break;
2910 }
2911 /*
2912 * Make sure file is in the hot area.
2913 */
2914 if (!hotextents(hfsmp, &VTOF(vp)->ff_extents[0]) && !(VTOC(vp)->c_attr.ca_recflags & kHFSFastDevPinnedMask)) {
2915 #if HFC_VERBOSE
2916 printf("hfs: hotfiles_evict: file %d isn't hot!\n", key->fileID);
2917 #endif
2918 hfs_unlock(VTOC(vp));
2919 vnode_put(vp);
2920 goto delete; /* stale entry, go to next */
2921 }
2922
2923 /*
2924 * Relocate file out of hot area. On cooperative fusion (CF) that just
2925 * means un-pinning the data from the ssd. For traditional hotfiles that means moving
2926 * the file data out of the hot region of the disk.
2927 */
2928 if (hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN) {
2929 uint32_t pinned_blocks;
2930
2931 hfs_unlock(VTOC(vp)); // don't need an exclusive lock for this
2932 hfs_lock(VTOC(vp), HFS_SHARED_LOCK, HFS_LOCK_ALLOW_NOEXISTS);
2933
2934 error = hfs_pin_vnode(hfsmp, vp, HFS_UNPIN_IT, &pinned_blocks, ctx);
2935 fileblocks = pinned_blocks;
2936
2937 if (!error) {
2938 // go back to an exclusive lock since we're going to modify the cnode again
2939 hfs_unlock(VTOC(vp));
2940 hfs_lock(VTOC(vp), HFS_EXCLUSIVE_LOCK, HFS_LOCK_ALLOW_NOEXISTS);
2941 }
2942 } else {
2943 error = hfs_relocate(vp, HFSTOVCB(hfsmp)->nextAllocation, vfs_context_ucred(ctx), vfs_context_proc(ctx));
2944 }
2945 if (error) {
2946 #if HFC_VERBOSE
2947 printf("hfs: hotfiles_evict: err %d relocating file %d\n", error, key->fileID);
2948 #endif
2949 hfs_unlock(VTOC(vp));
2950 vnode_put(vp);
2951 bt_op = kBTreeNextRecord;
2952 goto next; /* go to next */
2953 } else {
2954 VTOC(vp)->c_attr.ca_recflags &= ~kHFSFastDevPinnedMask;
2955 VTOC(vp)->c_flag |= C_MODIFIED;
2956 }
2957
2958 //
2959 // We do not believe that this call to hfs_fsync() is
2960 // necessary and it causes a journal transaction
2961 // deadlock so we are removing it.
2962 //
2963 // (void) hfs_fsync(vp, MNT_WAIT, 0, p);
2964
2965 hfs_unlock(VTOC(vp));
2966 vnode_put(vp);
2967
2968 hfsmp->hfs_hotfile_freeblks += fileblocks;
2969 listp->hfl_reclaimblks -= fileblocks;
2970 if (listp->hfl_reclaimblks < 0)
2971 listp->hfl_reclaimblks = 0;
2972 blksmoved += fileblocks;
2973 filesmoved++;
2974 delete:
2975 /* Start a new transaction before calling BTree code. */
2976 if (hfs_start_transaction(hfsmp) != 0) {
2977 error = EINVAL;
2978 break;
2979 }
2980 startedtrans = 1;
2981
2982 error = BTDeleteRecord(filefork, iterator);
2983 if (error) {
2984 error = MacToVFSError(error);
2985 break;
2986 }
2987 savedtemp = key->temperature;
2988 key->temperature = HFC_LOOKUPTAG;
2989 error = BTDeleteRecord(filefork, iterator);
2990 if (error) {
2991 error = MacToVFSError(error);
2992 break;
2993 }
2994 key->temperature = savedtemp;
2995 next:
2996 (void) BTFlushPath(filefork);
2997
2998 /* Transaction complete. */
2999 if (startedtrans) {
3000 hfs_end_transaction(hfsmp);
3001 startedtrans = 0;
3002 }
3003
3004 } /* end while */
3005
3006 #if HFC_VERBOSE
3007 printf("hfs: hotfiles_evict: moved %d files (%d blks, %d to go)\n", filesmoved, blksmoved, listp->hfl_reclaimblks);
3008 #endif
3009 /* Finish any outstanding transactions. */
3010 if (startedtrans) {
3011 save_btree_user_info(hfsmp);
3012
3013 (void) BTFlushPath(filefork);
3014 hfs_end_transaction(hfsmp);
3015 startedtrans = 0;
3016 }
3017 hfs_unlock(VTOC(hfsmp->hfc_filevp));
3018
3019 /*
3020 * Move to next stage when finished.
3021 */
3022 if (listp->hfl_reclaimblks <= 0) {
3023 stage = HFC_ADOPTION;
3024 #if HFC_VERBOSE
3025 printf("hfs: hotfiles_evict: %d blocks free in hot file band\n", hfsmp->hfs_hotfile_freeblks);
3026 #endif
3027 }
3028 FREE(iterator, M_TEMP);
3029 hfsmp->hfc_stage = stage;
3030 wakeup((caddr_t)&hfsmp->hfc_stage);
3031 return (error);
3032 }
3033
3034 /*
3035 * Age the existing records in the hot files b-tree.
3036 */
3037 static int
3038 hotfiles_age(struct hfsmount *hfsmp)
3039 {
3040 BTreeInfoRec btinfo;
3041 BTreeIterator * iterator = NULL;
3042 BTreeIterator * prev_iterator;
3043 FSBufferDescriptor record;
3044 FSBufferDescriptor prev_record;
3045 HotFileKey * key;
3046 HotFileKey * prev_key;
3047 filefork_t * filefork;
3048 u_int32_t data;
3049 u_int32_t prev_data;
3050 u_int32_t newtemp;
3051 int error;
3052 int i;
3053 int numrecs;
3054 int aged = 0;
3055 u_int16_t reclen;
3056
3057
3058 if (hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN) {
3059 //
3060 // hotfiles don't age on CF
3061 //
3062 return 0;
3063 }
3064
3065 MALLOC(iterator, BTreeIterator *, 2 * sizeof(*iterator), M_TEMP, M_WAITOK);
3066 if (iterator == NULL) {
3067 error = ENOMEM;
3068 goto out2;
3069 }
3070 bzero(iterator, 2 * sizeof(*iterator));
3071 key = (HotFileKey*) &iterator->key;
3072
3073 prev_iterator = &iterator[1];
3074 prev_key = (HotFileKey*) &prev_iterator->key;
3075
3076 record.bufferAddress = &data;
3077 record.itemSize = sizeof(data);
3078 record.itemCount = 1;
3079 prev_record.bufferAddress = &prev_data;
3080 prev_record.itemSize = sizeof(prev_data);
3081 prev_record.itemCount = 1;
3082
3083 /*
3084 * Capture b-tree changes inside a transaction
3085 */
3086 if (hfs_start_transaction(hfsmp) != 0) {
3087 error = EINVAL;
3088 goto out2;
3089 }
3090 if (hfs_lock(VTOC(hfsmp->hfc_filevp), HFS_EXCLUSIVE_LOCK, HFS_LOCK_DEFAULT) != 0) {
3091 error = EPERM;
3092 goto out1;
3093 }
3094 filefork = VTOF(hfsmp->hfc_filevp);
3095
3096 error = BTGetInformation(filefork, 0, &btinfo);
3097 if (error) {
3098 error = MacToVFSError(error);
3099 goto out;
3100 }
3101 if (btinfo.numRecords < 2) {
3102 error = 0;
3103 goto out;
3104 }
3105
3106 /* Only want 1st half of leaf records */
3107 numrecs = (btinfo.numRecords /= 2) - 1;
3108
3109 error = BTIterateRecord(filefork, kBTreeFirstRecord, iterator, &record, &reclen);
3110 if (error) {
3111 printf("hfs_agehotfiles: BTIterateRecord: %d\n", error);
3112 error = MacToVFSError(error);
3113 goto out;
3114 }
3115 bcopy(iterator, prev_iterator, sizeof(BTreeIterator));
3116 prev_data = data;
3117
3118 for (i = 0; i < numrecs; ++i) {
3119 error = BTIterateRecord(filefork, kBTreeNextRecord, iterator, &record, &reclen);
3120 if (error == 0) {
3121 if (key->temperature < prev_key->temperature) {
3122 printf("hfs_agehotfiles: out of order keys!\n");
3123 error = EFTYPE;
3124 break;
3125 }
3126 if (reclen != sizeof(data)) {
3127 printf("hfs_agehotfiles: invalid record length %d\n", reclen);
3128 error = EFTYPE;
3129 break;
3130 }
3131 if (key->keyLength != HFC_KEYLENGTH) {
3132 printf("hfs_agehotfiles: invalid key length %d\n", key->keyLength);
3133 error = EFTYPE;
3134 break;
3135 }
3136 } else if ((error == fsBTEndOfIterationErr || error == fsBTRecordNotFoundErr) &&
3137 (i == (numrecs - 1))) {
3138 error = 0;
3139 } else if (error) {
3140 printf("hfs_agehotfiles: %d of %d BTIterateRecord: %d\n", i, numrecs, error);
3141 error = MacToVFSError(error);
3142 break;
3143 }
3144 if (prev_key->temperature == HFC_LOOKUPTAG) {
3145 #if HFC_VERBOSE
3146 printf("hfs_agehotfiles: ran into thread record\n");
3147 #endif
3148 error = 0;
3149 break;
3150 }
3151 error = BTDeleteRecord(filefork, prev_iterator);
3152 if (error) {
3153 printf("hfs_agehotfiles: BTDeleteRecord failed %d (file %d)\n", error, prev_key->fileID);
3154 error = MacToVFSError(error);
3155 break;
3156 }
3157
3158 /* Age by halving the temperature (floor = 4) */
3159 newtemp = MAX(prev_key->temperature >> 1, 4);
3160 prev_key->temperature = newtemp;
3161
3162 error = BTInsertRecord(filefork, prev_iterator, &prev_record, prev_record.itemSize);
3163 if (error) {
3164 printf("hfs_agehotfiles: BTInsertRecord failed %d (file %d)\n", error, prev_key->fileID);
3165 error = MacToVFSError(error);
3166 break;
3167 }
3168 ++aged;
3169 /*
3170 * Update thread entry with latest temperature.
3171 */
3172 prev_key->temperature = HFC_LOOKUPTAG;
3173 error = BTUpdateRecord(filefork, prev_iterator,
3174 (IterateCallBackProcPtr)update_callback,
3175 &newtemp);
3176 if (error) {
3177 printf("hfs_agehotfiles: %d of %d BTUpdateRecord failed %d (file %d, %d)\n",
3178 i, numrecs, error, prev_key->fileID, newtemp);
3179 error = MacToVFSError(error);
3180 // break;
3181 }
3182
3183 bcopy(iterator, prev_iterator, sizeof(BTreeIterator));
3184 prev_data = data;
3185
3186 } /* end for */
3187
3188 #if HFC_VERBOSE
3189 if (error == 0)
3190 printf("hfs_agehotfiles: aged %d records out of %d\n", aged, btinfo.numRecords);
3191 #endif
3192 (void) BTFlushPath(filefork);
3193 out:
3194 hfs_unlock(VTOC(hfsmp->hfc_filevp));
3195 out1:
3196 hfs_end_transaction(hfsmp);
3197 out2:
3198 if (iterator)
3199 FREE(iterator, M_TEMP);
3200 return (error);
3201 }
3202
3203 /*
3204 * Return true if any blocks (or all blocks if all is true)
3205 * are contained in the hot file region.
3206 */
3207 static int
3208 hotextents(struct hfsmount *hfsmp, HFSPlusExtentDescriptor * extents)
3209 {
3210 u_int32_t b1, b2;
3211 int i;
3212 int inside = 0;
3213
3214 for (i = 0; i < kHFSPlusExtentDensity; ++i) {
3215 b1 = extents[i].startBlock;
3216 if (b1 == 0)
3217 break;
3218 b2 = b1 + extents[i].blockCount - 1;
3219 if ((b1 >= hfsmp->hfs_hotfile_start &&
3220 b2 <= hfsmp->hfs_hotfile_end) ||
3221 (b1 < hfsmp->hfs_hotfile_end &&
3222 b2 > hfsmp->hfs_hotfile_end)) {
3223 inside = 1;
3224 break;
3225 }
3226 }
3227 return (inside);
3228 }
3229
3230
3231 /*
3232 *========================================================================
3233 * HOT FILE B-TREE ROUTINES
3234 *========================================================================
3235 */
3236
3237 /*
3238 * Open the hot files b-tree for writing.
3239 *
3240 * On successful exit the vnode has a reference but not an iocount.
3241 */
3242 static int
3243 hfc_btree_open(struct hfsmount *hfsmp, struct vnode **vpp)
3244 {
3245 return hfc_btree_open_ext(hfsmp, vpp, 0);
3246 }
3247
3248 static int
3249 hfc_btree_open_ext(struct hfsmount *hfsmp, struct vnode **vpp, int ignore_btree_errs)
3250 {
3251 proc_t p;
3252 struct vnode *vp;
3253 struct cat_desc cdesc;
3254 struct cat_attr cattr;
3255 struct cat_fork cfork;
3256 static char filename[] = HFC_FILENAME;
3257 int error;
3258 int retry = 0;
3259 int lockflags;
3260 int newvnode_flags = 0;
3261
3262 *vpp = NULL;
3263 p = current_proc();
3264
3265 bzero(&cdesc, sizeof(cdesc));
3266 cdesc.cd_parentcnid = kRootDirID;
3267 cdesc.cd_nameptr = (const u_int8_t *)filename;
3268 cdesc.cd_namelen = strlen(filename);
3269
3270 lockflags = hfs_systemfile_lock(hfsmp, SFL_CATALOG, HFS_SHARED_LOCK);
3271
3272 error = cat_lookup(hfsmp, &cdesc, 0, 0, &cdesc, &cattr, &cfork, NULL);
3273
3274 hfs_systemfile_unlock(hfsmp, lockflags);
3275
3276 if (error) {
3277 printf("hfs: hfc_btree_open: cat_lookup error %d\n", error);
3278 return (error);
3279 }
3280 again:
3281 cdesc.cd_flags |= CD_ISMETA;
3282 error = hfs_getnewvnode(hfsmp, NULL, NULL, &cdesc, 0, &cattr,
3283 &cfork, &vp, &newvnode_flags);
3284 if (error) {
3285 printf("hfs: hfc_btree_open: hfs_getnewvnode error %d\n", error);
3286 cat_releasedesc(&cdesc);
3287 return (error);
3288 }
3289 if (!vnode_issystem(vp)) {
3290 #if HFC_VERBOSE
3291 printf("hfs: hfc_btree_open: file has UBC, try again\n");
3292 #endif
3293 hfs_unlock(VTOC(vp));
3294 vnode_recycle(vp);
3295 vnode_put(vp);
3296 if (retry++ == 0)
3297 goto again;
3298 else
3299 return (EBUSY);
3300 }
3301
3302 /* Open the B-tree file for writing... */
3303 error = BTOpenPath(VTOF(vp), (KeyCompareProcPtr) hfc_comparekeys);
3304 if (error) {
3305 if (!ignore_btree_errs) {
3306 printf("hfs: hfc_btree_open: BTOpenPath error %d; filesize %lld\n", error, VTOF(vp)->ff_size);
3307 error = MacToVFSError(error);
3308 } else {
3309 error = 0;
3310 }
3311 }
3312
3313 hfs_unlock(VTOC(vp));
3314 if (error == 0) {
3315 *vpp = vp;
3316 vnode_ref(vp); /* keep a reference while its open */
3317 }
3318 vnode_put(vp);
3319
3320 if (!vnode_issystem(vp))
3321 panic("hfs: hfc_btree_open: not a system file (vp = %p)", vp);
3322
3323 HotFilesInfo hotfileinfo;
3324
3325 if (error == 0 && (hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN)) {
3326 if ((BTGetUserData(VTOF(vp), &hotfileinfo, sizeof(hotfileinfo)) == 0) && (SWAP_BE32 (hotfileinfo.magic) == HFC_MAGIC)) {
3327 if (hfsmp->hfs_hotfile_freeblks == 0) {
3328 hfsmp->hfs_hotfile_freeblks = hfsmp->hfs_hotfile_maxblks - SWAP_BE32 (hotfileinfo.usedblocks);
3329 }
3330
3331 hfs_hotfile_cur_freeblks(hfsmp); // factors in any adjustments that happened at run-time
3332 }
3333 }
3334
3335 return (error);
3336 }
3337
3338 /*
3339 * Close the hot files b-tree.
3340 *
3341 * On entry the vnode has a reference.
3342 */
3343 static int
3344 hfc_btree_close(struct hfsmount *hfsmp, struct vnode *vp)
3345 {
3346 proc_t p = current_proc();
3347 int error = 0;
3348
3349
3350 if (hfsmp->jnl) {
3351 hfs_flush(hfsmp, HFS_FLUSH_JOURNAL);
3352 }
3353
3354 if (vnode_get(vp) == 0) {
3355 error = hfs_lock(VTOC(vp), HFS_EXCLUSIVE_LOCK, HFS_LOCK_DEFAULT);
3356 if (error == 0) {
3357 (void) hfs_fsync(vp, MNT_WAIT, 0, p);
3358 error = BTClosePath(VTOF(vp));
3359 hfs_unlock(VTOC(vp));
3360 }
3361 vnode_rele(vp);
3362 vnode_recycle(vp);
3363 vnode_put(vp);
3364 }
3365
3366 return (error);
3367 }
3368
3369 //
3370 // Assumes that hfsmp->hfc_filevp points to the hotfile btree vnode
3371 // (i.e. you called hfc_btree_open() ahead of time)
3372 //
3373 static int
3374 hfc_btree_delete_record(struct hfsmount *hfsmp, BTreeIterator *iterator, HotFileKey *key)
3375 {
3376 int error;
3377 filefork_t *filefork=VTOF(hfsmp->hfc_filevp);
3378
3379 /* Start a new transaction before calling BTree code. */
3380 if (hfs_start_transaction(hfsmp) != 0) {
3381 return EINVAL;
3382 }
3383
3384 error = BTDeleteRecord(filefork, iterator);
3385 if (error) {
3386 error = MacToVFSError(error);
3387 printf("hfs: failed to delete record for file-id %d : err %d\n", key->fileID, error);
3388 goto out;
3389 }
3390
3391 int savedtemp;
3392 savedtemp = key->temperature;
3393 key->temperature = HFC_LOOKUPTAG;
3394 error = BTDeleteRecord(filefork, iterator);
3395 if (error) {
3396 error = MacToVFSError(error);
3397 printf("hfs:2: failed to delete record for file-id %d : err %d\n", key->fileID, error);
3398 }
3399 key->temperature = savedtemp;
3400
3401 (void) BTFlushPath(filefork);
3402
3403 out:
3404 /* Transaction complete. */
3405 hfs_end_transaction(hfsmp);
3406
3407 return error;
3408 }
3409
3410 //
3411 // You have to have already opened the hotfile btree so
3412 // that hfsmp->hfc_filevp is filled in.
3413 //
3414 static int
3415 hfc_btree_delete(struct hfsmount *hfsmp)
3416 {
3417 struct vnode *dvp = NULL;
3418 vfs_context_t ctx = vfs_context_current();
3419 struct vnode_attr va;
3420 struct componentname cname;
3421 static char filename[] = HFC_FILENAME;
3422 int error;
3423
3424 error = VFS_ROOT(HFSTOVFS(hfsmp), &dvp, ctx);
3425 if (error) {
3426 return (error);
3427 }
3428 cname.cn_nameiop = DELETE;
3429 cname.cn_flags = ISLASTCN;
3430 cname.cn_context = ctx;
3431 cname.cn_pnbuf = filename;
3432 cname.cn_pnlen = sizeof(filename);
3433 cname.cn_nameptr = filename;
3434 cname.cn_namelen = strlen(filename);
3435 cname.cn_hash = 0;
3436 cname.cn_consume = 0;
3437
3438 VATTR_INIT(&va);
3439 VATTR_SET(&va, va_type, VREG);
3440 VATTR_SET(&va, va_mode, S_IFREG | S_IRUSR | S_IWUSR);
3441 VATTR_SET(&va, va_uid, 0);
3442 VATTR_SET(&va, va_gid, 0);
3443
3444 if (hfs_start_transaction(hfsmp) != 0) {
3445 error = EINVAL;
3446 goto out;
3447 }
3448
3449 /* call ourselves directly, ignore the higher-level VFS file creation code */
3450 error = VNOP_REMOVE(dvp, hfsmp->hfc_filevp, &cname, 0, ctx);
3451 if (error) {
3452 printf("hfs: error %d removing HFBT on %s\n", error, HFSTOVCB(hfsmp)->vcbVN);
3453 }
3454
3455 hfs_end_transaction(hfsmp);
3456
3457 out:
3458 if (dvp) {
3459 vnode_put(dvp);
3460 dvp = NULL;
3461 }
3462
3463 return 0;
3464 }
3465
3466
3467
3468
3469 /*
3470 * Create a hot files btree file.
3471 *
3472 */
3473 static int
3474 hfc_btree_create(struct hfsmount *hfsmp, unsigned int nodesize, unsigned int entries)
3475 {
3476 struct vnode *dvp = NULL;
3477 struct vnode *vp = NULL;
3478 struct cnode *cp = NULL;
3479 vfs_context_t ctx = vfs_context_current();
3480 struct vnode_attr va;
3481 struct componentname cname;
3482 static char filename[] = HFC_FILENAME;
3483 int error;
3484
3485 if (hfsmp->hfc_filevp)
3486 panic("hfs: hfc_btree_create: hfc_filevp exists (vp = %p)", hfsmp->hfc_filevp);
3487
3488 error = VFS_ROOT(HFSTOVFS(hfsmp), &dvp, ctx);
3489 if (error) {
3490 return (error);
3491 }
3492 cname.cn_nameiop = CREATE;
3493 cname.cn_flags = ISLASTCN;
3494 cname.cn_context = ctx;
3495 cname.cn_pnbuf = filename;
3496 cname.cn_pnlen = sizeof(filename);
3497 cname.cn_nameptr = filename;
3498 cname.cn_namelen = strlen(filename);
3499 cname.cn_hash = 0;
3500 cname.cn_consume = 0;
3501
3502 VATTR_INIT(&va);
3503 VATTR_SET(&va, va_type, VREG);
3504 VATTR_SET(&va, va_mode, S_IFREG | S_IRUSR | S_IWUSR);
3505 VATTR_SET(&va, va_uid, 0);
3506 VATTR_SET(&va, va_gid, 0);
3507
3508 if (hfs_start_transaction(hfsmp) != 0) {
3509 error = EINVAL;
3510 goto out;
3511 }
3512
3513 /* call ourselves directly, ignore the higher-level VFS file creation code */
3514 error = VNOP_CREATE(dvp, &vp, &cname, &va, ctx);
3515 if (error) {
3516 printf("hfs: error %d creating HFBT on %s\n", error, HFSTOVCB(hfsmp)->vcbVN);
3517 goto out;
3518 }
3519 if (dvp) {
3520 vnode_put(dvp);
3521 dvp = NULL;
3522 }
3523 if ((error = hfs_lock(VTOC(vp), HFS_EXCLUSIVE_LOCK, HFS_LOCK_DEFAULT))) {
3524 goto out;
3525 }
3526 cp = VTOC(vp);
3527
3528 /* Don't use non-regular files or files with links. */
3529 if (!vnode_isreg(vp) || cp->c_linkcount != 1) {
3530 error = EFTYPE;
3531 goto out;
3532 }
3533
3534 printf("hfs: created HFBT on %s\n", HFSTOVCB(hfsmp)->vcbVN);
3535
3536 if (VTOF(vp)->ff_size < nodesize) {
3537 caddr_t buffer;
3538 u_int16_t *index;
3539 u_int16_t offset;
3540 BTNodeDescriptor *ndp;
3541 BTHeaderRec *bthp;
3542 HotFilesInfo *hotfileinfo;
3543 int nodecnt;
3544 int filesize;
3545 int entirespernode;
3546
3547 /*
3548 * Mark it invisible (truncate will pull these changes).
3549 */
3550 ((FndrFileInfo *)&cp->c_finderinfo[0])->fdFlags |=
3551 SWAP_BE16 (kIsInvisible + kNameLocked);
3552
3553 if (kmem_alloc(kernel_map, (vm_offset_t *)&buffer, nodesize, VM_KERN_MEMORY_FILE)) {
3554 error = ENOMEM;
3555 goto out;
3556 }
3557 bzero(buffer, nodesize);
3558 index = (u_int16_t *)buffer;
3559
3560 entirespernode = (nodesize - sizeof(BTNodeDescriptor) - 2) /
3561 (sizeof(HotFileKey) + 6);
3562 nodecnt = 2 + howmany(entries * 2, entirespernode);
3563 nodecnt = roundup(nodecnt, 8);
3564 filesize = nodecnt * nodesize;
3565
3566 /* FILL IN THE NODE DESCRIPTOR: */
3567 ndp = (BTNodeDescriptor *)buffer;
3568 ndp->kind = kBTHeaderNode;
3569 ndp->numRecords = SWAP_BE16 (3);
3570 offset = sizeof(BTNodeDescriptor);
3571 index[(nodesize / 2) - 1] = SWAP_BE16 (offset);
3572
3573 /* FILL IN THE HEADER RECORD: */
3574 bthp = (BTHeaderRec *)((u_int8_t *)buffer + offset);
3575 bthp->nodeSize = SWAP_BE16 (nodesize);
3576 bthp->totalNodes = SWAP_BE32 (filesize / nodesize);
3577 bthp->freeNodes = SWAP_BE32 (nodecnt - 1);
3578 bthp->clumpSize = SWAP_BE32 (filesize);
3579 bthp->btreeType = kUserBTreeType; /* non-metadata */
3580 bthp->attributes |= SWAP_BE32 (kBTBigKeysMask);
3581 bthp->maxKeyLength = SWAP_BE16 (HFC_KEYLENGTH);
3582 offset += sizeof(BTHeaderRec);
3583 index[(nodesize / 2) - 2] = SWAP_BE16 (offset);
3584
3585 /* FILL IN THE USER RECORD: */
3586 hotfileinfo = (HotFilesInfo *)((u_int8_t *)buffer + offset);
3587 hotfileinfo->magic = SWAP_BE32 (HFC_MAGIC);
3588 hotfileinfo->version = SWAP_BE32 (HFC_VERSION);
3589 hotfileinfo->duration = SWAP_BE32 (HFC_DEFAULT_DURATION);
3590 hotfileinfo->timebase = 0;
3591 hotfileinfo->timeleft = 0;
3592 hotfileinfo->threshold = SWAP_BE32 (HFC_MINIMUM_TEMPERATURE);
3593 hotfileinfo->maxfileblks = SWAP_BE32 (HFC_MAXIMUM_FILESIZE / HFSTOVCB(hfsmp)->blockSize);
3594 if (hfsmp->hfs_flags & HFS_CS_HOTFILE_PIN) {
3595 if (hfsmp->hfs_hotfile_freeblks == 0) {
3596 hfsmp->hfs_hotfile_freeblks = hfsmp->hfs_hotfile_maxblks;
3597 }
3598 hotfileinfo->usedblocks = SWAP_BE32 (hfsmp->hfs_hotfile_maxblks - hfsmp->hfs_hotfile_freeblks);
3599 } else {
3600 hotfileinfo->maxfilecnt = SWAP_BE32 (HFC_DEFAULT_FILE_COUNT);
3601 }
3602 strlcpy((char *)hotfileinfo->tag, hfc_tag,
3603 sizeof hotfileinfo->tag);
3604 offset += kBTreeHeaderUserBytes;
3605 index[(nodesize / 2) - 3] = SWAP_BE16 (offset);
3606
3607 /* FILL IN THE MAP RECORD (only one node in use). */
3608 *((u_int8_t *)buffer + offset) = 0x80;
3609 offset += nodesize - sizeof(BTNodeDescriptor) - sizeof(BTHeaderRec)
3610 - kBTreeHeaderUserBytes - (4 * sizeof(int16_t));
3611 index[(nodesize / 2) - 4] = SWAP_BE16 (offset);
3612
3613 vnode_setnoflush(vp);
3614 error = hfs_truncate(vp, (off_t)filesize, IO_NDELAY, 0, ctx);
3615 if (error) {
3616 printf("hfs: error %d growing HFBT on %s\n", error, HFSTOVCB(hfsmp)->vcbVN);
3617 goto out;
3618 }
3619 cp->c_flag |= C_ZFWANTSYNC;
3620 cp->c_zftimeout = 1;
3621
3622 if (error == 0) {
3623 struct vnop_write_args args;
3624 uio_t auio;
3625
3626 auio = uio_create(1, 0, UIO_SYSSPACE, UIO_WRITE);
3627 uio_addiov(auio, (uintptr_t)buffer, nodesize);
3628
3629 args.a_desc = &vnop_write_desc;
3630 args.a_vp = vp;
3631 args.a_uio = auio;
3632 args.a_ioflag = 0;
3633 args.a_context = ctx;
3634
3635 hfs_unlock(cp);
3636 cp = NULL;
3637
3638 error = hfs_vnop_write(&args);
3639 if (error)
3640 printf("hfs: error %d writing HFBT on %s\n", error, HFSTOVCB(hfsmp)->vcbVN);
3641
3642 uio_free(auio);
3643 }
3644 kmem_free(kernel_map, (vm_offset_t)buffer, nodesize);
3645 }
3646 out:
3647 hfs_end_transaction(hfsmp);
3648 if (dvp) {
3649 vnode_put(dvp);
3650 }
3651 if (vp) {
3652 if (cp)
3653 hfs_unlock(cp);
3654 vnode_recycle(vp);
3655 vnode_put(vp);
3656 }
3657 return (error);
3658 }
3659
3660 /*
3661 * Compare two hot file b-tree keys.
3662 *
3663 * Result: +n search key > trial key
3664 * 0 search key = trial key
3665 * -n search key < trial key
3666 */
3667 static int
3668 hfc_comparekeys(HotFileKey *searchKey, HotFileKey *trialKey)
3669 {
3670 /*
3671 * Compared temperatures first.
3672 */
3673 if (searchKey->temperature == trialKey->temperature) {
3674 /*
3675 * Temperatures are equal so compare file ids.
3676 */
3677 if (searchKey->fileID == trialKey->fileID) {
3678 /*
3679 * File ids are equal so compare fork types.
3680 */
3681 if (searchKey->forkType == trialKey->forkType) {
3682 return (0);
3683 } else if (searchKey->forkType > trialKey->forkType) {
3684 return (1);
3685 }
3686 } else if (searchKey->fileID > trialKey->fileID) {
3687 return (1);
3688 }
3689 } else if (searchKey->temperature > trialKey->temperature) {
3690 return (1);
3691 }
3692
3693 return (-1);
3694 }
3695
3696
3697 /*
3698 *========================================================================
3699 * HOT FILE DATA COLLECTING ROUTINES
3700 *========================================================================
3701 */
3702
3703 /*
3704 * Lookup a hot file entry in the tree.
3705 */
3706 #if HFC_DEBUG
3707 static hotfile_entry_t *
3708 hf_lookup(hotfile_data_t *hotdata, u_int32_t fileid, u_int32_t temperature)
3709 {
3710 hotfile_entry_t *entry = hotdata->rootentry;
3711
3712 while (entry &&
3713 entry->temperature != temperature &&
3714 entry->fileid != fileid) {
3715
3716 if (temperature > entry->temperature)
3717 entry = entry->right;
3718 else if (temperature < entry->temperature)
3719 entry = entry->left;
3720 else if (fileid > entry->fileid)
3721 entry = entry->right;
3722 else
3723 entry = entry->left;
3724 }
3725 return (entry);
3726 }
3727 #endif
3728
3729 /*
3730 * Insert a hot file entry into the tree.
3731 */
3732 static int
3733 hf_insert(hotfile_data_t *hotdata, hotfile_entry_t *newentry)
3734 {
3735 hotfile_entry_t *entry = hotdata->rootentry;
3736 u_int32_t fileid = newentry->fileid;
3737 u_int32_t temperature = newentry->temperature;
3738
3739 if (entry == NULL) {
3740 hotdata->rootentry = newentry;
3741 hotdata->coldest = newentry;
3742 hotdata->activefiles++;
3743 return 0;
3744 }
3745
3746 while (entry) {
3747 if (temperature > entry->temperature) {
3748 if (entry->right) {
3749 entry = entry->right;
3750 } else {
3751 entry->right = newentry;
3752 break;
3753 }
3754 } else if (temperature < entry->temperature) {
3755 if (entry->left) {
3756 entry = entry->left;
3757 } else {
3758 entry->left = newentry;
3759 break;
3760 }
3761 } else if (fileid > entry->fileid) {
3762 if (entry->right) {
3763 entry = entry->right;
3764 } else {
3765 if (entry->fileid != fileid)
3766 entry->right = newentry;
3767 break;
3768 }
3769 } else {
3770 if (entry->left) {
3771 entry = entry->left;
3772 } else {
3773 if (entry->fileid != fileid) {
3774 entry->left = newentry;
3775 } else {
3776 return EEXIST;
3777 }
3778 break;
3779 }
3780 }
3781 }
3782
3783 hotdata->activefiles++;
3784 return 0;
3785 }
3786
3787 /*
3788 * Find the coldest entry in the tree.
3789 */
3790 static hotfile_entry_t *
3791 hf_coldest(hotfile_data_t *hotdata)
3792 {
3793 hotfile_entry_t *entry = hotdata->rootentry;
3794
3795 if (entry) {
3796 while (entry->left)
3797 entry = entry->left;
3798 }
3799 return (entry);
3800 }
3801
3802 /*
3803 * Find the hottest entry in the tree.
3804 */
3805 static hotfile_entry_t *
3806 hf_hottest(hotfile_data_t *hotdata)
3807 {
3808 hotfile_entry_t *entry = hotdata->rootentry;
3809
3810 if (entry) {
3811 while (entry->right)
3812 entry = entry->right;
3813 }
3814 return (entry);
3815 }
3816
3817 /*
3818 * Delete a hot file entry from the tree.
3819 */
3820 static void
3821 hf_delete(hotfile_data_t *hotdata, u_int32_t fileid, u_int32_t temperature)
3822 {
3823 hotfile_entry_t *entry, *parent, *next;
3824
3825 parent = NULL;
3826 entry = hotdata->rootentry;
3827
3828 while (entry &&
3829 entry->temperature != temperature &&
3830 entry->fileid != fileid) {
3831
3832 parent = entry;
3833 if (temperature > entry->temperature)
3834 entry = entry->right;
3835 else if (temperature < entry->temperature)
3836 entry = entry->left;
3837 else if (fileid > entry->fileid)
3838 entry = entry->right;
3839 else
3840 entry = entry->left;
3841 }
3842
3843 if (entry) {
3844 /*
3845 * Reorganize the sub-trees spanning from our entry.
3846 */
3847 if ((next = entry->right)) {
3848 hotfile_entry_t *pnextl, *psub;
3849 /*
3850 * Tree pruning: take the left branch of the
3851 * current entry and place it at the lowest
3852 * left branch of the current right branch
3853 */
3854 psub = next;
3855
3856 /* Walk the Right/Left sub tree from current entry */
3857 while ((pnextl = psub->left))
3858 psub = pnextl;
3859
3860 /* Plug the old left tree to the new ->Right leftmost entry */
3861 psub->left = entry->left;
3862
3863 } else /* only left sub-tree, simple case */ {
3864 next = entry->left;
3865 }
3866 /*
3867 * Now, plug the current entry sub tree to
3868 * the good pointer of our parent entry.
3869 */
3870 if (parent == NULL)
3871 hotdata->rootentry = next;
3872 else if (parent->left == entry)
3873 parent->left = next;
3874 else
3875 parent->right = next;
3876
3877 /* Place entry back on the free-list */
3878 entry->left = 0;
3879 entry->fileid = 0;
3880 entry->temperature = 0;
3881
3882 entry->right = hotdata->freelist;
3883 hotdata->freelist = entry;
3884 hotdata->activefiles--;
3885
3886 if (hotdata->coldest == entry || hotdata->coldest == NULL) {
3887 hotdata->coldest = hf_coldest(hotdata);
3888 }
3889
3890 }
3891 }
3892
3893 /*
3894 * Get a free hot file entry.
3895 */
3896 static hotfile_entry_t *
3897 hf_getnewentry(hotfile_data_t *hotdata)
3898 {
3899 hotfile_entry_t * entry;
3900
3901 /*
3902 * When the free list is empty then steal the coldest one
3903 */
3904 if (hotdata->freelist == NULL) {
3905 entry = hf_coldest(hotdata);
3906 hf_delete(hotdata, entry->fileid, entry->temperature);
3907 }
3908 entry = hotdata->freelist;
3909 hotdata->freelist = entry->right;
3910 entry->right = 0;
3911
3912 return (entry);
3913 }
3914
3915
3916 /*
3917 * Generate a sorted list of hot files (hottest to coldest).
3918 *
3919 * As a side effect, every node in the hot file tree will be
3920 * deleted (moved to the free list).
3921 */
3922 static void
3923 hf_getsortedlist(hotfile_data_t * hotdata, hotfilelist_t *sortedlist)
3924 {
3925 int i = 0;
3926 hotfile_entry_t *entry;
3927
3928 while ((entry = hf_hottest(hotdata)) != NULL) {
3929 sortedlist->hfl_hotfile[i].hf_fileid = entry->fileid;
3930 sortedlist->hfl_hotfile[i].hf_temperature = entry->temperature;
3931 sortedlist->hfl_hotfile[i].hf_blocks = entry->blocks;
3932 sortedlist->hfl_totalblocks += entry->blocks;
3933 ++i;
3934
3935 hf_delete(hotdata, entry->fileid, entry->temperature);
3936 }
3937
3938 sortedlist->hfl_count = i;
3939
3940 #if HFC_VERBOSE
3941 printf("hfs: hf_getsortedlist returning %d entries w/%d total blocks\n", i, sortedlist->hfl_totalblocks);
3942 #endif
3943 }
3944
3945
3946 #if HFC_DEBUG
3947 static void
3948 hf_maxdepth(hotfile_entry_t * root, int depth, int *maxdepth)
3949 {
3950 if (root) {
3951 depth++;
3952 if (depth > *maxdepth)
3953 *maxdepth = depth;
3954 hf_maxdepth(root->left, depth, maxdepth);
3955 hf_maxdepth(root->right, depth, maxdepth);
3956 }
3957 }
3958
3959 static void
3960 hf_printtree(hotfile_entry_t * root)
3961 {
3962 if (root) {
3963 hf_printtree(root->left);
3964 printf("hfs: temperature: % 8d, fileid %d\n", root->temperature, root->fileid);
3965 hf_printtree(root->right);
3966 }
3967 }
3968 #endif