osfmk/kern/priority.c

   1 /*
   2  * Copyright (c) 2000-2010 Apple Inc. All rights reserved.
   3  *
   4  * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
   5  *
   6  * This file contains Original Code and/or Modifications of Original Code
   7  * as defined in and that are subject to the Apple Public Source License
   8  * Version 2.0 (the 'License'). You may not use this file except in
   9  * compliance with the License. The rights granted to you under the License
  10  * may not be used to create, or enable the creation or redistribution of,
  11  * unlawful or unlicensed copies of an Apple operating system, or to
  12  * circumvent, violate, or enable the circumvention or violation of, any
  13  * terms of an Apple operating system software license agreement.
  14  *
  15  * Please obtain a copy of the License at
  16  * http://www.opensource.apple.com/apsl/ and read it before using this file.
  17  *
  18  * The Original Code and all software distributed under the License are
  19  * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
  20  * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
  21  * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
  22  * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
  23  * Please see the License for the specific language governing rights and
  24  * limitations under the License.
  25  *
  26  * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
  27  */
  28 /*
  29  * @OSF_COPYRIGHT@
  30  */
  31 /*
  32  * Mach Operating System
  33  * Copyright (c) 1991,1990,1989,1988,1987 Carnegie Mellon University
  34  * All Rights Reserved.
  35  *
  36  * Permission to use, copy, modify and distribute this software and its
  37  * documentation is hereby granted, provided that both the copyright
  38  * notice and this permission notice appear in all copies of the
  39  * software, derivative works or modified versions, and any portions
  40  * thereof, and that both notices appear in supporting documentation.
  41  *
  42  * CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS "AS IS"
  43  * CONDITION.  CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND FOR
  44  * ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
  45  *
  46  * Carnegie Mellon requests users of this software to return to
  47  *
  48  *  Software Distribution Coordinator  or  Software.Distribution@CS.CMU.EDU
  49  *  School of Computer Science
  50  *  Carnegie Mellon University
  51  *  Pittsburgh PA 15213-3890
  52  *
  53  * any improvements or extensions that they make and grant Carnegie Mellon
  54  * the rights to redistribute these changes.
  55  */
  56 /*
  57  */
  58 /*
  59  *      File:   priority.c
  60  *      Author: Avadis Tevanian, Jr.
  61  *      Date:   1986
  62  *
  63  *      Priority related scheduler bits.
  64  */
  65
  66 #include <mach/boolean.h>
  67 #include <mach/kern_return.h>
  68 #include <mach/machine.h>
  69 #include <kern/host.h>
  70 #include <kern/mach_param.h>
  71 #include <kern/sched.h>
  72 #include <sys/kdebug.h>
  73 #include <kern/spl.h>
  74 #include <kern/thread.h>
  75 #include <kern/processor.h>
  76 #include <kern/ledger.h>
  77 #include <machine/machparam.h>
  78 #include <kern/machine.h>
  79
  80 #ifdef CONFIG_MACH_APPROXIMATE_TIME
  81 #include <machine/commpage.h>  /* for commpage_update_mach_approximate_time */
  82 #endif
  83
  84 /*
  85  *      thread_quantum_expire:
  86  *
  87  *      Recalculate the quantum and priority for a thread.
  88  *
  89  *      Called at splsched.
  90  */
  91
  92 void
  93 thread_quantum_expire(
  94         timer_call_param_t      p0,
  95         timer_call_param_t      p1)
  96 {
  97         processor_t                     processor = p0;
  98         thread_t                        thread = p1;
  99         ast_t                           preempt;
 100         uint64_t                        ctime;
 101         int                                     urgency;
 102         uint64_t                        ignore1, ignore2;
 103
 104         assert(processor == current_processor());
 105         assert(thread == current_thread());
 106
 107         SCHED_STATS_QUANTUM_TIMER_EXPIRATION(processor);
 108
 109         /*
 110          * We bill CPU time to both the individual thread and its task.
 111          *
 112          * Because this balance adjustment could potentially attempt to wake this very
 113          * thread, we must credit the ledger before taking the thread lock. The ledger
 114          * pointers are only manipulated by the thread itself at the ast boundary.
 115          */
 116         ledger_credit(thread->t_ledger, task_ledgers.cpu_time, thread->quantum_remaining);
 117         ledger_credit(thread->t_threadledger, thread_ledgers.cpu_time, thread->quantum_remaining);
 118 #ifdef CONFIG_BANK
 119         if (thread->t_bankledger) {
 120                 ledger_credit(thread->t_bankledger, bank_ledgers.cpu_time,
 121                                 (thread->quantum_remaining - thread->t_deduct_bank_ledger_time));
 122         }
 123         thread->t_deduct_bank_ledger_time = 0;
 124 #endif
 125
 126         ctime = mach_absolute_time();
 127
 128 #ifdef CONFIG_MACH_APPROXIMATE_TIME
 129         commpage_update_mach_approximate_time(ctime);
 130 #endif
 131
 132         thread_lock(thread);
 133
 134         /*
 135          * We've run up until our quantum expiration, and will (potentially)
 136          * continue without re-entering the scheduler, so update this now.
 137          */
 138         processor->last_dispatch = ctime;
 139         thread->last_run_time = ctime;
 140
 141         /*
 142          *      Check for fail-safe trip.
 143          */
 144         if ((thread->sched_mode == TH_MODE_REALTIME || thread->sched_mode == TH_MODE_FIXED) &&
 145             !(thread->sched_flags & TH_SFLAG_PROMOTED_MASK) &&
 146             !(thread->options & TH_OPT_SYSTEM_CRITICAL)) {
 147                 uint64_t new_computation;
 148
 149                 new_computation = ctime - thread->computation_epoch;
 150                 new_computation += thread->computation_metered;
 151                 if (new_computation > max_unsafe_computation) {
 152                         KERNEL_DEBUG_CONSTANT(MACHDBG_CODE(DBG_MACH_SCHED, MACH_FAILSAFE)|DBG_FUNC_NONE,
 153                                         (uintptr_t)thread->sched_pri, (uintptr_t)thread->sched_mode, 0, 0, 0);
 154
 155                         thread->safe_release = ctime + sched_safe_duration;
 156
 157                         sched_thread_mode_demote(thread, TH_SFLAG_FAILSAFE);
 158                 }
 159         }
 160
 161         /*
 162          *      Recompute scheduled priority if appropriate.
 163          */
 164         if (SCHED(can_update_priority)(thread))
 165                 SCHED(update_priority)(thread);
 166         else
 167                 SCHED(lightweight_update_priority)(thread);
 168
 169         if (thread->sched_mode != TH_MODE_REALTIME)
 170                 SCHED(quantum_expire)(thread);
 171
 172         processor->current_pri = thread->sched_pri;
 173         processor->current_thmode = thread->sched_mode;
 174
 175         /* Tell platform layer that we are still running this thread */
 176         urgency = thread_get_urgency(thread, &ignore1, &ignore2);
 177         machine_thread_going_on_core(thread, urgency, 0);
 178
 179         /*
 180          *      This quantum is up, give this thread another.
 181          */
 182         processor->first_timeslice = FALSE;
 183
 184         thread_quantum_init(thread);
 185
 186         /* Reload precise timing global policy to thread-local policy */
 187         thread->precise_user_kernel_time = use_precise_user_kernel_time(thread);
 188
 189         /*
 190          * Since non-precise user/kernel time doesn't update the state/thread timer
 191          * during privilege transitions, synthesize an event now.
 192          */
 193         if (!thread->precise_user_kernel_time) {
 194                 timer_switch(PROCESSOR_DATA(processor, current_state),
 195                                          ctime,
 196                                          PROCESSOR_DATA(processor, current_state));
 197                 timer_switch(PROCESSOR_DATA(processor, thread_timer),
 198                                          ctime,
 199                                          PROCESSOR_DATA(processor, thread_timer));
 200         }
 201
 202         processor->quantum_end = ctime + thread->quantum_remaining;
 203
 204         /*
 205          *      Context switch check.
 206          */
 207         if ((preempt = csw_check(processor, AST_QUANTUM)) != AST_NONE)
 208                 ast_on(preempt);
 209
 210         thread_unlock(thread);
 211
 212         timer_call_enter1(&processor->quantum_timer, thread,
 213             processor->quantum_end, TIMER_CALL_SYS_CRITICAL | TIMER_CALL_LOCAL);
 214
 215 #if defined(CONFIG_SCHED_TIMESHARE_CORE)
 216         sched_timeshare_consider_maintenance(ctime);
 217 #endif /* CONFIG_SCHED_TIMESHARE_CORE */
 218
 219 }
 220
 221 /*
 222  *      sched_set_thread_base_priority:
 223  *
 224  *      Set the base priority of the thread
 225  *      and reset its scheduled priority.
 226  *
 227  *      This is the only path to change base_pri.
 228  *
 229  *      Called with the thread locked.
 230  */
 231 void
 232 sched_set_thread_base_priority(thread_t thread, int priority)
 233 {
 234         thread->base_pri = priority;
 235
 236         thread_recompute_sched_pri(thread, FALSE);
 237 }
 238
 239 /*
 240  *      thread_recompute_sched_pri:
 241  *
 242  *      Reset the scheduled priority of the thread
 243  *      according to its base priority if the
 244  *      thread has not been promoted or depressed.
 245  *
 246  *      This is the standard way to push base_pri changes into sched_pri,
 247  *      or to recalculate the appropriate sched_pri after clearing
 248  *      a promotion or depression.
 249  *
 250  *      Called at splsched with the thread locked.
 251  */
 252 void
 253 thread_recompute_sched_pri(
 254                            thread_t thread,
 255                            boolean_t override_depress)
 256 {
 257         int priority;
 258
 259         if (thread->sched_mode == TH_MODE_TIMESHARE)
 260                 priority = SCHED(compute_timeshare_priority)(thread);
 261         else
 262                 priority = thread->base_pri;
 263
 264         if ((!(thread->sched_flags & TH_SFLAG_PROMOTED_MASK)  || (priority > thread->sched_pri)) &&
 265             (!(thread->sched_flags & TH_SFLAG_DEPRESSED_MASK) || override_depress)) {
 266                 set_sched_pri(thread, priority);
 267         }
 268 }
 269
 270 void
 271 sched_default_quantum_expire(thread_t thread __unused)
 272 {
 273       /*
 274        * No special behavior when a timeshare, fixed, or realtime thread
 275        * uses up its entire quantum
 276        */
 277 }
 278
 279 #if defined(CONFIG_SCHED_TIMESHARE_CORE)
 280
 281 /*
 282  *      lightweight_update_priority:
 283  *
 284  *      Update the scheduled priority for
 285  *      a timesharing thread.
 286  *
 287  *      Only for use on the current thread.
 288  *
 289  *      Called with the thread locked.
 290  */
 291 void
 292 lightweight_update_priority(thread_t thread)
 293 {
 294         assert(thread->runq == PROCESSOR_NULL);
 295         assert(thread == current_thread());
 296
 297         if (thread->sched_mode == TH_MODE_TIMESHARE) {
 298                 int priority;
 299                 uint32_t delta;
 300
 301                 thread_timer_delta(thread, delta);
 302
 303                 /*
 304                  *      Accumulate timesharing usage only
 305                  *      during contention for processor
 306                  *      resources.
 307                  */
 308                 if (thread->pri_shift < INT8_MAX)
 309                         thread->sched_usage += delta;
 310
 311                 thread->cpu_delta += delta;
 312
 313                 priority = sched_compute_timeshare_priority(thread);
 314
 315                 /*
 316                  * Adjust the scheduled priority like thread_recompute_sched_pri,
 317                  * except with the benefit of knowing the thread is on this core.
 318                  */
 319                 if ((!(thread->sched_flags & TH_SFLAG_PROMOTED_MASK)  || (priority > thread->sched_pri)) &&
 320                     (!(thread->sched_flags & TH_SFLAG_DEPRESSED_MASK)) &&
 321                     priority != thread->sched_pri) {
 322
 323                         thread->sched_pri = priority;
 324
 325                         KERNEL_DEBUG_CONSTANT(MACHDBG_CODE(DBG_MACH_SCHED, MACH_SCHED_CHANGE_PRIORITY),
 326                                               (uintptr_t)thread_tid(thread),
 327                                               thread->base_pri,
 328                                               thread->sched_pri,
 329                                               0, /* eventually, 'reason' */
 330                                               0);
 331                 }
 332         }
 333 }
 334
 335 /*
 336  *      Define shifts for simulating (5/8) ** n
 337  *
 338  *      Shift structures for holding update shifts.  Actual computation
 339  *      is  usage = (usage >> shift1) +/- (usage >> abs(shift2))  where the
 340  *      +/- is determined by the sign of shift 2.
 341  */
 342 struct shift_data {
 343         int     shift1;
 344         int     shift2;
 345 };
 346
 347 #define SCHED_DECAY_TICKS       32
 348 static struct shift_data        sched_decay_shifts[SCHED_DECAY_TICKS] = {
 349         {1,1},{1,3},{1,-3},{2,-7},{3,5},{3,-5},{4,-8},{5,7},
 350         {5,-7},{6,-10},{7,10},{7,-9},{8,-11},{9,12},{9,-11},{10,-13},
 351         {11,14},{11,-13},{12,-15},{13,17},{13,-15},{14,-17},{15,19},{16,18},
 352         {16,-19},{17,22},{18,20},{18,-20},{19,26},{20,22},{20,-22},{21,-27}
 353 };
 354
 355 /*
 356  *      sched_compute_timeshare_priority:
 357  *
 358  *      Calculate the timesharing priority based upon usage and load.
 359  */
 360 extern int sched_pri_decay_band_limit;
 361
 362
 363 int
 364 sched_compute_timeshare_priority(thread_t thread)
 365 {
 366         /* start with base priority */
 367         int priority = thread->base_pri - (thread->sched_usage >> thread->pri_shift);
 368
 369         if (priority < MINPRI_USER)
 370                 priority = MINPRI_USER;
 371         else if (priority > MAXPRI_KERNEL)
 372                 priority = MAXPRI_KERNEL;
 373
 374         return priority;
 375 }
 376
 377
 378 /*
 379  *      can_update_priority
 380  *
 381  *      Make sure we don't do re-dispatches more frequently than a scheduler tick.
 382  *
 383  *      Called with the thread locked.
 384  */
 385 boolean_t
 386 can_update_priority(
 387                                         thread_t        thread)
 388 {
 389         if (sched_tick == thread->sched_stamp)
 390                 return (FALSE);
 391         else
 392                 return (TRUE);
 393 }
 394
 395 /*
 396  *      update_priority
 397  *
 398  *      Perform housekeeping operations driven by scheduler tick.
 399  *
 400  *      Called with the thread locked.
 401  */
 402 void
 403 update_priority(
 404         register thread_t       thread)
 405 {
 406         register unsigned       ticks;
 407         register uint32_t       delta;
 408
 409         ticks = sched_tick - thread->sched_stamp;
 410         assert(ticks != 0);
 411         thread->sched_stamp += ticks;
 412         if (sched_use_combined_fgbg_decay)
 413                 thread->pri_shift = sched_combined_fgbg_pri_shift;
 414         else if (thread->sched_flags & TH_SFLAG_THROTTLED)
 415                 thread->pri_shift = sched_background_pri_shift;
 416         else
 417                 thread->pri_shift = sched_pri_shift;
 418
 419         /* If requested, accelerate aging of sched_usage */
 420         if (sched_decay_usage_age_factor > 1)
 421                 ticks *= sched_decay_usage_age_factor;
 422
 423         /*
 424          *      Gather cpu usage data.
 425          */
 426         thread_timer_delta(thread, delta);
 427         if (ticks < SCHED_DECAY_TICKS) {
 428                 register struct shift_data      *shiftp;
 429
 430                 /*
 431                  *      Accumulate timesharing usage only
 432                  *      during contention for processor
 433                  *      resources.
 434                  */
 435                 if (thread->pri_shift < INT8_MAX)
 436                         thread->sched_usage += delta;
 437
 438                 thread->cpu_usage += delta + thread->cpu_delta;
 439                 thread->cpu_delta = 0;
 440
 441                 shiftp = &sched_decay_shifts[ticks];
 442                 if (shiftp->shift2 > 0) {
 443                     thread->cpu_usage =
 444                                                 (thread->cpu_usage >> shiftp->shift1) +
 445                                                 (thread->cpu_usage >> shiftp->shift2);
 446                     thread->sched_usage =
 447                                                 (thread->sched_usage >> shiftp->shift1) +
 448                                                 (thread->sched_usage >> shiftp->shift2);
 449                 }
 450                 else {
 451                     thread->cpu_usage =
 452                                                 (thread->cpu_usage >> shiftp->shift1) -
 453                                                 (thread->cpu_usage >> -(shiftp->shift2));
 454                     thread->sched_usage =
 455                                                 (thread->sched_usage >> shiftp->shift1) -
 456                                                 (thread->sched_usage >> -(shiftp->shift2));
 457                 }
 458         }
 459         else {
 460                 thread->cpu_usage = thread->cpu_delta = 0;
 461                 thread->sched_usage = 0;
 462         }
 463
 464         /*
 465          *      Check for fail-safe release.
 466          */
 467         if ((thread->sched_flags & TH_SFLAG_FAILSAFE) &&
 468             mach_absolute_time() >= thread->safe_release) {
 469                 sched_thread_mode_undemote(thread, TH_SFLAG_FAILSAFE);
 470         }
 471
 472         /*
 473          *      Recompute scheduled priority if appropriate.
 474          */
 475         if (thread->sched_mode == TH_MODE_TIMESHARE) {
 476                 int priority = sched_compute_timeshare_priority(thread);
 477
 478                 /*
 479                  * Adjust the scheduled priority like thread_recompute_sched_pri,
 480                  * except without setting an AST.
 481                  */
 482                 if ((!(thread->sched_flags & TH_SFLAG_PROMOTED_MASK)  || (priority > thread->sched_pri)) &&
 483                     (!(thread->sched_flags & TH_SFLAG_DEPRESSED_MASK)) &&
 484                     priority != thread->sched_pri) {
 485
 486                         boolean_t removed = thread_run_queue_remove(thread);
 487
 488                         thread->sched_pri = priority;
 489
 490                         KERNEL_DEBUG_CONSTANT(MACHDBG_CODE(DBG_MACH_SCHED, MACH_SCHED_CHANGE_PRIORITY),
 491                                               (uintptr_t)thread_tid(thread),
 492                                               thread->base_pri,
 493                                               thread->sched_pri,
 494                                               0, /* eventually, 'reason' */
 495                                               0);
 496
 497                         if (removed)
 498                                 thread_run_queue_reinsert(thread, SCHED_TAILQ);
 499                 }
 500         }
 501
 502         return;
 503 }
 504
 505 #endif /* CONFIG_SCHED_TIMESHARE_CORE */
 506
 507 #if MACH_ASSERT
 508 /* sched_mode == TH_MODE_TIMESHARE controls whether a thread has a timeshare count when it has a run count */
 509
 510 void sched_share_incr(thread_t thread) {
 511         assert((thread->state & (TH_RUN|TH_IDLE)) == TH_RUN);
 512         assert(thread->sched_mode == TH_MODE_TIMESHARE);
 513         assert(thread->SHARE_COUNT == 0);
 514         thread->SHARE_COUNT++;
 515         (void)hw_atomic_add(&sched_share_count, 1);
 516 }
 517
 518 void sched_share_decr(thread_t thread) {
 519         assert((thread->state & (TH_RUN|TH_IDLE)) != TH_RUN || thread->sched_mode != TH_MODE_TIMESHARE);
 520         assert(thread->SHARE_COUNT == 1);
 521         (void)hw_atomic_sub(&sched_share_count, 1);
 522         thread->SHARE_COUNT--;
 523 }
 524
 525 /* TH_SFLAG_THROTTLED controls whether a thread has a background count when it has a run count and a share count */
 526
 527 void sched_background_incr(thread_t thread) {
 528         assert((thread->state & (TH_RUN|TH_IDLE)) == TH_RUN);
 529         assert(thread->sched_mode == TH_MODE_TIMESHARE);
 530         assert((thread->sched_flags & TH_SFLAG_THROTTLED) == TH_SFLAG_THROTTLED);
 531
 532         assert(thread->BG_COUNT == 0);
 533         thread->BG_COUNT++;
 534         int val = hw_atomic_add(&sched_background_count, 1);
 535         assert(val >= 0);
 536
 537         /* Always do the background change while holding a share count */
 538         assert(thread->SHARE_COUNT == 1);
 539 }
 540
 541 void sched_background_decr(thread_t thread) {
 542         if ((thread->state & (TH_RUN|TH_IDLE)) == TH_RUN && thread->sched_mode == TH_MODE_TIMESHARE)
 543                 assert((thread->sched_flags & TH_SFLAG_THROTTLED) != TH_SFLAG_THROTTLED);
 544         assert(thread->BG_COUNT == 1);
 545         int val = hw_atomic_sub(&sched_background_count, 1);
 546         thread->BG_COUNT--;
 547         assert(val >= 0);
 548         assert(thread->BG_COUNT == 0);
 549
 550         /* Always do the background change while holding a share count */
 551         assert(thread->SHARE_COUNT == 1);
 552 }
 553
 554
 555 void
 556 assert_thread_sched_count(thread_t thread) {
 557         /* Only 0 or 1 are acceptable values */
 558         assert(thread->BG_COUNT    == 0 || thread->BG_COUNT    == 1);
 559         assert(thread->SHARE_COUNT == 0 || thread->SHARE_COUNT == 1);
 560
 561         /* BG is only allowed when you already have a share count */
 562         if (thread->BG_COUNT == 1)
 563                 assert(thread->SHARE_COUNT == 1);
 564         if (thread->SHARE_COUNT == 0)
 565                 assert(thread->BG_COUNT == 0);
 566
 567         if ((thread->state & (TH_RUN|TH_IDLE)) != TH_RUN ||
 568             (thread->sched_mode != TH_MODE_TIMESHARE))
 569                 assert(thread->SHARE_COUNT == 0);
 570
 571         if ((thread->state & (TH_RUN|TH_IDLE)) == TH_RUN &&
 572             (thread->sched_mode == TH_MODE_TIMESHARE))
 573                 assert(thread->SHARE_COUNT == 1);
 574
 575         if ((thread->state & (TH_RUN|TH_IDLE)) != TH_RUN ||
 576             (thread->sched_mode != TH_MODE_TIMESHARE)    ||
 577             !(thread->sched_flags & TH_SFLAG_THROTTLED))
 578                 assert(thread->BG_COUNT == 0);
 579
 580         if ((thread->state & (TH_RUN|TH_IDLE)) == TH_RUN &&
 581             (thread->sched_mode == TH_MODE_TIMESHARE)    &&
 582             (thread->sched_flags & TH_SFLAG_THROTTLED))
 583                 assert(thread->BG_COUNT == 1);
 584 }
 585
 586 #endif /* MACH_ASSERT */
 587
 588 /*
 589  * Set the thread's true scheduling mode
 590  * Called with thread mutex and thread locked
 591  * The thread has already been removed from the runqueue.
 592  *
 593  * (saved_mode is handled before this point)
 594  */
 595 void
 596 sched_set_thread_mode(thread_t thread, sched_mode_t new_mode)
 597 {
 598         assert_thread_sched_count(thread);
 599         assert(thread->runq == PROCESSOR_NULL);
 600
 601         sched_mode_t old_mode = thread->sched_mode;
 602
 603         thread->sched_mode = new_mode;
 604
 605         switch (new_mode) {
 606                 case TH_MODE_FIXED:
 607                 case TH_MODE_REALTIME:
 608                         if (old_mode == TH_MODE_TIMESHARE) {
 609                                 if ((thread->state & (TH_RUN|TH_IDLE)) == TH_RUN) {
 610                                         if (thread->sched_flags & TH_SFLAG_THROTTLED)
 611                                                 sched_background_decr(thread);
 612
 613                                         sched_share_decr(thread);
 614                                 }
 615                         }
 616                         break;
 617
 618                 case TH_MODE_TIMESHARE:
 619                         if (old_mode != TH_MODE_TIMESHARE) {
 620                                 if ((thread->state & (TH_RUN|TH_IDLE)) == TH_RUN) {
 621                                         sched_share_incr(thread);
 622
 623                                         if (thread->sched_flags & TH_SFLAG_THROTTLED)
 624                                                 sched_background_incr(thread);
 625                                 }
 626                         }
 627                         break;
 628
 629                 default:
 630                         panic("unexpected mode: %d", new_mode);
 631                         break;
 632         }
 633
 634         assert_thread_sched_count(thread);
 635 }
 636
 637 /*
 638  * Demote the true scheduler mode to timeshare (called with the thread locked)
 639  */
 640 void
 641 sched_thread_mode_demote(thread_t thread, uint32_t reason)
 642 {
 643         assert(reason & TH_SFLAG_DEMOTED_MASK);
 644         assert((thread->sched_flags & reason) != reason);
 645         assert_thread_sched_count(thread);
 646
 647         if (thread->policy_reset)
 648                 return;
 649
 650         if (thread->sched_flags & TH_SFLAG_DEMOTED_MASK) {
 651                 /* Another demotion reason is already active */
 652                 thread->sched_flags |= reason;
 653                 return;
 654         }
 655
 656         assert(thread->saved_mode == TH_MODE_NONE);
 657
 658         boolean_t removed = thread_run_queue_remove(thread);
 659
 660         thread->sched_flags |= reason;
 661
 662         thread->saved_mode = thread->sched_mode;
 663
 664         sched_set_thread_mode(thread, TH_MODE_TIMESHARE);
 665
 666         thread_recompute_priority(thread);
 667
 668         if (removed)
 669                 thread_run_queue_reinsert(thread, SCHED_TAILQ);
 670
 671         assert_thread_sched_count(thread);
 672 }
 673
 674 /*
 675  * Un-demote the true scheduler mode back to the saved mode (called with the thread locked)
 676  */
 677 void
 678 sched_thread_mode_undemote(thread_t thread, uint32_t reason)
 679 {
 680         assert(reason & TH_SFLAG_DEMOTED_MASK);
 681         assert((thread->sched_flags & reason) == reason);
 682         assert(thread->saved_mode != TH_MODE_NONE);
 683         assert(thread->sched_mode == TH_MODE_TIMESHARE);
 684         assert(thread->policy_reset == 0);
 685
 686         assert_thread_sched_count(thread);
 687
 688         thread->sched_flags &= ~reason;
 689
 690         if (thread->sched_flags & TH_SFLAG_DEMOTED_MASK) {
 691                 /* Another demotion reason is still active */
 692                 return;
 693         }
 694
 695         boolean_t removed = thread_run_queue_remove(thread);
 696
 697         sched_set_thread_mode(thread, thread->saved_mode);
 698
 699         thread->saved_mode = TH_MODE_NONE;
 700
 701         thread_recompute_priority(thread);
 702
 703         if (removed)
 704                 thread_run_queue_reinsert(thread, SCHED_TAILQ);
 705 }
 706
 707 /*
 708  * Set the thread to be categorized as 'background'
 709  * Called with thread mutex and thread lock held
 710  *
 711  * TODO: Eventually, 'background' should be a true sched_mode.
 712  */
 713 void
 714 sched_set_thread_throttled(thread_t thread, boolean_t wants_throttle)
 715 {
 716         if (thread->policy_reset)
 717                 return;
 718
 719         assert(((thread->sched_flags & TH_SFLAG_THROTTLED) ? TRUE : FALSE) != wants_throttle);
 720
 721         assert_thread_sched_count(thread);
 722
 723         /*
 724          * When backgrounding a thread, iOS has the semantic that
 725          * realtime and fixed priority threads should be demoted
 726          * to timeshare background threads.
 727          *
 728          * On OSX, realtime and fixed priority threads don't lose their mode.
 729          */
 730
 731         if (wants_throttle) {
 732                 thread->sched_flags |= TH_SFLAG_THROTTLED;
 733                 if ((thread->state & (TH_RUN|TH_IDLE)) == TH_RUN && thread->sched_mode == TH_MODE_TIMESHARE) {
 734                         sched_background_incr(thread);
 735                 }
 736
 737                 assert_thread_sched_count(thread);
 738
 739         } else {
 740                 thread->sched_flags &= ~TH_SFLAG_THROTTLED;
 741                 if ((thread->state & (TH_RUN|TH_IDLE)) == TH_RUN && thread->sched_mode == TH_MODE_TIMESHARE) {
 742                         sched_background_decr(thread);
 743                 }
 744
 745                 assert_thread_sched_count(thread);
 746
 747         }
 748
 749         assert_thread_sched_count(thread);
 750 }
 751