X-Git-Url: https://git.saurik.com/apple/xnu.git/blobdiff_plain/cb3231590a3c94ab4375e2228bd5e86b0cf1ad7e..c3c9b80d004dbbfdf763edeb97968c6997e3b45b:/osfmk/kern/priority.c

diff --git a/osfmk/kern/priority.c b/osfmk/kern/priority.c
index 5ac1ce756..abdfa868e 100644
--- a/osfmk/kern/priority.c
+++ b/osfmk/kern/priority.c
@@ -110,7 +110,7 @@ thread_quantum_expire(
 
 	KERNEL_DEBUG_CONSTANT(MACHDBG_CODE(DBG_MACH_SCHED, MACH_SCHED_QUANTUM_EXPIRED) | DBG_FUNC_START, 0, 0, 0, 0, 0);
 
-	SCHED_STATS_QUANTUM_TIMER_EXPIRATION(processor);
+	SCHED_STATS_INC(quantum_timer_expirations);
 
 	/*
 	 * We bill CPU time to both the individual thread and its task.
@@ -131,12 +131,12 @@ thread_quantum_expire(
 		    (thread->quantum_remaining - thread->t_deduct_bank_ledger_time));
 	}
 	thread->t_deduct_bank_ledger_time = 0;
-
 	ctime = mach_absolute_time();
 
 #ifdef CONFIG_MACH_APPROXIMATE_TIME
 	commpage_update_mach_approximate_time(ctime);
 #endif
+	sched_update_pset_avg_execution_time(processor->processor_set, thread->quantum_remaining, ctime, thread->th_sched_bucket);
 
 #if MONOTONIC
 	mt_sched_update(thread);
@@ -201,8 +201,8 @@ thread_quantum_expire(
 	 * during privilege transitions, synthesize an event now.
 	 */
 	if (!thread->precise_user_kernel_time) {
-		timer_update(PROCESSOR_DATA(processor, current_state), ctime);
-		timer_update(PROCESSOR_DATA(processor, thread_timer), ctime);
+		timer_update(processor->current_state, ctime);
+		timer_update(processor->thread_timer, ctime);
 		timer_update(&thread->runnable_timer, ctime);
 	}
 
@@ -233,8 +233,7 @@ thread_quantum_expire(
 	ast_propagate(thread);
 
 	thread_unlock(thread);
-
-	timer_call_quantum_timer_enter(&processor->quantum_timer, thread,
+	running_timer_enter(processor, RUNNING_TIMER_QUANTUM, thread,
 	    processor->quantum_end, ctime);
 
 	/* Tell platform layer that we are still running this thread */
@@ -279,11 +278,11 @@ sched_set_thread_base_priority(thread_t thread, int priority)
 	}
 
 	int old_base_pri = thread->base_pri;
-	thread->req_base_pri = priority;
+	thread->req_base_pri = (int16_t)priority;
 	if (thread->sched_flags & TH_SFLAG_BASE_PRI_FROZEN) {
 		priority = MAX(priority, old_base_pri);
 	}
-	thread->base_pri = priority;
+	thread->base_pri = (int16_t)priority;
 
 	if ((thread->state & TH_RUN) == TH_RUN) {
 		assert(thread->last_made_runnable_time != THREAD_NOT_RUNNABLE);
@@ -335,11 +334,11 @@ sched_set_kernel_thread_priority(thread_t thread, int new_priority)
 	if (new_priority > thread->max_priority) {
 		new_priority = thread->max_priority;
 	}
-#if CONFIG_EMBEDDED
+#if !defined(XNU_TARGET_OS_OSX)
 	if (new_priority < MAXPRI_THROTTLE) {
 		new_priority = MAXPRI_THROTTLE;
 	}
-#endif /* CONFIG_EMBEDDED */
+#endif /* !defined(XNU_TARGET_OS_OSX) */
 
 	thread->importance = new_priority - thread->task_priority;
 
@@ -370,10 +369,10 @@ thread_recompute_sched_pri(thread_t thread, set_sched_pri_options_t options)
 	uint32_t     sched_flags = thread->sched_flags;
 	sched_mode_t sched_mode  = thread->sched_mode;
 
-	int priority = thread->base_pri;
+	int16_t priority = thread->base_pri;
 
 	if (sched_mode == TH_MODE_TIMESHARE) {
-		priority = SCHED(compute_timeshare_priority)(thread);
+		priority = (int16_t)SCHED(compute_timeshare_priority)(thread);
 	}
 
 	if (sched_flags & TH_SFLAG_DEPRESS) {
@@ -428,6 +427,9 @@ sched_default_quantum_expire(thread_t thread __unused)
 	 */
 }
 
+int smt_timeshare_enabled = 1;
+int smt_sched_bonus_16ths = 8;
+
 #if defined(CONFIG_SCHED_TIMESHARE_CORE)
 
 /*
@@ -458,7 +460,11 @@ lightweight_update_priority(thread_t thread)
 		 *	resources.
 		 */
 		if (thread->pri_shift < INT8_MAX) {
-			thread->sched_usage += delta;
+			if (thread_no_smt(thread) && smt_timeshare_enabled) {
+				thread->sched_usage += (delta + ((delta * smt_sched_bonus_16ths) >> 4));
+			} else {
+				thread->sched_usage += delta;
+			}
 		}
 
 		thread->cpu_delta += delta;
@@ -531,19 +537,25 @@ const struct shift_data        sched_decay_shifts[SCHED_DECAY_TICKS] = {
 extern int sched_pri_decay_band_limit;
 
 
-/* Only use the decay floor logic on embedded non-clutch schedulers */
-#if CONFIG_EMBEDDED && !CONFIG_SCHED_CLUTCH
+/* Only use the decay floor logic on non-macOS and non-clutch schedulers */
+#if !defined(XNU_TARGET_OS_OSX) && !CONFIG_SCHED_CLUTCH
 
 int
 sched_compute_timeshare_priority(thread_t thread)
 {
-	int decay_amount = (thread->sched_usage >> thread->pri_shift);
+	int decay_amount;
 	int decay_limit = sched_pri_decay_band_limit;
 
 	if (thread->base_pri > BASEPRI_FOREGROUND) {
 		decay_limit += (thread->base_pri - BASEPRI_FOREGROUND);
 	}
 
+	if (thread->pri_shift == INT8_MAX) {
+		decay_amount = 0;
+	} else {
+		decay_amount = (thread->sched_usage >> thread->pri_shift);
+	}
+
 	if (decay_amount > decay_limit) {
 		decay_amount = decay_limit;
 	}
@@ -564,13 +576,17 @@ sched_compute_timeshare_priority(thread_t thread)
 	return priority;
 }
 
-#else /* CONFIG_EMBEDDED && !CONFIG_SCHED_CLUTCH */
+#else /* !defined(XNU_TARGET_OS_OSX) && !CONFIG_SCHED_CLUTCH */
 
 int
 sched_compute_timeshare_priority(thread_t thread)
 {
 	/* start with base priority */
-	int priority = thread->base_pri - (thread->sched_usage >> thread->pri_shift);
+	int priority = thread->base_pri;
+
+	if (thread->pri_shift != INT8_MAX) {
+		priority -= (thread->sched_usage >> thread->pri_shift);
+	}
 
 	if (priority < MINPRI_USER) {
 		priority = MINPRI_USER;
@@ -581,7 +597,7 @@ sched_compute_timeshare_priority(thread_t thread)
 	return priority;
 }
 
-#endif /* CONFIG_EMBEDDED && !CONFIG_SCHED_CLUTCH */
+#endif /* !defined(XNU_TARGET_OS_OSX) && !CONFIG_SCHED_CLUTCH */
 
 /*
  *	can_update_priority
@@ -635,7 +651,11 @@ update_priority(
 		 *	determine if the system was in a contended state.
 		 */
 		if (thread->pri_shift < INT8_MAX) {
-			thread->sched_usage += delta;
+			if (thread_no_smt(thread) && smt_timeshare_enabled) {
+				thread->sched_usage += (delta + ((delta * smt_sched_bonus_16ths) >> 4));
+			} else {
+				thread->sched_usage += delta;
+			}
 		}
 
 		thread->cpu_usage += delta + thread->cpu_delta;
@@ -729,6 +749,26 @@ sched_decr_bucket(sched_bucket_t bucket)
 	os_atomic_dec(&sched_run_buckets[bucket], relaxed);
 }
 
+static void
+sched_add_bucket(sched_bucket_t bucket, uint8_t run_weight)
+{
+	assert(bucket >= TH_BUCKET_FIXPRI &&
+	    bucket <= TH_BUCKET_SHARE_BG);
+
+	os_atomic_add(&sched_run_buckets[bucket], run_weight, relaxed);
+}
+
+static void
+sched_sub_bucket(sched_bucket_t bucket, uint8_t run_weight)
+{
+	assert(bucket >= TH_BUCKET_FIXPRI &&
+	    bucket <= TH_BUCKET_SHARE_BG);
+
+	assert(os_atomic_load(&sched_run_buckets[bucket], relaxed) > 0);
+
+	os_atomic_sub(&sched_run_buckets[bucket], run_weight, relaxed);
+}
+
 uint32_t
 sched_run_incr(thread_t thread)
 {
@@ -753,6 +793,35 @@ sched_run_decr(thread_t thread)
 	return new_count;
 }
 
+uint32_t
+sched_smt_run_incr(thread_t thread)
+{
+	assert((thread->state & (TH_RUN | TH_IDLE)) == TH_RUN);
+
+	uint8_t run_weight = (thread_no_smt(thread) && smt_timeshare_enabled) ? 2 : 1;
+	thread->sched_saved_run_weight = run_weight;
+
+	uint32_t new_count = os_atomic_add(&sched_run_buckets[TH_BUCKET_RUN], run_weight, relaxed);
+
+	sched_add_bucket(thread->th_sched_bucket, run_weight);
+
+	return new_count;
+}
+
+uint32_t
+sched_smt_run_decr(thread_t thread)
+{
+	assert((thread->state & (TH_RUN | TH_IDLE)) != TH_RUN);
+
+	uint8_t run_weight = thread->sched_saved_run_weight;
+
+	sched_sub_bucket(thread->th_sched_bucket, run_weight);
+
+	uint32_t new_count = os_atomic_sub(&sched_run_buckets[TH_BUCKET_RUN], run_weight, relaxed);
+
+	return new_count;
+}
+
 void
 sched_update_thread_bucket(thread_t thread)
 {
@@ -793,6 +862,46 @@ sched_update_thread_bucket(thread_t thread)
 	}
 }
 
+void
+sched_smt_update_thread_bucket(thread_t thread)
+{
+	sched_bucket_t old_bucket = thread->th_sched_bucket;
+	sched_bucket_t new_bucket = TH_BUCKET_RUN;
+
+	switch (thread->sched_mode) {
+	case TH_MODE_FIXED:
+	case TH_MODE_REALTIME:
+		new_bucket = TH_BUCKET_FIXPRI;
+		break;
+
+	case TH_MODE_TIMESHARE:
+		if (thread->base_pri > BASEPRI_DEFAULT) {
+			new_bucket = TH_BUCKET_SHARE_FG;
+		} else if (thread->base_pri > BASEPRI_UTILITY) {
+			new_bucket = TH_BUCKET_SHARE_DF;
+		} else if (thread->base_pri > MAXPRI_THROTTLE) {
+			new_bucket = TH_BUCKET_SHARE_UT;
+		} else {
+			new_bucket = TH_BUCKET_SHARE_BG;
+		}
+		break;
+
+	default:
+		panic("unexpected mode: %d", thread->sched_mode);
+		break;
+	}
+
+	if (old_bucket != new_bucket) {
+		thread->th_sched_bucket = new_bucket;
+		thread->pri_shift = sched_pri_shifts[new_bucket];
+
+		if ((thread->state & (TH_RUN | TH_IDLE)) == TH_RUN) {
+			sched_sub_bucket(old_bucket, thread->sched_saved_run_weight);
+			sched_add_bucket(new_bucket, thread->sched_saved_run_weight);
+		}
+	}
+}
+
 /*
  * Set the thread's true scheduling mode
  * Called with thread mutex and thread locked
@@ -816,6 +925,18 @@ sched_set_thread_mode(thread_t thread, sched_mode_t new_mode)
 		break;
 	}
 
+#if CONFIG_SCHED_AUTO_JOIN
+	/*
+	 * Realtime threads might have auto-joined a work interval based on
+	 * make runnable relationships. If such an RT thread is now being demoted
+	 * to non-RT, unjoin the thread from the work interval.
+	 */
+	if ((thread->sched_flags & TH_SFLAG_THREAD_GROUP_AUTO_JOIN) && (new_mode != TH_MODE_REALTIME)) {
+		assert((thread->sched_mode == TH_MODE_REALTIME) || (thread->th_work_interval_flags & TH_WORK_INTERVAL_FLAGS_AUTO_JOIN_LEAK));
+		work_interval_auto_join_demote(thread);
+	}
+#endif /* CONFIG_SCHED_AUTO_JOIN */
+
 	thread->sched_mode = new_mode;
 
 	SCHED(update_thread_bucket)(thread);