X-Git-Url: https://git.saurik.com/apple/xnu.git/blobdiff_plain/378393581903b274cb7a4d18e0d978071a6b592d..c18c124eaa464aaaa5549e99e5a70fc9cbb50944:/osfmk/kern/clock.c diff --git a/osfmk/kern/clock.c b/osfmk/kern/clock.c index 25fecf46f..1bd578496 100644 --- a/osfmk/kern/clock.c +++ b/osfmk/kern/clock.c @@ -1,131 +1,152 @@ /* - * Copyright (c) 2000-2004 Apple Computer, Inc. All rights reserved. + * Copyright (c) 2000-2008 Apple Inc. All rights reserved. * - * @APPLE_LICENSE_HEADER_START@ + * @APPLE_OSREFERENCE_LICENSE_HEADER_START@ * - * The contents of this file constitute Original Code as defined in and - * are subject to the Apple Public Source License Version 1.1 (the - * "License"). You may not use this file except in compliance with the - * License. Please obtain a copy of the License at - * http://www.apple.com/publicsource and read it before using this file. + * This file contains Original Code and/or Modifications of Original Code + * as defined in and that are subject to the Apple Public Source License + * Version 2.0 (the 'License'). You may not use this file except in + * compliance with the License. The rights granted to you under the License + * may not be used to create, or enable the creation or redistribution of, + * unlawful or unlicensed copies of an Apple operating system, or to + * circumvent, violate, or enable the circumvention or violation of, any + * terms of an Apple operating system software license agreement. * - * This Original Code and all software distributed under the License are - * distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY KIND, EITHER + * Please obtain a copy of the License at + * http://www.opensource.apple.com/apsl/ and read it before using this file. + * + * The Original Code and all software distributed under the License are + * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES, * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY, - * FITNESS FOR A PARTICULAR PURPOSE OR NON-INFRINGEMENT. Please see the - * License for the specific language governing rights and limitations - * under the License. + * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT. + * Please see the License for the specific language governing rights and + * limitations under the License. * - * @APPLE_LICENSE_HEADER_END@ + * @APPLE_OSREFERENCE_LICENSE_HEADER_END@ */ /* * @OSF_COPYRIGHT@ */ /* - * File: kern/clock.c - * Purpose: Routines for the creation and use of kernel - * alarm clock services. This file and the ipc - * routines in kern/ipc_clock.c constitute the - * machine-independent clock service layer. */ -#include - #include -#include -#include -#include - -#include -#include -#include -#include + #include #include #include -#include #include -#include +#include + +#include -#include -#include +#include #include -#include #include -#include -#include -#include +uint32_t hz_tick_interval = 1; + + +decl_simple_lock_data(,clock_lock) + +#define clock_lock() \ + simple_lock(&clock_lock) + +#define clock_unlock() \ + simple_unlock(&clock_lock) + +#define clock_lock_init() \ + simple_lock_init(&clock_lock, 0) + + +/* + * Time of day (calendar) variables. + * + * Algorithm: + * + * TOD <- (seconds + epoch, fraction) <- CONV(current absolute time + offset) + * + * where CONV converts absolute time units into seconds and a fraction. + */ +static struct clock_calend { + uint64_t epoch; + uint64_t offset; + + int32_t adjdelta; /* Nanosecond time delta for this adjustment period */ + uint64_t adjstart; /* Absolute time value for start of this adjustment period */ + uint32_t adjoffset; /* Absolute time offset for this adjustment period as absolute value */ +} clock_calend; + +#if CONFIG_DTRACE /* - * Exported interface + * Unlocked calendar flipflop; this is used to track a clock_calend such + * that we can safely access a snapshot of a valid clock_calend structure + * without needing to take any locks to do it. + * + * The trick is to use a generation count and set the low bit when it is + * being updated/read; by doing this, we guarantee, through use of the + * hw_atomic functions, that the generation is incremented when the bit + * is cleared atomically (by using a 1 bit add). */ +static struct unlocked_clock_calend { + struct clock_calend calend; /* copy of calendar */ + uint32_t gen; /* generation count */ +} flipflop[ 2]; -#include -#include +static void clock_track_calend_nowait(void); -/* local data declarations */ -decl_simple_lock_data(static,ClockLock) /* clock system synchronization */ -static struct zone *alarm_zone; /* zone for user alarms */ -static struct alarm *alrmfree; /* alarm free list pointer */ -static struct alarm *alrmdone; /* alarm done list pointer */ -static long alrm_seqno; /* uniquely identifies alarms */ -static thread_call_data_t alarm_deliver; +#endif -decl_simple_lock_data(static,calend_adjlock) +/* + * Calendar adjustment variables and values. + */ +#define calend_adjperiod (NSEC_PER_SEC / 100) /* adjustment period, ns */ +#define calend_adjskew (40 * NSEC_PER_USEC) /* "standard" skew, ns / period */ +#define calend_adjbig (NSEC_PER_SEC) /* use 10x skew above adjbig ns */ + +static int64_t calend_adjtotal; /* Nanosecond remaining total adjustment */ +static uint64_t calend_adjdeadline; /* Absolute time value for next adjustment period */ +static uint32_t calend_adjinterval; /* Absolute time interval of adjustment period */ static timer_call_data_t calend_adjcall; -static uint64_t calend_adjdeadline; +static uint32_t calend_adjactive; + +static uint32_t calend_set_adjustment( + long *secs, + int *microsecs); + +static void calend_adjust_call(void); +static uint32_t calend_adjust(void); static thread_call_data_t calend_wakecall; -/* external declarations */ -extern struct clock clock_list[]; -extern int clock_count; - -/* local clock subroutines */ -static -void flush_alarms( - clock_t clock); - -static -void post_alarm( - clock_t clock, - alarm_t alarm); - -static -int check_time( - alarm_type_t alarm_type, - mach_timespec_t *alarm_time, - mach_timespec_t *clock_time); - -static -void clock_alarm_deliver( - thread_call_param_t p0, - thread_call_param_t p1); - -static -void calend_adjust_call( - timer_call_param_t p0, - timer_call_param_t p1); - -static -void calend_dowakeup( - thread_call_param_t p0, - thread_call_param_t p1); +extern void IOKitResetTime(void); -/* - * Macros to lock/unlock clock system. - */ -#define LOCK_CLOCK(s) \ - s = splclock(); \ - simple_lock(&ClockLock); +void _clock_delay_until_deadline(uint64_t interval, + uint64_t deadline); -#define UNLOCK_CLOCK(s) \ - simple_unlock(&ClockLock); \ - splx(s); +static uint64_t clock_boottime; /* Seconds boottime epoch */ + +#define TIME_ADD(rsecs, secs, rfrac, frac, unit) \ +MACRO_BEGIN \ + if (((rfrac) += (frac)) >= (unit)) { \ + (rfrac) -= (unit); \ + (rsecs) += 1; \ + } \ + (rsecs) += (secs); \ +MACRO_END + +#define TIME_SUB(rsecs, secs, rfrac, frac, unit) \ +MACRO_BEGIN \ + if ((int)((rfrac) -= (frac)) < 0) { \ + (rfrac) += (unit); \ + (rsecs) -= 1; \ + } \ + (rsecs) -= (secs); \ +MACRO_END /* * clock_config: @@ -135,37 +156,12 @@ void calend_dowakeup( void clock_config(void) { - clock_t clock; - register int i; - - assert(cpu_number() == master_cpu); - - simple_lock_init(&ClockLock, 0); - thread_call_setup(&alarm_deliver, clock_alarm_deliver, NULL); - - simple_lock_init(&calend_adjlock, 0); - timer_call_setup(&calend_adjcall, calend_adjust_call, NULL); - - thread_call_setup(&calend_wakecall, calend_dowakeup, NULL); + clock_lock_init(); - /* - * Configure clock devices. - */ - for (i = 0; i < clock_count; i++) { - clock = &clock_list[i]; - if (clock->cl_ops) { - if ((*clock->cl_ops->c_config)() == 0) - clock->cl_ops = 0; - } - } - - /* - * Initialize the timer callouts. - */ - timer_call_initialize(); + timer_call_setup(&calend_adjcall, (timer_call_func_t)calend_adjust_call, NULL); + thread_call_setup(&calend_wakecall, (thread_call_func_t)IOKitResetTime, NULL); - /* start alarm sequence numbers at 0 */ - alrm_seqno = 0; + clock_oldconfig(); } /* @@ -176,696 +172,623 @@ clock_config(void) void clock_init(void) { - clock_t clock; - register int i; - - /* - * Initialize basic clock structures. - */ - for (i = 0; i < clock_count; i++) { - clock = &clock_list[i]; - if (clock->cl_ops && clock->cl_ops->c_init) - (*clock->cl_ops->c_init)(); - } + clock_oldinit(); } /* - * Called by machine dependent code - * to initialize areas dependent on the - * timebase value. May be called multiple - * times during start up. + * clock_timebase_init: + * + * Called by machine dependent code + * to initialize areas dependent on the + * timebase value. May be called multiple + * times during start up. */ void clock_timebase_init(void) { - sched_timebase_init(); -} + uint64_t abstime; -/* - * Initialize the clock ipc service facility. - */ -void -clock_service_create(void) -{ - clock_t clock; - register int i; + nanoseconds_to_absolutetime(calend_adjperiod, &abstime); + calend_adjinterval = (uint32_t)abstime; - /* - * Initialize ipc clock services. - */ - for (i = 0; i < clock_count; i++) { - clock = &clock_list[i]; - if (clock->cl_ops) { - ipc_clock_init(clock); - ipc_clock_enable(clock); - } - } + nanoseconds_to_absolutetime(NSEC_PER_SEC / 100, &abstime); + hz_tick_interval = (uint32_t)abstime; - /* - * Perform miscellaneous late - * initialization. - */ - i = sizeof(struct alarm); - alarm_zone = zinit(i, (4096/i)*i, 10*i, "alarms"); + sched_timebase_init(); } /* - * Get the service port on a clock. + * mach_timebase_info_trap: + * + * User trap returns timebase constant. */ kern_return_t -host_get_clock_service( - host_t host, - clock_id_t clock_id, - clock_t *clock) /* OUT */ +mach_timebase_info_trap( + struct mach_timebase_info_trap_args *args) { - if (host == HOST_NULL || clock_id < 0 || clock_id >= clock_count) { - *clock = CLOCK_NULL; - return (KERN_INVALID_ARGUMENT); - } + mach_vm_address_t out_info_addr = args->info; + mach_timebase_info_data_t info; - *clock = &clock_list[clock_id]; - if ((*clock)->cl_ops == 0) - return (KERN_FAILURE); - return (KERN_SUCCESS); -} + clock_timebase_info(&info); -/* - * Get the control port on a clock. - */ -kern_return_t -host_get_clock_control( - host_priv_t host_priv, - clock_id_t clock_id, - clock_t *clock) /* OUT */ -{ - if (host_priv == HOST_PRIV_NULL || clock_id < 0 || clock_id >= clock_count) { - *clock = CLOCK_NULL; - return (KERN_INVALID_ARGUMENT); - } + copyout((void *)&info, out_info_addr, sizeof (info)); - *clock = &clock_list[clock_id]; - if ((*clock)->cl_ops == 0) - return (KERN_FAILURE); return (KERN_SUCCESS); } /* - * Get the current clock time. + * Calendar routines. */ -kern_return_t -clock_get_time( - clock_t clock, - mach_timespec_t *cur_time) /* OUT */ -{ - if (clock == CLOCK_NULL) - return (KERN_INVALID_ARGUMENT); - return ((*clock->cl_ops->c_gettime)(cur_time)); -} /* - * Get clock attributes. + * clock_get_calendar_microtime: + * + * Returns the current calendar value, + * microseconds as the fraction. */ -kern_return_t -clock_get_attributes( - clock_t clock, - clock_flavor_t flavor, - clock_attr_t attr, /* OUT */ - mach_msg_type_number_t *count) /* IN/OUT */ +void +clock_get_calendar_microtime( + clock_sec_t *secs, + clock_usec_t *microsecs) { - if (clock == CLOCK_NULL) - return (KERN_INVALID_ARGUMENT); - if (clock->cl_ops->c_getattr) - return(clock->cl_ops->c_getattr(flavor, attr, count)); - else - return (KERN_FAILURE); + clock_get_calendar_absolute_and_microtime(secs, microsecs, NULL); } /* - * Set the current clock time. + * clock_get_calendar_absolute_and_microtime: + * + * Returns the current calendar value, + * microseconds as the fraction. Also + * returns mach_absolute_time if abstime + * is not NULL. */ -kern_return_t -clock_set_time( - clock_t clock, - mach_timespec_t new_time) +void +clock_get_calendar_absolute_and_microtime( + clock_sec_t *secs, + clock_usec_t *microsecs, + uint64_t *abstime) { - mach_timespec_t *clock_time; + uint64_t now; + spl_t s; - if (clock == CLOCK_NULL) - return (KERN_INVALID_ARGUMENT); - if (clock->cl_ops->c_settime == NULL) - return (KERN_FAILURE); - clock_time = &new_time; - if (BAD_MACH_TIMESPEC(clock_time)) - return (KERN_INVALID_VALUE); + s = splclock(); + clock_lock(); + + now = mach_absolute_time(); + if (abstime) + *abstime = now; + + if (clock_calend.adjdelta < 0) { + uint32_t t32; + + /* + * Since offset is decremented during a negative adjustment, + * ensure that time increases monotonically without going + * temporarily backwards. + * If the delta has not yet passed, now is set to the start + * of the current adjustment period; otherwise, we're between + * the expiry of the delta and the next call to calend_adjust(), + * and we offset accordingly. + */ + if (now > clock_calend.adjstart) { + t32 = (uint32_t)(now - clock_calend.adjstart); - /* - * Flush all outstanding alarms. - */ - flush_alarms(clock); + if (t32 > clock_calend.adjoffset) + now -= clock_calend.adjoffset; + else + now = clock_calend.adjstart; + } + } - /* - * Set the new time. - */ - return (clock->cl_ops->c_settime(clock_time)); + now += clock_calend.offset; + + absolutetime_to_microtime(now, secs, microsecs); + + *secs += (clock_sec_t)clock_calend.epoch; + + clock_unlock(); + splx(s); } /* - * Set the clock alarm resolution. + * clock_get_calendar_nanotime: + * + * Returns the current calendar value, + * nanoseconds as the fraction. + * + * Since we do not have an interface to + * set the calendar with resolution greater + * than a microsecond, we honor that here. */ -kern_return_t -clock_set_attributes( - clock_t clock, - clock_flavor_t flavor, - clock_attr_t attr, - mach_msg_type_number_t count) +void +clock_get_calendar_nanotime( + clock_sec_t *secs, + clock_nsec_t *nanosecs) { - if (clock == CLOCK_NULL) - return (KERN_INVALID_ARGUMENT); - if (clock->cl_ops->c_setattr) - return (clock->cl_ops->c_setattr(flavor, attr, count)); - else - return (KERN_FAILURE); + uint64_t now; + spl_t s; + + s = splclock(); + clock_lock(); + + now = mach_absolute_time(); + + if (clock_calend.adjdelta < 0) { + uint32_t t32; + + if (now > clock_calend.adjstart) { + t32 = (uint32_t)(now - clock_calend.adjstart); + + if (t32 > clock_calend.adjoffset) + now -= clock_calend.adjoffset; + else + now = clock_calend.adjstart; + } + } + + now += clock_calend.offset; + + absolutetime_to_microtime(now, secs, nanosecs); + + *nanosecs *= NSEC_PER_USEC; + + *secs += (clock_sec_t)clock_calend.epoch; + + clock_unlock(); + splx(s); } /* - * Setup a clock alarm. + * clock_gettimeofday: + * + * Kernel interface for commpage implementation of + * gettimeofday() syscall. + * + * Returns the current calendar value, and updates the + * commpage info as appropriate. Because most calls to + * gettimeofday() are handled in user mode by the commpage, + * this routine should be used infrequently. */ -kern_return_t -clock_alarm( - clock_t clock, - alarm_type_t alarm_type, - mach_timespec_t alarm_time, - ipc_port_t alarm_port, - mach_msg_type_name_t alarm_port_type) +void +clock_gettimeofday( + clock_sec_t *secs, + clock_usec_t *microsecs) { - alarm_t alarm; - mach_timespec_t clock_time; - int chkstat; - kern_return_t reply_code; - spl_t s; - - if (clock == CLOCK_NULL) - return (KERN_INVALID_ARGUMENT); - if (clock->cl_ops->c_setalrm == 0) - return (KERN_FAILURE); - if (IP_VALID(alarm_port) == 0) - return (KERN_INVALID_CAPABILITY); + uint64_t now; + spl_t s; - /* - * Check alarm parameters. If parameters are invalid, - * send alarm message immediately. - */ - (*clock->cl_ops->c_gettime)(&clock_time); - chkstat = check_time(alarm_type, &alarm_time, &clock_time); - if (chkstat <= 0) { - reply_code = (chkstat < 0 ? KERN_INVALID_VALUE : KERN_SUCCESS); - clock_alarm_reply(alarm_port, alarm_port_type, - reply_code, alarm_type, clock_time); - return (KERN_SUCCESS); + s = splclock(); + clock_lock(); + + now = mach_absolute_time(); + + if (clock_calend.adjdelta >= 0) { + clock_gettimeofday_set_commpage(now, clock_calend.epoch, clock_calend.offset, secs, microsecs); } + else { + uint32_t t32; - /* - * Get alarm and add to clock alarm list. - */ + if (now > clock_calend.adjstart) { + t32 = (uint32_t)(now - clock_calend.adjstart); + + if (t32 > clock_calend.adjoffset) + now -= clock_calend.adjoffset; + else + now = clock_calend.adjstart; + } + + now += clock_calend.offset; + + absolutetime_to_microtime(now, secs, microsecs); - LOCK_CLOCK(s); - if ((alarm = alrmfree) == 0) { - UNLOCK_CLOCK(s); - alarm = (alarm_t) zalloc(alarm_zone); - if (alarm == 0) - return (KERN_RESOURCE_SHORTAGE); - LOCK_CLOCK(s); + *secs += (clock_sec_t)clock_calend.epoch; } - else - alrmfree = alarm->al_next; - - alarm->al_status = ALARM_CLOCK; - alarm->al_time = alarm_time; - alarm->al_type = alarm_type; - alarm->al_port = alarm_port; - alarm->al_port_type = alarm_port_type; - alarm->al_clock = clock; - alarm->al_seqno = alrm_seqno++; - post_alarm(clock, alarm); - UNLOCK_CLOCK(s); - return (KERN_SUCCESS); + clock_unlock(); + splx(s); } /* - * Sleep on a clock. System trap. User-level libmach clock_sleep - * interface call takes a mach_timespec_t sleep_time argument which it - * converts to sleep_sec and sleep_nsec arguments which are then - * passed to clock_sleep_trap. + * clock_set_calendar_microtime: + * + * Sets the current calendar value by + * recalculating the epoch and offset + * from the system clock. + * + * Also adjusts the boottime to keep the + * value consistent, writes the new + * calendar value to the platform clock, + * and sends calendar change notifications. */ -kern_return_t -clock_sleep_trap( - struct clock_sleep_trap_args *args) +void +clock_set_calendar_microtime( + clock_sec_t secs, + clock_usec_t microsecs) { - mach_port_name_t clock_name = args->clock_name; - sleep_type_t sleep_type = args->sleep_type; - int sleep_sec = args->sleep_sec; - int sleep_nsec = args->sleep_nsec; - mach_vm_address_t wakeup_time_addr = args->wakeup_time; - clock_t clock; - mach_timespec_t swtime; - kern_return_t rvalue; + clock_sec_t sys; + clock_usec_t microsys; + clock_sec_t newsecs; + clock_usec_t newmicrosecs; + spl_t s; - /* - * Convert the trap parameters. - */ - if (clock_name != MACH_PORT_NULL) - clock = port_name_to_clock(clock_name); - else - clock = &clock_list[SYSTEM_CLOCK]; + newsecs = secs; + newmicrosecs = microsecs; + + s = splclock(); + clock_lock(); - swtime.tv_sec = sleep_sec; - swtime.tv_nsec = sleep_nsec; + commpage_disable_timestamp(); /* - * Call the actual clock_sleep routine. + * Calculate the new calendar epoch based on + * the new value and the system clock. */ - rvalue = clock_sleep_internal(clock, sleep_type, &swtime); + clock_get_system_microtime(&sys, µsys); + TIME_SUB(secs, sys, microsecs, microsys, USEC_PER_SEC); /* - * Return current time as wakeup time. + * Adjust the boottime based on the delta. */ - if (rvalue != KERN_INVALID_ARGUMENT && rvalue != KERN_FAILURE) { - copyout((char *)&swtime, wakeup_time_addr, sizeof(mach_timespec_t)); - } - return (rvalue); -} - -/* - * Kernel internally callable clock sleep routine. The calling - * thread is suspended until the requested sleep time is reached. - */ -kern_return_t -clock_sleep_internal( - clock_t clock, - sleep_type_t sleep_type, - mach_timespec_t *sleep_time) -{ - alarm_t alarm; - mach_timespec_t clock_time; - kern_return_t rvalue; - int chkstat; - spl_t s; - - if (clock == CLOCK_NULL) - return (KERN_INVALID_ARGUMENT); - if (clock->cl_ops->c_setalrm == 0) - return (KERN_FAILURE); + clock_boottime += secs - clock_calend.epoch; /* - * Check sleep parameters. If parameters are invalid - * return an error, otherwise post alarm request. + * Set the new calendar epoch. */ - (*clock->cl_ops->c_gettime)(&clock_time); + clock_calend.epoch = secs; - chkstat = check_time(sleep_type, sleep_time, &clock_time); - if (chkstat < 0) - return (KERN_INVALID_VALUE); - rvalue = KERN_SUCCESS; - if (chkstat > 0) { - wait_result_t wait_result; + nanoseconds_to_absolutetime((uint64_t)microsecs * NSEC_PER_USEC, &clock_calend.offset); - /* - * Get alarm and add to clock alarm list. - */ - - LOCK_CLOCK(s); - if ((alarm = alrmfree) == 0) { - UNLOCK_CLOCK(s); - alarm = (alarm_t) zalloc(alarm_zone); - if (alarm == 0) - return (KERN_RESOURCE_SHORTAGE); - LOCK_CLOCK(s); - } - else - alrmfree = alarm->al_next; + /* + * Cancel any adjustment in progress. + */ + calend_adjtotal = clock_calend.adjdelta = 0; - /* - * Wait for alarm to occur. - */ - wait_result = assert_wait((event_t)alarm, THREAD_ABORTSAFE); - if (wait_result == THREAD_WAITING) { - alarm->al_time = *sleep_time; - alarm->al_status = ALARM_SLEEP; - post_alarm(clock, alarm); - UNLOCK_CLOCK(s); + clock_unlock(); - wait_result = thread_block(THREAD_CONTINUE_NULL); + /* + * Set the new value for the platform clock. + */ + PESetUTCTimeOfDay(newsecs, newmicrosecs); - /* - * Note if alarm expired normally or whether it - * was aborted. If aborted, delete alarm from - * clock alarm list. Return alarm to free list. - */ - LOCK_CLOCK(s); - if (alarm->al_status != ALARM_DONE) { - assert(wait_result != THREAD_AWAKENED); - if (((alarm->al_prev)->al_next = alarm->al_next) != NULL) - (alarm->al_next)->al_prev = alarm->al_prev; - rvalue = KERN_ABORTED; - } - *sleep_time = alarm->al_time; - alarm->al_status = ALARM_FREE; - } else { - assert(wait_result == THREAD_INTERRUPTED); - assert(alarm->al_status == ALARM_FREE); - rvalue = KERN_ABORTED; - } - alarm->al_next = alrmfree; - alrmfree = alarm; - UNLOCK_CLOCK(s); - } - else - *sleep_time = clock_time; + splx(s); - return (rvalue); + /* + * Send host notifications. + */ + host_notify_calendar_change(); + +#if CONFIG_DTRACE + clock_track_calend_nowait(); +#endif } /* - * CLOCK INTERRUPT SERVICE ROUTINES. - */ - -/* - * Service clock alarm interrupts. Called from machine dependent - * layer at splclock(). The clock_id argument specifies the clock, - * and the clock_time argument gives that clock's current time. + * clock_initialize_calendar: + * + * Set the calendar and related clocks + * from the platform clock at boot or + * wake event. + * + * Also sends host notifications. */ void -clock_alarm_intr( - clock_id_t clock_id, - mach_timespec_t *clock_time) +clock_initialize_calendar(void) { - clock_t clock; - register alarm_t alrm1; - register alarm_t alrm2; - mach_timespec_t *alarm_time; + clock_sec_t sys, secs; + clock_usec_t microsys, microsecs; spl_t s; - clock = &clock_list[clock_id]; + PEGetUTCTimeOfDay(&secs, µsecs); - /* - * Update clock alarm list. All alarms that are due are moved - * to the alarmdone list to be serviced by the alarm_thread. - */ + s = splclock(); + clock_lock(); - LOCK_CLOCK(s); - alrm1 = (alarm_t) &clock->cl_alarm; - while ((alrm2 = alrm1->al_next) != NULL) { - alarm_time = &alrm2->al_time; - if (CMP_MACH_TIMESPEC(alarm_time, clock_time) > 0) - break; + commpage_disable_timestamp(); + if ((long)secs >= (long)clock_boottime) { /* - * Alarm has expired, so remove it from the - * clock alarm list. - */ - if ((alrm1->al_next = alrm2->al_next) != NULL) - (alrm1->al_next)->al_prev = alrm1; + * Initialize the boot time based on the platform clock. + */ + if (clock_boottime == 0) + clock_boottime = secs; /* - * If a clock_sleep() alarm, wakeup the thread - * which issued the clock_sleep() call. + * Calculate the new calendar epoch based on + * the platform clock and the system clock. */ - if (alrm2->al_status == ALARM_SLEEP) { - alrm2->al_next = 0; - alrm2->al_status = ALARM_DONE; - alrm2->al_time = *clock_time; - thread_wakeup((event_t)alrm2); - } + clock_get_system_microtime(&sys, µsys); + TIME_SUB(secs, sys, microsecs, microsys, USEC_PER_SEC); - /* - * If a clock_alarm() alarm, place the alarm on - * the alarm done list and schedule the alarm - * delivery mechanism. + /* + * Set the new calendar epoch. */ - else { - assert(alrm2->al_status == ALARM_CLOCK); - if ((alrm2->al_next = alrmdone) != NULL) - alrmdone->al_prev = alrm2; - else - thread_call_enter(&alarm_deliver); - alrm2->al_prev = (alarm_t) &alrmdone; - alrmdone = alrm2; - alrm2->al_status = ALARM_DONE; - alrm2->al_time = *clock_time; - } + clock_calend.epoch = secs; + + nanoseconds_to_absolutetime((uint64_t)microsecs * NSEC_PER_USEC, &clock_calend.offset); + + /* + * Cancel any adjustment in progress. + */ + calend_adjtotal = clock_calend.adjdelta = 0; } + clock_unlock(); + splx(s); + /* - * Setup the clock dependent layer to deliver another - * interrupt for the next pending alarm. + * Send host notifications. */ - if (alrm2) - (*clock->cl_ops->c_setalrm)(alarm_time); - UNLOCK_CLOCK(s); + host_notify_calendar_change(); + +#if CONFIG_DTRACE + clock_track_calend_nowait(); +#endif } /* - * ALARM DELIVERY ROUTINES. + * clock_get_boottime_nanotime: + * + * Return the boottime, used by sysctl. */ - -static void -clock_alarm_deliver( - __unused thread_call_param_t p0, - __unused thread_call_param_t p1) +void +clock_get_boottime_nanotime( + clock_sec_t *secs, + clock_nsec_t *nanosecs) { - register alarm_t alrm; - kern_return_t code; - spl_t s; + spl_t s; - LOCK_CLOCK(s); - while ((alrm = alrmdone) != NULL) { - if ((alrmdone = alrm->al_next) != NULL) - alrmdone->al_prev = (alarm_t) &alrmdone; - UNLOCK_CLOCK(s); - - code = (alrm->al_status == ALARM_DONE? KERN_SUCCESS: KERN_ABORTED); - if (alrm->al_port != IP_NULL) { - /* Deliver message to designated port */ - if (IP_VALID(alrm->al_port)) { - clock_alarm_reply(alrm->al_port, alrm->al_port_type, code, - alrm->al_type, alrm->al_time); - } + s = splclock(); + clock_lock(); - LOCK_CLOCK(s); - alrm->al_status = ALARM_FREE; - alrm->al_next = alrmfree; - alrmfree = alrm; - } - else - panic("clock_alarm_deliver"); - } + *secs = (clock_sec_t)clock_boottime; + *nanosecs = 0; - UNLOCK_CLOCK(s); + clock_unlock(); + splx(s); } /* - * CLOCK PRIVATE SERVICING SUBROUTINES. - */ - -/* - * Flush all pending alarms on a clock. All alarms - * are activated and timestamped correctly, so any - * programs waiting on alarms/threads will proceed - * with accurate information. + * clock_adjtime: + * + * Interface to adjtime() syscall. + * + * Calculates adjustment variables and + * initiates adjustment. */ -static void -flush_alarms( - clock_t clock) +clock_adjtime( + long *secs, + int *microsecs) { - register alarm_t alrm1, alrm2; - spl_t s; + uint32_t interval; + spl_t s; - /* - * Flush all outstanding alarms. + s = splclock(); + clock_lock(); + + interval = calend_set_adjustment(secs, microsecs); + if (interval != 0) { + calend_adjdeadline = mach_absolute_time() + interval; + if (!timer_call_enter(&calend_adjcall, calend_adjdeadline, TIMER_CALL_SYS_CRITICAL)) + calend_adjactive++; + } + else + if (timer_call_cancel(&calend_adjcall)) + calend_adjactive--; + + clock_unlock(); + splx(s); +} + +static uint32_t +calend_set_adjustment( + long *secs, + int *microsecs) +{ + uint64_t now, t64; + int64_t total, ototal; + uint32_t interval = 0; + + /* + * Compute the total adjustment time in nanoseconds. */ - LOCK_CLOCK(s); - alrm1 = (alarm_t) &clock->cl_alarm; - while ((alrm2 = alrm1->al_next) != NULL) { - /* - * Remove alarm from the clock alarm list. - */ - if ((alrm1->al_next = alrm2->al_next) != NULL) - (alrm1->al_next)->al_prev = alrm1; + total = ((int64_t)*secs * (int64_t)NSEC_PER_SEC) + (*microsecs * (int64_t)NSEC_PER_USEC); + + /* + * Disable commpage gettimeofday(). + */ + commpage_disable_timestamp(); + + /* + * Get current absolute time. + */ + now = mach_absolute_time(); + + /* + * Save the old adjustment total for later return. + */ + ototal = calend_adjtotal; + /* + * Is a new correction specified? + */ + if (total != 0) { /* - * If a clock_sleep() alarm, wakeup the thread - * which issued the clock_sleep() call. + * Set delta to the standard, small, adjustment skew. */ - if (alrm2->al_status == ALARM_SLEEP) { - alrm2->al_next = 0; - thread_wakeup((event_t)alrm2); + int32_t delta = calend_adjskew; + + if (total > 0) { + /* + * Positive adjustment. If greater than the preset 'big' + * threshold, slew at a faster rate, capping if necessary. + */ + if (total > (int64_t) calend_adjbig) + delta *= 10; + if (delta > total) + delta = (int32_t)total; + + /* + * Convert the delta back from ns to absolute time and store in adjoffset. + */ + nanoseconds_to_absolutetime((uint64_t)delta, &t64); + clock_calend.adjoffset = (uint32_t)t64; } else { /* - * If a clock_alarm() alarm, place the alarm on - * the alarm done list and wakeup the dedicated - * kernel alarm_thread to service the alarm. + * Negative adjustment; therefore, negate the delta. If + * greater than the preset 'big' threshold, slew at a faster + * rate, capping if necessary. */ - assert(alrm2->al_status == ALARM_CLOCK); - if ((alrm2->al_next = alrmdone) != NULL) - alrmdone->al_prev = alrm2; - else - thread_wakeup((event_t)&alrmdone); - alrm2->al_prev = (alarm_t) &alrmdone; - alrmdone = alrm2; + if (total < (int64_t) -calend_adjbig) + delta *= 10; + delta = -delta; + if (delta < total) + delta = (int32_t)total; + + /* + * Save the current absolute time. Subsequent time operations occuring + * during this negative correction can make use of this value to ensure + * that time increases monotonically. + */ + clock_calend.adjstart = now; + + /* + * Convert the delta back from ns to absolute time and store in adjoffset. + */ + nanoseconds_to_absolutetime((uint64_t)-delta, &t64); + clock_calend.adjoffset = (uint32_t)t64; } - } - UNLOCK_CLOCK(s); -} -/* - * Post an alarm on a clock's active alarm list. The alarm is - * inserted in time-order into the clock's active alarm list. - * Always called from within a LOCK_CLOCK() code section. - */ -static -void -post_alarm( - clock_t clock, - alarm_t alarm) -{ - register alarm_t alrm1, alrm2; - mach_timespec_t *alarm_time; - mach_timespec_t *queue_time; + /* + * Store the total adjustment time in ns. + */ + calend_adjtotal = total; + + /* + * Store the delta for this adjustment period in ns. + */ + clock_calend.adjdelta = delta; - /* - * Traverse alarm list until queue time is greater - * than alarm time, then insert alarm. - */ - alarm_time = &alarm->al_time; - alrm1 = (alarm_t) &clock->cl_alarm; - while ((alrm2 = alrm1->al_next) != NULL) { - queue_time = &alrm2->al_time; - if (CMP_MACH_TIMESPEC(queue_time, alarm_time) > 0) - break; - alrm1 = alrm2; + /* + * Set the interval in absolute time for later return. + */ + interval = calend_adjinterval; + } + else { + /* + * No change; clear any prior adjustment. + */ + calend_adjtotal = clock_calend.adjdelta = 0; } - alrm1->al_next = alarm; - alarm->al_next = alrm2; - alarm->al_prev = alrm1; - if (alrm2) - alrm2->al_prev = alarm; - /* - * If the inserted alarm is the 'earliest' alarm, - * reset the device layer alarm time accordingly. + /* + * If an prior correction was in progress, return the + * remaining uncorrected time from it. */ - if (clock->cl_alarm.al_next == alarm) - (*clock->cl_ops->c_setalrm)(alarm_time); + if (ototal != 0) { + *secs = (long)(ototal / (long)NSEC_PER_SEC); + *microsecs = (int)((ototal % (int)NSEC_PER_SEC) / (int)NSEC_PER_USEC); + } + else + *secs = *microsecs = 0; + +#if CONFIG_DTRACE + clock_track_calend_nowait(); +#endif + + return (interval); } -/* - * Check the validity of 'alarm_time' and 'alarm_type'. If either - * argument is invalid, return a negative value. If the 'alarm_time' - * is now, return a 0 value. If the 'alarm_time' is in the future, - * return a positive value. - */ -static -int -check_time( - alarm_type_t alarm_type, - mach_timespec_t *alarm_time, - mach_timespec_t *clock_time) +static void +calend_adjust_call(void) { - int result; - - if (BAD_ALRMTYPE(alarm_type)) - return (-1); - if (BAD_MACH_TIMESPEC(alarm_time)) - return (-1); - if ((alarm_type & ALRMTYPE) == TIME_RELATIVE) - ADD_MACH_TIMESPEC(alarm_time, clock_time); - - result = CMP_MACH_TIMESPEC(alarm_time, clock_time); + uint32_t interval; + spl_t s; - return ((result >= 0)? result: 0); -} + s = splclock(); + clock_lock(); -mach_timespec_t -clock_get_system_value(void) -{ - clock_t clock = &clock_list[SYSTEM_CLOCK]; - mach_timespec_t value; + if (--calend_adjactive == 0) { + interval = calend_adjust(); + if (interval != 0) { + clock_deadline_for_periodic_event(interval, mach_absolute_time(), &calend_adjdeadline); - (void) (*clock->cl_ops->c_gettime)(&value); + if (!timer_call_enter(&calend_adjcall, calend_adjdeadline, TIMER_CALL_SYS_CRITICAL)) + calend_adjactive++; + } + } - return value; + clock_unlock(); + splx(s); } -mach_timespec_t -clock_get_calendar_value(void) +static uint32_t +calend_adjust(void) { - clock_t clock = &clock_list[CALENDAR_CLOCK]; - mach_timespec_t value = MACH_TIMESPEC_ZERO; + uint64_t now, t64; + int32_t delta; + uint32_t interval = 0; - (void) (*clock->cl_ops->c_gettime)(&value); + commpage_disable_timestamp(); - return value; -} + now = mach_absolute_time(); -void -clock_deadline_for_periodic_event( - uint64_t interval, - uint64_t abstime, - uint64_t *deadline) -{ - assert(interval != 0); + delta = clock_calend.adjdelta; - *deadline += interval; + if (delta > 0) { + clock_calend.offset += clock_calend.adjoffset; - if (*deadline <= abstime) { - *deadline = abstime + interval; - abstime = mach_absolute_time(); + calend_adjtotal -= delta; + if (delta > calend_adjtotal) { + clock_calend.adjdelta = delta = (int32_t)calend_adjtotal; - if (*deadline <= abstime) - *deadline = abstime + interval; + nanoseconds_to_absolutetime((uint64_t)delta, &t64); + clock_calend.adjoffset = (uint32_t)t64; + } } -} + else + if (delta < 0) { + clock_calend.offset -= clock_calend.adjoffset; -void -mk_timebase_info_trap( - struct mk_timebase_info_trap_args *args) -{ - uint32_t *delta = args->delta; - uint32_t *abs_to_ns_numer = args->abs_to_ns_numer; - uint32_t *abs_to_ns_denom = args->abs_to_ns_denom; - uint32_t *proc_to_abs_numer = args->proc_to_abs_numer; - uint32_t *proc_to_abs_denom = args->proc_to_abs_denom; - mach_timebase_info_data_t info; - uint32_t one = 1; + calend_adjtotal -= delta; + if (delta < calend_adjtotal) { + clock_calend.adjdelta = delta = (int32_t)calend_adjtotal; - clock_timebase_info(&info); + nanoseconds_to_absolutetime((uint64_t)-delta, &t64); + clock_calend.adjoffset = (uint32_t)t64; + } - copyout((void *)&one, CAST_USER_ADDR_T(delta), sizeof (uint32_t)); + if (clock_calend.adjdelta != 0) + clock_calend.adjstart = now; + } + + if (clock_calend.adjdelta != 0) + interval = calend_adjinterval; - copyout((void *)&info.numer, CAST_USER_ADDR_T(abs_to_ns_numer), sizeof (uint32_t)); - copyout((void *)&info.denom, CAST_USER_ADDR_T(abs_to_ns_denom), sizeof (uint32_t)); +#if CONFIG_DTRACE + clock_track_calend_nowait(); +#endif - copyout((void *)&one, CAST_USER_ADDR_T(proc_to_abs_numer), sizeof (uint32_t)); - copyout((void *)&one, CAST_USER_ADDR_T(proc_to_abs_denom), sizeof (uint32_t)); + return (interval); } -kern_return_t -mach_timebase_info_trap( - struct mach_timebase_info_trap_args *args) +/* + * clock_wakeup_calendar: + * + * Interface to power management, used + * to initiate the reset of the calendar + * on wake from sleep event. + */ +void +clock_wakeup_calendar(void) { - mach_vm_address_t out_info_addr = args->info; - mach_timebase_info_data_t info; - - clock_timebase_info(&info); - - copyout((void *)&info, out_info_addr, sizeof (info)); - - return (KERN_SUCCESS); + thread_call_enter(&calend_wakecall); } +/* + * Wait / delay routines. + */ static void mach_wait_until_continue( __unused void *parameter, @@ -875,6 +798,15 @@ mach_wait_until_continue( /*NOTREACHED*/ } +/* + * mach_wait_until_trap: Suspend execution of calling thread until the specified time has passed + * + * Parameters: args->deadline Amount of time to wait + * + * Returns: 0 Success + * !0 Not success + * + */ kern_return_t mach_wait_until_trap( struct mach_wait_until_trap_args *args) @@ -882,16 +814,14 @@ mach_wait_until_trap( uint64_t deadline = args->deadline; wait_result_t wresult; - wresult = assert_wait_deadline((event_t)mach_wait_until_trap, THREAD_ABORTSAFE, deadline); + wresult = assert_wait_deadline_with_leeway((event_t)mach_wait_until_trap, THREAD_ABORTSAFE, + TIMEOUT_URGENCY_USER_NORMAL, deadline, 0); if (wresult == THREAD_WAITING) wresult = thread_block(mach_wait_until_continue); return ((wresult == THREAD_INTERRUPTED)? KERN_ABORTED: KERN_SUCCESS); } -/* - * Delay primitives. - */ void clock_delay_until( uint64_t deadline) @@ -901,27 +831,44 @@ clock_delay_until( if (now >= deadline) return; - if ( (deadline - now) < (8 * sched_cswtime) || + _clock_delay_until_deadline(deadline - now, deadline); +} + +/* + * Preserve the original precise interval that the client + * requested for comparison to the spin threshold. + */ +void +_clock_delay_until_deadline( + uint64_t interval, + uint64_t deadline) +{ + + if (interval == 0) + return; + + if ( ml_delay_should_spin(interval) || get_preemption_level() != 0 || - ml_get_interrupts_enabled() == FALSE ) - machine_delay_until(deadline); - else { - assert_wait_deadline((event_t)clock_delay_until, THREAD_UNINT, deadline - sched_cswtime); + ml_get_interrupts_enabled() == FALSE ) { + machine_delay_until(interval, deadline); + } else { + assert_wait_deadline((event_t)clock_delay_until, THREAD_UNINT, deadline); thread_block(THREAD_CONTINUE_NULL); } } + void delay_for_interval( uint32_t interval, uint32_t scale_factor) { - uint64_t end; + uint64_t abstime; - clock_interval_to_deadline(interval, scale_factor, &end); + clock_interval_to_absolutetime_interval(interval, scale_factor, &abstime); - clock_delay_until(end); + _clock_delay_until_deadline(abstime, mach_absolute_time() + abstime); } void @@ -931,69 +878,152 @@ delay( delay_for_interval((usec < 0)? -usec: usec, NSEC_PER_USEC); } +/* + * Miscellaneous routines. + */ void -clock_adjtime( - int32_t *secs, - int32_t *microsecs) +clock_interval_to_deadline( + uint32_t interval, + uint32_t scale_factor, + uint64_t *result) { - uint32_t interval; - spl_t s; + uint64_t abstime; - s = splclock(); - simple_lock(&calend_adjlock); + clock_interval_to_absolutetime_interval(interval, scale_factor, &abstime); - interval = clock_set_calendar_adjtime(secs, microsecs); - if (interval != 0) { - if (calend_adjdeadline >= interval) - calend_adjdeadline -= interval; - clock_deadline_for_periodic_event(interval, mach_absolute_time(), - &calend_adjdeadline); + *result = mach_absolute_time() + abstime; +} - timer_call_enter(&calend_adjcall, calend_adjdeadline); - } - else - timer_call_cancel(&calend_adjcall); +void +clock_absolutetime_interval_to_deadline( + uint64_t abstime, + uint64_t *result) +{ + *result = mach_absolute_time() + abstime; +} - simple_unlock(&calend_adjlock); - splx(s); +void +clock_get_uptime( + uint64_t *result) +{ + *result = mach_absolute_time(); } -static void -calend_adjust_call( - __unused timer_call_param_t p0, - __unused timer_call_param_t p1) +void +clock_deadline_for_periodic_event( + uint64_t interval, + uint64_t abstime, + uint64_t *deadline) { - uint32_t interval; - spl_t s; + assert(interval != 0); - s = splclock(); - simple_lock(&calend_adjlock); + *deadline += interval; - interval = clock_adjust_calendar(); - if (interval != 0) { - clock_deadline_for_periodic_event(interval, mach_absolute_time(), - &calend_adjdeadline); + if (*deadline <= abstime) { + *deadline = abstime + interval; + abstime = mach_absolute_time(); - timer_call_enter(&calend_adjcall, calend_adjdeadline); + if (*deadline <= abstime) + *deadline = abstime + interval; } - - simple_unlock(&calend_adjlock); - splx(s); } +#if CONFIG_DTRACE + +/* + * clock_get_calendar_nanotime_nowait + * + * Description: Non-blocking version of clock_get_calendar_nanotime() + * + * Notes: This function operates by separately tracking calendar time + * updates using a two element structure to copy the calendar + * state, which may be asynchronously modified. It utilizes + * barrier instructions in the tracking process and in the local + * stable snapshot process in order to ensure that a consistent + * snapshot is used to perform the calculation. + */ void -clock_wakeup_calendar(void) +clock_get_calendar_nanotime_nowait( + clock_sec_t *secs, + clock_nsec_t *nanosecs) { - thread_call_enter(&calend_wakecall); -} + int i = 0; + uint64_t now; + struct unlocked_clock_calend stable; -extern void IOKitResetTime(void); /* XXX */ + for (;;) { + stable = flipflop[i]; /* take snapshot */ -static void -calend_dowakeup( - __unused thread_call_param_t p0, - __unused thread_call_param_t p1) + /* + * Use a barrier instructions to ensure atomicity. We AND + * off the "in progress" bit to get the current generation + * count. + */ + (void)hw_atomic_and(&stable.gen, ~(uint32_t)1); + + /* + * If an update _is_ in progress, the generation count will be + * off by one, if it _was_ in progress, it will be off by two, + * and if we caught it at a good time, it will be equal (and + * our snapshot is threfore stable). + */ + if (flipflop[i].gen == stable.gen) + break; + + /* Switch to the oher element of the flipflop, and try again. */ + i ^= 1; + } + + now = mach_absolute_time(); + + if (stable.calend.adjdelta < 0) { + uint32_t t32; + + if (now > stable.calend.adjstart) { + t32 = (uint32_t)(now - stable.calend.adjstart); + + if (t32 > stable.calend.adjoffset) + now -= stable.calend.adjoffset; + else + now = stable.calend.adjstart; + } + } + + now += stable.calend.offset; + + absolutetime_to_microtime(now, secs, nanosecs); + *nanosecs *= NSEC_PER_USEC; + + *secs += (clock_sec_t)stable.calend.epoch; +} + +static void +clock_track_calend_nowait(void) { + int i; + + for (i = 0; i < 2; i++) { + struct clock_calend tmp = clock_calend; + + /* + * Set the low bit if the generation count; since we use a + * barrier instruction to do this, we are guaranteed that this + * will flag an update in progress to an async caller trying + * to examine the contents. + */ + (void)hw_atomic_or(&flipflop[i].gen, 1); - IOKitResetTime(); + flipflop[i].calend = tmp; + + /* + * Increment the generation count to clear the low bit to + * signal completion. If a caller compares the generation + * count after taking a copy while in progress, the count + * will be off by two. + */ + (void)hw_atomic_add(&flipflop[i].gen, 1); + } } + +#endif /* CONFIG_DTRACE */ +