xnu-4570.1.46.tar.gz

[apple/xnu.git] / osfmk / arm / machine_routines.h
diff --git a/osfmk/arm/machine_routines.h b/osfmk/arm/machine_routines.h

new file mode 100644 (file)

index 0000000..3510649
--- /dev/null
+++ b/osfmk/arm/machine_routines.h
@@ -0,0 +1,884 @@
+/*
+ * Copyright (c) 2007-2015 Apple Inc. All rights reserved.
+ *
+ * @APPLE_OSREFERENCE_LICENSE_HEADER_START@
+ *
+ * This file contains Original Code and/or Modifications of Original Code
+ * as defined in and that are subject to the Apple Public Source License
+ * Version 2.0 (the 'License'). You may not use this file except in
+ * compliance with the License. The rights granted to you under the License
+ * may not be used to create, or enable the creation or redistribution of,
+ * unlawful or unlicensed copies of an Apple operating system, or to
+ * circumvent, violate, or enable the circumvention or violation of, any
+ * terms of an Apple operating system software license agreement.
+ *
+ * Please obtain a copy of the License at
+ * http://www.opensource.apple.com/apsl/ and read it before using this file.
+ *
+ * The Original Code and all software distributed under the License are
+ * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
+ * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
+ * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
+ * Please see the License for the specific language governing rights and
+ * limitations under the License.
+ *
+ * @APPLE_OSREFERENCE_LICENSE_HEADER_END@
+ */
+/*
+ * @OSF_COPYRIGHT@
+ */
+
+#ifndef        _ARM_MACHINE_ROUTINES_H_
+#define        _ARM_MACHINE_ROUTINES_H_
+
+#include <mach/mach_types.h>
+#include <mach/boolean.h>
+#include <kern/kern_types.h>
+#include <pexpert/pexpert.h>
+
+#include <sys/cdefs.h>
+#include <sys/appleapiopts.h>
+
+#include <stdarg.h>
+
+__BEGIN_DECLS
+
+/* Interrupt handling */
+
+void ml_cpu_signal(unsigned int cpu_id);
+void ml_cpu_signal_deferred_adjust_timer(uint64_t nanosecs);
+uint64_t ml_cpu_signal_deferred_get_timer(void);
+void ml_cpu_signal_deferred(unsigned int cpu_id);
+void ml_cpu_signal_retract(unsigned int cpu_id);
+
+/* Initialize Interrupts */
+void    ml_init_interrupt(void);
+
+/* Get Interrupts Enabled */
+boolean_t ml_get_interrupts_enabled(void);
+
+/* Set Interrupts Enabled */
+boolean_t ml_set_interrupts_enabled(boolean_t enable);
+
+/* Check if running at interrupt context */
+boolean_t ml_at_interrupt_context(void);
+
+/* Generate a fake interrupt */
+void ml_cause_interrupt(void);
+
+/* Clear interrupt spin debug state for thread */
+#if INTERRUPT_MASKED_DEBUG
+void ml_spin_debug_reset(thread_t thread);
+void ml_spin_debug_clear(thread_t thread);
+void ml_spin_debug_clear_self(void);
+void ml_check_interrupts_disabled_duration(thread_t thread);
+#endif
+
+#ifdef XNU_KERNEL_PRIVATE
+extern boolean_t ml_is_quiescing(void);
+extern void ml_set_is_quiescing(boolean_t);
+extern uint64_t ml_get_booter_memory_size(void);
+#endif
+
+/* Type for the Time Base Enable function */
+typedef void (*time_base_enable_t)(cpu_id_t cpu_id, boolean_t enable);
+#if MACH_KERNEL_PRIVATE
+/* Type for the Processor Cache Dispatch function */
+typedef void (*cache_dispatch_t)(cpu_id_t cpu_id, unsigned int select, unsigned int param0, unsigned int param1);
+#endif
+
+#define CacheConfig                    0x00000000UL
+#define CacheControl                   0x00000001UL
+#define CacheClean                     0x00000002UL
+#define CacheCleanRegion               0x00000003UL
+#define CacheCleanFlush                        0x00000004UL
+#define CacheCleanFlushRegion          0x00000005UL
+#define CacheShutdown                  0x00000006UL
+
+#define CacheControlEnable             0x00000000UL
+
+#define CacheConfigCCSIDR              0x00000001UL
+#define CacheConfigSize                        0x00000100UL
+
+/* Type for the Processor Idle function */
+typedef void (*processor_idle_t)(cpu_id_t cpu_id, boolean_t enter, uint64_t *new_timeout_ticks);
+
+/* Type for the Idle Tickle function */
+typedef void (*idle_tickle_t)(void);
+
+/* Type for the Idle Timer function */
+typedef void (*idle_timer_t)(void *refcon, uint64_t *new_timeout_ticks);
+
+/* Type for the IPI Hander */
+typedef void (*ipi_handler_t)(void);
+
+/* Type for the Lockdown Hander */
+typedef void (*lockdown_handler_t)(void *);
+
+/* Type for the Platform specific Error Handler */
+typedef void (*platform_error_handler_t)(void *refcon, vm_offset_t fault_addr);
+
+/*
+ * The exception callback (ex_cb) module allows kernel drivers to 
+ * register and receive callbacks for exceptions, and indicate 
+ * actions to be taken by the platform kernel
+ * Currently this is supported for ARM64 but extending support for ARM32 
+ * should be straightforward
+ */
+
+/* Supported exception classes for callbacks */
+typedef enum
+{
+       EXCB_CLASS_ILLEGAL_INSTR_SET,
+       EXCB_CLASS_MAX          // this must be last
+}
+ex_cb_class_t;
+
+/* Actions indicated by callbacks to be taken by platform kernel */
+typedef enum
+{
+       EXCB_ACTION_RERUN,      // re-run the faulting instruction
+       EXCB_ACTION_NONE,       // continue normal exception handling
+}
+ex_cb_action_t;
+
+/* 
+ * Exception state 
+ * We cannot use a private kernel data structure such as arm_saved_state_t 
+ * The CPSR and ESR are not clobbered when the callback function is invoked so 
+ * those registers can be examined by the callback function;
+ * the same is done in the platform error handlers
+ */
+typedef struct 
+{
+       vm_offset_t far;
+}
+ex_cb_state_t;
+
+/* callback type definition */
+typedef ex_cb_action_t (*ex_cb_t) (
+       ex_cb_class_t           cb_class,
+       void                            *refcon,// provided at registration 
+       const ex_cb_state_t     *state  // exception state
+       );
+
+/* 
+ * Callback registration 
+ * Currently we support only one registered callback per class but 
+ * it should be possible to support more callbacks
+ */
+kern_return_t ex_cb_register(
+       ex_cb_class_t   cb_class, 
+       ex_cb_t                 cb,
+       void                    *refcon );
+
+/*
+ * Called internally by platform kernel to invoke the registered callback for class
+ */
+ex_cb_action_t ex_cb_invoke(
+       ex_cb_class_t   cb_class,
+    vm_offset_t                far);
+
+
+void ml_parse_cpu_topology(void);
+
+unsigned int ml_get_cpu_count(void);
+
+int ml_get_boot_cpu_number(void);
+
+int ml_get_cpu_number(uint32_t phys_id);
+
+int ml_get_max_cpu_number(void);
+
+/* Struct for ml_cpu_get_info */
+struct ml_cpu_info {
+       unsigned long           vector_unit;
+       unsigned long           cache_line_size;
+       unsigned long           l1_icache_size;
+       unsigned long           l1_dcache_size;
+       unsigned long           l2_settings;
+       unsigned long           l2_cache_size;
+       unsigned long           l3_settings;
+       unsigned long           l3_cache_size;
+};
+typedef struct ml_cpu_info ml_cpu_info_t;
+
+typedef enum {
+       CLUSTER_TYPE_SMP,
+} cluster_type_t;
+
+cluster_type_t ml_get_boot_cluster(void);
+
+/* Struct for ml_processor_register */
+struct ml_processor_info {
+       cpu_id_t                        cpu_id;
+       vm_offset_t                     start_paddr;
+       boolean_t                       supports_nap;
+       void                            *platform_cache_dispatch;
+       time_base_enable_t              time_base_enable;
+       processor_idle_t                processor_idle;
+       idle_tickle_t                   *idle_tickle;
+       idle_timer_t                    idle_timer;
+       void                            *idle_timer_refcon;
+       vm_offset_t                     powergate_stub_addr;
+       uint32_t                        powergate_stub_length;
+       uint32_t                        powergate_latency;
+       platform_error_handler_t        platform_error_handler;
+       uint64_t                        regmap_paddr;
+       uint32_t                        phys_id;
+       uint32_t                        log_id;
+       uint32_t                        l2_access_penalty;
+       uint32_t                        cluster_id;
+       cluster_type_t                  cluster_type;
+       uint32_t                        l2_cache_id;
+       uint32_t                        l2_cache_size;
+       uint32_t                        l3_cache_id;
+       uint32_t                        l3_cache_size;
+};
+typedef struct ml_processor_info ml_processor_info_t;
+
+#if    defined(PEXPERT_KERNEL_PRIVATE) || defined(MACH_KERNEL_PRIVATE)
+/* Struct for ml_init_timebase */
+struct  tbd_ops {
+       void            (*tbd_fiq_handler)(void);
+       uint32_t        (*tbd_get_decrementer)(void);
+       void            (*tbd_set_decrementer)(uint32_t dec_value);
+};
+typedef struct tbd_ops        *tbd_ops_t;
+typedef struct tbd_ops        tbd_ops_data_t;
+#endif
+
+/* Register a processor */                      
+kern_return_t  ml_processor_register(
+       ml_processor_info_t     *ml_processor_info,
+       processor_t                     *processor,
+       ipi_handler_t           *ipi_handler);
+
+/* Register a lockdown handler */
+kern_return_t ml_lockdown_handler_register(lockdown_handler_t, void *);
+
+#if XNU_KERNEL_PRIVATE
+void ml_lockdown_init(void);
+
+/* Check if the machine layer wants to intercept a panic call */
+boolean_t ml_wants_panic_trap_to_debugger(void);
+
+/* Machine layer routine for intercepting panics */
+void ml_panic_trap_to_debugger(const char *panic_format_str,
+                               va_list *panic_args,
+                               unsigned int reason,
+                               void *ctx,
+                               uint64_t panic_options_mask,
+                               unsigned long panic_caller);
+#endif /* XNU_KERNEL_PRIVATE */
+
+/* Initialize Interrupts */
+void ml_install_interrupt_handler(
+    void *nub,
+    int source,
+    void *target,
+    IOInterruptHandler handler,
+    void *refCon);
+
+vm_offset_t
+ml_static_vtop(
+       vm_offset_t);
+
+vm_offset_t
+ml_static_ptovirt(
+       vm_offset_t);
+
+/* Offset required to obtain absolute time value from tick counter */
+uint64_t ml_get_abstime_offset(void);
+
+/* Offset required to obtain continuous time value from tick counter */
+uint64_t ml_get_conttime_offset(void);
+
+#ifdef __APPLE_API_UNSTABLE
+/* PCI config cycle probing */
+boolean_t ml_probe_read(
+       vm_offset_t paddr,
+       unsigned int *val);
+boolean_t ml_probe_read_64(
+       addr64_t paddr,
+       unsigned int *val);
+
+/* Read physical address byte */
+unsigned int ml_phys_read_byte(
+       vm_offset_t paddr);
+unsigned int ml_phys_read_byte_64(
+       addr64_t paddr);
+
+/* Read physical address half word */
+unsigned int ml_phys_read_half(
+       vm_offset_t paddr);
+unsigned int ml_phys_read_half_64(
+       addr64_t paddr);
+
+/* Read physical address word*/
+unsigned int ml_phys_read(
+       vm_offset_t paddr);
+unsigned int ml_phys_read_64(
+       addr64_t paddr);
+unsigned int ml_phys_read_word(
+       vm_offset_t paddr);
+unsigned int ml_phys_read_word_64(
+       addr64_t paddr);
+
+unsigned long long ml_io_read(uintptr_t iovaddr, int iovsz);
+unsigned int ml_io_read8(uintptr_t iovaddr);
+unsigned int ml_io_read16(uintptr_t iovaddr);
+unsigned int ml_io_read32(uintptr_t iovaddr);
+unsigned long long ml_io_read64(uintptr_t iovaddr);
+
+/* Read physical address double word */
+unsigned long long ml_phys_read_double(
+       vm_offset_t paddr);
+unsigned long long ml_phys_read_double_64(
+       addr64_t paddr);
+
+/* Write physical address byte */
+void ml_phys_write_byte(
+       vm_offset_t paddr, unsigned int data);
+void ml_phys_write_byte_64(
+       addr64_t paddr, unsigned int data);
+
+/* Write physical address half word */
+void ml_phys_write_half(
+       vm_offset_t paddr, unsigned int data);
+void ml_phys_write_half_64(
+       addr64_t paddr, unsigned int data);
+
+/* Write physical address word */
+void ml_phys_write(
+       vm_offset_t paddr, unsigned int data);
+void ml_phys_write_64(
+       addr64_t paddr, unsigned int data);
+void ml_phys_write_word(
+       vm_offset_t paddr, unsigned int data);
+void ml_phys_write_word_64(
+       addr64_t paddr, unsigned int data);
+
+/* Write physical address double word */
+void ml_phys_write_double(
+       vm_offset_t paddr, unsigned long long data);
+void ml_phys_write_double_64(
+       addr64_t paddr, unsigned long long data);
+
+void ml_static_mfree(
+       vm_offset_t,
+       vm_size_t);
+
+kern_return_t
+ml_static_protect(
+    vm_offset_t start,
+    vm_size_t size,
+    vm_prot_t new_prot);
+
+/* virtual to physical on wired pages */
+vm_offset_t ml_vtophys(
+       vm_offset_t vaddr);
+
+/* Get processor info */
+void ml_cpu_get_info(ml_cpu_info_t *ml_cpu_info);
+
+#endif /* __APPLE_API_UNSTABLE */
+
+#ifdef __APPLE_API_PRIVATE
+#ifdef XNU_KERNEL_PRIVATE
+vm_size_t ml_nofault_copy(
+       vm_offset_t virtsrc, 
+       vm_offset_t virtdst, 
+       vm_size_t size);
+boolean_t ml_validate_nofault(
+       vm_offset_t virtsrc, vm_size_t size);
+#endif /* XNU_KERNEL_PRIVATE */
+#if    defined(PEXPERT_KERNEL_PRIVATE) || defined(MACH_KERNEL_PRIVATE)
+/* IO memory map services */
+
+/* Map memory map IO space */
+vm_offset_t ml_io_map(
+       vm_offset_t phys_addr, 
+       vm_size_t size);
+
+vm_offset_t ml_io_map_wcomb(
+       vm_offset_t phys_addr, 
+       vm_size_t size);
+
+void ml_get_bouncepool_info(
+       vm_offset_t *phys_addr,
+       vm_size_t   *size);
+
+vm_map_address_t ml_map_high_window(
+       vm_offset_t     phys_addr,
+       vm_size_t       len);
+
+/* boot memory allocation */
+vm_offset_t ml_static_malloc(
+       vm_size_t size);
+
+void ml_init_timebase(
+       void            *args,
+       tbd_ops_t       tbd_funcs,
+       vm_offset_t     int_address,
+       vm_offset_t     int_value);
+
+uint64_t ml_get_timebase(void);
+
+void ml_init_lock_timeout(void);
+
+boolean_t ml_delay_should_spin(uint64_t interval);
+
+uint32_t ml_get_decrementer(void);
+
+#if !CONFIG_SKIP_PRECISE_USER_KERNEL_TIME
+void timer_state_event_user_to_kernel(void);
+void timer_state_event_kernel_to_user(void);
+#endif /* !CONFIG_SKIP_PRECISE_USER_KERNEL_TIME */
+
+uint64_t ml_get_hwclock(void);
+
+#ifdef __arm64__
+boolean_t ml_get_timer_pending(void);
+#endif
+
+void platform_syscall(
+       struct arm_saved_state *);
+
+void ml_set_decrementer(
+       uint32_t dec_value);
+
+boolean_t is_user_contex(
+       void);
+
+void ml_init_arm_debug_interface(void *args, vm_offset_t virt_address);
+
+/* These calls are only valid if __ARM_USER_PROTECT__ is defined */
+uintptr_t arm_user_protect_begin(
+                                 thread_t thread);
+
+void arm_user_protect_end(
+                          thread_t thread,
+                          uintptr_t up,
+                          boolean_t disable_interrupts);
+
+#endif /* PEXPERT_KERNEL_PRIVATE || MACH_KERNEL_PRIVATE  */
+
+/* Zero bytes starting at a physical address */
+void bzero_phys(
+       addr64_t phys_address,
+       vm_size_t length);
+
+void bzero_phys_nc(addr64_t src64, vm_size_t bytes);
+
+void ml_thread_policy(
+       thread_t thread,
+       unsigned policy_id,
+       unsigned policy_info);
+
+#define MACHINE_GROUP                                  0x00000001
+#define MACHINE_NETWORK_GROUP                  0x10000000
+#define MACHINE_NETWORK_WORKLOOP               0x00000001
+#define MACHINE_NETWORK_NETISR                 0x00000002
+
+/* Initialize the maximum number of CPUs */
+void ml_init_max_cpus(
+       unsigned int max_cpus);
+
+/* Return the maximum number of CPUs set by ml_init_max_cpus() */
+unsigned int ml_get_max_cpus(
+       void);
+
+/* Return the maximum memory size */
+unsigned int ml_get_machine_mem(void);
+
+#ifdef XNU_KERNEL_PRIVATE
+/* Return max offset */
+vm_map_offset_t ml_get_max_offset(
+       boolean_t       is64,
+       unsigned int option);
+#define MACHINE_MAX_OFFSET_DEFAULT     0x01
+#define MACHINE_MAX_OFFSET_MIN         0x02
+#define MACHINE_MAX_OFFSET_MAX         0x04
+#define MACHINE_MAX_OFFSET_DEVICE      0x08
+#endif
+
+extern void    ml_cpu_up(void);
+extern void    ml_cpu_down(void);
+extern void    ml_arm_sleep(void);
+
+extern uint64_t ml_get_wake_timebase(void);
+extern uint64_t ml_get_conttime_wake_time(void);
+
+/* Time since the system was reset (as part of boot/wake) */
+uint64_t ml_get_time_since_reset(void);
+
+#ifdef XNU_KERNEL_PRIVATE
+/* Just a stub on ARM */
+extern kern_return_t ml_interrupt_prewarm(uint64_t deadline);
+#define TCOAL_DEBUG(x, a, b, c, d, e) do { } while(0)
+#endif /* XNU_KERNEL_PRIVATE */
+
+/* Bytes available on current stack */
+vm_offset_t ml_stack_remaining(void);
+
+#ifdef MACH_KERNEL_PRIVATE
+uint32_t       get_fpscr(void);
+void           set_fpscr(uint32_t);
+
+extern void            init_vfp(void);
+extern boolean_t       get_vfp_enabled(void);
+#if     (__ARM_VFP__ >= 3)
+extern unsigned int    get_mvfr0(void);
+extern unsigned int    get_mvfr1(void);
+#endif
+extern void            arm_debug_set_cp14(arm_debug_state_t *debug_state);
+extern void            fiq_context_init(boolean_t enable_fiq);
+
+extern void            reenable_async_aborts(void);
+extern void            cpu_idle_wfi(boolean_t wfi_fast);
+
+#ifdef MONITOR
+#define MONITOR_SET_ENTRY      0x800   /* Set kernel entry point from monitor */
+#define MONITOR_LOCKDOWN       0x801   /* Enforce kernel text/rodata integrity */
+unsigned long          monitor_call(uintptr_t callnum, uintptr_t arg1,
+                                    uintptr_t arg2, uintptr_t arg3);
+#endif /* MONITOR */
+
+#if defined(KERNEL_INTEGRITY_KTRR)
+void rorgn_stash_range(void);
+void rorgn_lockdown(void);
+#endif /* defined(KERNEL_INTEGRITY_KTRR)*/
+
+#endif /* MACH_KERNEL_PRIVATE */
+
+extern uint32_t        arm_debug_read_dscr(void);
+
+extern int     set_be_bit(void);
+extern int     clr_be_bit(void);
+extern int     be_tracing(void);
+
+typedef void (*broadcastFunc) (void *);
+unsigned int cpu_broadcast_xcall(uint32_t *, boolean_t, broadcastFunc, void *);
+kern_return_t cpu_xcall(int, broadcastFunc, void *);
+
+#ifdef  KERNEL_PRIVATE
+
+/* Interface to be used by the perf. controller to register a callback, in a
+ * single-threaded fashion. The callback will receive notifications of
+ * processor performance quality-of-service changes from the scheduler.
+ */
+
+#ifdef __arm64__
+typedef void (*cpu_qos_update_t)(int throughput_qos, uint64_t qos_param1, uint64_t qos_param2);
+void cpu_qos_update_register(cpu_qos_update_t);
+#endif /* __arm64__ */
+
+struct going_on_core {
+       uint64_t        thread_id;
+       uint16_t        qos_class;
+       uint16_t        urgency;        /* XCPM compatibility */
+       uint32_t        is_32_bit : 1; /* uses 32-bit ISA/register state in userspace (which may differ from address space size) */
+       uint32_t        is_kernel_thread : 1;
+       uint64_t        thread_group_id;
+       void            *thread_group_data;
+       uint64_t        scheduling_latency;     /* absolute time between when thread was made runnable and this ctx switch */
+       uint64_t        start_time;
+       uint64_t        scheduling_latency_at_same_basepri;
+       uint32_t        energy_estimate_nj;     /* return: In nanojoules */
+        /* smaller of the time between last change to base priority and ctx switch and scheduling_latency */
+};
+typedef struct going_on_core *going_on_core_t;
+
+struct going_off_core {
+       uint64_t        thread_id;
+       uint32_t        energy_estimate_nj;     /* return: In nanojoules */
+       uint32_t        reserved;
+       uint64_t        end_time;
+       uint64_t        thread_group_id;
+       void            *thread_group_data;
+};
+typedef struct going_off_core *going_off_core_t;
+
+struct thread_group_data {
+       uint64_t        thread_group_id;
+       void            *thread_group_data;
+       uint32_t        thread_group_size;
+       uint32_t        thread_group_flags;
+};
+typedef struct thread_group_data *thread_group_data_t;
+
+struct perfcontrol_max_runnable_latency {
+       uint64_t        max_scheduling_latencies[4 /* THREAD_URGENCY_MAX */];
+};
+typedef struct perfcontrol_max_runnable_latency *perfcontrol_max_runnable_latency_t;
+
+struct perfcontrol_work_interval {
+       uint64_t        thread_id;
+       uint16_t        qos_class;
+       uint16_t        urgency;
+       uint32_t        flags; // notify
+       uint64_t        work_interval_id;
+       uint64_t        start;
+       uint64_t        finish;
+       uint64_t        deadline;
+       uint64_t        next_start;
+       uint64_t        thread_group_id;
+       void            *thread_group_data;
+       uint32_t        create_flags;
+};
+typedef struct perfcontrol_work_interval *perfcontrol_work_interval_t;
+
+
+/* 
+ * Structure to export per-CPU counters as part of the CLPC callout. 
+ * Contains only the fixed CPU counters (instructions and cycles); CLPC 
+ * would call back into XNU to get the configurable counters if needed. 
+ */
+struct perfcontrol_cpu_counters {
+       uint64_t        instructions;
+       uint64_t        cycles;
+};
+
+/*
+ * Structure used to pass information about a thread to CLPC
+ */
+struct perfcontrol_thread_data {
+       /*
+        * Energy estimate (return value)
+        * The field is populated by CLPC and used to update the 
+        * energy estimate of the thread
+        */
+       uint32_t            energy_estimate_nj;
+       /* Perfcontrol class for thread */
+       perfcontrol_class_t perfctl_class;
+       /* Thread ID for the thread */
+       uint64_t            thread_id;
+       /* Thread Group ID */
+       uint64_t            thread_group_id;
+       /* 
+        * Scheduling latency for threads at the same base priority. 
+        * Calculated by the scheduler and passed into CLPC. The field is 
+        * populated only in the thread_data structure for the thread 
+        * going on-core. 
+        */
+       uint64_t            scheduling_latency_at_same_basepri;
+       /* Thread Group data pointer */
+       void                *thread_group_data;
+       /* perfctl state pointer */
+       void                *perfctl_state;
+};
+
+/*
+ * All callouts from the scheduler are executed with interrupts
+ * disabled. Callouts should be implemented in C with minimal
+ * abstractions, and only use KPI exported by the mach/libkern
+ * symbolset, restricted to routines like spinlocks and atomic
+ * operations and scheduler routines as noted below. Spinlocks that
+ * are used to synchronize data in the perfcontrol_state_t should only
+ * ever be acquired with interrupts disabled, to avoid deadlocks where
+ * an quantum expiration timer interrupt attempts to perform a callout
+ * that attempts to lock a spinlock that is already held.
+ */
+
+/*
+ * When a processor is switching between two threads (after the
+ * scheduler has chosen a new thread), the low-level platform layer
+ * will call this routine, which should perform required timestamps,
+ * MMIO register reads, or other state switching. No scheduler locks
+ * are held during this callout.
+ *
+ * This function is called with interrupts ENABLED.
+ */
+typedef void (*sched_perfcontrol_context_switch_t)(perfcontrol_state_t, perfcontrol_state_t);
+
+/*
+ * Once the processor has switched to the new thread, the offcore
+ * callout will indicate the old thread that is no longer being
+ * run. The thread's scheduler lock is held, so it will not begin
+ * running on another processor (in the case of preemption where it
+ * remains runnable) until it completes. If the "thread_terminating"
+ * boolean is TRUE, this will be the last callout for this thread_id.
+ */
+typedef void (*sched_perfcontrol_offcore_t)(perfcontrol_state_t, going_off_core_t /* populated by callee */, boolean_t);
+
+/*
+ * After the offcore callout and after the old thread can potentially
+ * start running on another processor, the oncore callout will be
+ * called with the thread's scheduler lock held. The oncore callout is
+ * also called any time one of the parameters in the going_on_core_t
+ * structure changes, like priority/QoS changes, and quantum
+ * expiration, so the callout must not assume callouts are paired with
+ * offcore callouts.
+ */
+typedef void (*sched_perfcontrol_oncore_t)(perfcontrol_state_t, going_on_core_t);
+
+/*
+ * Periodically (on hundreds of ms scale), the scheduler will perform
+ * maintenance and report the maximum latency for runnable (but not currently
+ * running) threads for each urgency class.
+ */
+typedef void (*sched_perfcontrol_max_runnable_latency_t)(perfcontrol_max_runnable_latency_t);
+
+/*
+ * When the kernel receives information about work intervals from userland,
+ * it is passed along using this callback. No locks are held, although the state
+ * object will not go away during the callout.
+ */
+typedef void (*sched_perfcontrol_work_interval_notify_t)(perfcontrol_state_t, perfcontrol_work_interval_t);
+
+/*
+ * These callbacks are used when thread groups are added, removed or properties
+ * updated.
+ * No blocking allocations (or anything else blocking) are allowed inside these
+ * callbacks. No locks allowed in these callbacks as well since the kernel might
+ * be holding the thread/task locks.
+ */
+typedef void (*sched_perfcontrol_thread_group_init_t)(thread_group_data_t);
+typedef void (*sched_perfcontrol_thread_group_deinit_t)(thread_group_data_t);
+typedef void (*sched_perfcontrol_thread_group_flags_update_t)(thread_group_data_t);
+
+/*
+ * Sometime after the timeout set by sched_perfcontrol_update_callback_deadline has passed,
+ * this function will be called, passing the timeout deadline that was previously armed as an argument.
+ *
+ * This is called inside context-switch/quantum-interrupt context and must follow the safety rules for that context.
+ */
+typedef void (*sched_perfcontrol_deadline_passed_t)(uint64_t deadline);
+
+/*
+ * Context Switch Callout
+ * 
+ * Parameters:
+ * event        - The perfcontrol_event for this callout
+ * cpu_id       - The CPU doing the context switch
+ * timestamp    - The timestamp for the context switch
+ * flags        - Flags for other relevant information
+ * offcore      - perfcontrol_data structure for thread going off-core
+ * oncore       - perfcontrol_data structure for thread going on-core
+ * cpu_counters - perfcontrol_cpu_counters for the CPU doing the switch
+ */
+typedef void (*sched_perfcontrol_csw_t)(
+       perfcontrol_event event, uint32_t cpu_id, uint64_t timestamp, uint32_t flags,
+       struct perfcontrol_thread_data *offcore, struct perfcontrol_thread_data *oncore,
+       struct perfcontrol_cpu_counters *cpu_counters, __unused void *unused);
+
+
+/*
+ * Thread State Update Callout
+ *
+ * Parameters:
+ * event        - The perfcontrol_event for this callout
+ * cpu_id       - The CPU doing the state update
+ * timestamp    - The timestamp for the state update
+ * flags        - Flags for other relevant information
+ * thr_data     - perfcontrol_data structure for the thread being updated
+ */
+typedef void (*sched_perfcontrol_state_update_t)(
+       perfcontrol_event event, uint32_t cpu_id, uint64_t timestamp, uint32_t flags,
+       struct perfcontrol_thread_data *thr_data, __unused void *unused);
+
+
+/*
+ * Callers should always use the CURRENT version so that the kernel can detect both older
+ * and newer structure layouts. New callbacks should always be added at the end of the
+ * structure, and xnu should expect existing source recompiled against newer headers
+ * to pass NULL for unimplemented callbacks. Pass NULL as the as the callbacks parameter
+ * to reset callbacks to their default in-kernel values.
+ */
+
+#define SCHED_PERFCONTROL_CALLBACKS_VERSION_0 (0) /* up-to oncore */
+#define SCHED_PERFCONTROL_CALLBACKS_VERSION_1 (1) /* up-to max_runnable_latency */
+#define SCHED_PERFCONTROL_CALLBACKS_VERSION_2 (2) /* up-to work_interval_notify */
+#define SCHED_PERFCONTROL_CALLBACKS_VERSION_3 (3) /* up-to thread_group_deinit */
+#define SCHED_PERFCONTROL_CALLBACKS_VERSION_4 (4) /* up-to deadline_passed */
+#define SCHED_PERFCONTROL_CALLBACKS_VERSION_5 (5) /* up-to state_update */
+#define SCHED_PERFCONTROL_CALLBACKS_VERSION_6 (6) /* up-to thread_group_flags_update */
+#define SCHED_PERFCONTROL_CALLBACKS_VERSION_CURRENT SCHED_PERFCONTROL_CALLBACKS_VERSION_6
+
+struct sched_perfcontrol_callbacks {
+       unsigned long version; /* Use SCHED_PERFCONTROL_CALLBACKS_VERSION_CURRENT */
+       sched_perfcontrol_offcore_t                   offcore;
+       sched_perfcontrol_context_switch_t            context_switch;
+       sched_perfcontrol_oncore_t                    oncore;
+       sched_perfcontrol_max_runnable_latency_t      max_runnable_latency;
+       sched_perfcontrol_work_interval_notify_t      work_interval_notify;
+       sched_perfcontrol_thread_group_init_t         thread_group_init;
+       sched_perfcontrol_thread_group_deinit_t       thread_group_deinit;
+       sched_perfcontrol_deadline_passed_t           deadline_passed;
+       sched_perfcontrol_csw_t                       csw;
+       sched_perfcontrol_state_update_t              state_update;
+       sched_perfcontrol_thread_group_flags_update_t thread_group_flags_update;
+};
+typedef struct sched_perfcontrol_callbacks *sched_perfcontrol_callbacks_t;
+
+extern void sched_perfcontrol_register_callbacks(sched_perfcontrol_callbacks_t callbacks, unsigned long size_of_state);
+
+/*
+ * Update the scheduler with the set of cores that should be used to dispatch new threads.
+ * Non-recommended cores can still be used to field interrupts or run bound threads.
+ * This should be called with interrupts enabled and no scheduler locks held.
+ */
+#define ALL_CORES_RECOMMENDED  (~(uint32_t)0)
+
+extern void sched_perfcontrol_update_recommended_cores(uint32_t recommended_cores);
+extern void sched_perfcontrol_thread_group_recommend(void *data, cluster_type_t recommendation);
+
+/*
+ * Update the deadline after which sched_perfcontrol_deadline_passed will be called.
+ * Returns TRUE if it successfully canceled a previously set callback,
+ * and FALSE if it did not (i.e. one wasn't set, or callback already fired / is in flight).
+ * The callback is automatically canceled when it fires, and does not repeat unless rearmed.
+ *
+ * This 'timer' executes as the scheduler switches between threads, on a non-idle core
+ *
+ * There can be only one outstanding timer globally.
+ */
+extern boolean_t sched_perfcontrol_update_callback_deadline(uint64_t deadline);
+
+typedef enum perfcontrol_callout_type {
+    PERFCONTROL_CALLOUT_ON_CORE,
+    PERFCONTROL_CALLOUT_OFF_CORE,
+    PERFCONTROL_CALLOUT_CONTEXT,
+    PERFCONTROL_CALLOUT_STATE_UPDATE,
+    /* Add other callout types here */
+    PERFCONTROL_CALLOUT_MAX
+} perfcontrol_callout_type_t;
+
+typedef enum perfcontrol_callout_stat {
+    PERFCONTROL_STAT_INSTRS,
+    PERFCONTROL_STAT_CYCLES,
+    /* Add other stat types here */
+    PERFCONTROL_STAT_MAX
+} perfcontrol_callout_stat_t;
+
+uint64_t perfcontrol_callout_stat_avg(perfcontrol_callout_type_t type,
+       perfcontrol_callout_stat_t stat);
+
+
+#endif /* KERNEL_PRIVATE */
+
+boolean_t machine_timeout_suspended(void);
+void ml_get_power_state(boolean_t *, boolean_t *);
+
+boolean_t user_cont_hwclock_allowed(void);
+boolean_t user_timebase_allowed(void);
+boolean_t ml_thread_is64bit(thread_t thread);
+void ml_task_set_rop_pid(task_t task, task_t parent_task, boolean_t inherit);
+
+#ifdef __arm64__
+void ml_set_align_checking(void);
+boolean_t arm64_wfe_allowed(void);
+#endif /* __arm64__ */
+
+void ml_timer_evaluate(void);
+boolean_t ml_timer_forced_evaluation(void);
+uint64_t ml_energy_stat(thread_t);
+void ml_gpu_stat_update(uint64_t);
+uint64_t ml_gpu_stat(thread_t);
+#endif /* __APPLE_API_PRIVATE */
+
+__END_DECLS
+
+#endif /* _ARM_MACHINE_ROUTINES_H_ */