darling-xnu/osfmk/kern/remote_time.c
2023-05-16 21:41:14 -07:00

534 lines
18 KiB
C

/*
* Copyright (c) 2017-2020 Apple Inc. All rights reserved.
*
* @APPLE_OSREFERENCE_LICENSE_HEADER_START@
*
* This file contains Original Code and/or Modifications of Original Code
* as defined in and that are subject to the Apple Public Source License
* Version 2.0 (the 'License'). You may not use this file except in
* compliance with the License. The rights granted to you under the License
* may not be used to create, or enable the creation or redistribution of,
* unlawful or unlicensed copies of an Apple operating system, or to
* circumvent, violate, or enable the circumvention or violation of, any
* terms of an Apple operating system software license agreement.
*
* Please obtain a copy of the License at
* http://www.opensource.apple.com/apsl/ and read it before using this file.
*
* The Original Code and all software distributed under the License are
* distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
* EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
* INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
* Please see the License for the specific language governing rights and
* limitations under the License.
*
* @APPLE_OSREFERENCE_LICENSE_HEADER_END@
*/
#include <mach/mach_time.h>
#include <mach/clock_types.h>
#include <kern/misc_protos.h>
#include <kern/clock.h>
#include <kern/remote_time.h>
#include <kern/spl.h>
#include <kern/locks.h>
#include <sys/kdebug.h>
#include <machine/machine_routines.h>
#include <kern/assert.h>
#include <kern/kern_types.h>
#include <kern/thread.h>
#include <machine/commpage.h>
#include <machine/atomic.h>
LCK_GRP_DECLARE(bt_lck_grp, "bridge timestamp");
LCK_SPIN_DECLARE(bt_spin_lock, &bt_lck_grp);
LCK_SPIN_DECLARE(bt_ts_conversion_lock, &bt_lck_grp);
LCK_SPIN_DECLARE(bt_maintenance_lock, &bt_lck_grp);
#if CONFIG_MACH_BRIDGE_SEND_TIME
uint32_t bt_enable_flag = 0;
_Atomic uint32_t bt_init_flag = 0;
void mach_bridge_timer_maintenance(void);
uint32_t mach_bridge_timer_enable(uint32_t new_value, int change);
/*
* When CONFIG_MACH_BRIDGE_SEND_TIME is defined, it is expected
* that a machine-specific timestamp sending routine such as
* void mach_bridge_send_timestamp(uint64_t); has also been defined.
*/
extern void mach_bridge_send_timestamp(uint64_t);
void
mach_bridge_timer_maintenance(void)
{
if (!os_atomic_load(&bt_init_flag, acquire)) {
return;
}
lck_spin_lock(&bt_maintenance_lock);
if (!bt_enable_flag) {
goto done;
}
mach_bridge_send_timestamp(0);
done:
lck_spin_unlock(&bt_maintenance_lock);
}
/*
* If change = 0, return the current value of bridge_timer_enable
* If change = 1, update bridge_timer_enable and return the updated
* value
*/
uint32_t
mach_bridge_timer_enable(uint32_t new_value, int change)
{
uint32_t current_value = 0;
assert(os_atomic_load(&bt_init_flag, relaxed));
lck_spin_lock(&bt_maintenance_lock);
if (change) {
bt_enable_flag = new_value;
}
current_value = bt_enable_flag;
lck_spin_unlock(&bt_maintenance_lock);
return current_value;
}
#endif /* CONFIG_MACH_BRIDGE_SEND_TIME */
#if CONFIG_MACH_BRIDGE_RECV_TIME
#include <machine/machine_remote_time.h>
/*
* functions used by machine-specific code
* that implements CONFIG_MACH_BRIDGE_RECV_TIME
*/
void mach_bridge_add_timestamp(uint64_t remote_timestamp, uint64_t local_timestamp);
void bt_calibration_thread_start(void);
void bt_params_add(struct bt_params *params);
/* function called by sysctl */
struct bt_params bt_params_get_latest(void);
/*
* Platform specific bridge time receiving interface.
* These variables should be exported by the platform specific time receiving code.
*/
extern _Atomic uint32_t bt_init_flag;
static uint64_t received_local_timestamp = 0;
static uint64_t received_remote_timestamp = 0;
/*
* Buffer the previous timestamp pairs and rate
* It is protected by the bt_ts_conversion_lock
*/
#define BT_PARAMS_COUNT 10
static struct bt_params bt_params_hist[BT_PARAMS_COUNT] = {};
static int bt_params_idx = -1;
void
bt_params_add(struct bt_params *params)
{
lck_spin_assert(&bt_ts_conversion_lock, LCK_ASSERT_OWNED);
bt_params_idx = (bt_params_idx + 1) % BT_PARAMS_COUNT;
bt_params_hist[bt_params_idx] = *params;
}
#if defined(XNU_TARGET_OS_BRIDGE)
static inline struct bt_params*
bt_params_find(uint64_t local_ts)
{
lck_spin_assert(&bt_ts_conversion_lock, LCK_ASSERT_OWNED);
int idx = bt_params_idx;
if (idx < 0) {
return NULL;
}
do {
if (local_ts >= bt_params_hist[idx].base_local_ts) {
return &bt_params_hist[idx];
}
if (--idx < 0) {
idx = BT_PARAMS_COUNT - 1;
}
} while (idx != bt_params_idx);
return NULL;
}
#endif /* defined(XNU_TARGET_OS_BRIDGE) */
static inline struct bt_params
bt_params_get_latest_locked(void)
{
lck_spin_assert(&bt_ts_conversion_lock, LCK_ASSERT_OWNED);
struct bt_params latest_params = {};
if (bt_params_idx >= 0) {
latest_params = bt_params_hist[bt_params_idx];
}
return latest_params;
}
struct bt_params
bt_params_get_latest(void)
{
struct bt_params latest_params = {};
/* Check if ts_converison_lock has been initialized */
if (os_atomic_load(&bt_init_flag, acquire)) {
lck_spin_lock(&bt_ts_conversion_lock);
latest_params = bt_params_get_latest_locked();
lck_spin_unlock(&bt_ts_conversion_lock);
}
return latest_params;
}
/*
* Conditions: bt_spin_lock held and called from primary interrupt context
*/
void
mach_bridge_add_timestamp(uint64_t remote_timestamp, uint64_t local_timestamp)
{
lck_spin_assert(&bt_spin_lock, LCK_ASSERT_OWNED);
/* sleep/wake might return the same mach_absolute_time as the previous timestamp pair */
if ((received_local_timestamp == local_timestamp) ||
(received_remote_timestamp == remote_timestamp)) {
return;
}
received_local_timestamp = local_timestamp;
received_remote_timestamp = remote_timestamp;
thread_wakeup((event_t)bt_params_hist);
}
static double
mach_bridge_compute_rate(uint64_t new_local_ts, uint64_t new_remote_ts,
uint64_t old_local_ts, uint64_t old_remote_ts)
{
int64_t rdiff = (int64_t)new_remote_ts - (int64_t)old_remote_ts;
int64_t ldiff = (int64_t)new_local_ts - (int64_t)old_local_ts;
double calc_rate = ((double)rdiff) / (double)ldiff;
return calc_rate;
}
#define MAX_RECALCULATE_COUNT 8
#define CUMULATIVE_RATE_DECAY_CONSTANT 0.01
#define CUMULATIVE_RATE_WEIGHT 0.99
#define INITIAL_RATE 1.0
#define MIN_INITIAL_SAMPLE_COUNT 10
#define MAX_INITIAL_SAMPLE_COUNT 50
#define MAX_SKIP_RESET_COUNT 2
#define MIN_LOCAL_TS_DISTANCE_NS 100000000 /* 100 ms */
#define MAX_LOCAL_TS_DISTANCE_NS 350000000 /* 350 ms */
#define TS_PAIR_MISMATCH_THRESHOLD_NS 50000000 /* 50 ms */
#define MAX_TS_PAIR_MISMATCHES 5
#define MAX_TS_PAIR_MISMATCH_RESET_COUNT 3
#define MIN_OBSERVED_RATE 0.8
#define MAX_OBSERVED_RATE 1.2
static void
bt_calibration_thread(void)
{
static uint64_t prev_local_ts = 0, prev_remote_ts = 0, curr_local_ts = 0, curr_remote_ts = 0;
static uint64_t prev_received_local_ts = 0, prev_received_remote_ts = 0;
static double cumulative_rate = INITIAL_RATE;
static uint32_t initial_sample_count = 1;
static uint32_t max_initial_sample_count = MAX_INITIAL_SAMPLE_COUNT;
static uint32_t skip_reset_count = MAX_SKIP_RESET_COUNT;
int recalculate_count = 1;
static bool reset = false;
bool sleep = false;
static bool skip_rcv_ts = false;
static uint64_t ts_pair_mismatch = 0;
static uint32_t ts_pair_mismatch_reset_count = 0;
spl_t s = splsched();
lck_spin_lock(&bt_spin_lock);
if (!received_remote_timestamp) {
if (PE_parse_boot_argn("rt_ini_count", &max_initial_sample_count,
sizeof(uint32_t)) == TRUE) {
if (max_initial_sample_count < MIN_INITIAL_SAMPLE_COUNT) {
max_initial_sample_count = MIN_INITIAL_SAMPLE_COUNT;
}
}
/* Nothing to do the first time */
goto block;
}
/*
* The values in bt_params are recalculated every time a new timestamp
* pair is received. Firstly, both timestamps are converted to nanoseconds.
* The current and previous timestamp pairs are used to compute the
* observed_rate of the two clocks w.r.t each other. For the first
* MIN_INITIAL_SAMPLE_COUNT number of pairs, the cumulative_rate is a simple
* average of the observed_rate. For the later pairs, the cumulative_rate
* is updated using exponential moving average of the observed_rate.
* The current and bt_params' base timestamp pairs are used to compute
* the rate_from_base. This value ensures that the bt_params base
* timestamp pair curve doesn't stay parallel to the observed timestamp
* pair curve, rather moves in the direction of the observed timestamp curve.
* The bt_params.rate is computed as a weighted average of the cumulative_rate
* and the rate_from_base. For each current local timestamp, the remote_time
* is predicted using the previous values of bt_params. After computing the new
* bt_params.rate, bt_params.base_remote_time is set to this predicted value
* and bt_params.base_local_time is set to the current local timestamp.
*/
recalculate:
assertf(recalculate_count <= MAX_RECALCULATE_COUNT, "bt_caliberation_thread: recalculate \
invocation exceeds MAX_RECALCULATE_COUNT");
if ((received_remote_timestamp == BT_RESET_SENTINEL_TS) || (received_remote_timestamp == BT_WAKE_SENTINEL_TS)) {
KDBG(MACHDBG_CODE(DBG_MACH_CLOCK, MACH_BRIDGE_RESET_TS), received_local_timestamp, received_remote_timestamp, 1);
reset = true;
skip_reset_count = MAX_SKIP_RESET_COUNT;
ts_pair_mismatch_reset_count = 0;
goto block;
} else if (received_remote_timestamp == BT_SLEEP_SENTINEL_TS) {
sleep = true;
} else if (!received_local_timestamp) {
/* If the local timestamp isn't accurately captured, the received value will be ignored */
skip_rcv_ts = true;
goto block;
}
/* Keep a copy of the prev timestamps to compute distance */
prev_received_local_ts = curr_local_ts;
prev_received_remote_ts = curr_remote_ts;
uint64_t curr_local_abs = received_local_timestamp;
absolutetime_to_nanoseconds(curr_local_abs, &curr_local_ts);
curr_remote_ts = received_remote_timestamp;
/* Prevent unusual rate changes caused by delayed timestamps */
uint64_t local_diff = curr_local_ts - prev_received_local_ts;
if (!(reset || sleep) && ((local_diff < MIN_LOCAL_TS_DISTANCE_NS) ||
(!skip_rcv_ts && (local_diff > MAX_LOCAL_TS_DISTANCE_NS)))) {
/* Skip the current timestamp */
KDBG(MACHDBG_CODE(DBG_MACH_CLOCK, MACH_BRIDGE_SKIP_TS), curr_local_ts, curr_remote_ts,
prev_received_local_ts);
goto block;
} else {
skip_rcv_ts = false;
/* Use the prev copy of timestamps only if the distance is acceptable */
prev_local_ts = prev_received_local_ts;
prev_remote_ts = prev_received_remote_ts;
}
lck_spin_unlock(&bt_spin_lock);
splx(s);
struct bt_params bt_params = {};
lck_spin_lock(&bt_ts_conversion_lock);
if (reset) {
if (skip_reset_count > 0) {
KDBG(MACHDBG_CODE(DBG_MACH_CLOCK, MACH_BRIDGE_SKIP_TS), curr_local_ts, curr_remote_ts,
prev_local_ts, skip_reset_count);
skip_reset_count--;
goto skip_reset;
}
bt_params.base_local_ts = curr_local_ts;
bt_params.base_remote_ts = curr_remote_ts;
bt_params.rate = cumulative_rate;
prev_local_ts = 0;
prev_remote_ts = 0;
ts_pair_mismatch = 0;
initial_sample_count = 1;
reset = false;
KDBG(MACHDBG_CODE(DBG_MACH_CLOCK, MACH_BRIDGE_RESET_TS), curr_local_ts, curr_remote_ts, 2);
} else if (sleep) {
absolutetime_to_nanoseconds(mach_absolute_time(), &bt_params.base_local_ts);
bt_params.base_remote_ts = 0;
bt_params.rate = 0;
sleep = false;
} else {
struct bt_params bt_params_snapshot = {};
if (bt_params_idx >= 0) {
bt_params_snapshot = bt_params_hist[bt_params_idx];
}
lck_spin_unlock(&bt_ts_conversion_lock);
if (bt_params_snapshot.rate == 0.0) {
/*
* The rate should never be 0 because we always expect a reset/wake
* sentinel after sleep, followed by valid timestamp pair data that
* will be handled by the reset clause (above). However, we should
* not rely on a paired version of the remote OS - we could actually
* be running a completely different OS! Treat a timestamp after
* a sleep as a reset condition.
*/
reset = true;
skip_reset_count = MAX_SKIP_RESET_COUNT;
ts_pair_mismatch_reset_count = 0;
KDBG(MACHDBG_CODE(DBG_MACH_CLOCK, MACH_BRIDGE_RESET_TS), curr_local_ts, curr_remote_ts, 3);
s = splsched();
lck_spin_lock(&bt_spin_lock);
goto block;
}
/* Check if the predicted remote timestamp is within the expected current remote timestamp range */
uint64_t pred_remote_ts = mach_bridge_compute_timestamp(curr_local_ts, &bt_params_snapshot);
uint64_t diff = 0;
if (initial_sample_count >= max_initial_sample_count) {
if (pred_remote_ts > curr_remote_ts) {
diff = pred_remote_ts - curr_remote_ts;
} else {
diff = curr_remote_ts - pred_remote_ts;
}
if (diff > TS_PAIR_MISMATCH_THRESHOLD_NS) {
ts_pair_mismatch++;
KDBG(MACHDBG_CODE(DBG_MACH_CLOCK, MACH_BRIDGE_TS_MISMATCH), curr_local_ts,
curr_remote_ts, pred_remote_ts, ts_pair_mismatch);
} else {
ts_pair_mismatch = 0;
}
if (ts_pair_mismatch > MAX_TS_PAIR_MISMATCHES) {
#if (DEVELOPMENT || DEBUG)
if (ts_pair_mismatch_reset_count == MAX_TS_PAIR_MISMATCH_RESET_COUNT) {
panic("remote_time: timestamp pair mismatch exceeded limit");
}
#endif /* (DEVELOPMENT || DEBUG) */
reset = true;
ts_pair_mismatch_reset_count++;
KDBG(MACHDBG_CODE(DBG_MACH_CLOCK, MACH_BRIDGE_RESET_TS), curr_local_ts, curr_remote_ts, 4);
s = splsched();
lck_spin_lock(&bt_spin_lock);
goto block;
}
}
double observed_rate, rate_from_base, new_rate;
observed_rate = mach_bridge_compute_rate(curr_local_ts, curr_remote_ts, prev_local_ts, prev_remote_ts);
/* Log bad observed rates and skip the timestamp pair */
if ((observed_rate < MIN_OBSERVED_RATE) || (observed_rate > MAX_OBSERVED_RATE)) {
KDBG(MACHDBG_CODE(DBG_MACH_CLOCK, MACH_BRIDGE_OBSV_RATE), *(uint64_t *)((void *)&observed_rate));
ts_pair_mismatch = ts_pair_mismatch > 0 ? (ts_pair_mismatch - 1) : 0;
s = splsched();
lck_spin_lock(&bt_spin_lock);
goto block;
}
if (initial_sample_count <= MIN_INITIAL_SAMPLE_COUNT) {
initial_sample_count++;
cumulative_rate = cumulative_rate + (observed_rate - cumulative_rate) / initial_sample_count;
} else {
if (initial_sample_count < max_initial_sample_count) {
initial_sample_count++;
}
cumulative_rate = cumulative_rate + CUMULATIVE_RATE_DECAY_CONSTANT * (observed_rate - cumulative_rate);
}
rate_from_base = mach_bridge_compute_rate(curr_local_ts, curr_remote_ts, bt_params_snapshot.base_local_ts,
bt_params_snapshot.base_remote_ts);
new_rate = CUMULATIVE_RATE_WEIGHT * cumulative_rate + (1 - CUMULATIVE_RATE_WEIGHT) * rate_from_base;
/*
* Acquire the lock first to ensure that bt_params.base_local_ts is always
* greater than the last value of now captured by mach_bridge_remote_time.
* This ensures that we always use the same parameters to compute remote
* timestamp for a given local timestamp.
*/
lck_spin_lock(&bt_ts_conversion_lock);
absolutetime_to_nanoseconds(mach_absolute_time(), &bt_params.base_local_ts);
bt_params.base_remote_ts = mach_bridge_compute_timestamp(bt_params.base_local_ts, &bt_params_snapshot);
bt_params.rate = new_rate;
}
bt_params_add(&bt_params);
commpage_set_remotetime_params(bt_params.rate, bt_params.base_local_ts, bt_params.base_remote_ts);
KDBG(MACHDBG_CODE(DBG_MACH_CLOCK, MACH_BRIDGE_TS_PARAMS), bt_params.base_local_ts,
bt_params.base_remote_ts, *(uint64_t *)((void *)&bt_params.rate));
skip_reset:
lck_spin_unlock(&bt_ts_conversion_lock);
s = splsched();
lck_spin_lock(&bt_spin_lock);
/* Check if a new timestamp pair was received */
if (received_local_timestamp != curr_local_abs) {
recalculate_count++;
goto recalculate;
}
block:
assert_wait((event_t)bt_params_hist, THREAD_UNINT);
lck_spin_unlock(&bt_spin_lock);
splx(s);
thread_block((thread_continue_t)bt_calibration_thread);
}
void
bt_calibration_thread_start(void)
{
thread_t thread;
kern_return_t result = kernel_thread_start_priority((thread_continue_t)bt_calibration_thread,
NULL, BASEPRI_KERNEL, &thread);
if (result != KERN_SUCCESS) {
panic("mach_bridge_add_timestamp: thread_timestamp_calibration");
}
thread_deallocate(thread);
}
#endif /* CONFIG_MACH_BRIDGE_RECV_TIME */
/**
* mach_bridge_remote_time
*
* This function is used to predict the remote CPU's clock time, given
* the local time.
*
* If local_timestamp = 0, then the remote_timestamp is calculated
* corresponding to the current mach_absolute_time.
*
* If XNU_TARGET_OS_BRIDGE is defined, then monotonicity of
* predicted time is guaranteed only for recent local_timestamp values
* lesser than the current mach_absolute_time upto 1 second.
*
* If CONFIG_MACH_BRIDGE_SEND_TIME is true, then the function is compiled
* for the remote CPU. If CONFIG_MACH_BRIDGE_RECV_TIME is true, then the
* the function is compiled for the local CPU. Both config options cannot
* be true simultaneously.
*/
uint64_t
mach_bridge_remote_time(uint64_t local_timestamp)
{
#if defined(CONFIG_MACH_BRIDGE_SEND_TIME)
#if !defined(CONFIG_MACH_BRIDGE_RECV_TIME)
/* only send side of the bridge is defined: no translation needed */
if (!local_timestamp) {
return mach_absolute_time();
}
return 0;
#else
#error "You cannot define both sides of the bridge!"
#endif /* !defined(CONFIG_MACH_BRIDGE_RECV_TIME) */
#else
#if !defined(CONFIG_MACH_BRIDGE_RECV_TIME)
/* neither the send or receive side of the bridge is defined: echo the input */
return local_timestamp;
#else
if (!os_atomic_load(&bt_init_flag, acquire)) {
return 0;
}
uint64_t remote_timestamp = 0;
lck_spin_lock(&bt_ts_conversion_lock);
uint64_t now = mach_absolute_time();
if (!local_timestamp) {
local_timestamp = now;
}
#if defined(XNU_TARGET_OS_BRIDGE)
uint64_t local_timestamp_ns = 0;
if (local_timestamp < now) {
absolutetime_to_nanoseconds(local_timestamp, &local_timestamp_ns);
struct bt_params *params = bt_params_find(local_timestamp_ns);
remote_timestamp = mach_bridge_compute_timestamp(local_timestamp_ns, params);
}
#else
struct bt_params params = bt_params_get_latest_locked();
remote_timestamp = mach_bridge_compute_timestamp(local_timestamp, &params);
#endif /* defined(XNU_TARGET_OS_BRIDGE) */
lck_spin_unlock(&bt_ts_conversion_lock);
KDBG(MACHDBG_CODE(DBG_MACH_CLOCK, MACH_BRIDGE_REMOTE_TIME), local_timestamp, remote_timestamp, now);
return remote_timestamp;
#endif /* !defined(CONFIG_MACH_BRIDGE_RECV_TIME) */
#endif /* defined(CONFIG_MACH_BRIDGE_SEND_TIME) */
}