monado/src/xrt/auxiliary/util/u_timing_render.c

427 lines
11 KiB
C

// Copyright 2020-2021, Collabora, Ltd.
// SPDX-License-Identifier: BSL-1.0
/*!
* @file
* @brief Shared frame timing code.
* @author Jakob Bornecrantz <jakob@collabora.com>
* @ingroup aux_util
*/
#include "os/os_time.h"
#include "util/u_time.h"
#include "util/u_misc.h"
#include "util/u_debug.h"
#include "util/u_timing.h"
#include "util/u_logging.h"
#include "util/u_trace_marker.h"
#include <stdio.h>
#include <assert.h>
#include <inttypes.h>
/*
*
* Structs enums, and defines.
*
*/
enum u_rt_state
{
U_RT_READY,
U_RT_WAIT_LEFT,
U_RT_PREDICTED,
U_RT_BEGUN,
};
struct u_rt_frame
{
//! When we predicted this frame to be shown.
uint64_t predicted_display_time_ns;
//! The selected display period.
uint64_t predicted_display_period_ns;
//! When the client should have delivered the frame.
uint64_t predicted_delivery_time_ns;
struct
{
uint64_t predicted_ns;
uint64_t wait_woke_ns;
uint64_t begin_ns;
uint64_t delivered_ns;
} when; //!< When something happened.
int64_t frame_id;
enum u_rt_state state;
};
struct render_timing
{
struct u_render_timing base;
struct u_rt_frame frames[2];
uint32_t current_frame;
uint32_t next_frame;
int64_t frame_counter;
struct
{
//! App time between wait returning and begin being called.
uint64_t cpu_time_ns;
//! Time between begin and frame rendering completeing.
uint64_t draw_time_ns;
//! Exrta time between end of draw time and when the compositor wakes up.
uint64_t margin_ns;
} app; //!< App statistics.
struct
{
//! The last display time that the thing driving this helper got.
uint64_t predicted_display_time_ns;
//! The last display period the hardware is running at.
uint64_t predicted_display_period_ns;
//! The extra time needed by the thing driving this helper.
uint64_t extra_ns;
} last_input;
uint64_t last_returned_ns;
};
/*
*
* Helpers
*
*/
static inline struct render_timing *
render_timing(struct u_render_timing *urt)
{
return (struct render_timing *)urt;
}
DEBUG_GET_ONCE_LOG_OPTION(ll, "U_TIMING_RENDER_LOG", U_LOGGING_WARN)
#define RT_LOG_T(...) U_LOG_IFL_T(debug_get_log_option_ll(), __VA_ARGS__)
#define RT_LOG_D(...) U_LOG_IFL_D(debug_get_log_option_ll(), __VA_ARGS__)
#define RT_LOG_I(...) U_LOG_IFL_I(debug_get_log_option_ll(), __VA_ARGS__)
#define RT_LOG_W(...) U_LOG_IFL_W(debug_get_log_option_ll(), __VA_ARGS__)
#define RT_LOG_E(...) U_LOG_IFL_E(debug_get_log_option_ll(), __VA_ARGS__)
#define DEBUG_PRINT_FRAME_ID() RT_LOG_T("%" PRIi64, frame_id)
#define GET_INDEX_FROM_ID(RT, ID) ((uint64_t)(ID) % ARRAY_SIZE((RT)->frames))
#define IIR_ALPHA_LT 0.8
#define IIR_ALPHA_GT 0.8
static void
do_iir_filter(uint64_t *target, double alpha_lt, double alpha_gt, uint64_t sample)
{
uint64_t t = *target;
double alpha = t < sample ? alpha_lt : alpha_gt;
double a = time_ns_to_s(t) * alpha;
double b = time_ns_to_s(sample) * (1.0 - alpha);
*target = time_s_to_ns(a + b);
}
static uint64_t
min_period(const struct render_timing *rt)
{
return rt->last_input.predicted_display_period_ns;
}
static uint64_t
last_sample_displayed(const struct render_timing *rt)
{
return rt->last_input.predicted_display_time_ns;
}
static uint64_t
last_return_predicted_display(const struct render_timing *rt)
{
return rt->last_returned_ns;
}
static uint64_t
total_app_time_ns(const struct render_timing *rt)
{
return rt->app.cpu_time_ns + rt->app.draw_time_ns;
}
static uint64_t
total_compositor_time_ns(const struct render_timing *rt)
{
return rt->app.margin_ns + rt->last_input.extra_ns;
}
static uint64_t
total_app_and_compositor_time_ns(const struct render_timing *rt)
{
return total_app_time_ns(rt) + total_compositor_time_ns(rt);
}
static uint64_t
calc_period(const struct render_timing *rt)
{
// Error checking.
uint64_t base_period_ns = min_period(rt);
if (base_period_ns == 0) {
assert(false && "Have not yet received and samples from timing driver.");
base_period_ns = U_TIME_1MS_IN_NS * 16; // Sure
}
// Calculate the using both values separately.
uint64_t period_ns = base_period_ns;
while (rt->app.cpu_time_ns > period_ns) {
period_ns += base_period_ns;
}
while (rt->app.draw_time_ns > period_ns) {
period_ns += base_period_ns;
}
return period_ns;
}
static uint64_t
predict_display_time(const struct render_timing *rt, uint64_t period_ns)
{
// Now
uint64_t now_ns = os_monotonic_get_ns();
// Total app and compositor time to produce a frame
uint64_t app_and_compositor_time_ns = total_app_and_compositor_time_ns(rt);
// Start from the last time that the driver displayed something.
uint64_t val = last_sample_displayed(rt);
// Return a time after the last returned display time.
while (val <= last_return_predicted_display(rt)) {
val += period_ns;
}
// Have to have enough time to perform app work.
while ((val - app_and_compositor_time_ns) <= now_ns) {
val += period_ns;
}
return val;
}
/*
*
* Member functions.
*
*/
static void
rt_predict(struct u_render_timing *urt,
int64_t *out_frame_id,
uint64_t *out_wake_up_time,
uint64_t *out_predicted_display_time,
uint64_t *out_predicted_display_period)
{
struct render_timing *rt = render_timing(urt);
int64_t frame_id = ++rt->frame_counter;
*out_frame_id = frame_id;
DEBUG_PRINT_FRAME_ID();
uint64_t period_ns = calc_period(rt);
uint64_t predict_ns = predict_display_time(rt, period_ns);
// When should the client wake up.
uint64_t wake_up_time_ns = predict_ns - total_app_and_compositor_time_ns(rt);
// When the client should deliver the frame to us.
uint64_t delivery_time_ns = predict_ns - total_compositor_time_ns(rt);
rt->last_returned_ns = predict_ns;
*out_wake_up_time = wake_up_time_ns;
*out_predicted_display_time = predict_ns;
*out_predicted_display_period = period_ns;
size_t index = GET_INDEX_FROM_ID(rt, frame_id);
assert(rt->frames[index].frame_id == -1);
assert(rt->frames[index].state == U_RT_READY);
rt->frames[index].state = U_RT_PREDICTED;
rt->frames[index].frame_id = frame_id;
rt->frames[index].predicted_delivery_time_ns = delivery_time_ns;
rt->frames[index].predicted_display_period_ns = period_ns;
rt->frames[index].when.predicted_ns = os_monotonic_get_ns();
}
static void
rt_mark_point(struct u_render_timing *urt, int64_t frame_id, enum u_timing_point point, uint64_t when_ns)
{
struct render_timing *rt = render_timing(urt);
RT_LOG_T("%" PRIi64 " (%u)", frame_id, point);
size_t index = GET_INDEX_FROM_ID(rt, frame_id);
assert(rt->frames[index].frame_id == frame_id);
switch (point) {
case U_TIMING_POINT_WAKE_UP:
assert(rt->frames[index].state == U_RT_PREDICTED);
rt->frames[index].when.wait_woke_ns = when_ns;
rt->frames[index].state = U_RT_WAIT_LEFT;
break;
case U_TIMING_POINT_BEGIN:
assert(rt->frames[index].state == U_RT_WAIT_LEFT);
rt->frames[index].when.begin_ns = os_monotonic_get_ns();
rt->frames[index].state = U_RT_BEGUN;
break;
case U_TIMING_POINT_SUBMIT:
default: assert(false);
}
}
static void
rt_mark_discarded(struct u_render_timing *urt, int64_t frame_id)
{
struct render_timing *rt = render_timing(urt);
DEBUG_PRINT_FRAME_ID();
size_t index = GET_INDEX_FROM_ID(rt, frame_id);
assert(rt->frames[index].frame_id == frame_id);
assert(rt->frames[index].state == U_RT_WAIT_LEFT || rt->frames[index].state == U_RT_BEGUN);
rt->frames[index].when.delivered_ns = os_monotonic_get_ns();
rt->frames[index].state = U_RT_READY;
rt->frames[index].frame_id = -1;
}
static void
rt_mark_delivered(struct u_render_timing *urt, int64_t frame_id)
{
struct render_timing *rt = render_timing(urt);
DEBUG_PRINT_FRAME_ID();
size_t index = GET_INDEX_FROM_ID(rt, frame_id);
struct u_rt_frame *f = &rt->frames[index];
assert(f->frame_id == frame_id);
assert(f->state == U_RT_BEGUN);
uint64_t now_ns = os_monotonic_get_ns();
// Update all data.
f->when.delivered_ns = now_ns;
/*
* Process data.
*/
int64_t diff_ns = f->predicted_delivery_time_ns - now_ns;
bool late = false;
if (diff_ns < 0) {
diff_ns = -diff_ns;
late = true;
}
#define NS_TO_MS_F(ns) (time_ns_to_s(ns) * 1000.0)
uint64_t diff_cpu_ns = f->when.begin_ns - f->when.wait_woke_ns;
uint64_t diff_draw_ns = f->when.delivered_ns - f->when.begin_ns;
RT_LOG_D(
"Delivered frame %.2fms %s." //
"\n\tperiod: %.2f" //
"\n\tcpu o: %.2f, n: %.2f" //
"\n\tdraw o: %.2f, n: %.2f", //
time_ns_to_ms_f(diff_ns), late ? "late" : "early", //
time_ns_to_ms_f(f->predicted_display_period_ns), //
time_ns_to_ms_f(rt->app.cpu_time_ns), time_ns_to_ms_f(diff_cpu_ns), //
time_ns_to_ms_f(rt->app.draw_time_ns), time_ns_to_ms_f(diff_draw_ns)); //
do_iir_filter(&rt->app.cpu_time_ns, IIR_ALPHA_LT, IIR_ALPHA_GT, diff_cpu_ns);
do_iir_filter(&rt->app.draw_time_ns, IIR_ALPHA_LT, IIR_ALPHA_GT, diff_draw_ns);
// Trace the data.
#ifdef XRT_FEATURE_TRACING
#define TE_BEG(TRACK, TIME, NAME) U_TRACE_EVENT_BEGIN_ON_TRACK_DATA(timing, TRACK, TIME, NAME, PERCETTO_I(f->frame_id))
#define TE_END(TRACK, TIME) U_TRACE_EVENT_END_ON_TRACK(timing, TRACK, TIME)
if (U_TRACE_CATEGORY_IS_ENABLED(timing)) {
TE_BEG(ft_cpu, f->when.predicted_ns, "sleep");
TE_END(ft_cpu, f->when.wait_woke_ns);
uint64_t cpu_start_ns = f->when.wait_woke_ns + 1;
TE_BEG(ft_cpu, cpu_start_ns, "cpu");
TE_END(ft_cpu, f->when.begin_ns);
TE_BEG(ft_draw, f->when.begin_ns, "draw");
TE_END(ft_draw, f->when.delivered_ns);
}
#undef TE_BEG
#undef TE_END
#endif
// Reset the frame.
f->state = U_RT_READY;
f->frame_id = -1;
}
static void
rt_info(struct u_render_timing *urt,
uint64_t predicted_display_time_ns,
uint64_t predicted_display_period_ns,
uint64_t extra_ns)
{
struct render_timing *rt = render_timing(urt);
rt->last_input.predicted_display_time_ns = predicted_display_time_ns;
rt->last_input.predicted_display_period_ns = predicted_display_period_ns;
rt->last_input.extra_ns = extra_ns;
}
static void
rt_destroy(struct u_render_timing *urt)
{
free(urt);
}
/*
*
* 'Exported' functions.
*
*/
xrt_result_t
u_rt_create(struct u_render_timing **out_urt)
{
struct render_timing *rt = U_TYPED_CALLOC(struct render_timing);
rt->base.predict = rt_predict;
rt->base.mark_point = rt_mark_point;
rt->base.mark_discarded = rt_mark_discarded;
rt->base.mark_delivered = rt_mark_delivered;
rt->base.info = rt_info;
rt->base.destroy = rt_destroy;
rt->app.cpu_time_ns = U_TIME_1MS_IN_NS * 2;
rt->app.draw_time_ns = U_TIME_1MS_IN_NS * 2;
rt->app.margin_ns = U_TIME_1MS_IN_NS / 2;
for (size_t i = 0; i < ARRAY_SIZE(rt->frames); i++) {
rt->frames[i].state = U_RT_READY;
rt->frames[i].frame_id = -1;
}
*out_urt = &rt->base;
return XRT_SUCCESS;
}