diff --git a/src/xrt/compositor/CMakeLists.txt b/src/xrt/compositor/CMakeLists.txt index a31df2d08..ca6b299a5 100644 --- a/src/xrt/compositor/CMakeLists.txt +++ b/src/xrt/compositor/CMakeLists.txt @@ -153,6 +153,7 @@ if(XRT_HAVE_VULKAN) util/comp_base.c util/comp_render.h util/comp_render_cs.c + util/comp_render_gfx.c util/comp_render_helpers.h util/comp_semaphore.h util/comp_semaphore.c diff --git a/src/xrt/compositor/util/comp_render.h b/src/xrt/compositor/util/comp_render.h index 9b1b11ae5..8be8f8ccb 100644 --- a/src/xrt/compositor/util/comp_render.h +++ b/src/xrt/compositor/util/comp_render.h @@ -22,6 +22,45 @@ extern "C" { struct comp_layer; +/*! + * Helper function that takes a set of layers, new device poses, a scratch + * images with associated @ref render_gfx_target_resources and writes the needed + * commands to the @ref render_gfx to do a full composition with distortion. + * The scratch images are optionally used to squash layers should it not be + * possible to do a @p fast_path. Will use the render passes of the targets + * which set the layout. + * + * The render passes of @p rsi_rtrs must be created with a final_layout of + * VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL or there will be validation errors. + * + * Expected layouts: + * * Layer images: VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL + * * Scratch images: Any (as per the @ref render_gfx_render_pass) + * * Target image: Any (as per the @ref render_gfx_render_pass) + * + * After call layouts: + * * Layer images: VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL + * * Scratch images: VK_IMAGE_LAYOUT_SHADER_READ_ONLY_OPTIMAL + * * Target image: What the render pass of @p rtr specifies. + * + * @ingroup comp_util + */ +void +comp_render_gfx_dispatch(struct render_gfx *rr, + struct render_scratch_images *rsi, + struct render_gfx_target_resources rsi_rtrs[2], + const struct comp_layer *layers, + const uint32_t layer_count, + struct xrt_pose world_poses[2], + struct xrt_pose eye_poses[2], + struct xrt_fov fovs[2], + struct xrt_matrix_2x2 vertex_rots[2], + struct render_gfx_target_resources *rtr, + const struct render_viewport_data viewport_datas[2], + bool fast_path, + bool do_timewarp); + + /*! * Helper to dispatch the layer squasher for a single view. * diff --git a/src/xrt/compositor/util/comp_render_gfx.c b/src/xrt/compositor/util/comp_render_gfx.c new file mode 100644 index 000000000..50019b669 --- /dev/null +++ b/src/xrt/compositor/util/comp_render_gfx.c @@ -0,0 +1,632 @@ +// Copyright 2023, Collabora, Ltd. +// SPDX-License-Identifier: BSL-1.0 +/*! + * @file + * @brief Compositor gfx rendering code. + * @author Jakob Bornecrantz + * @ingroup comp_util + */ + +#include "xrt/xrt_compositor.h" + +#include "math/m_api.h" + +#include "util/u_misc.h" +#include "util/u_trace_marker.h" + +#include "vk/vk_helpers.h" + +#include "render/render_interface.h" + +#include "util/comp_render.h" +#include "util/comp_render_helpers.h" + + +/* + * + * Internal structs. + * + */ + +/* + * Internal state for a single view. + */ +struct gfx_view_state +{ + // Filled out descriptor sets. + VkDescriptorSet descriptor_sets[RENDER_MAX_LAYERS]; + + // The type of layer. + enum xrt_layer_type types[RENDER_MAX_LAYERS]; + // Is the alpha premultipled, false means unpremultiplied. + bool premultiplied_alphas[RENDER_MAX_LAYERS]; + + // Number of layers filed in. + uint32_t layer_count; + + // Full rotation and translation VP matrix, in world space. + struct xrt_matrix_4x4 world_vp_full; + // Full rotation and translation VP matrix, in view space. + struct xrt_matrix_4x4 eye_vp_full; + // Only rotation and translation VP matrix, in world space. + struct xrt_matrix_4x4 world_vp_rot_only; + // Only rotation and translation VP matrix, in view space. + struct xrt_matrix_4x4 eye_vp_rot_only; +}; + + +/* + * + * Static data. + * + */ + +static const VkClearColorValue background_color_idle = { + .float32 = {0.1f, 0.1f, 0.1f, 1.0f}, +}; + +static const VkClearColorValue background_color_active = { + .float32 = {0.0f, 0.0f, 0.0f, 1.0f}, +}; + + +/* + * + * Model view projection helper functions. + * + */ + +static inline void +calc_mvp_full(struct gfx_view_state *state, + const struct xrt_layer_data *layer_data, + const struct xrt_pose *pose, + const struct xrt_vec3 *scale, + struct xrt_matrix_4x4 *result) +{ + struct xrt_matrix_4x4 model; + math_matrix_4x4_model(pose, scale, &model); + + if (is_layer_view_space(layer_data)) { + math_matrix_4x4_multiply(&state->eye_vp_full, &model, result); + } else { + math_matrix_4x4_multiply(&state->world_vp_full, &model, result); + } +} + +static inline void +calc_mvp_rot_only(struct gfx_view_state *state, + const struct xrt_layer_data *data, + const struct xrt_pose *pose, + const struct xrt_vec3 *scale, + struct xrt_matrix_4x4 *result) +{ + struct xrt_matrix_4x4 model; + struct xrt_pose rot_only = { + .orientation = pose->orientation, + .position = XRT_VEC3_ZERO, + }; + math_matrix_4x4_model(&rot_only, scale, &model); + + if (is_layer_view_space(data)) { + math_matrix_4x4_multiply(&state->eye_vp_rot_only, &model, result); + } else { + math_matrix_4x4_multiply(&state->world_vp_rot_only, &model, result); + } +} + + +/* + * + * Graphics layer data builders. + * + */ + +static inline void +add_layer(struct gfx_view_state *state, const struct xrt_layer_data *data, VkDescriptorSet descriptor_set) +{ + uint32_t cur_layer = state->layer_count++; + state->descriptor_sets[cur_layer] = descriptor_set; + state->types[cur_layer] = data->type; + state->premultiplied_alphas[cur_layer] = !is_layer_unpremultiplied(data); +} + +static VkResult +do_projection_layer(struct render_gfx *rr, + const struct comp_layer *layer, + uint32_t view_index, + VkSampler clamp_to_edge, + VkSampler clamp_to_border_black, + struct gfx_view_state *state) +{ + const struct xrt_layer_data *layer_data = &layer->data; + const struct xrt_layer_projection_view_data *vd = NULL; + const struct xrt_layer_depth_data *dvd = NULL; + struct vk_bundle *vk = rr->r->vk; + VkResult ret; + + if (layer_data->type == XRT_LAYER_STEREO_PROJECTION) { + view_index_to_projection_data(view_index, layer_data, &vd); + } else { + view_index_to_depth_data(view_index, layer_data, &vd, &dvd); + } + + uint32_t sc_array_index = is_view_index_right(view_index) ? 1 : 0; + uint32_t array_index = vd->sub.array_index; + const struct comp_swapchain_image *image = &layer->sc_array[sc_array_index]->images[vd->sub.image_index]; + + // Color + VkSampler src_sampler = clamp_to_border_black; + VkImageView src_image_view = get_image_view(image, layer_data->flags, array_index); + + // Fully initialised below. + struct render_gfx_layer_projection_data data; + + // Used for Subimage and OpenGL flip. + set_post_transform_rect( // + layer_data, // data + &vd->sub.norm_rect, // src_norm_rect + false, // invert_flip + &data.post_transform); // out_norm_rect + + // Used to go from UV to tangent space. + render_calc_uv_to_tangent_lengths_rect(&vd->fov, &data.to_tanget); + + // Create MVP matrix, rotation only so we get 3dof timewarp. + struct xrt_vec3 scale = {1, 1, 1}; + calc_mvp_rot_only(state, layer_data, &vd->pose, &scale, &data.mvp); + + // Can fail if we have too many layers. + VkDescriptorSet descriptor_set = VK_NULL_HANDLE; + ret = render_gfx_layer_projection_alloc_and_write( // + rr, // rr + &data, // data + src_sampler, // src_sampler + src_image_view, // src_image_view + &descriptor_set); // out_descriptor_set + VK_CHK_AND_RET(ret, "render_gfx_layer_projection_alloc_and_write"); + + add_layer(state, layer_data, descriptor_set); + + return VK_SUCCESS; +} + +static VkResult +do_quad_layer(struct render_gfx *rr, + const struct comp_layer *layer, + uint32_t view_index, + VkSampler clamp_to_edge, + VkSampler clamp_to_border_black, + struct gfx_view_state *state) +{ + const struct xrt_layer_data *layer_data = &layer->data; + const struct xrt_layer_quad_data *q = &layer_data->quad; + struct vk_bundle *vk = rr->r->vk; + VkResult ret; + + // Should we actually do a layer here? + if (!is_view_index_visible(view_index, q->visibility)) { + return VK_SUCCESS; + } + + const uint32_t array_index = q->sub.array_index; + const struct comp_swapchain_image *image = &layer->sc_array[0]->images[q->sub.image_index]; + + // Color + VkSampler src_sampler = clamp_to_edge; + VkImageView src_image_view = get_image_view(image, layer_data->flags, array_index); + + // Fully initialised below. + struct render_gfx_layer_quad_data data; + + // Used for Subimage and OpenGL flip. + set_post_transform_rect( // + layer_data, // data + &q->sub.norm_rect, // src_norm_rect + false, // invert_flip + &data.post_transform); // out_norm_rect + + // Create MVP matrix, full 6dof mvp needed. + struct xrt_vec3 scale = {q->size.x, q->size.y, 1}; + calc_mvp_full(state, layer_data, &q->pose, &scale, &data.mvp); + + // Can fail if we have too many layers. + VkDescriptorSet descriptor_set = VK_NULL_HANDLE; + ret = render_gfx_layer_quad_alloc_and_write( // + rr, // rr + &data, // data + src_sampler, // src_sampler + src_image_view, // src_image_view + &descriptor_set); // out_descriptor_set + VK_CHK_AND_RET(ret, "render_gfx_layer_quad_alloc_and_write"); + + add_layer(state, layer_data, descriptor_set); + + return VK_SUCCESS; +} + +static void +do_layers(struct render_gfx *rr, + struct render_gfx_target_resources rtrs[2], + const struct render_viewport_data viewport_datas[2], + const struct xrt_fov new_fovs[2], + const struct xrt_pose world_poses[2], + const struct xrt_pose eye_poses[2], + const struct comp_layer *layers, + uint32_t layer_count) +{ + COMP_TRACE_MARKER(); + + struct vk_bundle *vk = rr->r->vk; + VkResult ret; + + // Hardcoded to stereo. + struct gfx_view_state views[2] = XRT_STRUCT_INIT; + + for (uint32_t view = 0; view < ARRAY_SIZE(views); view++) { + + // Projection + struct xrt_matrix_4x4 p; + math_matrix_4x4_projection_vulkan_infinite_reverse(&new_fovs[view], 0.1, &p); + + // Reused view matrix. + struct xrt_matrix_4x4 v; + + // World + math_matrix_4x4_view_from_pose(&world_poses[view], &v); + math_matrix_4x4_multiply(&p, &v, &views[view].world_vp_full); + + struct xrt_pose world_rot_only = {world_poses[view].orientation, XRT_VEC3_ZERO}; + math_matrix_4x4_view_from_pose(&world_rot_only, &v); + math_matrix_4x4_multiply(&p, &v, &views[view].world_vp_rot_only); + + // Eye + math_matrix_4x4_view_from_pose(&eye_poses[view], &v); + math_matrix_4x4_multiply(&p, &v, &views[view].eye_vp_full); + + struct xrt_pose eye_rot_only = {eye_poses[view].orientation, XRT_VEC3_ZERO}; + math_matrix_4x4_view_from_pose(&eye_rot_only, &v); + math_matrix_4x4_multiply(&p, &v, &views[view].eye_vp_rot_only); + } + + /* + * Reserve UBOs, create descriptor sets, and fill in any data a head of + * time, if we ever want to copy UBO data this lets us do that easily + * write a copy command before the other gfx commands. + */ + + assert(layer_count <= RENDER_MAX_LAYERS && "Too many layers"); + + VkSampler clamp_to_edge = rr->r->samplers.clamp_to_edge; + VkSampler clamp_to_border_black = rr->r->samplers.clamp_to_border_black; + + for (uint32_t view = 0; view < ARRAY_SIZE(views); view++) { + for (uint32_t i = 0; i < layer_count; i++) { + switch (layers[i].data.type) { + case XRT_LAYER_STEREO_PROJECTION: + case XRT_LAYER_STEREO_PROJECTION_DEPTH: + ret = do_projection_layer( // + rr, // rr + &layers[i], // layer + view, // view_index + clamp_to_edge, // clamp_to_edge + clamp_to_border_black, // clamp_to_border_black + &views[view]); // state + VK_CHK_WITH_GOTO(ret, "do_projection_layer", err_layer); + break; + case XRT_LAYER_QUAD: + ret = do_quad_layer( // + rr, // rr + &layers[i], // layer + view, // view_index + clamp_to_edge, // clamp_to_edge + clamp_to_border_black, // clamp_to_border_black + &views[view]); // state + VK_CHK_WITH_GOTO(ret, "do_quad_layer", err_layer); + break; + default: break; + } + } + } + + + /* + * Do command writing here. + */ + + const VkClearColorValue *color = layer_count == 0 ? &background_color_idle : &background_color_active; + + for (uint32_t view = 0; view < ARRAY_SIZE(views); view++) { + render_gfx_begin_target( // + rr, // + &rtrs[view], // + color); // + + render_gfx_begin_view( // + rr, // + view, // view_index + &viewport_datas[view]); // viewport_data + + struct gfx_view_state *state = &views[view]; + + for (uint32_t i = 0; i < state->layer_count; i++) { + switch (state->types[i]) { + case XRT_LAYER_STEREO_PROJECTION: + case XRT_LAYER_STEREO_PROJECTION_DEPTH: + render_gfx_layer_projection( // + rr, // + state->premultiplied_alphas[i], // + state->descriptor_sets[i]); // + break; + case XRT_LAYER_QUAD: + render_gfx_layer_quad( // + rr, // + state->premultiplied_alphas[i], // + state->descriptor_sets[i]); // + break; + default: break; + } + } + + render_gfx_end_view(rr); + + render_gfx_end_target(rr); + } + + + return; + +err_layer: + // Allocator reset at end of frame, nothing to clean up. + VK_ERROR(vk, "Layer processing failed, that shouldn't happen!"); +} + + +/* + * + * Graphics distortion helpers. + * + */ + +static void +do_mesh(struct render_gfx *rr, + struct render_gfx_target_resources *rtr, + const struct render_viewport_data viewport_datas[2], + const struct xrt_matrix_2x2 vertex_rots[2], + VkSampler src_samplers[2], + VkImageView src_image_views[2], + const struct xrt_normalized_rect src_norm_rects[2], + const struct xrt_pose src_poses[2], + const struct xrt_fov src_fovs[2], + const struct xrt_pose new_poses[2], + bool do_timewarp) +{ + struct vk_bundle *vk = rr->r->vk; + VkResult ret; + + /* + * Reserve UBOs, create descriptor sets, and fill in any data a head of + * time, if we ever want to copy UBO data this lets us do that easily + * write a copy command before the other gfx commands. + */ + + VkDescriptorSet descriptor_sets[2] = XRT_STRUCT_INIT; + for (uint32_t i = 0; i < 2; i++) { + + struct render_gfx_mesh_ubo_data data = { + .vertex_rot = vertex_rots[i], + .post_transform = src_norm_rects[i], + }; + + // Extra arguments for timewarp. + if (do_timewarp) { + data.pre_transform = rr->r->distortion.uv_to_tanangle[i]; + + render_calc_time_warp_matrix( // + &src_poses[i], // + &src_fovs[i], // + &new_poses[i], // + &data.transform); // + } + + ret = render_gfx_mesh_alloc_and_write( // + rr, // + &data, // + src_samplers[i], // + src_image_views[i], // + &descriptor_sets[i]); // + VK_CHK_WITH_GOTO(ret, "render_gfx_mesh_alloc", err_no_memory); + } + + + /* + * Do command writing here. + */ + + render_gfx_begin_target( // + rr, // + rtr, // + &background_color_active); // + + for (uint32_t i = 0; i < 2; i++) { + render_gfx_begin_view( // + rr, // + i, // view_index + &viewport_datas[i]); // viewport_data + + render_gfx_mesh_draw( // + rr, // rr + i, // mesh_index + descriptor_sets[i], // descriptor_set + do_timewarp); // do_timewarp + + render_gfx_end_view(rr); + } + + render_gfx_end_target(rr); + + return; + +err_no_memory: + // Allocator reset at end of frame, nothing to clean up. + VK_ERROR(vk, "Could not allocate all UBOs for frame, that's really strange and shouldn't happen!"); +} + +static void +do_mesh_from_proj(struct render_gfx *rr, + struct render_gfx_target_resources *rts, + const struct render_viewport_data viewport_datas[2], + const struct xrt_matrix_2x2 vertex_rots[2], + const struct comp_layer *layer, + const struct xrt_layer_projection_view_data *lvd, + const struct xrt_layer_projection_view_data *rvd, + const struct xrt_pose new_poses[2], + bool do_timewarp) +{ + const struct xrt_layer_data *data = &layer->data; + const uint32_t left_array_index = lvd->sub.array_index; + const uint32_t right_array_index = rvd->sub.array_index; + const struct comp_swapchain_image *left = &layer->sc_array[0]->images[lvd->sub.image_index]; + const struct comp_swapchain_image *right = &layer->sc_array[1]->images[rvd->sub.image_index]; + + struct xrt_normalized_rect src_norm_rects[2] = {lvd->sub.norm_rect, rvd->sub.norm_rect}; + if (data->flip_y) { + src_norm_rects[0].h = -src_norm_rects[0].h; + src_norm_rects[0].y = 1 + src_norm_rects[0].y; + src_norm_rects[1].h = -src_norm_rects[1].h; + src_norm_rects[1].y = 1 + src_norm_rects[1].y; + } + + VkSampler clamp_to_border_black = rr->r->samplers.clamp_to_border_black; + VkSampler src_samplers[2] = { + clamp_to_border_black, + clamp_to_border_black, + }; + + VkImageView src_image_views[2] = { + get_image_view(left, data->flags, left_array_index), + get_image_view(right, data->flags, right_array_index), + }; + + const struct xrt_pose src_poses[2] = {lvd->pose, rvd->pose}; + const struct xrt_fov src_fovs[2] = {lvd->fov, rvd->fov}; + + do_mesh( // + rr, // + rts, // + viewport_datas, // + vertex_rots, // + src_samplers, // + src_image_views, // + src_norm_rects, // + src_poses, // + src_fovs, // + new_poses, // + do_timewarp); // +} + + +void +comp_render_gfx_dispatch(struct render_gfx *rr, + struct render_scratch_images *rsi, + struct render_gfx_target_resources rsi_rtrs[2], + const struct comp_layer *layers, + const uint32_t layer_count, + struct xrt_pose world_poses[2], + struct xrt_pose eye_poses[2], + struct xrt_fov fovs[2], + struct xrt_matrix_2x2 vertex_rots[2], + struct render_gfx_target_resources *rtr, + const struct render_viewport_data viewport_datas[2], + bool fast_path, + bool do_timewarp) +{ + // Only used if fast_path is true. + const struct comp_layer *layer = &layers[0]; + + // Sanity check. + assert(!fast_path || layer_count >= 1); + + if (fast_path && layer->data.type == XRT_LAYER_STEREO_PROJECTION) { + // Fast path. + const struct xrt_layer_stereo_projection_data *stereo = &layer->data.stereo; + const struct xrt_layer_projection_view_data *lvd = &stereo->l; + const struct xrt_layer_projection_view_data *rvd = &stereo->r; + + do_mesh_from_proj( // + rr, // + rtr, // + viewport_datas, // + vertex_rots, // + layer, // + lvd, // + rvd, // + world_poses, // + do_timewarp); // + + } else if (fast_path && layer->data.type == XRT_LAYER_STEREO_PROJECTION_DEPTH) { + // Fast path. + const struct xrt_layer_stereo_projection_depth_data *stereo = &layer->data.stereo_depth; + const struct xrt_layer_projection_view_data *lvd = &stereo->l; + const struct xrt_layer_projection_view_data *rvd = &stereo->r; + + do_mesh_from_proj( // + rr, // + rtr, // + viewport_datas, // + vertex_rots, // + layer, // + lvd, // + rvd, // + world_poses, // + do_timewarp); // + + } else { + if (fast_path) { + U_LOG_W("Wanted fast path but no projection layer, falling back to layer squasher."); + } + + struct render_viewport_data layer_viewport_datas[2] = { + {.x = 0, .y = 0, .w = rsi->extent.width, .h = rsi->extent.height}, + {.x = 0, .y = 0, .w = rsi->extent.width, .h = rsi->extent.height}, + }; + + do_layers( // + rr, // rr + rsi_rtrs, // rtrs + layer_viewport_datas, // viewport_datas + fovs, // new_fovs + world_poses, // world_poses + eye_poses, // eye_poses + layers, // layers + layer_count); // layer_count + + VkSampler clamp_to_border_black = rr->r->samplers.clamp_to_border_black; + VkSampler src_samplers[2] = { + clamp_to_border_black, + clamp_to_border_black, + }; + VkImageView src_image_views[2] = { + rsi->color[0].srgb_view, + rsi->color[1].srgb_view, + }; + + struct xrt_normalized_rect src_norm_rects[2] = { + {.x = 0, .y = 0, .w = 1, .h = 1}, + {.x = 0, .y = 0, .w = 1, .h = 1}, + }; + + // We are passing in the same old and new poses. + do_mesh( // + rr, // + rtr, // + viewport_datas, // + vertex_rots, // + src_samplers, // + src_image_views, // + src_norm_rects, // + world_poses, // + fovs, // + world_poses, // + false); // + } +}