aux/vive: Parse camera calibration

This commit is contained in:
Moses Turner 2021-09-02 01:41:21 -05:00 committed by Moses Turner
parent efbc4cd9e5
commit cef922946a
4 changed files with 259 additions and 2 deletions

View file

@ -291,7 +291,7 @@ if (XRT_BUILD_DRIVER_VIVE OR XRT_BUILD_DRIVER_SURVIVE)
vive/vive_config.c vive/vive_config.c
) )
add_library(aux_vive STATIC ${VIVE_CONFIG_SOURCE_FILES}) add_library(aux_vive STATIC ${VIVE_CONFIG_SOURCE_FILES})
target_link_libraries(aux_vive PRIVATE xrt-interfaces aux_util aux_math xrt-external-cjson) target_link_libraries(aux_vive PRIVATE xrt-interfaces aux_util aux_math aux_tracking xrt-external-cjson)
target_link_libraries(aux_vive PRIVATE ${ZLIB_LIBRARIES}) target_link_libraries(aux_vive PRIVATE ${ZLIB_LIBRARIES})
target_include_directories(aux_vive PRIVATE ${ZLIB_INCLUDE_DIRS}) target_include_directories(aux_vive PRIVATE ${ZLIB_INCLUDE_DIRS})
endif() endif()

View file

@ -247,7 +247,7 @@ lib_aux_vive = static_library(
xrt_include, xrt_include,
cjson_include, cjson_include,
], ],
dependencies: [zlib], dependencies: [zlib, aux_tracking],
) )
aux_vive = declare_dependency( aux_vive = declare_dependency(

View file

@ -4,6 +4,7 @@
* @file * @file
* @brief Vive json implementation * @brief Vive json implementation
* @author Lubosz Sarnecki <lubosz.sarnecki@collabora.com> * @author Lubosz Sarnecki <lubosz.sarnecki@collabora.com>
* @author Moses Turner <moses@collabora.com>
* @ingroup drv_vive * @ingroup drv_vive
*/ */
@ -17,6 +18,10 @@
#include "math/m_api.h" #include "math/m_api.h"
#include "tracking/t_tracking.h"
#include "math/m_vec3.h"
#include "math/m_space.h"
#define VIVE_TRACE(d, ...) U_LOG_IFL_T(d->ll, __VA_ARGS__) #define VIVE_TRACE(d, ...) U_LOG_IFL_T(d->ll, __VA_ARGS__)
#define VIVE_DEBUG(d, ...) U_LOG_IFL_D(d->ll, __VA_ARGS__) #define VIVE_DEBUG(d, ...) U_LOG_IFL_D(d->ll, __VA_ARGS__)
@ -31,6 +36,10 @@
#define JSON_MATRIX_3X3(a, b, c) u_json_get_matrix_3x3(u_json_get(a, b), c) #define JSON_MATRIX_3X3(a, b, c) u_json_get_matrix_3x3(u_json_get(a, b), c)
#define JSON_STRING(a, b, c) u_json_get_string_into_array(u_json_get(a, b), c, sizeof(c)) #define JSON_STRING(a, b, c) u_json_get_string_into_array(u_json_get(a, b), c, sizeof(c))
#define printf_pose(pose) \
printf("%f %f %f %f %f %f %f\n", pose.position.x, pose.position.y, pose.position.z, pose.orientation.x, \
pose.orientation.y, pose.orientation.z, pose.orientation.w);
static void static void
_get_color_coeffs(struct u_vive_values *values, const cJSON *coeffs, uint8_t eye, uint8_t channel) _get_color_coeffs(struct u_vive_values *values, const cJSON *coeffs, uint8_t eye, uint8_t channel)
{ {
@ -180,6 +189,170 @@ _print_vec3(const char *title, struct xrt_vec3 *vec)
U_LOG_D("%s = %f %f %f", title, (double)vec->x, (double)vec->y, (double)vec->z); U_LOG_D("%s = %f %f %f", title, (double)vec->x, (double)vec->y, (double)vec->z);
} }
static bool
_get_camera(struct index_camera *cam, const cJSON *cam_json)
{
bool succeeded = true;
const cJSON *extrinsics = u_json_get(cam_json, "extrinsics");
succeeded = succeeded && JSON_VEC3(extrinsics, "plus_x", &cam->extrinsics.plus_x);
succeeded = succeeded && JSON_VEC3(extrinsics, "plus_z", &cam->extrinsics.plus_z);
succeeded = succeeded && JSON_VEC3(extrinsics, "position", &cam->extrinsics.position);
const cJSON *intrinsics = u_json_get(cam_json, "intrinsics");
succeeded = succeeded && u_json_get_double_array(u_json_get(u_json_get(intrinsics, "distort"), "coeffs"),
cam->intrinsics.distortion, 4);
succeeded = succeeded && u_json_get_double(u_json_get(intrinsics, "center_x"), &cam->intrinsics.center_x);
succeeded = succeeded && u_json_get_double(u_json_get(intrinsics, "center_y"), &cam->intrinsics.center_y);
succeeded = succeeded && u_json_get_double(u_json_get(intrinsics, "focal_x"), &cam->intrinsics.focal_x);
succeeded = succeeded && u_json_get_double(u_json_get(intrinsics, "focal_y"), &cam->intrinsics.focal_y);
succeeded = succeeded && u_json_get_int(u_json_get(intrinsics, "height"), &cam->intrinsics.image_size_pixels.h);
succeeded = succeeded && u_json_get_int(u_json_get(intrinsics, "width"), &cam->intrinsics.image_size_pixels.w);
if (!succeeded) {
return false;
}
return true;
}
bool
vive_get_stereo_camera_calibration(struct vive_config *d,
struct t_stereo_camera_calibration **out_calibration,
struct xrt_pose *head_in_left_camera)
{
// Note! This doesn't feel exactly correct - some parts of the math seem weird, and when undistorting the
// images with the data produced by this function, things don't quite line up along epipolar lines. If you're
// really good at this kind of math and very bored, you could try to figure out what the problem is here. I for
// one have to accept that I don't have time for this and have to merge it as-is.
if (!d->cameras.valid) {
U_LOG_W("Why did you call me?");
return false;
}
struct index_camera *cameras = d->cameras.view;
bool print_debug = false;
struct t_stereo_camera_calibration *out_calib = NULL;
t_stereo_camera_calibration_alloc(&out_calib, 5);
*out_calibration = out_calib;
struct xrt_matrix_3x3 rotate_hmd_to_camera[2];
struct xrt_matrix_3x3 rotate_camera_to_hmd[2];
for (int i = 0; i < 2; i++) {
out_calib->view[i].use_fisheye = true;
out_calib->view[i].image_size_pixels.h = 960;
out_calib->view[i].image_size_pixels.w = 960;
// This better be row-major!
out_calib->view[i].intrinsics[0][0] = cameras[i].intrinsics.focal_x;
out_calib->view[i].intrinsics[0][1] = 0.0f;
out_calib->view[i].intrinsics[0][2] = cameras[i].intrinsics.center_x;
out_calib->view[i].intrinsics[1][0] = 0.0f;
out_calib->view[i].intrinsics[1][1] = cameras[i].intrinsics.focal_y;
out_calib->view[i].intrinsics[1][2] = cameras[i].intrinsics.center_y;
out_calib->view[i].intrinsics[2][0] = 0.0f;
out_calib->view[i].intrinsics[2][1] = 0.0f;
out_calib->view[i].intrinsics[2][2] = 1.0f;
out_calib->view[i].distortion_fisheye[0] = cameras[i].intrinsics.distortion[0];
out_calib->view[i].distortion_fisheye[1] = cameras[i].intrinsics.distortion[1];
out_calib->view[i].distortion_fisheye[2] = cameras[i].intrinsics.distortion[2];
out_calib->view[i].distortion_fisheye[3] = cameras[i].intrinsics.distortion[3];
struct xrt_vec3 plus_x = m_vec3_mul_scalar(cameras[i].extrinsics.plus_x, -1.0f);
struct xrt_vec3 plus_z = m_vec3_mul_scalar(cameras[i].extrinsics.plus_z, -1.0f);
struct xrt_vec3 plus_y;
math_vec3_cross(&plus_z, &plus_x, &plus_y);
// I will have a seziure if you ask me if this is row-major or col-major. It works, okay? *OKAY?*
rotate_hmd_to_camera[i].v[0] = plus_x.x;
rotate_hmd_to_camera[i].v[1] = plus_y.x;
rotate_hmd_to_camera[i].v[2] = plus_z.x;
rotate_hmd_to_camera[i].v[3] = plus_x.y;
rotate_hmd_to_camera[i].v[4] = plus_y.y;
rotate_hmd_to_camera[i].v[5] = plus_z.y;
rotate_hmd_to_camera[i].v[6] = plus_x.z;
rotate_hmd_to_camera[i].v[7] = plus_y.z;
rotate_hmd_to_camera[i].v[8] = plus_z.z;
math_matrix_3x3_inverse(&rotate_hmd_to_camera[i], &rotate_camera_to_hmd[i]);
}
// The Index has hard-coded position intrinsics: relative to the HMD origin, both cameras have the exact same Y
// and Z coordinate, and their X-coordinates have the same magnitude but opposite signs. In other words their
// positions are mirrored across the YZ plane. So, I can do cheesy shortcuts like this.
float negative_baseline = cameras[1].extrinsics.position.x - cameras[0].extrinsics.position.x;
// Doing rotate_camera_to_hmd * (baseline, 0, 0)
out_calib->camera_translation[0] = negative_baseline * rotate_camera_to_hmd[1].v[0];
out_calib->camera_translation[1] = negative_baseline * rotate_camera_to_hmd[1].v[1];
out_calib->camera_translation[2] = negative_baseline * rotate_camera_to_hmd[1].v[2];
struct xrt_matrix_3x3 rot_left_camera_to_right_camera;
math_matrix_3x3_multiply(&rotate_hmd_to_camera[1], &rotate_camera_to_hmd[0], &rot_left_camera_to_right_camera);
out_calib->camera_rotation[0][0] = rot_left_camera_to_right_camera.v[0];
out_calib->camera_rotation[0][1] = rot_left_camera_to_right_camera.v[1];
out_calib->camera_rotation[0][2] = rot_left_camera_to_right_camera.v[2];
out_calib->camera_rotation[1][0] = rot_left_camera_to_right_camera.v[3];
out_calib->camera_rotation[1][1] = rot_left_camera_to_right_camera.v[4];
out_calib->camera_rotation[1][2] = rot_left_camera_to_right_camera.v[5];
out_calib->camera_rotation[2][0] = rot_left_camera_to_right_camera.v[6];
out_calib->camera_rotation[2][1] = rot_left_camera_to_right_camera.v[7];
out_calib->camera_rotation[2][2] = rot_left_camera_to_right_camera.v[8];
struct xrt_space_graph xsg_hmd_in_left_cam = {0};
// For some reason xrt_space_graph wants things in the opposite order as you'd expect.
// Second, we apply the position:
struct xrt_pose just_translation = {0};
just_translation.orientation.w = 1.0f;
just_translation.orientation.x = 0.0f;
just_translation.orientation.y = 0.0f;
just_translation.orientation.z = 0.0f;
// Weird that only the y-component has to be negative, right? I, the person writing this, don't really
// understand it. The Index calibration sure uses weird coordinate spaces.
just_translation.position.x = cameras[0].extrinsics.position.x;
just_translation.position.y = -cameras[0].extrinsics.position.y;
just_translation.position.z = cameras[0].extrinsics.position.z;
m_space_graph_add_pose(&xsg_hmd_in_left_cam, &just_translation);
// First, we add the rotation:
struct xrt_pose just_rotation = {0};
math_quat_from_matrix_3x3(&rotate_camera_to_hmd[0], &just_rotation.orientation);
m_space_graph_add_pose(&xsg_hmd_in_left_cam, &just_rotation);
struct xrt_space_relation head_in_left_cam = {0};
m_space_graph_resolve(&xsg_hmd_in_left_cam, &head_in_left_cam);
if (print_debug) {
printf_pose(head_in_left_cam.pose);
}
*head_in_left_camera = head_in_left_cam.pose;
return true;
}
static void static void
vive_init_defaults(struct vive_config *d) vive_init_defaults(struct vive_config *d)
{ {
@ -200,6 +373,8 @@ vive_init_defaults(struct vive_config *d)
d->imu.gyro_scale.y = 1.0f; d->imu.gyro_scale.y = 1.0f;
d->imu.gyro_scale.z = 1.0f; d->imu.gyro_scale.z = 1.0f;
d->cameras.valid = false;
for (int view = 0; view < 2; view++) { for (int view = 0; view < 2; view++) {
d->distortion[view].aspect_x_over_y = 0.89999997615814209f; d->distortion[view].aspect_x_over_y = 0.89999997615814209f;
d->distortion[view].grow_for_undistort = 0.5f; d->distortion[view].grow_for_undistort = 0.5f;
@ -279,6 +454,45 @@ vive_config_parse(struct vive_config *d, char *json_string, enum u_logging_level
math_pose_transform(&trackref_to_head, &d->imu.trackref, &imu_to_head); math_pose_transform(&trackref_to_head, &d->imu.trackref, &imu_to_head);
d->display.imuref = imu_to_head; d->display.imuref = imu_to_head;
// Hey! Moses wrote this part in a pretty big hurry; you will definitely see some suspect things here.
// If you're bored, please fix them!
const cJSON *cms = u_json_get(json, "tracked_cameras");
const cJSON *cmr;
bool found_camera_json = false;
bool succeeded_parsing_json = false;
cJSON_ArrayForEach(cmr, cms)
{
found_camera_json = true;
const cJSON *name_json = u_json_get(cmr, "name");
const char *name = name_json->valuestring;
bool is_left = !strcmp("left", name);
bool is_right = !strcmp("right", name);
if (!is_left && !is_right) {
continue;
}
if (!_get_camera(&d->cameras.view[is_right], cmr)) {
succeeded_parsing_json = false;
break;
}
succeeded_parsing_json = true;
}
if (!found_camera_json) {
U_LOG_W("HMD is Index, but no cameras in json file!");
} else if (!succeeded_parsing_json) {
U_LOG_E("Failed to parse Index camera calibration!");
} else {
d->cameras.valid = true;
}
} break; } break;
default: default:
VIVE_ERROR(d, "Unknown Vive variant."); VIVE_ERROR(d, "Unknown Vive variant.");

View file

@ -4,6 +4,7 @@
* @file * @file
* @brief vive json header * @brief vive json header
* @author Lubosz Sarnecki <lubosz.sarnecki@collabora.com> * @author Lubosz Sarnecki <lubosz.sarnecki@collabora.com>
* @author Moses Turner <moses@collabora.com>
* @ingroup drv_vive * @ingroup drv_vive
*/ */
@ -14,6 +15,7 @@
#include "xrt/xrt_defines.h" #include "xrt/xrt_defines.h"
#include "util/u_logging.h" #include "util/u_logging.h"
#include "util/u_distortion_mesh.h" #include "util/u_distortion_mesh.h"
#include "tracking/t_tracking.h"
// public documentation // public documentation
#define INDEX_MIN_IPD 0.058 #define INDEX_MIN_IPD 0.058
@ -41,6 +43,36 @@ enum VIVE_CONTROLLER_VARIANT
CONTROLLER_UNKNOWN CONTROLLER_UNKNOWN
}; };
/*!
* A calibrated camera on an Index.
*/
struct index_camera
{
// Note! All the values in this struct are directly pasted in from the JSON values.
// As such, in my opinion, plus_x, plus_z and position are all "wrong" - all the code I've had to write that
// uses this struct flips the signs of plus_x, plus_z, and the signs of the X- and Z-components of position.
// I have no idea why those sign flips were necessary - I suppose Valve/HTC just made some weird decisions when
// making the config file schemas. I figure it would be very confusing to try to "fix" these values as I'm
// parsing them, so if you're writing code downstream of this, beware and expect the values in here to be
// exactly the same as those in the compressed JSON. -Moses
struct
{
struct xrt_vec3 plus_x;
struct xrt_vec3 plus_z;
struct xrt_vec3 position; // looks like from head pose
} extrinsics;
struct
{
double distortion[4]; // Kannala-Brandt
double center_x;
double center_y;
double focal_x;
double focal_y;
struct xrt_size image_size_pixels;
} intrinsics;
};
/*! /*!
* A single lighthouse senosor point and normal, in IMU space. * A single lighthouse senosor point and normal, in IMU space.
*/ */
@ -113,6 +145,12 @@ struct vive_config
struct u_vive_values distortion[2]; struct u_vive_values distortion[2];
struct
{
struct index_camera view[2];
bool valid;
} cameras;
struct lh_model lh; struct lh_model lh;
}; };
@ -161,3 +199,8 @@ struct vive_controller_device;
bool bool
vive_config_parse_controller(struct vive_controller_config *d, char *json_string, enum u_logging_level ll); vive_config_parse_controller(struct vive_controller_config *d, char *json_string, enum u_logging_level ll);
bool
vive_get_stereo_camera_calibration(struct vive_config *d,
struct t_stereo_camera_calibration **out_calibration,
struct xrt_pose *head_in_left_camera);