scripts/step_05_align3D.R

# this is where we will align the marker 3d data using mousetrap.

library(tidyverse)
library(mousetrap)
library(ggprism)
library(conflicted)
# library(cowplot)


# load the data
dat <- read_tsv("data/combined_data_long.tsv.bz2",
  col_types = cols(
    index = col_integer(),
    REF_D_x = col_double(),
    REF_D_y = col_double(),
    REF_D_z = col_double(),
    REF_W_x = col_double(),
    REF_W_y = col_double(),
    REF_W_z = col_double(),
    condition = col_factor(),
    trial = col_factor(),
    trial_elapsed_time = col_double(),
    experiment_id = col_factor(),
    subj_pos = col_factor(),
    subj = col_factor(),
    CAR_x = col_double(),
    CAR_y = col_double(),
    CAR_z = col_double(),
    filename = col_factor()
  ))

# add a unique trial ID which is a combination of experiment_id, subj, condition, trial
dat <- dat %>%
  mutate(
    mt_id = paste0(experiment_id, subj, condition, trial)
  )

# now we can remove every column except the ones used for mousetrap
dat <- dat %>%
  select(
    mt_id,
    index,
    trial_elapsed_time,
    CAR_x,
    CAR_y,
    CAR_z,
    trial,
    subj,
    subj_pos,
    condition,
    experiment_id
  )
# we can also remove all trial "1" data since that is the practice trial
# dat <- dat %>%
#   dplyr::filter(trial != "1")

# let's get the unique trial count
trial_counts <- dat %>% 
  group_by(mt_id) %>%
  summarise(
    trial_count = n_distinct(trial)
  ) %>%
  ungroup()
# instead let's remove trials under 30 seconds (practice trial is 30 seconds)
# first we need to find the max trial_elapsed_time for each trial
dat <- dat %>%
  group_by(mt_id) %>%
  mutate(
    max_trial_elapsed_time = max(trial_elapsed_time)
  ) %>%
  ungroup() %>%
  dplyr::filter(max_trial_elapsed_time > 30) %>%
  select(-max_trial_elapsed_time)

trial_counts <- dat %>% 
  group_by(mt_id) %>%
  summarise(
    trial_count = n_distinct(trial)
  ) %>%
  ungroup()


# timestamps seem to be required to be an integer, right now they are doubles
# number of seconds with 5 decimal places
# dat <- dat %>%
#  mutate(trial_elapsed_time = as.integer(trial_elapsed_time * 100000))

levels(dat$experiment_id) <- paste("Subject Pair", levels(dat$experiment_id))

levels(dat$trial) <- paste("Trial", as.integer(levels(dat$trial)) - 1)

levels(dat$condition) <- c("Sync", "Task", "No Sonification")

# based on the data (you can see if you comment out the filters below)
# we need to completely exclude
# - Subject Pair 2, No Sonification, Trial 2
# - Subject Pair 3, Sync, Trial 0
# - Subject Pair 4, Task, Trial 1
# And we need to only include partial data for the following:
# - Subject Pair 1, Sync, Trial 3, only include up to 45 seconds
# - Subject Pair 2, Sync, Trial 3, only include up to 60 seconds
# - Subject Pair 5, Sync, Trial 2, only include up to 55 seconds
# - Subject Pair 5, Sync, Trial 4, only include up to 80 seconds
# - Subject Pair 2, Task, Trial 2, only include up to 20 seconds
# - Subject Pair 4, Task, Trial 2, only include up to 65 seconds

# let's remove the above

dat <- dat %>%
  dplyr::filter(
    !(experiment_id == "Subject Pair 2" & condition == "No Sonification" & trial == "Trial 2") &
      !(experiment_id == "Subject Pair 3" & condition == "Sync" & trial == "Trial 0") &
      !(experiment_id == "Subject Pair 4" & condition == "Task" & trial == "Trial 1")
  )

# now let's remove the partial data
dat <- dat %>%
  dplyr::filter(
    !(experiment_id == "Subject Pair 1" & condition == "Sync" & trial == "Trial 3" & trial_elapsed_time > 45) &
      !(experiment_id == "Subject Pair 2" & condition == "Sync" & trial == "Trial 3" & trial_elapsed_time > 60) &
      !(experiment_id == "Subject Pair 5" & condition == "Sync" & trial == "Trial 2" & trial_elapsed_time > 52) &
      !(experiment_id == "Subject Pair 5" & condition == "Sync" & trial == "Trial 4" & trial_elapsed_time > 78) &
      !(experiment_id == "Subject Pair 2" & condition == "Task" & trial == "Trial 2" & trial_elapsed_time > 20) &
      !(experiment_id == "Subject Pair 4" & condition == "Task" & trial == "Trial 2" & trial_elapsed_time > 65)
  )

# Now we just need to reindex the trials so
# - Subject Pair 2, No Sonification, Trial 3 becomes Trial 2
# - Subject Pair 5, Sync, Trial 4 becomes Trial 3
# - Subject Pair 4, Task, Trial 2 becomes Trial 1
# - Subject Pair 4, Task, Trial 3 becomes Trial 2
# - Subject Pair 4, Task, Trial 4 becomes Trial 3
# we need to account for the trial being a factor
# and case_when is fussy so let's use base r
# to update the variables
dat$trial[dat$experiment_id == "Subject Pair 2" & dat$condition == "No Sonification" & dat$trial == "Trial 3"] <- "Trial 2"
dat$trial[dat$experiment_id == "Subject Pair 5" & dat$condition == "Sync" & dat$trial == "Trial 4"] <- "Trial 3"
dat$trial[dat$experiment_id == "Subject Pair 4" & dat$condition == "Task" & dat$trial == "Trial 2"] <- "Trial 1"
dat$trial[dat$experiment_id == "Subject Pair 4" & dat$condition == "Task" & dat$trial == "Trial 3"] <- "Trial 2"
dat$trial[dat$experiment_id == "Subject Pair 4" & dat$condition == "Task" & dat$trial == "Trial 4"] <- "Trial 3"


#### OK THE DATA IS ALL READY TO GO

dat_mt <- mt_import_long(dat,
  xpos_label = "CAR_x",
  ypos_label = "CAR_y",
  zpos_label = "CAR_z",
  timestamps_label = "trial_elapsed_time",
  mt_id_label = "mt_id",
  mt_seq_label = "index")

dat_mt_aligned <- mt_align_start(dat_mt, start = c(0, 0, 0))

# dat_mt_aligned_normalized <- mt_length_normalize(
#     dat_mt_aligned,
#     dimensions = c("xpos", "ypos", "zpos"))

# ln_trajectories

# mt_plot(dat_mt_aligned_normalized,
#   use = "ln_trajectories",
#   x = "timestamps",
#   color = "experiment_id")
grid::current.viewport()
# plt <- mt_plot(dat_mt_aligned,
#   use = "trajectories",
#   x = "timestamps",
#   color = "experiment_id")

# dat_mt_aligned <- mt_measures(dat_mt_aligned)

dat_mt_scaled <- mt_scale_trajectories(
    dat_mt_aligned,
    within_trajectory = TRUE,
    var_names = c("ypos"), prefix = "z_")

trajectories <- mt_reshape(dat_mt_scaled,
        use2_variables = c("trial", "experiment_id", "subj", "condition"),
        aggregate = FALSE, subset = condition == "No Sonification")


plt <- ggplot(
  trajectories,
  aes(x = timestamps, y = z_ypos, color = subj)) +
  geom_path(alpha = 0.6) +
  scale_color_prism("floral") +
  guides(y = "prism_offset_minor") +
  theme_prism(base_size = 16) +
  theme(legend.position = "none") +
  labs(
    y = "Standardized Y Position",
    x = "Time (s)",
    title = "Subject Pair Trajectories: No Sonification") +
  facet_grid(
    rows = vars(trial),
    cols = vars(experiment_id),
    scales = "free_x",
    space = "free_x"
  )

ggsave(
  "docs/figures/mt_trajectories_no_sonification.png",
  plt,
  width = 16,
  height = 9,
  units = "in",
  dpi = 300
)


trajectories <- mt_reshape(dat_mt_scaled,
        use2_variables = c("trial", "experiment_id", "subj", "condition"),
        aggregate = FALSE, subset = condition == "Sync")


plt <- ggplot(
  trajectories,
  aes(x = timestamps, y = z_ypos, color = subj)) +
  geom_path(alpha = 0.6) +
  scale_color_prism("floral") +
  guides(y = "prism_offset_minor") +
  theme_prism(base_size = 16) +
  theme(legend.position = "none") +
  labs(
    y = "Standardized Y Position",
    x = "Time (s)",
    title = "Subject Pair Trajectories: Sync Sonification") +
  facet_grid(
    rows = vars(trial),
    cols = vars(experiment_id),
    scales = "free_x",
    space = "free_x"
  )

ggsave(
  "docs/figures/mt_trajectories_sync_sonification.png",
  plt,
  width = 16,
  height = 9,
  units = "in",
  dpi = 300
)


trajectories <- mt_reshape(dat_mt_scaled,
        use2_variables = c("trial", "experiment_id", "subj", "condition"),
        aggregate = FALSE, subset = condition == "Task")


plt <- ggplot(
  trajectories,
  aes(x = timestamps, y = z_ypos, color = subj)) +
  geom_path(alpha = 0.6) +
  scale_color_prism("floral") +
  guides(y = "prism_offset_minor") +
  theme_prism(base_size = 16) +
  theme(legend.position = "none") +
  labs(
    y = "Standardized Y Position",
    x = "Time (s)",
    title = "Subject Pair Trajectories: Task Sonification") +
  facet_grid(
    rows = vars(trial),
    cols = vars(experiment_id),
    scales = "free_x",
    space = "free_x"
  )

ggsave(
  "docs/figures/mt_trajectories_task_sonification.png",
  plt,
  width = 16,
  height = 9,
  units = "in",
  dpi = 300
)


# now let's save the standardized trajectories

trajectories <- mt_reshape(dat_mt_scaled,
        use2_variables = c("trial", "experiment_id", "subj", "condition"),
        aggregate = FALSE)

# we can remove xpos and zpos, since we are only analyzing one axis
# we also do not need the mt_id, but we will keep the mt_seq (index)
trajectories <- trajectories %>% select(-xpos, -zpos, -mt_id)


save(
  trajectories,
  file = "data/standardized_trajectories.Rda.bz2",
  compress = "bzip2")

# also save as a bzipped tsv for compatibility with other tools
con <- bzfile("data/standardized_trajectories.tsv.bz2")
write_tsv(trajectories, con)