knitr::opts_chunk$set(echo = TRUE, 
                      cache.lazy = FALSE,
                      dev = c("svglite", "pdf", "png"),
                      dpi = 300,
                      fig.path = 'figures/',
                      fig.keep = "high")


#added from: https://github.com/yihui/knitr-examples/blob/master/077-wrap-output.Rmd
library(knitr)
hook_output = knit_hooks$get('output')
knit_hooks$set(output = function(x, options) {
  # this hook is used only when the linewidth option is not NULL
  if (!is.null(n <- options$linewidth)) {
    x = knitr:::split_lines(x)
    # any lines wider than n should be wrapped
    if (any(nchar(x) > n)) x = strwrap(x, width = n)
    x = paste(x, collapse = '\n')
  }
  hook_output(x, options)
})


library(tidyverse) # A collection of packages for data science. More about it on 
                   # www.tidyverse.com
library(magrittr)  # A package that provides pipe operators like %>%
library(lme4)      # A package 
library(glue)      # A package that provides interpolated string functions.
library(latex2exp) # A package that converts latex to plotmath expressions.library(lmerTest)
library(lmerTest)  # A package that improves inference for LMEM.
library(emmeans)   # A package that allows to conduct post-hoc tests.
library(optimx)    # A package that contains additional optimizer. 
library(data.table)
library(glue)
library(mgcv)


ICC_nested <- function(model) {

  nested_terms <-  
    formula(model) %>%
    as.character(.) %>%
    str_extract_all(., "(?<=[|] ?)[[:word:]]+[/][[:word:]]+(?= ?[)])") %>%
    unlist(.) %>%
    na.omit(.) %>%
    as.vector(.) %>%
    str_trim(.)
  
  variances <- 
    as_tibble(VarCorr(model)) %>%
    select(effect    = grp,
           variance  = vcov) 
             

  rpl_effect <- function(x, str) {
  
    x <- str_trim(x)
    
    nested_hyperPar <- 
    strsplit(str, "/", fixed = TRUE)[[1]][1] %>%
    str_trim(.) %>%
    #add regx condition to prevent substring matching:
    paste0(., "($|:)")  
  
    x[grepl(nested_hyperPar, x)] <- str  
  
    return(x)
  }

  variances$effect <-    
    reduce(.x    = nested_terms,
           .f    = rpl_effect,
           .init = variances$effect,
           .dir  = "forward")

  variances %<>%
    group_by(effect) %>%
    summarize(variance = sum(variance, na.rm = TRUE)) %>%
    ungroup() %>%
    mutate(icc      = variance / sum(variance, na.rm = TRUE),
           icc_perc = icc * 100) %>%
    arrange(desc(icc))
  
  return(variances)
}


grid_data <- 
  readRDS("data/reliability_gridsearch_results.rds")


summary(select(grid_data, -system, -accuracy))

 dropout     hidden_size_max hidden_number learning_rate batch_size
 0   :2430   16 :2430        3:4050        0.001:4050    1 :2025   
 0.05:2430   32 :2430        5:4050        0.01 :4050    4 :2025   
 0.1 :2430   64 :2430        7:4050        0.1  :4050    8 :2025   
 0.15:2430   128:2430                                    16:2025   
 0.2 :2430   256:2430                                    32:2025   
                                                         64:2025   
 random_seed  epochs   
 -7712:4050   1 :4050  
 6483 :4050   5 :4050  
 20777:4050   10:4050


summary(select(grid_data, accuracy))

    accuracy     
 Min.   :0.7465  
 1st Qu.:0.7649  
 Median :0.7649  
 Mean   :0.7671  
 3rd Qu.:0.7649  
 Max.   :0.7920


data_plot <-
  grid_data      %>%
  select(-system) %>%
  pivot_longer(cols = !accuracy, 
               names_to = "parameter", 
               values_to = "parameter_value",
               values_transform = list(parameter_value = as.character)) %>%
  group_by(parameter, parameter_value) %>%
  summarize(mean_acc = mean(accuracy),
            sd_acc   = sd(accuracy)) 

ggplot(data = data_plot, 
       aes(y = mean_acc, x = factor(as.numeric(parameter_value)))) +
  theme_bw() + 
  xlab("") +
  ylab("mean accuracy") + 
  facet_wrap(vars(parameter), ncol = 2, scales = "free_x") +
  geom_point(size = .001) +
  geom_pointrange(aes(ymin = mean_acc - sd_acc, 
                      ymax = mean_acc + sd_acc))

`summarise()` has grouped output by 'parameter'. You can override using the `.groups` argument.


mod_form <- 
  #remove seed, so that it is identical with residual
  glue("(1|{names(grid_data)[-c(1,2,9)]})") %>% 
    glue_collapse(., sep = " + ") %>%
    glue("accuracy ~ ", .)

var_decomp <-   
  lmer(as.formula(mod_form), 
       data = grid_data)

#model2 <- 
#  update(var_decomp, ~ . + (1 | hidden_number:hidden_size_max))

Warning message in checkConv(attr(opt, "derivs"), opt$par, ctrl = control$checkConv, :
“Model failed to converge with max|grad| = 0.0131237 (tol = 0.002, component 1)”


ICC_nested(var_decomp)

effect	variance	icc	icc_perc
<chr>	<dbl>	<dbl>	<dbl>
Residual	3.143517e-05	6.115291e-01	61.152911971
hidden_number	1.594349e-05	3.101593e-01	31.015926717
learning_rate	3.184632e-06	6.195275e-02	6.195275409
batch_size	5.152907e-07	1.002429e-02	1.002429095
hidden_size_max	2.614108e-07	5.085398e-03	0.508539795
dropout	6.015225e-08	1.170182e-03	0.117018154
random_seed	4.060346e-09	7.898859e-05	0.007898859

Hyperparamter: Grid Serach from scratch¶