Revision 215dc19479aad7da6918390886e04de4fd2194ca authored by didacvp on 28 December 2020, 12:12:50 UTC, committed by GitHub on 28 December 2020, 12:12:50 UTC
1 parent de18867
Raw File
BrainAgeFull.R
args = commandArgs(TRUE)

eta=as.numeric(args[1])
max_depth=as.numeric(args[2])
gamma=as.numeric(args[3])
min_child_weight=as.numeric(args[4])
nrounds=as.numeric(args[5])
data_folder=as.character(args[6])
sex_split=try(as.logical(args[7]))


BrainAgeFull = function(eta, max_depth, gamma, min_child_weight, nrounds, data_folder, sex_split) {
  
  if(missing(sex_split)) { sex_split = F}
  
  basefolder="/cluster/projects/p274/projects/p024-modes_of_variation"
  data_folder=file.path(basefolder, data_folder)
  
  .libPaths()
  list.of.packages = c("dplyr", "xgboost", "caret")
  new.packages = list.of.packages[!(list.of.packages %in% installed.packages()[,"Package"])]
  if(length(new.packages)) install.packages(new.packages, repos = "file://tsd/shared/R/cran")
  lapply(list.of.packages, require, character.only = T)
  
  load(file.path(data_folder, "vars.Rda"))
  load(file.path(data_folder,"All_raw.Rda"))  
  load(file.path(data_folder,"All_preproc.Rda"))
  
  
  df.Train = list()
  data.train = list()
  label.train = list()
  
  if(sex_split == T) { 
    jj = sort(unique(df$sex))
    for (j in jj) {
      df.Train[[j+1]] <- df %>% filter(!eid %in% subs.long & sex == j)  
      data.train[[j+1]] = df.Train[[j+1]][, T1w_vars] %>% as.matrix()
      label.train[[j+1]]  = df.Train[[j+1]]$age %>% as.matrix()
    }
  } else {
    df.Train[[1]] <- df %>% filter(!eid %in% subs.long)
    data.train[[1]] = df.Train[[1]][, T1w_vars] %>% as.matrix()
    label.train[[1]] = df.Train[[1]]$age %>% as.matrix()
  }
  
  if(sex_split == T) {nfold = 5} else {nfold = 10}
  
  for(j in 1:length(data.train)) {
    bst <- xgboost(data = data.train[[j]],   # cth + subcortical volumes
                   objective = "reg:squarederror",
                   label = label.train[[j]], # fit age
                   eta = eta,
                   max_depth=max_depth,
                   gamma = gamma,
                   min_child_weight = min_child_weight,
                   nrounds = nrounds,
                   nthread = 5, 
                   verbose = 0)
  
    if(sex_split == T) {
      save(bst, file = file.path(data_folder, paste0("xgbcv.full",as.character(j-1),".Rda")))
    } else {
      save(bst, file = file.path(data_folder, "xgbcv.full.Rda"))
    }
  
  }
}

BrainAgeFull(eta, max_depth, gamma, min_child_weight, nrounds, data_folder, sex_split)
back to top