1 Arrange folders, sort files, read and merge

1.1 Create folders by conditions, copy files to them

# !!!!EVAL = FALSE
##################### Read file names ##################################################################################
file_names <- dir(pattern = "\\.xls$")
## if above isn't good enough try the following:
# file_names <- list.files(wd)
# file_names <- sop_files[!file.info(sop_files)$isdir]   # exclude directories
# file_names <- sop_files[grep(".xls", sop_files, fixed = TRUE)]


##################### Create folders with Condition names ###############################################################
# this part of script may be re-run if files from wd are updated
dir_names <- c("Unic_CTRL_Instr", "Unic_CTRL_Solo", "Unic_OGL_Instr", "Unic_OGL_Solo",
              "Repetat_CTRL_Instr", "Repetat_CTRL_Solo", "Repetat_OGL_Instr", "Repetat_OGL_Solo")
             
for(dir in dir_names){
  if(!dir.exists(file.path(wd, dir)))
  dir.create(file.path(wd, dir), showWarnings = FALSE)
}


##################### Use file names to sort them to folders ############################################################
sort_files_to_dirs <- function(wd, pattern, dir) {
  check_pattern <- outer(file_names, pattern, stringr::str_detect)               # if all TRUE bye row then it has full pattern
  index <- which(apply(check_pattern, 1, function(x) all(x==TRUE)))              # get index of file_names where all are TRUE
  sorted_files <- file_names[index]                                              # get names of files from indexes
  
  for(files in sorted_files) {                                                   # copy the files to corresponding folder
    file.copy(from = file.path(wd, files), to = file.path(wd, dir))
  }  
}

sort_files_to_dirs(wd = wd, pattern = c("unic", "ecran", "instructor"), dir = "Unic_CTRL_Instr")
sort_files_to_dirs(wd = wd, pattern = c("unic", "ecran", "solo"), dir = "Unic_CTRL_Solo")
sort_files_to_dirs(wd = wd, pattern = c("unic", "oglinda", "instructor"), dir = "Unic_OGL_Instr")
sort_files_to_dirs(wd = wd, pattern = c("unic", "oglinda", "solo"), dir = "Unic_OGL_Solo")

1.2 Reading the data

############ Read in all the .xls from folders and merge them in datasets named after corresponding folder ##############
# this part of script may be re-run if files from wd are updated
# RE-RUN FROM HERE IF FOLDERS AND SORTING WAS ALREADY DONE
wd <- "C:/Users/Mihai/Desktop/EEG_O.4c_1/O.4c - Poster/Date Studiu"
setwd(wd)
The working directory was changed to C:/Users/Mihai/Desktop/EEG_O.4c_1/O.4c - Poster/Date Studiu inside a notebook chunk. The working directory will be reset when the chunk is finished running. Use the knitr root.dir option in the setup chunk to change the working directory for notebook chunks.
folders <- list.files(wd)
folders <- folders[file.info(folders)$isdir]   # luam doar folderele
datasetnames <- NULL
for (i in 1:length(folders)) {
  datasetname <- folders[i]
  datasetnames <- c(datasetnames, datasetname)
  current_dir <- setwd(file.path(wd, folders[i]))
  print(paste0("current_dir: ", current_dir))
  
  paths <- dir(pattern = "\\.xls$")
  names(paths) <- basename(paths)
  assign( paste(datasetname), plyr::ldply(paths, rio::import) )
}
[1] "current_dir: C:/Users/Mihai/Desktop/EEG_O.4c_1/O.4c - Poster/Date Studiu"
[1] "current_dir: C:/Users/Mihai/Desktop/EEG_O.4c_1/O.4c - Poster/Date Studiu/Unic_CTRL_Instr"
[1] "current_dir: C:/Users/Mihai/Desktop/EEG_O.4c_1/O.4c - Poster/Date Studiu/Unic_CTRL_Solo"
[1] "current_dir: C:/Users/Mihai/Desktop/EEG_O.4c_1/O.4c - Poster/Date Studiu/Unic_OGL_Instr"
setwd(wd)
# detach("package:plyr", unload=TRUE)                                                   # detach plyr because of conflicts with dplyr

1.3 Cleaning the data

#################################### Data Cleaning #####################################################################
# Check if ids have > 1 row of data (empty .xls have only 1 row)
# Careful! This function modfies the datasets in the global envinronment
delete_empty_id <- function(df){
  list_empty_id <- 
    df %>%
    dplyr::group_by(.id) %>%
    dplyr::summarise(row_count = n()) %>%
    dplyr::rename("empty_id" = .id) %>%
    mutate(delete_id = if_else(row_count < 3, TRUE, FALSE)) %>%
    filter(delete_id == TRUE)
  
  df_modif <- 
    df %>%
    filter(!.id %in% list_empty_id$empty_id)
  
  if(!identical(df, df_modif)){
    df <- deparse(substitute(df))
    cat("Deleting from ", print(as.name(df))); print(list_empty_id)                    # print out which ids are deleted from which dataset
    assign(df, df_modif, envir = globalenv())                                          # assign modified df to original dataset from Global
  }else cat("No empty datasets. Nothing to delete")
}
# Apply function to all datasets (tricky to do in for loop because of super assignment)
delete_empty_id(Unic_CTRL_Instr)
No empty datasets. Nothing to delete
delete_empty_id(Unic_CTRL_Solo)
No empty datasets. Nothing to delete
delete_empty_id(Unic_OGL_Instr)
No empty datasets. Nothing to delete
delete_empty_id(Unic_OGL_Solo)
No empty datasets. Nothing to delete

1.4 Exclude SAM_resp based on RT outliers

# !!!!EVAL = FALSE
############################### Exclude Outliers based on RT (by subject and stimulus type) #######################################
## DONT RUN (unless it is needed) ----> eval=FALSE
# Exclude RT outliers (=- 2SD) - instead of simple filter, makeing them NA  is better for paired comparison
remove_outliers <- function(df) {
  df_modif <-
    df %>%
    dplyr::group_by(.id, `Stimulus type`) %>%                  # we could have done before:  dplyr::rename("Stim_type" = `Stimulus type`) 
    mutate(SAM_Resp = if_else(abs(SAM_RT - mean(SAM_RT, na.rm=TRUE)) > 2*sd(SAM_RT, na.rm=TRUE), as.numeric(NA), SAM_Resp))
  
  if(!identical(df, df_modif)){
    df <- deparse(substitute(df))
    cat("Deleting outliers from ", print(as.name(df)));                               # print out datasets which have been modified
    assign(df, df_modif, envir = globalenv())                                          # assign modified df to original dataset from Global
  }else cat("No outlier")
}

remove_outliers(Unic_CTRL_Instr)
remove_outliers(Unic_CTRL_Solo)
remove_outliers(Unic_OGL_Instr)
remove_outliers(Unic_OGL_Solo)

1.5 Test if datasets have same columns

unic_df_obj <- mget(c("Unic_CTRL_Instr", "Unic_CTRL_Solo", "Unic_OGL_Instr", "Unic_OGL_Solo"))
unic_df_obj <-lapply(unic_df_obj, colnames)
outer(unic_df_obj, unic_df_obj, Vectorize(identical))                           # if all are TRUE, all df have same columns
                Unic_CTRL_Instr Unic_CTRL_Solo Unic_OGL_Instr Unic_OGL_Solo
Unic_CTRL_Instr            TRUE           TRUE           TRUE          TRUE
Unic_CTRL_Solo             TRUE           TRUE           TRUE          TRUE
Unic_OGL_Instr             TRUE           TRUE           TRUE          TRUE
Unic_OGL_Solo              TRUE           TRUE           TRUE          TRUE



2 Analysis - UNICE

2.1 Descriptives

##########################################################################################################################
#################################### Analyses - UNICE ####################################################################
## Descriptives by condition dataset
descriptive_func <- function(df, Stim_type, By_ID = FALSE){
  df_name <- deparse(substitute(df))
  suppressWarnings({                                                                # if all NAs in SAM_Resp, NaNs and Infs will be produced
    df_modif <- 
      df %>%
      dplyr::rename("ID" = .id) %>%
      select_all(~gsub("\\s+|\\.", "_", .)) %>%                                     # replaces blancks with "_" in colnames 
      filter(Stimulus_type == Stim_type)                                            # filter by stimulus type
      
    if(isTRUE(By_ID)){                                                              # if true group by id, if not return descriptives for all ids
      by_id_text <- " by subject"
      df_modif %>%
      dplyr::group_by(ID) %>%
      tidystats::describe_data(SAM_Resp, SAM_RT, na.rm = TRUE) %>%
        knitr::kable(caption = paste(as.name(df_name), " ", Stim_type, by_id_text), format = "pandoc", digits = 2)
    }else{ 
      by_id_text <- " all subjects"
      df_modif %>%
      ungroup() %>%  
      tidystats::describe_data(SAM_Resp, SAM_RT, na.rm = TRUE) %>%
        knitr::kable(caption = paste(as.name(df_name), " ", Stim_type, by_id_text), format = "pandoc", digits = 2)
    }
  })
}  
descriptive_func(df = Unic_CTRL_Instr, Stim_type = "negativ", By_ID = FALSE)           # Negative - General

Unic_CTRL_Instr negativ all subjects
var missing n M SD SE min max range median mode skew kurtosis
SAM_Resp 0 105 2.80 1.50 0.15 1 8.00 7.00 3.00 2.00 0.83 3.49
SAM_RT 0 105 1.89 0.88 0.09 1 4.38 3.38 1.56 2.51 0.99 2.94

descriptive_func(df = Unic_CTRL_Solo, Stim_type = "negativ", By_ID = FALSE)

Unic_CTRL_Solo negativ all subjects
var missing n M SD SE min max range median mode skew kurtosis
SAM_Resp 0 105 3.33 1.75 0.17 1 8.00 7.00 3.00 2.00 0.62 2.56
SAM_RT 0 105 2.53 1.66 0.16 1 10.12 9.12 2.05 1.59 2.25 9.40

descriptive_func(df = Unic_OGL_Instr, Stim_type = "negativ", By_ID = FALSE)

Unic_OGL_Instr negativ all subjects
var missing n M SD SE min max range median mode skew kurtosis
SAM_Resp 0 105 2.80 1.83 0.18 1 8.00 7.00 2.00 2.00 1.11 3.5
SAM_RT 0 105 1.91 0.80 0.08 1 4.54 3.54 1.75 1.42 0.88 3.2

descriptive_func(df = Unic_OGL_Solo, Stim_type = "negativ", By_ID = FALSE)

Unic_OGL_Solo negativ all subjects
var missing n M SD SE min max range median mode skew kurtosis
SAM_Resp 0 105 2.66 1.60 0.16 1 8.00 7.00 2.00 1 1.00 3.60
SAM_RT 0 105 1.91 0.83 0.08 1 5.27 4.27 1.73 1 1.28 5.01

descriptive_func(df = Unic_CTRL_Instr, Stim_type = "negativ", By_ID = TRUE)            # Negative - by id

Unic_CTRL_Instr negativ by subject
var ID missing n M SD SE min max range median mode skew kurtosis
SAM_Resp O4c_2_ID17ecraninstructorunic .xls 0 35 2.23 0.91 0.15 1 4.00 3.00 2.00 2.00 0.25 2.26
SAM_Resp O4c_Run2_ID12ecraninstructorunic .xls 0 35 3.14 1.42 0.24 1 5.00 4.00 3.00 5.00 0.00 1.72
SAM_Resp O4c_Run4_ID10ecraninstructorunic .xls 0 35 3.03 1.87 0.32 1 8.00 7.00 3.00 1.00 0.83 3.03
SAM_RT O4c_2_ID17ecraninstructorunic .xls 0 35 2.84 0.75 0.13 1 4.38 3.38 2.65 2.51 0.04 2.81
SAM_RT O4c_Run2_ID12ecraninstructorunic .xls 0 35 1.43 0.32 0.05 1 2.26 1.26 1.37 1.00 0.69 2.88
SAM_RT O4c_Run4_ID10ecraninstructorunic .xls 0 35 1.40 0.57 0.10 1 3.26 2.26 1.23 1.22 2.15 6.83

descriptive_func(df = Unic_CTRL_Solo, Stim_type = "negativ", By_ID = TRUE)

Unic_CTRL_Solo negativ by subject
var ID missing n M SD SE min max range median mode skew kurtosis
SAM_Resp O4c_Run1_ID12ecransolo unic .xls 0 35 3.69 1.59 0.27 1.00 6.00 5.00 4.00 5.00 -0.19 1.75
SAM_Resp O4c_Run1_ID17ecransolo unic .xls 0 35 3.14 1.68 0.28 1.00 7.00 6.00 3.00 2.00 0.75 2.60
SAM_Resp O4c_Run3_ID10ecransolo unic .xls 0 35 3.17 1.95 0.33 1.00 8.00 7.00 3.00 2.00 1.11 3.36
SAM_RT O4c_Run1_ID12ecransolo unic .xls 0 35 1.79 0.69 0.12 1.00 4.23 3.23 1.56 1.59 1.47 5.65
SAM_RT O4c_Run1_ID17ecransolo unic .xls 0 35 3.48 1.71 0.29 1.18 10.12 8.94 3.24 1.18 1.91 8.09
SAM_RT O4c_Run3_ID10ecransolo unic .xls 0 35 2.31 1.88 0.32 1.00 9.63 8.63 1.65 1.28 2.47 9.08

descriptive_func(df = Unic_OGL_Instr, Stim_type = "negativ", By_ID = TRUE)

Unic_OGL_Instr negativ by subject
var ID missing n M SD SE min max range median mode skew kurtosis
SAM_Resp O4c_3_ID12oglindainstructorunic X.xls 0 35 2.77 1.46 0.25 1.00 5.00 4.00 3.00 1.00 0.23 1.70
SAM_Resp O4c_Run1_ID10oglindainstructorunic .xls 0 35 3.86 2.30 0.39 1.00 8.00 7.00 3.00 2.00 0.38 1.82
SAM_Resp O4c_RunN(modifica N!)_ID1717oglindainstructorunic .xls 0 35 1.77 0.73 0.12 1.00 3.00 2.00 2.00 2.00 0.37 1.98
SAM_RT O4c_3_ID12oglindainstructorunic X.xls 0 35 1.28 0.24 0.04 1.00 1.79 0.79 1.22 1.42 0.89 2.80
SAM_RT O4c_Run1_ID10oglindainstructorunic .xls 0 35 2.00 0.89 0.15 1.00 4.04 3.04 1.78 3.11 0.71 2.47
SAM_RT O4c_RunN(modifica N!)_ID1717oglindainstructorunic .xls 0 35 2.45 0.63 0.11 1.38 4.54 3.17 2.40 2.26 0.91 4.88

descriptive_func(df = Unic_OGL_Solo, Stim_type = "negativ", By_ID = TRUE)

Unic_OGL_Solo negativ by subject
var ID missing n M SD SE min max range median mode skew kurtosis
SAM_Resp O4c_4_ID12oglindasolo unic .xls 0 35 2.91 1.46 0.25 1.00 5.00 4.00 3.00 1.00 -0.02 1.65
SAM_Resp O4c_Run2_ID10oglindasolo unic .xls 0 35 3.34 1.94 0.33 1.00 8.00 7.00 3.00 3.00 0.66 2.62
SAM_Resp O4c_RunN(modifica N!)_ID1717oglindasolo unic .xls 0 35 1.71 0.67 0.11 1.00 3.00 2.00 2.00 2.00 0.38 2.24
SAM_RT O4c_4_ID12oglindasolo unic .xls 0 35 1.35 0.33 0.05 1.00 2.30 1.30 1.28 1.00 1.23 3.79
SAM_RT O4c_Run2_ID10oglindasolo unic .xls 0 35 2.01 1.05 0.18 1.00 5.27 4.27 1.73 1.24 1.42 4.56
SAM_RT O4c_RunN(modifica N!)_ID1717oglindasolo unic .xls 0 35 2.38 0.57 0.10 1.46 3.74 2.28 2.30 3.04 0.19 2.37

descriptive_func(df = Unic_CTRL_Instr, Stim_type = "pozitiv", By_ID = FALSE)           # Positive - General

Unic_CTRL_Instr pozitiv all subjects
var missing n M SD SE min max range median mode skew kurtosis
SAM_Resp 0 105 1.73 0.96 0.09 1 5.00 4.00 1.00 1.00 1.20 3.66
SAM_RT 0 105 1.69 0.70 0.07 1 4.08 3.08 1.39 2.33 1.12 3.51

descriptive_func(df = Unic_CTRL_Solo, Stim_type = "pozitiv", By_ID = FALSE)

Unic_CTRL_Solo pozitiv all subjects
var missing n M SD SE min max range median mode skew kurtosis
SAM_Resp 0 105 2.01 1.27 0.12 1 6.00 5.00 2.00 1.00 1.21 3.71
SAM_RT 0 105 2.13 1.29 0.13 1 9.16 8.16 1.78 1.21 2.52 12.52

descriptive_func(df = Unic_OGL_Instr, Stim_type = "pozitiv", By_ID = FALSE)

Unic_OGL_Instr pozitiv all subjects
var missing n M SD SE min max range median mode skew kurtosis
SAM_Resp 0 105 2.15 1.57 0.15 1 8.00 7.00 2.00 1 1.46 4.49
SAM_RT 0 105 1.85 0.82 0.08 1 5.14 4.14 1.59 1 1.64 6.04

descriptive_func(df = Unic_OGL_Solo, Stim_type = "pozitiv", By_ID = FALSE)

Unic_OGL_Solo pozitiv all subjects
var missing n M SD SE min max range median mode skew kurtosis
SAM_Resp 0 105 2.02 1.26 0.12 1 7.00 6.00 2.00 1.00 1.57 5.56
SAM_RT 0 105 1.84 1.03 0.10 1 6.72 5.71 1.47 1.42 2.25 9.10

descriptive_func(df = Unic_CTRL_Instr, Stim_type = "pozitiv", By_ID = TRUE)            # Positive - by id

Unic_CTRL_Instr pozitiv by subject
var ID missing n M SD SE min max range median mode skew kurtosis
SAM_Resp O4c_2_ID17ecraninstructorunic .xls 0 35 1.69 0.76 0.13 1.00 3.00 2.00 2.00 1.00 0.58 2.00
SAM_Resp O4c_Run2_ID12ecraninstructorunic .xls 0 35 1.00 0.00 0.00 1.00 1.00 0.00 1.00 1.00 NaN NaN
SAM_Resp O4c_Run4_ID10ecraninstructorunic .xls 0 35 2.51 1.04 0.18 1.00 5.00 4.00 2.00 2.00 0.44 2.47
SAM_RT O4c_2_ID17ecraninstructorunic .xls 0 35 2.41 0.59 0.10 1.39 4.08 2.69 2.41 2.33 0.40 3.21
SAM_RT O4c_Run2_ID12ecraninstructorunic .xls 0 35 1.25 0.29 0.05 1.00 2.50 1.50 1.18 1.14 2.48 10.70
SAM_RT O4c_Run4_ID10ecraninstructorunic .xls 0 35 1.41 0.49 0.08 1.00 3.55 2.54 1.27 1.76 2.59 11.43

descriptive_func(df = Unic_CTRL_Solo, Stim_type = "pozitiv", By_ID = TRUE)

Unic_CTRL_Solo pozitiv by subject
var ID missing n M SD SE min max range median mode skew kurtosis
SAM_Resp O4c_Run1_ID12ecransolo unic .xls 0 35 1.00 0.00 0.00 1.00 1.00 0.00 1.00 1.00 NaN NaN
SAM_Resp O4c_Run1_ID17ecransolo unic .xls 0 35 1.94 0.84 0.14 1.00 4.00 3.00 2.00 2.00 0.41 2.29
SAM_Resp O4c_Run3_ID10ecransolo unic .xls 0 35 3.09 1.40 0.24 1.00 6.00 5.00 3.00 2.00 0.30 2.22
SAM_RT O4c_Run1_ID12ecransolo unic .xls 0 35 1.39 0.42 0.07 1.00 2.91 1.91 1.27 1.21 1.83 6.56
SAM_RT O4c_Run1_ID17ecransolo unic .xls 0 35 2.89 0.68 0.12 1.23 4.85 3.61 2.84 2.81 0.71 4.47
SAM_RT O4c_Run3_ID10ecransolo unic .xls 0 35 2.11 1.81 0.31 1.00 9.16 8.16 1.40 2.99 2.67 9.78

descriptive_func(df = Unic_OGL_Instr, Stim_type = "pozitiv", By_ID = TRUE)

Unic_OGL_Instr pozitiv by subject
var ID missing n M SD SE min max range median mode skew kurtosis
SAM_Resp O4c_3_ID12oglindainstructorunic X.xls 0 35 1.29 0.52 0.09 1.00 3.00 2.00 1.00 1.00 1.57 4.56
SAM_Resp O4c_Run1_ID10oglindainstructorunic .xls 0 35 3.86 1.59 0.27 1.00 8.00 7.00 4.00 4.00 0.33 2.85
SAM_Resp O4c_RunN(modifica N!)_ID1717oglindainstructorunic .xls 0 35 1.31 0.47 0.08 1.00 2.00 1.00 1.00 1.00 0.80 1.64
SAM_RT O4c_3_ID12oglindainstructorunic X.xls 0 35 1.29 0.24 0.04 1.00 1.84 0.84 1.20 1.00 0.68 2.48
SAM_RT O4c_Run1_ID10oglindainstructorunic .xls 0 35 2.09 1.07 0.18 1.01 5.14 4.13 1.68 2.79 1.37 4.13
SAM_RT O4c_RunN(modifica N!)_ID1717oglindainstructorunic .xls 0 35 2.17 0.59 0.10 1.27 3.66 2.38 2.11 3.66 0.65 2.83

descriptive_func(df = Unic_OGL_Solo, Stim_type = "pozitiv", By_ID = TRUE)

Unic_OGL_Solo pozitiv by subject
var ID missing n M SD SE min max range median mode skew kurtosis
SAM_Resp O4c_4_ID12oglindasolo unic .xls 0 35 1.34 0.48 0.08 1 2.00 1.00 1.00 1.00 0.66 1.44
SAM_Resp O4c_Run2_ID10oglindasolo unic .xls 0 35 3.23 1.44 0.24 1 7.00 6.00 3.00 4.00 0.50 3.19
SAM_Resp O4c_RunN(modifica N!)_ID1717oglindasolo unic .xls 0 35 1.49 0.51 0.09 1 2.00 1.00 1.00 1.00 0.06 1.00
SAM_RT O4c_4_ID12oglindasolo unic .xls 0 35 1.24 0.43 0.07 1 3.48 2.48 1.14 1.42 4.27 22.86
SAM_RT O4c_Run2_ID10oglindasolo unic .xls 0 35 2.12 1.35 0.23 1 6.72 5.71 1.59 1.21 2.06 6.70
SAM_RT O4c_RunN(modifica N!)_ID1717oglindasolo unic .xls 0 35 2.16 0.83 0.14 1 4.54 3.53 1.98 1.79 0.87 3.30

descriptive_func(df = Unic_CTRL_Instr, Stim_type = "neutru", By_ID = FALSE)           # Neutral - General

Unic_CTRL_Instr neutru all subjects
var missing n M SD SE min max range median mode skew kurtosis
SAM_Resp 0 105 1.43 0.95 0.09 1 5.00 4.00 1.00 1.00 2.51 8.86
SAM_RT 0 105 1.57 0.58 0.06 1 3.47 2.47 1.42 2.12 1.08 3.82

descriptive_func(df = Unic_CTRL_Solo, Stim_type = "neutru", By_ID = FALSE)

Unic_CTRL_Solo neutru all subjects
var missing n M SD SE min max range median mode skew kurtosis
SAM_Resp 0 105 1.54 1.05 0.1 1 5.0 4.0 1.00 1.00 2.01 6.14
SAM_RT 0 105 1.88 0.98 0.1 1 5.9 4.9 1.51 1.61 1.62 5.84

descriptive_func(df = Unic_OGL_Instr, Stim_type = "neutru", By_ID = FALSE)

Unic_OGL_Instr neutru all subjects
var missing n M SD SE min max range median mode skew kurtosis
SAM_Resp 0 105 1.37 0.90 0.09 1 6.00 5.00 1.00 1.00 3.16 13.51
SAM_RT 0 105 1.67 0.62 0.06 1 3.98 2.98 1.57 1.21 1.36 5.02

descriptive_func(df = Unic_OGL_Solo, Stim_type = "neutru", By_ID = FALSE)

Unic_OGL_Solo neutru all subjects
var missing n M SD SE min max range median mode skew kurtosis
SAM_Resp 0 105 1.43 0.91 0.09 1 5.00 4.00 1.00 1.00 2.46 8.81
SAM_RT 0 105 1.56 0.60 0.06 1 3.73 2.73 1.37 1.55 1.33 4.12

descriptive_func(df = Unic_CTRL_Instr, Stim_type = "neutru", By_ID = TRUE)            # Neutral - by id

Unic_CTRL_Instr neutru by subject
var ID missing n M SD SE min max range median mode skew kurtosis
SAM_Resp O4c_2_ID17ecraninstructorunic .xls 0 35 1.23 0.60 0.10 1.0 3.00 2.00 1.00 1.00 2.40 7.17
SAM_Resp O4c_Run2_ID12ecraninstructorunic .xls 0 35 1.03 0.17 0.03 1.0 2.00 1.00 1.00 1.00 5.66 33.03
SAM_Resp O4c_Run4_ID10ecraninstructorunic .xls 0 35 2.03 1.34 0.23 1.0 5.00 4.00 2.00 1.00 1.21 3.29
SAM_RT O4c_2_ID17ecraninstructorunic .xls 0 35 2.17 0.51 0.09 1.3 3.47 2.16 2.13 2.12 0.84 3.42
SAM_RT O4c_Run2_ID12ecraninstructorunic .xls 0 35 1.33 0.35 0.06 1.0 2.09 1.09 1.22 2.09 0.74 2.23
SAM_RT O4c_Run4_ID10ecraninstructorunic .xls 0 35 1.20 0.26 0.04 1.0 1.87 0.87 1.09 1.00 1.47 3.91

descriptive_func(df = Unic_CTRL_Solo, Stim_type = "neutru", By_ID = TRUE)

Unic_CTRL_Solo neutru by subject
var ID missing n M SD SE min max range median mode skew kurtosis
SAM_Resp O4c_Run1_ID12ecransolo unic .xls 0 35 1.09 0.51 0.09 1.00 4.00 3.00 1.00 1.00 5.66 33.03
SAM_Resp O4c_Run1_ID17ecransolo unic .xls 0 35 1.49 0.98 0.17 1.00 5.00 4.00 1.00 1.00 2.12 6.86
SAM_Resp O4c_Run3_ID10ecransolo unic .xls 0 35 2.06 1.28 0.22 1.00 5.00 4.00 2.00 1.00 1.08 3.11
SAM_RT O4c_Run1_ID12ecransolo unic .xls 0 35 1.36 0.55 0.09 1.00 3.53 2.53 1.18 1.61 2.47 9.05
SAM_RT O4c_Run1_ID17ecransolo unic .xls 0 35 2.54 0.90 0.15 1.46 5.03 3.57 2.34 2.71 1.30 4.16
SAM_RT O4c_Run3_ID10ecransolo unic .xls 0 35 1.75 1.05 0.18 1.00 5.90 4.90 1.35 1.45 2.22 8.35

descriptive_func(df = Unic_OGL_Instr, Stim_type = "neutru", By_ID = TRUE)

Unic_OGL_Instr neutru by subject
var ID missing n M SD SE min max range median mode skew kurtosis
SAM_Resp O4c_3_ID12oglindainstructorunic X.xls 0 35 1.17 0.57 0.10 1.00 4.00 3.00 1.00 1.00 3.94 19.03
SAM_Resp O4c_Run1_ID10oglindainstructorunic .xls 0 35 1.80 1.32 0.22 1.00 6.00 5.00 1.00 1.00 1.84 5.49
SAM_Resp O4c_RunN(modifica N!)_ID1717oglindainstructorunic .xls 0 35 1.14 0.36 0.06 1.00 2.00 1.00 1.00 1.00 2.04 5.17
SAM_RT O4c_3_ID12oglindainstructorunic X.xls 0 35 1.25 0.23 0.04 1.00 1.83 0.83 1.22 1.21 0.80 2.74
SAM_RT O4c_Run1_ID10oglindainstructorunic .xls 0 35 1.90 0.73 0.12 1.00 3.98 2.98 1.71 3.98 0.93 3.43
SAM_RT O4c_RunN(modifica N!)_ID1717oglindainstructorunic .xls 0 35 1.86 0.56 0.09 1.05 3.75 2.70 1.84 2.87 1.09 5.12

descriptive_func(df = Unic_OGL_Solo, Stim_type = "neutru", By_ID = TRUE)
Unic_OGL_Solo neutru by subject
var ID missing n M SD SE min max range median mode skew kurtosis
SAM_Resp O4c_4_ID12oglindasolo unic .xls 0 35 1.20 0.41 0.07 1.00 2.00 1.00 1.00 1.00 1.50 3.25
SAM_Resp O4c_Run2_ID10oglindasolo unic .xls 0 35 1.94 1.33 0.22 1.00 5.00 4.00 1.00 1.00 1.18 3.12
SAM_Resp O4c_RunN(modifica N!)_ID1717oglindasolo unic .xls 0 35 1.14 0.43 0.07 1.00 3.00 2.00 1.00 1.00 3.08 11.98
SAM_RT O4c_4_ID12oglindasolo unic .xls 0 35 1.20 0.20 0.03 1.00 1.57 0.56 1.15 1.55 0.64 1.91
SAM_RT O4c_Run2_ID10oglindasolo unic .xls 0 35 1.77 0.78 0.13 1.00 3.73 2.73 1.38 1.95 0.82 2.43
SAM_RT O4c_RunN(modifica N!)_ID1717oglindasolo unic .xls 0 35 1.71 0.52 0.09 1.04 2.83 1.80 1.68 1.22 0.55 2.39

2.2 Merge

############################## Merge condition dataset ############################################################
# Must first rename .id to ID in oder to have .id for df names
ID_rename <- function(df){
  if(".id" %in% colnames(df)) {
    df_modif <- 
      df %>%
      dplyr::rename("ID" = .id)
    df <- deparse(substitute(df))
    cat("Changed .id to ID for: ", as.name(df))
    assign(df, df_modif, envir = globalenv())
  }  
}
ID_rename(Unic_CTRL_Instr)
Changed .id to ID for:  Unic_CTRL_Instr
ID_rename(Unic_CTRL_Solo)
Changed .id to ID for:  Unic_CTRL_Solo
ID_rename(Unic_OGL_Instr)
Changed .id to ID for:  Unic_OGL_Instr
ID_rename(Unic_OGL_Solo)
Changed .id to ID for:  Unic_OGL_Solo
# Merge into one df
list_df_merge <- list(Unic_CTRL_Instr, Unic_CTRL_Solo, Unic_OGL_Instr, Unic_OGL_Solo)
names(list_df_merge) <- c("Unic_CTRL_Instr", "Unic_CTRL_Solo", "Unic_OGL_Instr", "Unic_OGL_Solo")
Unic_merged <- plyr::ldply(list_df_merge, data.frame)                    # also works for this job bind_rows(list_df_merge, .id = "column_label")

2.3 Analyses on merged (Anova & post-hoc)

############################## Analyses on Merged ################################################################
## Just a Test 
  # Unic_merged_spread_Neg <- 
  #   Unic_merged %>%
  #   filter(!is.na(SAM_Resp)) %>%                                           # some files had only NA on SAM_Resp and SAM_RT
  #   select(.id, ID, Subj_id, 
  #          Stimuli.order, MarkerStimuli, Stimulus.type, 
  #          SAM_Resp, SAM_RT) %>%
  #   filter(Stimulus.type == "negativ") %>%                                 # dont forget to pick stymulus type
  #   spread(.id, SAM_Resp)
  # 
  # t.test(Unic_merged_spread_Neg$Unic_CTRL_Instr, Unic_merged_spread_Neg$Unic_CTRL_Solo, na.rm = TRUE)
  # t.test(Unic_merged_spread_Neg$Unic_OGL_Instr, Unic_merged_spread_Neg$Unic_OGL_Solo, na.rm = TRUE)
  # t.test(Unic_merged_spread_Neg$Unic_OGL_Instr, Unic_merged_spread_Neg$Unic_CTRL_Instr, na.rm = TRUE)
  # t.test(Unic_merged_spread_Neg$Unic_OGL_Solo, Unic_merged_spread_Neg$Unic_CTRL_Solo, na.rm = TRUE)
## Function prepair data for analyses
prepaire_merged_func <- function(Stim_type){
  Unic_merged %>%
    filter(!is.na(SAM_Resp)) %>%                                           # some files had only NA on SAM_Resp and SAM_RT
    select(.id, ID, Subj_id, 
           Stimuli.order, MarkerStimuli, Stimulus.type, 
           SAM_Resp, SAM_RT) %>%
    dplyr::rename(Cond = .id) %>% 
    filter(Stimulus.type == Stim_type) %>%                                 # dont forget to pick stymulus type
    mutate(Cond = as.factor(Cond))                                         # tunr to factor for aov family functions
}
Unic_merged_Neg <- prepaire_merged_func("negativ")
Unic_merged_Neu <- prepaire_merged_func("neutru")
Unic_merged_Poz <- prepaire_merged_func("pozitiv")
## Anova and Post-Hoc  - NEGATIV
# Stimulus type
cat("### Negativ")

2.3.1 Negativ

# Normality
cat("#### Normality Test")

2.3.1.1 Normality Test

Unic_merged_Neg %>%
  select(SAM_Resp) %>%                                                     # must select variables outside function 
  tadaatoolbox::tadaa_normtest(method = "shapiro")                         # , print = "markdown"  for Notebook
# Levene Test (p>.05 = homogeneity of variances)
cat("#### Levene Test")

2.3.1.2 Levene Test

Unic_merged_Neg %>%
  tadaatoolbox::tadaa_levene(data = ., SAM_Resp ~ Cond)                    # , print = "markdown"  for Notebook
# Anova
cat("#### Anova")

2.3.1.3 Anova

Unic_merged_Neg %>%
  #do(broom::glance(aov(.$SAM_Resp ~ .$Cond)))                             # regular anova do(broom::tidy(aov(.$SAM_Resp ~ .$Cond)))
  tadaatoolbox::tadaa_aov(data = ., SAM_Resp ~ Cond, type = 1)             # , print = "markdown"  for Notebook
# Post-Hoc 
cat("#### Post-Hoc Games Howell")

2.3.1.4 Post-Hoc Games Howell

Unic_merged_Neg %>%
  # Tukey for equal variance 
  tadaatoolbox::tadaa_pairwise_tukey(data = ., SAM_Resp, Cond)             # , print = "markdown"  for Notebook
  # Games Howell does not assume equal variances
  #tadaatoolbox::tadaa_pairwise_gh(data = ., SAM_Resp, Cond)                # , print = "markdown"  for Notebook
## Anova and Post-Hoc  - NEUTRU
# Stimulus type
cat("### Neutru")

2.3.2 Neutru

# Normality
cat("#### Normality Test")

2.3.2.1 Normality Test

Unic_merged_Neu %>%
  select(SAM_Resp) %>%                                                     # must select variables outside function 
  tadaatoolbox::tadaa_normtest(method = "shapiro")                         # , print = "markdown"  for Notebook
# Levene Test (p>.05 = homogeneity of variances)
cat("#### Levene Test")

2.3.2.2 Levene Test

Unic_merged_Neu %>%
  tadaatoolbox::tadaa_levene(data = ., SAM_Resp ~ Cond)                    # , print = "markdown"  for Notebook
# Anova
cat("#### Anova")

2.3.2.3 Anova

Unic_merged_Neu %>%
  #do(broom::glance(aov(.$SAM_Resp ~ .$Cond)))                             # regular anova do(broom::tidy(aov(.$SAM_Resp ~ .$Cond)))
  tadaatoolbox::tadaa_aov(data = ., SAM_Resp ~ Cond, type = 1)             # , print = "markdown"  for Notebook
# Post-Hoc 
cat("#### Post-Hoc Games Howell")

2.3.2.4 Post-Hoc Games Howell

Unic_merged_Neu %>%
  # Tukey for equal variance 
  tadaatoolbox::tadaa_pairwise_tukey(data = ., SAM_Resp, Cond)             # , print = "markdown"  for Notebook
  # Games Howell does not assume equal variances
  #tadaatoolbox::tadaa_pairwise_gh(data = ., SAM_Resp, Cond)                # , print = "markdown"  for Notebook
## Anova and Post-Hoc  - POZITIV
# Stimulus type
cat("### Pozitiv")

2.3.3 Pozitiv

# Normality
cat("#### Normality Test")

2.3.3.1 Normality Test

Unic_merged_Poz %>%
  select(SAM_Resp) %>%                                                     # must select variables outside function 
  tadaatoolbox::tadaa_normtest(method = "shapiro")                         # , print = "markdown"  for Notebook
# Levene Test (p>.05 = homogeneity of variances)
cat("#### Levene Test")

2.3.3.2 Levene Test

Unic_merged_Poz %>%
  tadaatoolbox::tadaa_levene(data = ., SAM_Resp ~ Cond)                    # , print = "markdown"  for Notebook
# Anova
cat("#### Anova")

2.3.3.3 Anova

Unic_merged_Poz %>%
  #do(broom::glance(aov(.$SAM_Resp ~ .$Cond)))                             # regular anova do(broom::tidy(aov(.$SAM_Resp ~ .$Cond)))
  tadaatoolbox::tadaa_aov(data = ., SAM_Resp ~ Cond, type = 1)             # , print = "markdown"  for Notebook
# Post-Hoc 
cat("#### Post-Hoc Games Howell")

2.3.3.4 Post-Hoc Games Howell

Unic_merged_Poz %>%
  # Tukey for equal variance 
  tadaatoolbox::tadaa_pairwise_tukey(data = ., SAM_Resp, Cond)             # , print = "markdown"  for Notebook
  # Games Howell does not assume equal variances
  #tadaatoolbox::tadaa_pairwise_gh(data = ., SAM_Resp, Cond)                # , print = "markdown"  for Notebook

2.4 Plots with p values

# by dataset
ggplot(Unic_merged, aes(x = Stimulus.type, y = SAM_Resp)) +
  geom_boxplot() +
  stat_summary(fun.data = mean_se,  colour = "darkred") +
  xlab("") +
  facet_wrap(~.id) +
  ggpubr::stat_compare_means(method = "t.test", 
                             label = "p.signif",                                         # to avoid scientific notation of very small p-values
                             #paired = TRUE, 
                             comparisons = list(c("negativ", "neutru"),
                                                c("neutru", "pozitiv"),
                                                c("negativ", "pozitiv")))  

# by Stimulus type
ggplot(Unic_merged, aes(x = .id, y = SAM_Resp)) +
  geom_boxplot() +
  stat_summary(fun.data = mean_se,  colour = "darkred") +
  xlab("") +
  theme(axis.text.x = element_text(angle = 90, hjust = 1)) +
  facet_wrap(~Stimulus.type) +
  ggpubr::stat_compare_means(method = "t.test",
                             label = "p.format",                                         # formated p-values
                             #paired = TRUE, 
                             comparisons = list(c("Unic_CTRL_Instr", "Unic_CTRL_Solo"),
                                                c("Unic_CTRL_Instr", "Unic_OGL_Instr"),
                                                c("Unic_CTRL_Solo", "Unic_OGL_Instr"),
                                                c("Unic_CTRL_Solo", "Unic_OGL_Solo"),
                                                c("Unic_OGL_Instr", "Unic_OGL_Solo"),
                                                c("Unic_CTRL_Instr", "Unic_OGL_Solo"))) 

# drop to CTRL vs OGL - by Stimulus type
Unic_merged %>%
  mutate(.id = case_when(.id %in% c("Unic_CTRL_Instr", "Unic_CTRL_Solo") ~ "Unic_CTRL",
                         .id %in% c("Unic_OGL_Instr", "Unic_OGL_Solo") ~ "Unic_OGL",
                         TRUE ~ as.character(.id))) %>%
    ggplot(aes(x = .id, y = SAM_Resp)) +
    geom_boxplot() +
    stat_summary(fun.data = mean_se,  colour = "darkred") +
    xlab("") +
    theme(axis.text.x = element_text(angle = 90, hjust = 1)) +
    facet_wrap(~Stimulus.type) +
    ggpubr::stat_compare_means(method = "t.test",
                               label = "p.format",                                         # formated p-values
                               #paired = TRUE, 
                               comparisons = list(c("Unic_CTRL", "Unic_OGL")))          

# drop to Instr vs Solo - by Stimulus type
Unic_merged %>%
  mutate(.id = case_when(.id %in% c("Unic_CTRL_Instr", "Unic_OGL_Instr") ~ "Unic_Instr",
                         .id %in% c("Unic_CTRL_Solo", "Unic_OGL_Solo") ~ "Unic_Solo",
                         TRUE ~ as.character(.id))) %>%
    ggplot(aes(x = .id, y = SAM_Resp)) +
    geom_boxplot() +
    stat_summary(fun.data = mean_se,  colour = "darkred") +
    xlab("") +
    theme(axis.text.x = element_text(angle = 90, hjust = 1)) +
    facet_wrap(~Stimulus.type) +
    ggpubr::stat_compare_means(method = "t.test",
                               label = "p.format",                                         # formated p-values
                               #paired = TRUE, 
                               comparisons = list(c("Unic_Instr", "Unic_Solo"))) 

3 Download Data

Unic_merged %>% 
    select(-c(3:10)) %>%
    DT::datatable(                                  # excel downloadable  DT table
      extensions = 'Buttons',
      options = list(pageLength = 20,
                     scrollX='500px', 
                     dom = 'Bfrtip', 
                     buttons = c('excel', "csv")))


4 Session Info

R version 3.5.2 (2018-12-20)
Platform: x86_64-w64-mingw32/x64 (64-bit)
Running under: Windows >= 8 x64 (build 9200)

Matrix products: default

locale:
[1] LC_COLLATE=Romanian_Romania.1250  LC_CTYPE=Romanian_Romania.1250    LC_MONETARY=Romanian_Romania.1250 LC_NUMERIC=C                     
[5] LC_TIME=Romanian_Romania.1250    

attached base packages:
[1] stats     graphics  grDevices utils     datasets  methods   base     

other attached packages:
 [1] bindrcpp_0.2.2     plyr_1.8.4         summarytools_0.9.3 DT_0.5             ggpubr_0.2         magrittr_1.5       broom_0.5.1       
 [8] papaja_0.1.0.9842  psych_1.8.10       forcats_0.3.0      stringr_1.3.1      dplyr_0.7.8        purrr_0.2.5        readr_1.3.0       
[15] tidyr_0.8.2        tibble_1.4.2       ggplot2_3.1.0      tidyverse_1.2.1    pacman_0.5.0      

loaded via a namespace (and not attached):
 [1] nlme_3.1-137        matrixStats_0.54.0  bitops_1.0-6        lubridate_1.7.4     httr_1.4.0          tools_3.5.2         backports_1.1.3    
 [8] tidystats_0.3       R6_2.3.0            nortest_1.0-4       lazyeval_0.2.1      colorspace_1.3-2    withr_2.1.2         tidyselect_0.2.5   
[15] gridExtra_2.3       mnormt_1.5-5        pixiedust_0.8.6     curl_3.2            compiler_3.5.2      tadaatoolbox_0.16.1 cli_1.0.1          
[22] rvest_0.3.2         expm_0.999-3        xml2_1.2.0          labeling_0.3        checkmate_1.8.5     scales_1.0.0        mvtnorm_1.0-10     
[29] digest_0.6.18       foreign_0.8-71      rmarkdown_1.11      rio_0.5.16          base64enc_0.1-3     pkgconfig_2.0.2     htmltools_0.3.6    
[36] manipulate_1.0.1    highr_0.7           pwr_1.2-2           htmlwidgets_1.3     rlang_0.3.1         readxl_1.1.0        pryr_0.1.4         
[43] rstudioapi_0.8      shiny_1.2.0         bindr_0.1.1         generics_0.0.2      jsonlite_1.6        crosstalk_1.0.0     zip_1.0.0          
[50] car_3.0-2           RCurl_1.95-4.11     rapportools_1.0     Matrix_1.2-15       Rcpp_1.0.0          DescTools_0.99.27   munsell_0.5.0      
[57] abind_1.4-5         viridis_0.5.1       stringi_1.2.4       yaml_2.2.0          carData_3.0-2       MASS_7.3-51.1       grid_3.5.2         
[64] parallel_3.5.2      promises_1.0.1      crayon_1.3.4        lattice_0.20-38     haven_2.1.0         pander_0.6.3        hms_0.4.2          
[71] magick_2.0          knitr_1.21          pillar_1.3.1        tcltk_3.5.2         boot_1.3-20         ggsignif_0.4.0      codetools_0.2-15   
[78] glue_1.3.0          evaluate_0.12       data.table_1.12.2   modelr_0.1.2        httpuv_1.4.5        cellranger_1.1.0    gtable_0.2.0       
[85] assertthat_0.2.0    xfun_0.4            openxlsx_4.1.0      mime_0.6            xtable_1.8-3        later_0.7.5         viridisLite_0.3.0  
 

A work by Claudiu Papasteri

claudiu.papasteri@gmail.com

 

---
title: "<br> O.4 - UCL Poster" 
subtitle: "Preliminary Report for Unice - 3 Study Participants"
author: "<br> Claudiu Papasteri"
date: "`r format(Sys.time(), '%d %m %Y')`"
output: 
    html_notebook:
            code_folding: hide
            toc: true
            toc_depth: 2
            number_sections: true
            theme: spacelab
            highlight: tango
            font-family: Arial
            fig_width: 10
            fig_height: 9
    pdf_document: 
            toc: true
            toc_depth: 2
            number_sections: true
            # fontsize: 11pt
            # geometry: margin=1in
            # fig_width: 7
            # fig_height: 6
            # fig_caption: true
    # github_document: 
            # toc: true
            # toc_depth: 2
            # html_preview: false
            # fig_width: 5
            # fig_height: 5
            # dev: jpeg
---


<!-- Setup -->


```{r setup, include=FALSE}
# kintr options
knitr::opts_chunk$set(
  comment = "#",
  collapse = TRUE,
  echo = TRUE, warning = TRUE, message = TRUE, cache = TRUE       # echo = False for github_document, but will be folded in html_notebook
)

# General R options and info
set.seed(111)               # in case we use randomized procedures       
options(scipen = 999)       # positive values bias towards fixed and negative towards scientific notation

# Load packages
if (!require("pacman")) install.packages("pacman")
packages <- c(
  "tidyverse",      # best thing that happend to me
  "psych",          # general purpose toolbox for personality, psychometric theory and experimental psychology
  "papaja",         # for APA style
  "broom",          # for tidy modelling
  "ggplot2",        # best plots
  "ggpubr",         # ggplot2 to publication quality
  "DT",             # nice searchable and downloadable tables
  "summarytools",
  "plyr", 
  "stringr"
  # , ...
)
if (!require("pacman")) install.packages("pacman")
pacman::p_load(char = packages)

# Themes for ggplot2 ploting (here used APA style)
theme_set(theme_apa())
```

```{r working_directory, include = FALSE}
### O.4 R code - Unice and Retatate
### R code for sorting, integrating and analyses 
# Task output files: 
# ID, experimental condition ("oglinda" / "ecran"), condition ("instructor", "solo"), type of task ("unic", "repetat")
wd <- "C:/Users/Mihai/Desktop/EEG_O.4c_1/O.4c - Poster"
setwd(wd)
```


<!-- Report -->


# Arrange folders, sort files, read and merge

## Create folders by conditions, copy files to them

```{r makedir_sortfiles, eval=FALSE}
# !!!!EVAL = FALSE
##################### Read file names ##################################################################################
file_names <- dir(pattern = "\\.xls$")
## if above isn't good enough try the following:
# file_names <- list.files(wd)
# file_names <- sop_files[!file.info(sop_files)$isdir]   # exclude directories
# file_names <- sop_files[grep(".xls", sop_files, fixed = TRUE)]


##################### Create folders with Condition names ###############################################################
# this part of script may be re-run if files from wd are updated
dir_names <- c("Unic_CTRL_Instr", "Unic_CTRL_Solo", "Unic_OGL_Instr", "Unic_OGL_Solo",
              "Repetat_CTRL_Instr", "Repetat_CTRL_Solo", "Repetat_OGL_Instr", "Repetat_OGL_Solo")
             
for(dir in dir_names){
  if(!dir.exists(file.path(wd, dir)))
  dir.create(file.path(wd, dir), showWarnings = FALSE)
}


##################### Use file names to sort them to folders ############################################################
sort_files_to_dirs <- function(wd, pattern, dir) {
  check_pattern <- outer(file_names, pattern, stringr::str_detect)               # if all TRUE bye row then it has full pattern
  index <- which(apply(check_pattern, 1, function(x) all(x==TRUE)))              # get index of file_names where all are TRUE
  sorted_files <- file_names[index]                                              # get names of files from indexes
  
  for(files in sorted_files) {                                                   # copy the files to corresponding folder
    file.copy(from = file.path(wd, files), to = file.path(wd, dir))
  }  
}

sort_files_to_dirs(wd = wd, pattern = c("unic", "ecran", "instructor"), dir = "Unic_CTRL_Instr")
sort_files_to_dirs(wd = wd, pattern = c("unic", "ecran", "solo"), dir = "Unic_CTRL_Solo")
sort_files_to_dirs(wd = wd, pattern = c("unic", "oglinda", "instructor"), dir = "Unic_OGL_Instr")
sort_files_to_dirs(wd = wd, pattern = c("unic", "oglinda", "solo"), dir = "Unic_OGL_Solo")
```


## Reading the data

```{r raw_read, hide=TRUE}
############ Read in all the .xls from folders and merge them in datasets named after corresponding folder ##############
# this part of script may be re-run if files from wd are updated
# RE-RUN FROM HERE IF FOLDERS AND SORTING WAS ALREADY DONE
wd <- "C:/Users/Mihai/Desktop/EEG_O.4c_1/O.4c - Poster/Date Studiu"
setwd(wd)
folders <- list.files(wd)
folders <- folders[file.info(folders)$isdir]   # luam doar folderele
datasetnames <- NULL

for (i in 1:length(folders)) {
  datasetname <- folders[i]
  datasetnames <- c(datasetnames, datasetname)
  current_dir <- setwd(file.path(wd, folders[i]))
  print(paste0("current_dir: ", current_dir))
  
  paths <- dir(pattern = "\\.xls$")
  names(paths) <- basename(paths)

  assign( paste(datasetname), plyr::ldply(paths, rio::import) )
}

setwd(wd)
# detach("package:plyr", unload=TRUE)                                                   # detach plyr because of conflicts with dplyr
```


## Cleaning the data

```{r clean_data, hide=TRUE}
#################################### Data Cleaning #####################################################################
# Check if ids have > 1 row of data (empty .xls have only 1 row)
# Careful! This function modfies the datasets in the global envinronment
delete_empty_id <- function(df){
  list_empty_id <- 
    df %>%
    dplyr::group_by(.id) %>%
    dplyr::summarise(row_count = n()) %>%
    dplyr::rename("empty_id" = .id) %>%
    mutate(delete_id = if_else(row_count < 3, TRUE, FALSE)) %>%
    filter(delete_id == TRUE)
  
  df_modif <- 
    df %>%
    filter(!.id %in% list_empty_id$empty_id)
  
  if(!identical(df, df_modif)){
    df <- deparse(substitute(df))
    cat("Deleting from ", print(as.name(df))); print(list_empty_id)                    # print out which ids are deleted from which dataset
    assign(df, df_modif, envir = globalenv())                                          # assign modified df to original dataset from Global
  }else cat("No empty datasets. Nothing to delete")
}

# Apply function to all datasets (tricky to do in for loop because of super assignment)
delete_empty_id(Unic_CTRL_Instr)
delete_empty_id(Unic_CTRL_Solo)
delete_empty_id(Unic_OGL_Instr)
delete_empty_id(Unic_OGL_Solo)
```


## Exclude SAM_resp based on RT outliers

```{r nooutlier_data, eval=FALSE}
# !!!!EVAL = FALSE
############################### Exclude Outliers based on RT (by subject and stimulus type) #######################################
## DONT RUN (unless it is needed) ----> eval=FALSE
# Exclude RT outliers (=- 2SD) - instead of simple filter, makeing them NA  is better for paired comparison
remove_outliers <- function(df) {
  df_modif <-
    df %>%
    dplyr::group_by(.id, `Stimulus type`) %>%                  # we could have done before:  dplyr::rename("Stim_type" = `Stimulus type`) 
    mutate(SAM_Resp = if_else(abs(SAM_RT - mean(SAM_RT, na.rm=TRUE)) > 2*sd(SAM_RT, na.rm=TRUE), as.numeric(NA), SAM_Resp))
  
  if(!identical(df, df_modif)){
    df <- deparse(substitute(df))
    cat("Deleting outliers from ", print(as.name(df)));                               # print out datasets which have been modified
    assign(df, df_modif, envir = globalenv())                                          # assign modified df to original dataset from Global
  }else cat("No outlier")
}

remove_outliers(Unic_CTRL_Instr)
remove_outliers(Unic_CTRL_Solo)
remove_outliers(Unic_OGL_Instr)
remove_outliers(Unic_OGL_Solo)
```


## Test if datasets have same columns

```{r test_cols}
unic_df_obj <- mget(c("Unic_CTRL_Instr", "Unic_CTRL_Solo", "Unic_OGL_Instr", "Unic_OGL_Solo"))
unic_df_obj <-lapply(unic_df_obj, colnames)
outer(unic_df_obj, unic_df_obj, Vectorize(identical))                           # if all are TRUE, all df have same columns
```

<br>
<br>


# Analysis - UNICE

## Descriptives

```{r desc_unice}
##########################################################################################################################
#################################### Analyses - UNICE ####################################################################
## Descriptives by condition dataset
descriptive_func <- function(df, Stim_type, By_ID = FALSE){
  df_name <- deparse(substitute(df))
  suppressWarnings({                                                                # if all NAs in SAM_Resp, NaNs and Infs will be produced
    df_modif <- 
      df %>%
      dplyr::rename("ID" = .id) %>%
      select_all(~gsub("\\s+|\\.", "_", .)) %>%                                     # replaces blancks with "_" in colnames 
      filter(Stimulus_type == Stim_type)                                            # filter by stimulus type
      
    if(isTRUE(By_ID)){                                                              # if true group by id, if not return descriptives for all ids
      by_id_text <- " by subject"
      df_modif %>%
      dplyr::group_by(ID) %>%
      tidystats::describe_data(SAM_Resp, SAM_RT, na.rm = TRUE) %>%
        knitr::kable(caption = paste(as.name(df_name), " ", Stim_type, by_id_text), format = "pandoc", digits = 2)
    }else{ 
      by_id_text <- " all subjects"
      df_modif %>%
      ungroup() %>%  
      tidystats::describe_data(SAM_Resp, SAM_RT, na.rm = TRUE) %>%
        knitr::kable(caption = paste(as.name(df_name), " ", Stim_type, by_id_text), format = "pandoc", digits = 2)
    }
  })
}  


descriptive_func(df = Unic_CTRL_Instr, Stim_type = "negativ", By_ID = FALSE)           # Negative - General
descriptive_func(df = Unic_CTRL_Solo, Stim_type = "negativ", By_ID = FALSE)
descriptive_func(df = Unic_OGL_Instr, Stim_type = "negativ", By_ID = FALSE)
descriptive_func(df = Unic_OGL_Solo, Stim_type = "negativ", By_ID = FALSE)

descriptive_func(df = Unic_CTRL_Instr, Stim_type = "negativ", By_ID = TRUE)            # Negative - by id
descriptive_func(df = Unic_CTRL_Solo, Stim_type = "negativ", By_ID = TRUE)
descriptive_func(df = Unic_OGL_Instr, Stim_type = "negativ", By_ID = TRUE)
descriptive_func(df = Unic_OGL_Solo, Stim_type = "negativ", By_ID = TRUE)

descriptive_func(df = Unic_CTRL_Instr, Stim_type = "pozitiv", By_ID = FALSE)           # Positive - General
descriptive_func(df = Unic_CTRL_Solo, Stim_type = "pozitiv", By_ID = FALSE)
descriptive_func(df = Unic_OGL_Instr, Stim_type = "pozitiv", By_ID = FALSE)
descriptive_func(df = Unic_OGL_Solo, Stim_type = "pozitiv", By_ID = FALSE)

descriptive_func(df = Unic_CTRL_Instr, Stim_type = "pozitiv", By_ID = TRUE)            # Positive - by id
descriptive_func(df = Unic_CTRL_Solo, Stim_type = "pozitiv", By_ID = TRUE)
descriptive_func(df = Unic_OGL_Instr, Stim_type = "pozitiv", By_ID = TRUE)
descriptive_func(df = Unic_OGL_Solo, Stim_type = "pozitiv", By_ID = TRUE)

descriptive_func(df = Unic_CTRL_Instr, Stim_type = "neutru", By_ID = FALSE)           # Neutral - General
descriptive_func(df = Unic_CTRL_Solo, Stim_type = "neutru", By_ID = FALSE)
descriptive_func(df = Unic_OGL_Instr, Stim_type = "neutru", By_ID = FALSE)
descriptive_func(df = Unic_OGL_Solo, Stim_type = "neutru", By_ID = FALSE)

descriptive_func(df = Unic_CTRL_Instr, Stim_type = "neutru", By_ID = TRUE)            # Neutral - by id
descriptive_func(df = Unic_CTRL_Solo, Stim_type = "neutru", By_ID = TRUE)
descriptive_func(df = Unic_OGL_Instr, Stim_type = "neutru", By_ID = TRUE)
descriptive_func(df = Unic_OGL_Solo, Stim_type = "neutru", By_ID = TRUE)
```


## Merge

```{r merged_unice_data, hide=TRUE}
############################## Merge condition dataset ############################################################
# Must first rename .id to ID in oder to have .id for df names
ID_rename <- function(df){
  if(".id" %in% colnames(df)) {
    df_modif <- 
      df %>%
      dplyr::rename("ID" = .id)
    df <- deparse(substitute(df))
    cat("Changed .id to ID for: ", as.name(df))
    assign(df, df_modif, envir = globalenv())
  }  
}

ID_rename(Unic_CTRL_Instr)
ID_rename(Unic_CTRL_Solo)
ID_rename(Unic_OGL_Instr)
ID_rename(Unic_OGL_Solo)

# Merge into one df
list_df_merge <- list(Unic_CTRL_Instr, Unic_CTRL_Solo, Unic_OGL_Instr, Unic_OGL_Solo)
names(list_df_merge) <- c("Unic_CTRL_Instr", "Unic_CTRL_Solo", "Unic_OGL_Instr", "Unic_OGL_Solo")
Unic_merged <- plyr::ldply(list_df_merge, data.frame)                    # also works for this job bind_rows(list_df_merge, .id = "column_label")
```


## Analyses on merged (Anova & post-hoc)

```{r anova_unice, results='asis'}
############################## Analyses on Merged ################################################################
## Just a Test 
  # Unic_merged_spread_Neg <- 
  #   Unic_merged %>%
  #   filter(!is.na(SAM_Resp)) %>%                                           # some files had only NA on SAM_Resp and SAM_RT
  #   select(.id, ID, Subj_id, 
  #          Stimuli.order, MarkerStimuli, Stimulus.type, 
  #          SAM_Resp, SAM_RT) %>%
  #   filter(Stimulus.type == "negativ") %>%                                 # dont forget to pick stymulus type
  #   spread(.id, SAM_Resp)
  # 
  # t.test(Unic_merged_spread_Neg$Unic_CTRL_Instr, Unic_merged_spread_Neg$Unic_CTRL_Solo, na.rm = TRUE)
  # t.test(Unic_merged_spread_Neg$Unic_OGL_Instr, Unic_merged_spread_Neg$Unic_OGL_Solo, na.rm = TRUE)
  # t.test(Unic_merged_spread_Neg$Unic_OGL_Instr, Unic_merged_spread_Neg$Unic_CTRL_Instr, na.rm = TRUE)
  # t.test(Unic_merged_spread_Neg$Unic_OGL_Solo, Unic_merged_spread_Neg$Unic_CTRL_Solo, na.rm = TRUE)

## Function prepair data for analyses
prepaire_merged_func <- function(Stim_type){
  Unic_merged %>%
    filter(!is.na(SAM_Resp)) %>%                                           # some files had only NA on SAM_Resp and SAM_RT
    select(.id, ID, Subj_id, 
           Stimuli.order, MarkerStimuli, Stimulus.type, 
           SAM_Resp, SAM_RT) %>%
    dplyr::rename(Cond = .id) %>% 
    filter(Stimulus.type == Stim_type) %>%                                 # dont forget to pick stymulus type
    mutate(Cond = as.factor(Cond))                                         # tunr to factor for aov family functions
}

Unic_merged_Neg <- prepaire_merged_func("negativ")
Unic_merged_Neu <- prepaire_merged_func("neutru")
Unic_merged_Poz <- prepaire_merged_func("pozitiv")


## Anova and Post-Hoc  - NEGATIV
# Stimulus type
cat("### Negativ")

# Normality
cat("#### Normality Test")
Unic_merged_Neg %>%
  select(SAM_Resp) %>%                                                     # must select variables outside function 
  tadaatoolbox::tadaa_normtest(method = "shapiro")                         # , print = "markdown"  for Notebook

# Levene Test (p>.05 = homogeneity of variances)
cat("#### Levene Test")
Unic_merged_Neg %>%
  tadaatoolbox::tadaa_levene(data = ., SAM_Resp ~ Cond)                    # , print = "markdown"  for Notebook

# Anova
cat("#### Anova")
Unic_merged_Neg %>%
  #do(broom::glance(aov(.$SAM_Resp ~ .$Cond)))                             # regular anova do(broom::tidy(aov(.$SAM_Resp ~ .$Cond)))
  tadaatoolbox::tadaa_aov(data = ., SAM_Resp ~ Cond, type = 1)             # , print = "markdown"  for Notebook

# Post-Hoc 
cat("#### Post-Hoc Games Howell")
Unic_merged_Neg %>%
  # Tukey for equal variance 
  tadaatoolbox::tadaa_pairwise_tukey(data = ., SAM_Resp, Cond)             # , print = "markdown"  for Notebook
  # Games Howell does not assume equal variances
  #tadaatoolbox::tadaa_pairwise_gh(data = ., SAM_Resp, Cond)                # , print = "markdown"  for Notebook


## Anova and Post-Hoc  - NEUTRU
# Stimulus type
cat("### Neutru")

# Normality
cat("#### Normality Test")
Unic_merged_Neu %>%
  select(SAM_Resp) %>%                                                     # must select variables outside function 
  tadaatoolbox::tadaa_normtest(method = "shapiro")                         # , print = "markdown"  for Notebook

# Levene Test (p>.05 = homogeneity of variances)
cat("#### Levene Test")
Unic_merged_Neu %>%
  tadaatoolbox::tadaa_levene(data = ., SAM_Resp ~ Cond)                    # , print = "markdown"  for Notebook

# Anova
cat("#### Anova")
Unic_merged_Neu %>%
  #do(broom::glance(aov(.$SAM_Resp ~ .$Cond)))                             # regular anova do(broom::tidy(aov(.$SAM_Resp ~ .$Cond)))
  tadaatoolbox::tadaa_aov(data = ., SAM_Resp ~ Cond, type = 1)             # , print = "markdown"  for Notebook

# Post-Hoc 
cat("#### Post-Hoc Games Howell")
Unic_merged_Neu %>%
  # Tukey for equal variance 
  tadaatoolbox::tadaa_pairwise_tukey(data = ., SAM_Resp, Cond)             # , print = "markdown"  for Notebook
  # Games Howell does not assume equal variances
  #tadaatoolbox::tadaa_pairwise_gh(data = ., SAM_Resp, Cond)                # , print = "markdown"  for Notebook


## Anova and Post-Hoc  - POZITIV
# Stimulus type
cat("### Pozitiv")

# Normality
cat("#### Normality Test")
Unic_merged_Poz %>%
  select(SAM_Resp) %>%                                                     # must select variables outside function 
  tadaatoolbox::tadaa_normtest(method = "shapiro")                         # , print = "markdown"  for Notebook

# Levene Test (p>.05 = homogeneity of variances)
cat("#### Levene Test")
Unic_merged_Poz %>%
  tadaatoolbox::tadaa_levene(data = ., SAM_Resp ~ Cond)                    # , print = "markdown"  for Notebook

# Anova
cat("#### Anova")
Unic_merged_Poz %>%
  #do(broom::glance(aov(.$SAM_Resp ~ .$Cond)))                             # regular anova do(broom::tidy(aov(.$SAM_Resp ~ .$Cond)))
  tadaatoolbox::tadaa_aov(data = ., SAM_Resp ~ Cond, type = 1)             # , print = "markdown"  for Notebook

# Post-Hoc 
cat("#### Post-Hoc Games Howell")
Unic_merged_Poz %>%
  # Tukey for equal variance 
  tadaatoolbox::tadaa_pairwise_tukey(data = ., SAM_Resp, Cond)             # , print = "markdown"  for Notebook
  # Games Howell does not assume equal variances
  #tadaatoolbox::tadaa_pairwise_gh(data = ., SAM_Resp, Cond)                # , print = "markdown"  for Notebook
```


## Plots with p values
```{r plot_unice, fig.height=7}
# by dataset
ggplot(Unic_merged, aes(x = Stimulus.type, y = SAM_Resp)) +
  geom_boxplot() +
  stat_summary(fun.data = mean_se,  colour = "darkred") +
  xlab("") +
  facet_wrap(~.id) +
  ggpubr::stat_compare_means(method = "t.test", 
                             label = "p.signif",                                         # to avoid scientific notation of very small p-values
                             #paired = TRUE, 
                             comparisons = list(c("negativ", "neutru"),
                                                c("neutru", "pozitiv"),
                                                c("negativ", "pozitiv")))  

# by Stimulus type
ggplot(Unic_merged, aes(x = .id, y = SAM_Resp)) +
  geom_boxplot() +
  stat_summary(fun.data = mean_se,  colour = "darkred") +
  xlab("") +
  theme(axis.text.x = element_text(angle = 90, hjust = 1)) +
  facet_wrap(~Stimulus.type) +
  ggpubr::stat_compare_means(method = "t.test",
                             label = "p.format",                                         # formated p-values
                             #paired = TRUE, 
                             comparisons = list(c("Unic_CTRL_Instr", "Unic_CTRL_Solo"),
                                                c("Unic_CTRL_Instr", "Unic_OGL_Instr"),
                                                c("Unic_CTRL_Solo", "Unic_OGL_Instr"),
                                                c("Unic_CTRL_Solo", "Unic_OGL_Solo"),
                                                c("Unic_OGL_Instr", "Unic_OGL_Solo"),
                                                c("Unic_CTRL_Instr", "Unic_OGL_Solo"))) 


# drop to CTRL vs OGL - by Stimulus type
Unic_merged %>%
  mutate(.id = case_when(.id %in% c("Unic_CTRL_Instr", "Unic_CTRL_Solo") ~ "Unic_CTRL",
                         .id %in% c("Unic_OGL_Instr", "Unic_OGL_Solo") ~ "Unic_OGL",
                         TRUE ~ as.character(.id))) %>%
    ggplot(aes(x = .id, y = SAM_Resp)) +
    geom_boxplot() +
    stat_summary(fun.data = mean_se,  colour = "darkred") +
    xlab("") +
    theme(axis.text.x = element_text(angle = 90, hjust = 1)) +
    facet_wrap(~Stimulus.type) +
    ggpubr::stat_compare_means(method = "t.test",
                               label = "p.format",                                         # formated p-values
                               #paired = TRUE, 
                               comparisons = list(c("Unic_CTRL", "Unic_OGL")))          

# drop to Instr vs Solo - by Stimulus type
Unic_merged %>%
  mutate(.id = case_when(.id %in% c("Unic_CTRL_Instr", "Unic_OGL_Instr") ~ "Unic_Instr",
                         .id %in% c("Unic_CTRL_Solo", "Unic_OGL_Solo") ~ "Unic_Solo",
                         TRUE ~ as.character(.id))) %>%
    ggplot(aes(x = .id, y = SAM_Resp)) +
    geom_boxplot() +
    stat_summary(fun.data = mean_se,  colour = "darkred") +
    xlab("") +
    theme(axis.text.x = element_text(angle = 90, hjust = 1)) +
    facet_wrap(~Stimulus.type) +
    ggpubr::stat_compare_means(method = "t.test",
                               label = "p.format",                                         # formated p-values
                               #paired = TRUE, 
                               comparisons = list(c("Unic_Instr", "Unic_Solo"))) 
```


# Download Data

```{r download_data}
Unic_merged %>% 
    select(-c(3:10)) %>%
    DT::datatable(                                  # excel downloadable  DT table
      extensions = 'Buttons',
      options = list(pageLength = 20,
                     scrollX='500px', 
                     dom = 'Bfrtip', 
                     buttons = c('excel', "csv")))
```




<!-- Session Info and License -->

<br>

# Session Info
```{r session_info, echo = FALSE, results = 'markup'}
sessionInfo()    
```

<!-- Footer -->
&nbsp;
<hr />
<p style="text-align: center;">A work by <a href="https://github.com/ClaudiuPapasteri/">Claudiu Papasteri</a></p>
<p style="text-align: center;"><span style="color: #808080;"><em>claudiu.papasteri@gmail.com</em></span></p>
&nbsp;
