-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy path05_calculate_effect_size_group.R
109 lines (91 loc) · 4.35 KB
/
05_calculate_effect_size_group.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
# Convert to effect sizes using metafor package
# 6.2.2020 KLS
# load required packages
library(here)
library(tidyverse)
library(metafor)
# load source functions
source(here::here('scr', 'reverse_es.R'))
# set hard-coded variables
file <- 'cleaned.csv'
# load data
dt <- read.csv(here::here('output', file))
# Calculation for two-group papers ####
# make interaction term for study + conditions
dt$conditionID <- interaction(dt$Study.Identifier, dt$condition)
# Calculate effect sizes for extreme group designs
dm <- dt[which(dt$Design == 'extreme group'),] # pull out means
ds <- dm[is.na(dm$sd),]
dm <- dm[!is.na(dm$sd),]
dm <- dm[c(1:2, 6, 8:15, 17:18, 21)]
### Temporarily remove Garza 2016 and Liu 2016 because missing age group means
garza <- dm[c(grep('Garza', dm$Study.Identifier)),]
liu <- dm[c(grep('Liu', dm$Study.Identifier)),]
dm <- dm[-c(grep('Garza', dm$Study.Identifier)),]
dm <- dm[-c(grep('Liu', dm$Study.Identifier)),]
## Calculate effect sizes
dm <- pivot_wider(dm, id_cols = colnames(dm[c(1:6, 14)]), names_from = 'Intervention',
values_from = c('mean', 'sd', 'n', 'age_mean', 'age_range', 'age_sd'))
dm <- escalc(measure = 'SMD', m1i = mean_Older, sd1i = sd_Older, n1i = n_Older,
m2i = mean_Younger, sd2i = sd_Younger, n2i = n_Younger, data = dm, var.names = c('cohens_d', 'var_cohens_d'))
# Calculate for multi-group papers ####
age_group_comparisons <- function (data, oldergrp, youngergrp, name){
# data = data frame with just data from this study
# row containing data from the older group row containing data from the younger group
dt <- data[c(oldergrp, youngergrp),]
dt$Intervention <- c('Older', 'Younger')
dt <- pivot_wider(dt, id_cols = colnames(dt[c(1:6, 14)]), names_from = 'Intervention',
values_from = c('mean', 'sd', 'n', 'age_mean', 'age_range', 'age_sd'))
dt <- escalc(measure = 'SMD', m1i = mean_Older, sd1i = sd_Older, n1i = n_Older,
m2i = mean_Younger, sd2i = sd_Younger, n2i = n_Younger, data = dt, var.names = c('cohens_d', 'var_cohens_d'))
dt$conditionID <- name
return(dt)
}
## Liu 2016 ####
liu <- liu[which(liu$conditionID == 'Liu 2016.Ln(k) mean'),] # take the mean from paper and get rid of others.
liu1 <- age_group_comparisons(liu, 1, 3, 'OAvMA')
liu2 <- age_group_comparisons(liu, 3, 2, 'MAvYA')
liu <- rbind(liu1, liu2)
dm <- rbind(dm, liu)
rm(liu, liu1, liu2)
## Garza 2016 ####
garza1 <- age_group_comparisons(garza, 4, 3, 'OAvMA2')
garza2 <- age_group_comparisons(garza, 3, 2, 'MA2vMA1')
garza3 <- age_group_comparisons(garza, 2, 1, 'MA2vYA')
garza <- rbind(garza1, garza2)
garza <- rbind(garza, garza3)
dm <- rbind(dm, garza)
rm(garza, garza1, garza2, garza3)
## average effect size across multiple values within the same study ####
average_within_study <- function(df, studyid) {
x = df[which(df$Study.Identifier == studyid),] # pull out study of interest
newmean <- cbind(x[1,1:18], t(colMeans(x[19:20]))) # average across estimates within same study
dt <- df[-which(df$Study.Identifier == studyid),] # remove multiple estimates from df
rbind(dt, newmean) # add new mean estimate to df
}
dm <- average_within_study(dm, 'Li 2013')
dm <- average_within_study(dm, 'Eppinger 2018')
dm <- average_within_study(dm, 'Whelan 2009')
dm <- average_within_study(dm, 'Liu 2016')
dm <- average_within_study(dm, 'Garza 2016')
# convert cohen's d to fisher z ####
dm <- mutate(dm,
a = ((n_Older + n_Younger)^2) / (n_Older * n_Younger),
r = cohens_d / (sqrt(cohens_d^2 + a)),
var_r = (a^2 * var_cohens_d) / (cohens_d^2 + a)^3,
fishers_z = 0.5 * log((1 + r) / (1 - r)),
var_fishers_z = 1 / ((n_Older + n_Younger) - 3),
)
# remove unneccesary columns
dm$mean_Older <- NULL; dm$mean_Younger <- NULL; dm$sd_Older <- NULL; dm$sd_Younger <- NULL; dm$conditionID <- NULL
dm$cohens_d <- NULL; dm$var_cohens_d <- NULL; dm$a <- NULL; dm$r <-NULL; dm$var_r <- NULL
## effect per decade ####
#dm$adj_effect_size <- dm$effect_size * 10 # calculate effect per year and then multiply by 10 for decade
# Reversals ####
dm <- reverse_es(dm, 'Garza 2016')
dm <- reverse_es(dm, 'Li 2013')
dm <- reverse_es(dm, 'Sparrow 2019')
dm <- reverse_es(dm, 'Sparrow 2018 Study 1')
dm <- reverse_es(dm, 'Sparrow 2018 Study 2')
write.csv(dm, here::here('output', 'extreme_group_table.csv'), row.names = FALSE)
rm(dm, ds, dt, file, average_within_study, reverse_es, age_group_comparisons)