nicebread
diff --git a/‎.gitignore‎
Lines changed: 6 additions & 1 deletion b/‎.gitignore‎
Lines changed: 6 additions & 1 deletion
diff --git a/‎1-simFramework.R‎
Lines changed: 7 additions & 8 deletions b/‎1-simFramework.R‎
Lines changed: 7 additions & 8 deletions
diff --git a/‎2-analysisFramework.R‎
Lines changed: 3 additions & 10 deletions b/‎2-analysisFramework.R‎
Lines changed: 3 additions & 10 deletions
diff --git a/‎3-resultsFramework.R‎
Lines changed: 8 additions & 11 deletions b/‎3-resultsFramework.R‎
Lines changed: 8 additions & 11 deletions
diff --git a/‎4-EstimationPlot.R‎
Lines changed: 1 addition & 1 deletion b/‎4-EstimationPlot.R‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎5-hypTestPlot.R‎
Lines changed: 2 additions & 2 deletions b/‎5-hypTestPlot.R‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎6-coveragePlot.R‎
Lines changed: 1 addition & 1 deletion b/‎6-coveragePlot.R‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎7-methodDominance.R‎
Lines changed: 139 additions & 0 deletions b/‎7-methodDominance.R‎
Lines changed: 139 additions & 0 deletions
diff --git a/‎Empirical n and ES distributions/fit_Fraley_2014.R‎
Lines changed: 0 additions & 3 deletions b/‎Empirical n and ES distributions/fit_Fraley_2014.R‎
Lines changed: 0 additions & 3 deletions
diff --git a/‎Empirical n and ES distributions/tau.R‎
Lines changed: 6 additions & 2 deletions b/‎Empirical n and ES distributions/tau.R‎
Lines changed: 6 additions & 2 deletions
@@ -14,7 +14,7 @@ vignettes/*.pdf
 
 analysisParts/*.RData
 
-# for the moment: do not upload simParts (1.2GB)
+# for the moment: do not upload simParts (1.2GB overall)
 simParts
 
 # shell script for automatically adding files > 50 MB:
@@ -23,3 +23,8 @@ simParts
 res.final.RData
 res.wide.RData
 res.wide.red.RData
+.git/objects/pack/pack-04e34f809f18eeb4d75e1cc330cb24b24fd26ce0.pack
+dataFiles/res.final.RData
+dataFiles/res.wide.RData
+dataFiles/res.wide.red.RData
+
@@ -1,3 +1,8 @@
+## ======================================================================
+## This file generates the simulated data sets, which are stored in separate
+## files in folder /simParts
+## ======================================================================
+
 # run this file:
 # source("1-simFramework.R", echo=TRUE)
 
@@ -19,7 +24,7 @@ k_set <- c(10, 30, 60, 100)							# number of studies in each MA
 delta_set <- c(0, .2, .5, .8)						# true mean of effect sizes
 qrpEnv_Set <- c("none", "med", "high")	# QRP environment
 selProp_set <- c(0, .6, .9)							# publication bias
-tau_set <- c(0, .2, .4)									# heterogeneity
+tau_set <- c(0, .2, .4)									# heterogeneity; assumed to follow a normal distribution
 
 # params stores all possible combinations of experimental factors
 params <- expand.grid(k=k_set, delta=delta_set, qrpEnv=qrpEnv_Set, selProp=selProp_set, tau=tau_set)
@@ -81,17 +86,14 @@ for (j in 1:nrow(param)) {
 			res0 <- cbind(
 	  			  batch		= batch, 
 	  			  replication	= i, 
-				  condition	= j,
+				  	condition	= j,
 
 	  			  # settings of the condition
 	  			  p,
 
 	  			  # results of the computation
 	  			  as.matrix(MA1))
 
-			  # collect results in the matrix
-			  #res[counter:(counter+nrow(MA1)-1), ] <- res0
-			  #counter <- counter+nrow(MA1)
 			  res <- rbind(res, res0)
 		} # of b-loop
 
@@ -102,9 +104,6 @@ for (j in 1:nrow(param)) {
 	sim <- sim %>% mutate(id=1000*(batch*10^(floor(log10(max(replication))+1)) + replication) + condition)	
 	save(sim, file=paste0("simPartsDemo/simData_condition_", j, ".RData"), compression="gzip")
 
-	# send a push notification after each finished condition:
-	# userkey <- "uY7zyarxM2HoNaTLeX8HXjWvpFA4Cp" #Define user key
-	# send_push(userkey, paste0("Condition ", j, "/", nrow(params), " finished"))
 } # of j (loop through parameter combinations)
 
 
 
@@ -21,7 +21,6 @@ simDatFiles <- list.files("simParts", pattern=".*\\.RData", full.names=TRUE)
 
 library(gtools)
 simDatFiles <- mixedsort(simDatFiles)
-# f <- simDatFiles[[33]]
 
 
 # loop through all simParts files
@@ -66,11 +65,11 @@ for (f in simDatFiles) {
 				pc_skew(t=MAdat$t, df=MAdat$N-2, long=TRUE),
 				pcurveEst(t=MAdat$t, df=MAdat$N-2, progress=FALSE, long=TRUE, CI=FALSE),
 				puniformEst(t.value=MAdat$t, n1=MAdat$n1, n2=MAdat$n2),
+				TPSM.est(t=MAdat$t, n1=MAdat$n1, n2=MAdat$n2, long=TRUE)#,
 				#topN(MAdat$d, MAdat$v, MAdat$n1, MAdat$n2, est="fixed", fixed.effect=0.3),
 				#topN(MAdat$d, MAdat$v, MAdat$n1, MAdat$n2, est="rma"),
-				#topN(MAdat$d, MAdat$v, MAdat$n1, MAdat$n2, est="PEESE"),
-				TPSM.est(t=MAdat$t, n1=MAdat$n1, n2=MAdat$n2, long=TRUE),
-				betaSM.est(d=MAdat$d, v=MAdat$v, long=TRUE)
+				#topN(MAdat$d, MAdat$v, MAdat$n1, MAdat$n2, est="PEESE"),				
+				#betaSM.est(d=MAdat$d, v=MAdat$v, long=TRUE)
 			)
 
 
@@ -92,10 +91,4 @@ for (f in simDatFiles) {
 	} # of dopar
 
 	save(res, file=paste0("analysisParts/analysis_", basename(f)), compress="gzip")
-	
-	# send a push notification after each 50 finished conditions:
-	if (which(simDatFiles == f) %% 50 == 0) {
-	  userkey <- "uY7zyarxM2HoNaTLeX8HXjWvpFA4Cp" #Define user key
-	  send_push(userkey, paste0("Condition ", which(simDatFiles == f), " finished"))
-	}
 } # of "f in simDatFiles"
@@ -26,8 +26,8 @@ res.final <- bind_rows(res_list)
 str(res.final)
 
 # final data set in long format:
-save(res.final, file="res.final.RData")
-#load(file="res.final.RData")
+save(res.final, file="dataFiles/res.final.RData")
+#load(file="dataFiles/res.final.RData")
 
 
 # Show conditions
@@ -58,8 +58,8 @@ print(tab2, n=54)
 
 res.wide <- inner_join(res.wide, tab2)
 
-save(res.wide, file="res.wide.RData", compress="gzip")
-#load(file="res.wide.RData")
+save(res.wide, file="dataFiles/res.wide.RData", compress="gzip")
+#load(file="dataFiles/res.wide.RData")
 
 # ---------------------------------------------------------------------
 #  save a reduced version that applies some selections
@@ -75,9 +75,6 @@ res.wide.red[res.wide.red$method == "3PSM" & is.na(res.wide.red$b0_p.value), c("
 ## RULE 3: Ignore p-uniform when it doesn't provide a lower CI (very rare cases)
 res.wide.red[res.wide.red$method == "puniform" & is.na(res.wide.red$b0_conf.low), c("b0_estimate", "b0_conf.low", "b0_conf.high", "b0_p.value")] <- NA
 
-# TODO: Skip this??
-# RULE X: set pcurve and puniform estimates to NA for all conditions which have less than 500/1000 successful meta-analyses
-#res.wide.red[res.wide.red$method %in% c("pcurve.evidence", "pcurve.hack", "pcurve.lack", "pcurve", "puniform") & res.wide.red$nMA.with.kSig.larger.3 < 500, c("b0_estimate", "b0_conf.low", "b0_conf.high", "b0_p.value", "skewtest_p.value")] <- NA
 
 # ---------------------------------------------------------------------
 # For hypothesis test: Add H0.rejection rule
@@ -97,8 +94,8 @@ res.wide.red$H0.reject[is.na(res.wide.red$p.value)] <- NA
 res.wide.red$H0.reject.wrongSign <- (res.wide.red$p.value < .05) & (is.na(res.wide.red$b0_estimate) | res.wide.red$b0_estimate < 0)
 res.wide.red$H0.reject.wrongSign[is.na(res.wide.red$p.value)] <- NA
 
-save(res.wide.red, file="res.wide.red.RData", compress="gzip")
-#load(file="res.wide.red.RData")
+save(res.wide.red, file="dataFiles/res.wide.red.RData", compress="gzip")
+#load(file="dataFiles/res.wide.red.RData")
 
 
 # ---------------------------------------------------------------------
@@ -135,8 +132,8 @@ print(summ, n=50)
 
 # summ contains the full summary of the simulations. This object can then be used to build tables, plots, etc.
 library(rio)
-export(summ, file="summ.csv")
-save(summ, file="summ.RData")
+export(summ, file="dataFiles/summ.csv")
+save(summ, file="dataFiles/summ.RData")
 
 # also export into Shiny app
 save(summ, file="Shiny/MAexplorer/summ.RData")
 
@@ -8,7 +8,7 @@ library(dplyr)
 library(grid)
 library(gridExtra)
 
-load("summ.RData")
+load("dataFiles/summ.RData")
 
 # ---------------------------------------------------------------------
 # Plot settings
 
@@ -8,7 +8,7 @@ library(grid)
 library(gridExtra)
 
 #setwd("C:/Users/evan.c.carter/Documents/Meta-analysis showdown")
-load(file="summ.RData")
+load(file="dataFiles/summ.RData")
 
 # ---------------------------------------------------------------------
 # SETTINGS
@@ -34,7 +34,7 @@ hyp.wide <- inner_join(hyp.H0, hyp.H1)
 hyp.wide$rejectionRatio <- hyp.wide$Power/hyp.wide$TypeI
 hyp.wide$errorSum <- (1-hyp.wide$Power) + hyp.wide$TypeI
 
-save(hyp.wide, file="hyp.wide.RData")
+save(hyp.wide, file="dataFiles/hyp.wide.RData")
 save(hyp.wide, file="Shiny/MAexplorer/hyp.wide.RData")
 
 
 
@@ -7,7 +7,7 @@ library(dplyr)
 library(grid)
 library(gridExtra)
 
-load(file="summ.RData")
+load(file="dataFiles/summ.RData")
 
 # ---------------------------------------------------------------------
 # SETTINGS
 
@@ -0,0 +1,139 @@
+library(ggplot2)
+library(dplyr)
+library(grid)
+library(gridExtra)
+
+load(file="dataFiles/summ.RData")
+head(summ)
+
+s2  <- summ %>% 
+	ungroup() %>% 
+	select(condition, method, ME.pos, RMSE.pos) %>% 
+	filter(!method %in% c("pcurve.evidence", "pcurve.hack", "pcurve.lack", "PET.rma", "PEESE.rma", "PETPEESE.rma"))
+
+# get experimental factors
+conditions <- s2 %>% filter(method=="reMA") %>% select(1:6)
+
+
+# ---------------------------------------------------------------------
+# pairwise dominance
+	
+# reshape results into a data set with binary comparisons
+# This probably could be made more elegant, but I couldn't figure out how.
+
+n.methods <- length(unique(s2$method))
+methods <- unique(s2$method)
+
+res <- data.frame()
+for (C in unique(s2$condition)) {
+	print(C)
+	for (i in 1:n.methods) {
+		for (j in 1:n.methods) {
+			if (i > j)
+			res <- rbind(res, data.frame(
+				condition = C,
+				method1 = methods[i],
+				method2 = methods[j],
+				ME.pos1 = as.numeric(s2[s2$condition == C & s2$method==methods[i], "ME.pos"]),
+				ME.pos2 = as.numeric(s2[s2$condition == C & s2$method==methods[j], "ME.pos"]),
+				RMSE.pos1 = as.numeric(s2[s2$condition == C & s2$method==methods[i], "RMSE.pos"]),
+				RMSE.pos2 = as.numeric(s2[s2$condition == C & s2$method==methods[j], "RMSE.pos"])
+			))
+		}
+	}
+}
+
+save(res, file="dataFiles/dominanceScore.RData")
+#load(file="dataFiles/dominanceScore.RData")
+
+res2 <- res %>% na.omit()
+
+# define points, winners and draws
+
+res2$winner <- ""
+res2$draw1 <- ""
+res2$draw2 <- ""
+
+winner1 <- (abs(res2$ME.pos1) < abs(res2$ME.pos2)) & (res2$RMSE.pos1 < res2$RMSE.pos2)
+res2$winner[winner1] <- as.character(res2$method1[winner1])
+
+winner2 <- (abs(res2$ME.pos1) > abs(res2$ME.pos2)) & (res2$RMSE.pos1 > res2$RMSE.pos2)
+res2$winner[winner2] <- as.character(res2$method2[winner2])
+
+draw <- ((abs(res2$ME.pos1) > abs(res2$ME.pos2)) & (res2$RMSE.pos1 < res2$RMSE.pos2)) | ((abs(res2$ME.pos1) < abs(res2$ME.pos2)) & (res2$RMSE.pos1 > res2$RMSE.pos2))
+res2$draw1[draw] <- as.character(res2$method1[draw])
+res2$draw2[draw] <- as.character(res2$method2[draw])
+
+
+## give 1 point for "draw"
+# scores <- res2 %>% group_by(condition) %>% summarise(
+# 	RE = sum(winner=="reMA")*2 + sum(draw1=="reMA") + sum(draw2=="reMA"),
+# 	TF = sum(winner=="TF")*2 + sum(draw1=="TF") + sum(draw2=="TF"),
+# 	PET = sum(winner=="PET.lm")*2 + sum(draw1=="PET.lm") + sum(draw2=="PET.lm"),
+# 	PEESE = sum(winner=="PEESE.lm")*2 + sum(draw1=="PEESE.lm") + sum(draw2=="PEESE.lm"),
+# 	PETPEESE = sum(winner=="PETPEESE.lm")*2 + sum(draw1=="PETPEESE.lm") + sum(draw2=="PETPEESE.lm"),
+# 	pcurve = sum(winner=="pcurve")*2 + sum(draw1=="pcurve") + sum(draw2=="pcurve"),
+# 	puniform = sum(winner=="puniform")*2 + sum(draw1=="puniform") + sum(draw2=="puniform"),
+# 	TPSM = sum(winner=="3PSM")*2 + sum(draw1=="3PSM") + sum(draw2=="3PSM")
+# )
+
+scores <- res2 %>% group_by(condition) %>% summarise(
+	RE = sum(winner=="reMA")*2 ,
+	TF = sum(winner=="TF")*2 ,
+	PET = sum(winner=="PET.lm")*2,
+	PEESE = sum(winner=="PEESE.lm")*2,
+	PETPEESE = sum(winner=="PETPEESE.lm")*2,
+	pcurve = sum(winner=="pcurve")*2 ,
+	puniform = sum(winner=="puniform")*2 ,
+	TPSM = sum(winner=="3PSM")*2
+)
+
+scores.long <- melt(scores, id.vars="condition")
+
+scores$winner <- ""
+for (i in 1:nrow(scores)) {
+	scores$winner[i] <- paste0(colnames(scores)[which(scores[i, 2:9] == max(scores[i, 2:9])) + 1], collapse = ", ")
+}
+
+scores <- merge(scores, conditions, by="condition")
+scores.long <- merge(scores.long, conditions, by="condition")
+
+scores$winner <- factor(scores$winner, levels=names(sort(table(scores$winner), decreasing=TRUE)))
+
+sort(table(scores$winner), decreasing=TRUE)
+
+ggplot(scores, aes(y=qrpEnv, x=factor(delta), shape=factor(winner))) + geom_point(size=6) + facet_grid(selProp~k+tau)
+
+# That looks ugly ...
+scores.long$loop <- paste0(scores.long$delta, ":", scores.long$qrpEnv, ":", scores.long$tau)
+ggplot(scores.long, aes(y=value, x=loop, color=factor(variable), group=factor(variable))) + geom_line() + facet_grid(k~selProp)
+
+# ---------------------------------------------------------------------
+# strong (absolute) dominance
+
+s2  <- summ %>% 
+	ungroup() %>% 
+	select(condition, k, delta, qrpEnv, selProp, tau, method, ME.pos, RMSE.pos) %>% 
+	filter(!method %in% c("pcurve.evidence", "pcurve.hack", "pcurve.lack", "PET.rma", "PEESE.rma", "PETPEESE.rma"))
+	
+# which method is best in ME?
+ME.matrix <- dcast(s2, condition ~ method, value.var="ME.pos")
+ME.matrix$ME.winner <- colnames(ME.matrix)[apply(ME.matrix, 1, which.min)]
+
+# which method is best in RMSE?
+RMSE.matrix <- dcast(s2, condition ~ method, value.var="RMSE.pos")
+RMSE.matrix$RMSE.winner <- colnames(RMSE.matrix)[apply(RMSE.matrix, 1, which.min)]
+
+fullDominance <- cbind(ME.matrix[, c("condition", "ME.winner")], RMSE.winner = RMSE.matrix$RMSE.winner)
+fullDominance$winner <- ""
+fullDominance$winner[fullDominance$ME.winner == fullDominance$RMSE.winner] <- fullDominance$ME.winner[fullDominance$ME.winner == fullDominance$RMSE.winner]
+
+sort(table(fullDominance$winner[fullDominance$winner != ""]), decreasing = TRUE)
+
+s3 <- merge(fullDominance, conditions, by="condition")
+
+
+ggplot(s3 %>% filter(winner != ""), aes(y=qrpEnv, x=factor(delta), shape=factor(winner))) + geom_point(size=6) + facet_grid(selProp~k+tau)
+
+
+ggplot(s3 %>% filter(winner != ""), aes(y=qrpEnv, x=factor(delta), shape=factor(winner))) + geom_point(size=6) + facet_grid(selProp~k+tau)
@@ -7,12 +7,9 @@ r <- rtrunc(1, spec="beta", a=.08, b=.14, 1.34, 5.03 )
 dtrue <- 2*r/sqrt(1-r^2) # this will select effect sizes that hit the social psych "sweet spot." it runs from 20th to 40th percentiles. This is roughly from the mode up a bit.
 
 
-
-
 #### Get sample sizes. ####
 # I pulled the raw data from Fraley & Vazire's n-pact factor paper, then selected the social psych journals (JESP, the first 2 sections of JPSP, and SPPS)
 # these were total N per study. To be generous, I assumed that they were all 2 group designs, then used this function to randomly sample a per-group n from that distribution
 
-
 rtrunc(n=1, spec="nbinom", a=10, b=Inf, size=2.3, mu=48)
 
@@ -16,8 +16,12 @@ prop.table(table(sel$tau < .2))
 prop.table(table(sel$tau < .4))
 
 
-# Investigate I^2 across all meta-analyses
+# ---------------------------------------------------------------------
+#  Investigate I^2 across all meta-analyses
+
+# Compute I^2 from Q
 dat$I2 <- (dat$Q - (dat[, "# of effect sizes"] - 1))/dat$Q
 dat$I2[dat$Q <= (dat[, "# of effect sizes"] - 1)] <- 0
 
-prop.table(table(dat$I2 > .25))
+prop.table(table(dat$I2 > .25))
+prop.table(table(dat$I2 > .75))