plot_simulation_results_model_sets_AICc.R



#read in all the sim data files- this was done in pieces to keep it computationally doable


#get a list of file names:
setwd("simresults/Best_model_AICc")
file_list<-list.files()

#loop through the files, merge 'em together
simulation.results <- do.call("rbind",lapply(file_list,
                                             FUN=function(files){read.csv(files, header=TRUE)}))

setwd("../..")

#Encoding results
#All scripted breaks found =1
#all breaks plus extra breaks found = 2
#missing breaks (when more than one break in sim data) =3
#right number of breaks but not all match =4
# total failure to find correct breaks =0 

#because our function was throwing an error about results as factors, we encoded 
#them numerically as above. But before we do any operations on it we should 
#at least convert the outcome integers to factors so we don't accidentally 
#do any numeric operations on them. 

#note the other columns of the data frame are also basically ordinal/catagorical, but
#we want to retain their order for plotting purposes, so we'll just proceed
#with caution there


simulation.results$victory<-as.factor(simulation.results$victory)
simulation.results$inSet<-as.factor(simulation.results$inSet)

#let's cull out the 15 year scenarios with 3 breaks- this usually violates the constraints of the 
#model and thus isn't an honest test- let's also get rid of it for 20, and 2 break scenarios for 20, as these often fail
simulation.results<-simulation.results[-which(simulation.results$Nyears=="15" & 
                                                simulation.results$nbreaksin=="3"),]
simulation.results<-simulation.results[-which(simulation.results$Nyears=="15" & 
                                                simulation.results$nbreaksin=="2"),]
#also, the nevative starting values for r don't work well...Ricker model works best for a population
#that is K limited, so this results in nonsensical output for this particular implimentation
simulation.results<-simulation.results[-which(simulation.results$startR=="-0.5"),]

#now we need to take th data produced and summarize it for plotting
library(plyr)


#count number of times a unique observation was recorded
summarize.results<-count(simulation.results,
                         c("Nyears", "startPop", "noise", "nbreaksin",
                           "startK", "startR", "changeK", "changeR", "victory"))

#count number of times a the model was in the equivalent model set
summarize.results.set<-count(simulation.results,
                         c("Nyears", "startPop", "noise", "nbreaksin",
                           "startK", "startR", "changeK", "changeR", "inSet"))

#for this we only care about the proportion of times we were right
summarize.results.right<-summarize.results[which(summarize.results$victory==1),]
summarize.results.set.right<-summarize.results.set[which(summarize.results.set$inSet==1),]
#get rid of columns with only one value
summarize.results.right$victory<-NULL
summarize.results.set.right$inSet<-NULL
#rename the freq column so we don't have naming issues with a merge
colnames(summarize.results.right)[colnames(summarize.results.right) == 'freq']<-'victory'
colnames(summarize.results.set.right)[colnames(summarize.results.set.right) == 'freq']<-'inSet'
summarize.results<-merge(summarize.results.right, summarize.results.set.right)

#count the number of times a unique scenario was attemped (should be pretty uniform but 
# there are someetimes cases where the fit failed) (for a denominator!)

tot.tests<-count(simulation.results,
                 c("Nyears", "startPop", "noise", "nbreaksin",
                   "startK", "startR", "changeK", "changeR"))
#rename the freq column so we don't have naming issues with a merge
colnames(tot.tests)[colnames(tot.tests) == 'freq']<-'total.tests'

summarize.results<-merge(summarize.results, tot.tests)

summarize.results$prop.top<-summarize.results$victory/summarize.results$total.tests
summarize.results$prop.set<-summarize.results$inSet/summarize.results$total.tests

#all right, let's get plotting!
library(ggplot2)


#choose a color palette
pal<-c("#ffffb2", "#fecc5c", "#fd8d3c", "#e31a1c")
pal.nozero<-c("#fecc5c", "#fd8d3c", "#e31a1c") #for cases where no zero break scenarios are plotted
pal.noone<-c("#fd8d3c", "#e31a1c")
pal.notwo<-c("#e31a1c")

#we need to subset the data by factor we're varying.

###############
# Noise experiment

#start with successes

noise.experiment.correct<-summarize.results[which(summarize.results$changeK==75 & 
                                                    summarize.results$changeR==25 & 
                                                    summarize.results$startR==2 &
                                                    summarize.results$Nyears==20),]
noiseplot.correct<-ggplot(noise.experiment.correct, aes(noise, prop.top, fill=as.factor(nbreaksin)))+
  scale_fill_manual(values=pal)+
  #geom_smooth(method="gam", se=F, color="grey", formula=y ~ poly(x, 3), span=0.1)+
  #geom_point(colour="black", pch=21, size=3)+
  geom_smooth(aes(noise, prop.set), method="gam", se=F, color="grey", formula=y ~ poly(x, 3), span=0.1, show.legend=F)+
  geom_point(aes(noise, prop.set), colour="black", pch=21, size=3)+
  theme_bw(base_size = 12)+
  guides(fill=guide_legend(title="Number\nof breaks"))+
  theme(legend.key=element_blank())+
  xlab("% noise")+
  ylab("proportion of outcomes")+
  xlim(0,15)+ylim(0.4,1.0)

noiseplot.correct


###############
# startR experiment

#start with successes

startr.experiment.correct<-summarize.results[which(summarize.results$changeK==75 & 
                                                    summarize.results$changeR==25 & 
                                                    summarize.results$noise==2 &
                                                    summarize.results$Nyears==20),]
startr.correct<-ggplot(startr.experiment.correct, aes(startR, prop.top, fill=as.factor(nbreaksin)))+
  scale_fill_manual(values=pal)+
  #geom_smooth(method="gam", se=F, color="grey", formula=y ~ poly(x, 3), span=0.1)+
  #geom_point(colour="black", pch=21, size=3)+
  geom_smooth(aes(startR, prop.set), method="gam", se=F, color="grey", formula=y ~ poly(x, 3), span=0.1, show.legend=F)+
  geom_point(aes(startR, prop.set), colour="black", pch=21, size=3)+
  theme_bw(base_size = 12)+
  guides(fill=guide_legend(title="Number\nof breaks"))+
  theme(legend.key=element_blank())+
  xlab("r starting value")+
  ylab("proportion of outcomes")+
  xlim(0.5, 2)+ylim(0.4,1.0)

startr.correct


###############
# K experiment

#start with successes

changeK.experiment.correct<-summarize.results[which(summarize.results$noise==5 & 
                                                      summarize.results$changeR==25 &
                                                      summarize.results$startR==2 &
                                                      summarize.results$Nyears==20),]
changeKplot.correct<-ggplot(changeK.experiment.correct, aes(changeK, prop.top, fill=as.factor(nbreaksin)))+
  scale_fill_manual(values=pal)+
  #geom_smooth(method="gam", se=F, color="grey", formula=y ~ poly(x, 3), span=0.1)+
  #geom_point(colour="black", pch=21, size=3)+
  geom_smooth(aes(changeK, prop.set), method="gam", se=F, color="grey", formula=y ~ poly(x, 3), span=0.1, show.legend=F)+
  geom_point(aes(changeK, prop.set), colour="black", pch=21, size=3)+
  theme_bw(base_size = 12)+
  guides(fill=guide_legend(title="Number\nof breaks"))+
  theme(legend.key=element_blank())+
  xlab("% change in K")+
  ylab("proportion of outcomes")+
  xlim(0,75)+ylim(0.4,1.0)

changeKplot.correct


###############
# r experiment

#start with successes

changeR.experiment.correct<-summarize.results[which(summarize.results$noise==5 & 
                                                      summarize.results$changeK==75 &
                                                      summarize.results$startR==2 &
                                                      summarize.results$Nyears==20),]
changeRplot.correct<-ggplot(changeR.experiment.correct, aes(changeR, prop.top, fill=as.factor(nbreaksin)))+
  scale_fill_manual(values=pal)+
  #geom_smooth(method="gam", se=F, color="grey", formula=y ~ poly(x, 3), span=0.1)+
  #geom_point(colour="black", pch=21, size=3)+
  geom_smooth(aes(changeR, prop.set), method="gam", se=F, color="grey", formula=y ~ poly(x, 3), span=0.1, show.legend=F)+
  geom_point(aes(changeR, prop.set), colour="black", pch=21, size=3)+
  theme_bw(base_size = 12)+
  guides(fill=guide_legend(title="Number\nof breaks"))+
  theme(legend.key=element_blank())+
  xlab("% change in r")+
  ylab("proportion of outcomes")+
  xlim(0,75)+ylim(0.4,1.0)

changeRplot.correct


###############
# Time series length experiment

#start with successes

Nyears.experiment.correct<-summarize.results[which(summarize.results$noise==2 & 
                                                     summarize.results$changeK==75 &
                                                     summarize.results$startR==2 &
                                                     summarize.results$changeR==25),]
Nyearsplot.correct<-ggplot(Nyears.experiment.correct, aes(Nyears, prop.top, fill=as.factor(nbreaksin)))+
  scale_fill_manual(values=pal)+
  #geom_smooth(method="lm", se=F, color="grey")+
  geom_smooth(aes(Nyears, prop.set), method="loess", se=F, color="grey", span=1.5, show.legend=F)+
  #geom_point(colour="black", pch=21, size=3)+
  geom_point(aes(Nyears, prop.set), colour="black", pch=21, size=3)+
  theme_bw(base_size = 12)+
  guides(fill=guide_legend(title="Number\nof breaks"))+
  theme(legend.key=element_blank())+
  xlab("Series length")+
  ylab("proportion of outcomes")+
  xlim(14,31)+ylim(0.4,1.0)

Nyearsplot.correct

# need to stack together noiseplot.correct, changeKplot.correct, changeRplot.correct, Nyearsplot.correct

#stack plots together
library(gridExtra)
library(grid)

noiseplot.correct.1<-noiseplot.correct+
  guides(fill=FALSE)+
  ylab(NULL)+
  #xlab(NULL)+
  coord_fixed(ratio=30)+
  ggtitle(label="A")+
  theme(plot.title = element_text(size = 12, margin = margin(t = 10, b = -1)))

startr.correct.1<-startr.correct+
  guides(fill=FALSE)+
  ylab(NULL)+
  #xlab(NULL)+
  coord_fixed(ratio=3)+
  ggtitle(label="B")+
  theme(plot.title = element_text(size = 12, margin = margin(t = 10, b = -1)))

changeKplot.correct.1<-changeKplot.correct+
  guides(fill=FALSE)+
  ylab(NULL)+
  #xlab(NULL)+
  coord_fixed(ratio=150)+
  ggtitle(label="C")+
  theme(plot.title = element_text(size = 12, margin = margin(t = 10, b = -1)))

changeRplot.correct.1<-changeRplot.correct+
  guides(fill=FALSE)+
  ylab(NULL)+
  #xlab(NULL)+
  coord_fixed(ratio=150)+
  ggtitle(label="D")+
  theme(plot.title = element_text(size = 12, margin = margin(t = 10, b = -1)))

Nyearsplot.correct.1<-Nyearsplot.correct+
  guides(fill=FALSE)+
  ylab(NULL)+
  #xlab(NULL)+
  coord_fixed(ratio=34)+
  ggtitle(label="E")+
  theme(plot.title = element_text(size = 12, margin = margin(t = 10, b = -1)))

#pull legend out of plot
g_legend <- function(a.gplot){
  tmp <- ggplot_gtable(ggplot_build(a.gplot))
  leg <- which(sapply(tmp$grobs, function(x) x$name) == "guide-box")
  legend <- tmp$grobs[[leg]]
  return(legend)}

leg<-g_legend(changeRplot.correct)

#create a blank grob to hold space where the legend would go next to D
blank <- grid.rect(gp=gpar(col="white"))

grid.arrange(arrangeGrob(noiseplot.correct.1, startr.correct.1, 
                         changeKplot.correct.1, changeRplot.correct.1,
                         Nyearsplot.correct.1, leg, 
                         ncol=6, widths=c(35,35,35,35,35,30)), 
             left=textGrob("\n                  Proportion of outcomes", rot=90,
                                       gp=gpar(fontsize=16, fontface="bold")))


pdf("figs/Figure_1_AICc_model_sets.pdf", height=3.4, width=11)
grid.arrange(arrangeGrob(noiseplot.correct.1, startr.correct.1, 
                         changeKplot.correct.1, changeRplot.correct.1,
                         Nyearsplot.correct.1, leg, 
                         ncol=6, widths=c(35,35,35,35,35,20)), 
             left=textGrob("        Proportion of outcomes in which top\n model(s) contain true scenario", rot=90,
                           gp=gpar(fontsize=12, fontface="bold")))

dev.off()