doc/Fig3.Rmd

---
title: "Figure 3 of the GERP paper"
output: pdf_document
---

```{r setup, include=TRUE}
#setwd("~/Documents/Github/pvpDiallel/")
knitr::opts_knit$set(root.dir=normalizePath('../'))
```

To reproduce the figures, we should set the current dir as your root path, i.e. `setwd("~/Documents/Github/GERP-diallel/")`. And then use `knitr` package to render the pdf file. Or simplely click `Knit PDF` icon in `RStudio`. To produce different figures into seperate pdf files, we should set `getpdf=TRUE` when calling the plotting functions.

First of all, determine fond size and set the getpdf option:
```{r}
#par(mar=c(5,4,4,2))
par(font=2, font.lab=2, font.axis=2)
fs = 1.6 # times bigger than default
fsize = 14 # absolute font size
getpdf = TRUE # get figures in seperated pdf [TRUE] or not [FALSE]
```

--------------------------

# Figure 3a and 3b
```{r, eval=TRUE, fig.width=10, fig.height=5}

library(ggplot2)
source("lib/multiplot.R")

plot_fig3ab <- function(outfile, getpdf){
  res <- read.csv("cache/var_explained_adk.csv")
  res1 <- subset(res, trait %in% "perse")
  res2 <- subset(res, trait %in% "MPH")

  res1$pheno <- toupper(res1$pheno)
  res2$pheno <- toupper(res2$pheno)
  
  t <- read.csv("data/hyb_heterosis.csv")
  bymed2 <- with(t, reorder(trait, abs(pMPH), median))
  #bymed2 <- with(trait, reorder(trait, pBPHmax, median))
  
  p1 <- ggplot(res1, aes(x=factor(pheno, levels=levels(bymed2)), y=h2,
                       fill=factor(type, levels=c("a2", "d2", "h2"), labels=c("A", "D", "k")))) + 
  geom_bar(position=position_dodge(), stat="identity") +
  xlab("") +
  ylim(c(0,1)) +
  ylab("Phenotypic Variance Explained") +
  ggtitle("") + theme_bw() +
  labs(fill="Effect") +
  theme(axis.text = element_text(size=fsize),
          axis.title=element_text(size=fsize, face="bold"),
          legend.title = element_text(size=fsize, face="bold"),
          legend.text = element_text(size=fsize))
  
  p2 <- ggplot(res2, aes(x=factor(pheno, levels=levels(bymed2)), y=h2, 
                       fill=factor(type, levels=c("a2", "d2", "h2"), labels=c("A", "D", "k")))) + 
  geom_bar(position=position_dodge(), stat="identity") +
  xlab("") +
  ylim(c(0,1)) +
  ylab("Phenotypic Variance Explained") +
  ggtitle("") + theme_bw() +
  labs(fill="Effect") +
  theme(axis.text = element_text(size=fsize),
          axis.title=element_text(size=fsize, face="bold"),
          legend.title = element_text(size=fsize, face="bold"),
          legend.text = element_text(size=fsize))

  multiplot(p1, p2, cols=2)
  if(getpdf){
    pdf(outfile, width=12, height=5)
    multiplot(p1, p2, cols=2)
    dev.off()
  }

}
######
plot_fig3ab(outfile="graphs/Fig_post_var.pdf", getpdf)
```

# Figure 3c and 3d

```{r, eval=TRUE, fig.width=10, fig.height=5}


library(beanplot)
library(ggplot2)
library(plyr)
#http://www.jstatsoft.org/v28/c01/paper
mybean <- function(inputdf, mymode="a2", ...){
  res1 <- ddply(inputdf, .(trait, mode, sp, type), summarise,
                r = mean(r),
                m = median(r))
  res1 <- subset(res1, type != "null")
  
  res1$mode <- as.character(res1$mode)
  res1 <- subset(res1, mode == mymode)
  res1$trait <- toupper(res1$trait)
  #print(nrow(res1))
  par(lend = 1, mai = c(0.8, 0.8, 0.5, 0.5))
  res1$type <- factor(res1$type, levels = c("real", "cs"))
  res1$trait <- factor(res1$trait, levels = toupper(c("TW",  "DTP", "DTS", "PHT", "EHT", "ASI", "GY")))
  beanplot(m ~ type + trait, data = res1, kernel="cosine", ll = 0.04, cex=1.5, side = "both", bw=0.02,
           border = NA, col = list(c("#d41243", "#d41243"), c("grey", "grey")), ...)
  #legend("bottomleft", fill = c("black", "grey"),
  #       legend = c("Group 2", "Group 1"))
  #return(res0)
  
  out <- data.frame()
  myt <- toupper(c("TW",  "DTP", "DTS", "PHT", "EHT", "ASI", "GY"))
  for(myti in myt){
    real <- subset(res1, type == "real" & trait == myti)
    rand <- subset(res1, type == "cs" & trait == myti)
    
    message(sprintf("###>>> real [ %s ] and random [ %s ]", nrow(real), nrow(rand)))
    test <- t.test(real$r, rand$r, alternative ="greater")
    
    tem <- data.frame(trait=myti, realmean=mean(real$r), csmean=mean(rand$r), pval=test$p.value)
    out <- rbind(out, tem)
  }

  return(out)
}

####
plot_fig3cd <- function(outfile, getpdf){
  res01 <- read.csv("largedata/res_realk_perse_42000.csv")
  res02 <- read.csv("largedata/res_realk_mph_42000.csv")
  
  par(mfrow=c(1,2))
  #par(mar=c(5,4,4,2))
  res1 <- mybean(inputdf=res01, mymode = "h2", ylim=c(0, 1), main="", ylab="Cross-validation Accuracy")
  res2 <- mybean(inputdf=res02, mymode = "h2", ylim=c(0, 1), main="", ylab="Cross-validation Accuracy")
  
  if(getpdf){
    pdf(outfile, height=5, width=12)
    par(mfrow=c(1,2))
    #par(mar=c(5,4,4,2))
    par(font=2, font.lab=2, font.axis=2)
    res1 <- mybean(inputdf=res01, mymode = "h2", ylim=c(0, 1), main="", ylab="Cross-validation Accuracy")
    res2 <- mybean(inputdf=res02, mymode = "h2", ylim=c(0, 1), main="", ylab="Cross-validation Accuracy")
    dev.off()
  }
  
  
}

###
plot_fig3cd(outfile="graphs/Fig3_perse_MPH_2plots.pdf", getpdf)


```