3.3 Fig 2E

nad = read.table('data/hNAD_B_gene_num')
inad = read.table('data/other_B_gene_num')
nad = nad[,4]/(nad[,3]-nad[,2])*1000000
inad = inad[,4]/(inad[,3]-inad[,2])*1000000
df = data.frame(variable=c(rep('hNAD',length(nad)),rep('non-hNAD',length(inad))),value=c(nad,inad))
ggplot(df, aes(variable, value))+ 
  geom_boxplot(width = 0.4,  notchwidth = 1, outlier.shape = NA,aes(fill=variable)) +
  labs(x=NULL,y="Gene count/Mb") +
  theme_classic() +
  theme(text = element_text(size = 20),legend.position = "none") +
  scale_fill_manual(values=c( "#2BA809","#00BFC4"))+ylim(0,25) 
## Warning: Removed 67 rows containing non-finite values (stat_boxplot).