diff --git a/rmd_analysis/expressionPC_covariate_r2.Rmd b/rmd_analysis/expressionPC_covariate_r2.Rmd deleted file mode 100644 index e0723e0..0000000 --- a/rmd_analysis/expressionPC_covariate_r2.Rmd +++ /dev/null @@ -1,112 +0,0 @@ ---- -title: "expressionPC_covariate_R2" -output: html_notebook ---- - - -```{r} -library(recount) -library(ggplot2) -library(RColorBrewer) -library(reshape2) - -load("../data/pc_loadings.Rdata") -load("../data/raw_protein_coding_withGC.Rdata") - -## none of the covariates have NA --> total sum of squares can be computed before hand -dat.cov <- lapply(gtex.rse, function(tiss) { - cov.dat <- tiss@colData[,c(10, 11, 21:80, 83)] - cov.dat <- cov.dat[,-which(sapply(cov.dat, function(x) length(unique(x))) == 1)] - cov.dat <- cov.dat[, -which(colnames(cov.dat) %in% c("smunpdrd","smpthnts", "smtstptref", "smnabtch", "smnabtchd", "smgebtch"))] ## not enought unique entries in more than one category, < 50 - cov.dat -}) - -pve.tissue <- mapply(function(x,y,z){ - pve.eachtiss <- matrix(ncol = z, nrow = ncol(y)) - for(i in 1:ncol(y)){ - pve.eachtiss[i,] <- sapply(summary(lm(x[,1:z]~y[,i])), function(p) p$r.squared) - } - colnames(pve.eachtiss) <- 1:z - rownames(pve.eachtiss) <- colnames(y) - pve.eachtiss -}, pc.loadings, dat.cov, num.pc.estimates, SIMPLIFY = FALSE) - -plot.r2 <- lapply(pve.tissue, melt) -``` - -```{r} -myPalette <- colorRampPalette(brewer.pal(9,'Blues'), space = "Lab") - -tiss<- "Subcutaneous" - -ggplot(plot.r2[[tiss]], aes(Var2, Var1)) + geom_tile(aes(fill = value), - colour = "white") + - # geom_text(size = 2, aes(label = prettyNum(value, digits=3, width=4, format="fg"))) + - scale_fill_gradientn(colours = myPalette(10)[1:6] - , limits = c(0,1) - , values = c(0, 0.1, 0.2, 0.3, 1) - ) + - xlab("") + ylab("Principal Components") + theme(axis.text.x=element_text(colour="black"), axis.text.y=element_text(colour="black"))+ - ggtitle(tiss) -``` -```{r} -tiss<- "Lung" - -ggplot(plot.r2[[tiss]], aes(Var2, Var1)) + geom_tile(aes(fill = value), - colour = "white") + - # geom_text(size = 2, aes(label = prettyNum(value, digits=3, width=4, format="fg"))) + - scale_fill_gradientn(colours = myPalette(10)[1:6] - , limits = c(0,1) - , values = c(0, 0.1, 0.2, 0.3, 1) - ) + - xlab("") + ylab("Principal Components") + theme(axis.text.x=element_text(colour="black"), axis.text.y=element_text(colour="black"))+ - ggtitle(tiss) -``` - -```{r} -tiss<- "Thyroid" - -ggplot(plot.r2[[tiss]], aes(Var2, Var1)) + geom_tile(aes(fill = value), - colour = "white") + - # geom_text(size = 2, aes(label = prettyNum(value, digits=3, width=4, format="fg"))) + - scale_fill_gradientn(colours = myPalette(10)[1:6] - , limits = c(0,1) - , values = c(0, 0.1, 0.2, 0.3, 1) - ) + - xlab("") + ylab("Principal Components") + theme(axis.text.x=element_text(colour="black"), axis.text.y=element_text(colour="black"))+ - ggtitle(tiss) -``` - -```{r} -tiss<- "Muscle" -ggplot(plot.r2[[tiss]], aes(Var2, Var1)) + geom_tile(aes(fill = value), - colour = "white") + - # geom_text(size = 2, aes(label = prettyNum(value, digits=3, width=4, format="fg"))) + - scale_fill_gradientn(colours = myPalette(10)[1:6] - , limits = c(0,1) - , values = c(0, 0.1, 0.2, 0.3, 1) - ) + - xlab("") + ylab("Principal Components") + theme(axis.text.x=element_text(colour="black"), axis.text.y=element_text(colour="black"))+ - ggtitle(tiss) -``` - -```{r} -tiss<- "Blood" - -ggplot(plot.r2[[tiss]], aes(Var2, Var1)) + geom_tile(aes(fill = value), - colour = "white") + - # geom_text(size = 2, aes(label = prettyNum(value, digits=3, width=4, format="fg"))) + - scale_fill_gradientn(colours = myPalette(10)[1:6] - , limits = c(0,1) - , values = c(0, 0.1, 0.2, 0.3, 1) - ) + - xlab("") + ylab("Principal Components") + theme(axis.text.x=element_text(colour="black"), axis.text.y=element_text(colour="black"))+ - ggtitle(tiss) -``` - -Add a new chunk by clicking the *Insert Chunk* button on the toolbar or by pressing *Cmd+Option+I*. - -When you save the notebook, an HTML file containing the code and output will be saved alongside it (click the *Preview* button or press *Cmd+Shift+K* to preview the HTML file). - -The preview shows you a rendered HTML copy of the contents of the editor. Consequently, unlike *Knit*, *Preview* does not run any R code chunks. Instead, the output of the chunk when it was last run in the editor is displayed. - diff --git a/rmd_analysis/expressionPC_covariate_r2.nb.html b/rmd_analysis/expressionPC_covariate_r2.nb.html deleted file mode 100644 index 6d7f92c..0000000 --- a/rmd_analysis/expressionPC_covariate_r2.nb.html +++ /dev/null @@ -1,345 +0,0 @@ - - - - - - - - - - - - - -expressionPC_covariate_R2 - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
- - - - - - - - - - - - - - - - - - - - -
library(recount)
-library(ggplot2)
-library(RColorBrewer)
-library(reshape2)
-load("../data/pc_loadings.Rdata")
-load("../data/raw_protein_coding_withGC.Rdata")
-## none of the covariates have NA --> total sum of squares can be computed before hand
-dat.cov <- lapply(gtex.rse, function(tiss) {
-  cov.dat <- tiss@colData[,c(10, 11, 21:80, 83)]
-  cov.dat <- cov.dat[,-which(sapply(cov.dat, function(x) length(unique(x))) == 1)]
-  cov.dat <- cov.dat[, -which(colnames(cov.dat) %in% c("smunpdrd","smpthnts", "smtstptref", "smnabtch", "smnabtchd", "smgebtch"))] ## not enought unique entries in more than one category, < 50
-  cov.dat
-})
-pve.tissue <- mapply(function(x,y,z){
-  pve.eachtiss <- matrix(ncol = z, nrow = ncol(y))
-  for(i in 1:ncol(y)){
-    pve.eachtiss[i,] <- sapply(summary(lm(x[,1:z]~y[,i])), function(p) p$r.squared)
-  }
-  colnames(pve.eachtiss) <- 1:z
-  rownames(pve.eachtiss) <- colnames(y)
-  pve.eachtiss
-}, pc.loadings, dat.cov, num.pc.estimates, SIMPLIFY = FALSE)
-plot.r2 <- lapply(pve.tissue, melt)
- - - - - - -
myPalette <- colorRampPalette(brewer.pal(9,'Blues'), space = "Lab")
-tiss<- "Subcutaneous"
-ggplot(plot.r2[[tiss]], aes(Var2, Var1)) + geom_tile(aes(fill = value),
-         colour = "white") + 
-        # geom_text(size = 2, aes(label = prettyNum(value, digits=3, width=4, format="fg"))) +
-        scale_fill_gradientn(colours = myPalette(10)[1:6]
-            , limits = c(0,1)
-        , values = c(0, 0.1, 0.2, 0.3, 1)
-        ) + 
-        xlab("") + ylab("Principal Components") + theme(axis.text.x=element_text(colour="black"), axis.text.y=element_text(colour="black"))+
-        ggtitle(tiss)
- - -

- - - - -
tiss<- "Lung"
-ggplot(plot.r2[[tiss]], aes(Var2, Var1)) + geom_tile(aes(fill = value),
-         colour = "white") + 
-        # geom_text(size = 2, aes(label = prettyNum(value, digits=3, width=4, format="fg"))) +
-        scale_fill_gradientn(colours = myPalette(10)[1:6]
-            , limits = c(0,1)
-        , values = c(0, 0.1, 0.2, 0.3, 1)
-        ) + 
-        xlab("") + ylab("Principal Components") + theme(axis.text.x=element_text(colour="black"), axis.text.y=element_text(colour="black"))+
-        ggtitle(tiss)
- - -

- - - - - - -
tiss<- "Thyroid"
-ggplot(plot.r2[[tiss]], aes(Var2, Var1)) + geom_tile(aes(fill = value),
-         colour = "white") + 
-        # geom_text(size = 2, aes(label = prettyNum(value, digits=3, width=4, format="fg"))) +
-        scale_fill_gradientn(colours = myPalette(10)[1:6]
-            , limits = c(0,1)
-        , values = c(0, 0.1, 0.2, 0.3, 1)
-        ) + 
-        xlab("") + ylab("Principal Components") + theme(axis.text.x=element_text(colour="black"), axis.text.y=element_text(colour="black"))+
-        ggtitle(tiss)
- - -

- - - - - - -
tiss<- "Muscle"
-ggplot(plot.r2[[tiss]], aes(Var2, Var1)) + geom_tile(aes(fill = value),
-         colour = "white") + 
-        # geom_text(size = 2, aes(label = prettyNum(value, digits=3, width=4, format="fg"))) +
-        scale_fill_gradientn(colours = myPalette(10)[1:6]
-            , limits = c(0,1)
-        , values = c(0, 0.1, 0.2, 0.3, 1)
-        ) + 
-        xlab("") + ylab("Principal Components") + theme(axis.text.x=element_text(colour="black"), axis.text.y=element_text(colour="black"))+
-        ggtitle(tiss)
- - -

- - - - - - -
tiss<- "Blood"
-ggplot(plot.r2[[tiss]], aes(Var2, Var1)) + geom_tile(aes(fill = value),
-         colour = "white") + 
-        # geom_text(size = 2, aes(label = prettyNum(value, digits=3, width=4, format="fg"))) +
-        scale_fill_gradientn(colours = myPalette(10)[1:6]
-            , limits = c(0,1)
-        , values = c(0, 0.1, 0.2, 0.3, 1)
-        ) + 
-        xlab("") + ylab("Principal Components") + theme(axis.text.x=element_text(colour="black"), axis.text.y=element_text(colour="black"))+
-        ggtitle(tiss)
- - -

- - - -

Add a new chunk by clicking the Insert Chunk button on the toolbar or by pressing Cmd+Option+I.

-

When you save the notebook, an HTML file containing the code and output will be saved alongside it (click the Preview button or press Cmd+Shift+K to preview the HTML file).

-

The preview shows you a rendered HTML copy of the contents of the editor. Consequently, unlike Knit, Preview does not run any R code chunks. Instead, the output of the chunk when it was last run in the editor is displayed.

- - -
LS0tCnRpdGxlOiAiZXhwcmVzc2lvblBDX2NvdmFyaWF0ZV9SMiIKb3V0cHV0OiBodG1sX25vdGVib29rCi0tLQoKCmBgYHtyfQpsaWJyYXJ5KHJlY291bnQpCmxpYnJhcnkoZ2dwbG90MikKbGlicmFyeShSQ29sb3JCcmV3ZXIpCmxpYnJhcnkocmVzaGFwZTIpCgpsb2FkKCIuLi9kYXRhL3BjX2xvYWRpbmdzLlJkYXRhIikKbG9hZCgiLi4vZGF0YS9yYXdfcHJvdGVpbl9jb2Rpbmdfd2l0aEdDLlJkYXRhIikKCiMjIG5vbmUgb2YgdGhlIGNvdmFyaWF0ZXMgaGF2ZSBOQSAtLT4gdG90YWwgc3VtIG9mIHNxdWFyZXMgY2FuIGJlIGNvbXB1dGVkIGJlZm9yZSBoYW5kCmRhdC5jb3YgPC0gbGFwcGx5KGd0ZXgucnNlLCBmdW5jdGlvbih0aXNzKSB7CiAgY292LmRhdCA8LSB0aXNzQGNvbERhdGFbLGMoMTAsIDExLCAyMTo4MCwgODMpXQogIGNvdi5kYXQgPC0gY292LmRhdFssLXdoaWNoKHNhcHBseShjb3YuZGF0LCBmdW5jdGlvbih4KSBsZW5ndGgodW5pcXVlKHgpKSkgPT0gMSldCiAgY292LmRhdCA8LSBjb3YuZGF0WywgLXdoaWNoKGNvbG5hbWVzKGNvdi5kYXQpICVpbiUgYygic211bnBkcmQiLCJzbXB0aG50cyIsICJzbXRzdHB0cmVmIiwgInNtbmFidGNoIiwgInNtbmFidGNoZCIsICJzbWdlYnRjaCIpKV0gIyMgbm90IGVub3VnaHQgdW5pcXVlIGVudHJpZXMgaW4gbW9yZSB0aGFuIG9uZSBjYXRlZ29yeSwgPCA1MAogIGNvdi5kYXQKfSkKCnB2ZS50aXNzdWUgPC0gbWFwcGx5KGZ1bmN0aW9uKHgseSx6KXsKICBwdmUuZWFjaHRpc3MgPC0gbWF0cml4KG5jb2wgPSB6LCBucm93ID0gbmNvbCh5KSkKICBmb3IoaSBpbiAxOm5jb2woeSkpewogICAgcHZlLmVhY2h0aXNzW2ksXSA8LSBzYXBwbHkoc3VtbWFyeShsbSh4WywxOnpdfnlbLGldKSksIGZ1bmN0aW9uKHApIHAkci5zcXVhcmVkKQogIH0KICBjb2xuYW1lcyhwdmUuZWFjaHRpc3MpIDwtIDE6egogIHJvd25hbWVzKHB2ZS5lYWNodGlzcykgPC0gY29sbmFtZXMoeSkKICBwdmUuZWFjaHRpc3MKfSwgcGMubG9hZGluZ3MsIGRhdC5jb3YsIG51bS5wYy5lc3RpbWF0ZXMsIFNJTVBMSUZZID0gRkFMU0UpCgpwbG90LnIyIDwtIGxhcHBseShwdmUudGlzc3VlLCBtZWx0KQpgYGAKCmBgYHtyfQpteVBhbGV0dGUgPC0gY29sb3JSYW1wUGFsZXR0ZShicmV3ZXIucGFsKDksJ0JsdWVzJyksIHNwYWNlID0gIkxhYiIpCgp0aXNzPC0gIlN1YmN1dGFuZW91cyIKCmdncGxvdChwbG90LnIyW1t0aXNzXV0sIGFlcyhWYXIyLCBWYXIxKSkgKyBnZW9tX3RpbGUoYWVzKGZpbGwgPSB2YWx1ZSksCgkgICAgIGNvbG91ciA9ICJ3aGl0ZSIpICsgCgkJIyBnZW9tX3RleHQoc2l6ZSA9IDIsIGFlcyhsYWJlbCA9IHByZXR0eU51bSh2YWx1ZSwgZGlnaXRzPTMsIHdpZHRoPTQsIGZvcm1hdD0iZmciKSkpICsKCQlzY2FsZV9maWxsX2dyYWRpZW50bihjb2xvdXJzID0gbXlQYWxldHRlKDEwKVsxOjZdCgkJCSwgbGltaXRzID0gYygwLDEpCgkJLCB2YWx1ZXMgPSBjKDAsIDAuMSwgMC4yLCAwLjMsIDEpCgkJKSArIAoJCXhsYWIoIiIpICsgeWxhYigiUHJpbmNpcGFsIENvbXBvbmVudHMiKSArIHRoZW1lKGF4aXMudGV4dC54PWVsZW1lbnRfdGV4dChjb2xvdXI9ImJsYWNrIiksIGF4aXMudGV4dC55PWVsZW1lbnRfdGV4dChjb2xvdXI9ImJsYWNrIikpKwoJCWdndGl0bGUodGlzcykKYGBgCmBgYHtyfQp0aXNzPC0gIkx1bmciCgpnZ3Bsb3QocGxvdC5yMltbdGlzc11dLCBhZXMoVmFyMiwgVmFyMSkpICsgZ2VvbV90aWxlKGFlcyhmaWxsID0gdmFsdWUpLAoJICAgICBjb2xvdXIgPSAid2hpdGUiKSArIAoJCSMgZ2VvbV90ZXh0KHNpemUgPSAyLCBhZXMobGFiZWwgPSBwcmV0dHlOdW0odmFsdWUsIGRpZ2l0cz0zLCB3aWR0aD00LCBmb3JtYXQ9ImZnIikpKSArCgkJc2NhbGVfZmlsbF9ncmFkaWVudG4oY29sb3VycyA9IG15UGFsZXR0ZSgxMClbMTo2XQoJCQksIGxpbWl0cyA9IGMoMCwxKQoJCSwgdmFsdWVzID0gYygwLCAwLjEsIDAuMiwgMC4zLCAxKQoJCSkgKyAKCQl4bGFiKCIiKSArIHlsYWIoIlByaW5jaXBhbCBDb21wb25lbnRzIikgKyB0aGVtZShheGlzLnRleHQueD1lbGVtZW50X3RleHQoY29sb3VyPSJibGFjayIpLCBheGlzLnRleHQueT1lbGVtZW50X3RleHQoY29sb3VyPSJibGFjayIpKSsKCQlnZ3RpdGxlKHRpc3MpCmBgYAoKYGBge3J9CnRpc3M8LSAiVGh5cm9pZCIKCmdncGxvdChwbG90LnIyW1t0aXNzXV0sIGFlcyhWYXIyLCBWYXIxKSkgKyBnZW9tX3RpbGUoYWVzKGZpbGwgPSB2YWx1ZSksCgkgICAgIGNvbG91ciA9ICJ3aGl0ZSIpICsgCgkJIyBnZW9tX3RleHQoc2l6ZSA9IDIsIGFlcyhsYWJlbCA9IHByZXR0eU51bSh2YWx1ZSwgZGlnaXRzPTMsIHdpZHRoPTQsIGZvcm1hdD0iZmciKSkpICsKCQlzY2FsZV9maWxsX2dyYWRpZW50bihjb2xvdXJzID0gbXlQYWxldHRlKDEwKVsxOjZdCgkJCSwgbGltaXRzID0gYygwLDEpCgkJLCB2YWx1ZXMgPSBjKDAsIDAuMSwgMC4yLCAwLjMsIDEpCgkJKSArIAoJCXhsYWIoIiIpICsgeWxhYigiUHJpbmNpcGFsIENvbXBvbmVudHMiKSArIHRoZW1lKGF4aXMudGV4dC54PWVsZW1lbnRfdGV4dChjb2xvdXI9ImJsYWNrIiksIGF4aXMudGV4dC55PWVsZW1lbnRfdGV4dChjb2xvdXI9ImJsYWNrIikpKwoJCWdndGl0bGUodGlzcykKYGBgCgpgYGB7cn0KdGlzczwtICJNdXNjbGUiCmdncGxvdChwbG90LnIyW1t0aXNzXV0sIGFlcyhWYXIyLCBWYXIxKSkgKyBnZW9tX3RpbGUoYWVzKGZpbGwgPSB2YWx1ZSksCgkgICAgIGNvbG91ciA9ICJ3aGl0ZSIpICsgCgkJIyBnZW9tX3RleHQoc2l6ZSA9IDIsIGFlcyhsYWJlbCA9IHByZXR0eU51bSh2YWx1ZSwgZGlnaXRzPTMsIHdpZHRoPTQsIGZvcm1hdD0iZmciKSkpICsKCQlzY2FsZV9maWxsX2dyYWRpZW50bihjb2xvdXJzID0gbXlQYWxldHRlKDEwKVsxOjZdCgkJCSwgbGltaXRzID0gYygwLDEpCgkJLCB2YWx1ZXMgPSBjKDAsIDAuMSwgMC4yLCAwLjMsIDEpCgkJKSArIAoJCXhsYWIoIiIpICsgeWxhYigiUHJpbmNpcGFsIENvbXBvbmVudHMiKSArIHRoZW1lKGF4aXMudGV4dC54PWVsZW1lbnRfdGV4dChjb2xvdXI9ImJsYWNrIiksIGF4aXMudGV4dC55PWVsZW1lbnRfdGV4dChjb2xvdXI9ImJsYWNrIikpKwoJCWdndGl0bGUodGlzcykKYGBgCgpgYGB7cn0KdGlzczwtICJCbG9vZCIKCmdncGxvdChwbG90LnIyW1t0aXNzXV0sIGFlcyhWYXIyLCBWYXIxKSkgKyBnZW9tX3RpbGUoYWVzKGZpbGwgPSB2YWx1ZSksCgkgICAgIGNvbG91ciA9ICJ3aGl0ZSIpICsgCgkJIyBnZW9tX3RleHQoc2l6ZSA9IDIsIGFlcyhsYWJlbCA9IHByZXR0eU51bSh2YWx1ZSwgZGlnaXRzPTMsIHdpZHRoPTQsIGZvcm1hdD0iZmciKSkpICsKCQlzY2FsZV9maWxsX2dyYWRpZW50bihjb2xvdXJzID0gbXlQYWxldHRlKDEwKVsxOjZdCgkJCSwgbGltaXRzID0gYygwLDEpCgkJLCB2YWx1ZXMgPSBjKDAsIDAuMSwgMC4yLCAwLjMsIDEpCgkJKSArIAoJCXhsYWIoIiIpICsgeWxhYigiUHJpbmNpcGFsIENvbXBvbmVudHMiKSArIHRoZW1lKGF4aXMudGV4dC54PWVsZW1lbnRfdGV4dChjb2xvdXI9ImJsYWNrIiksIGF4aXMudGV4dC55PWVsZW1lbnRfdGV4dChjb2xvdXI9ImJsYWNrIikpKwoJCWdndGl0bGUodGlzcykKYGBgCgpBZGQgYSBuZXcgY2h1bmsgYnkgY2xpY2tpbmcgdGhlICpJbnNlcnQgQ2h1bmsqIGJ1dHRvbiBvbiB0aGUgdG9vbGJhciBvciBieSBwcmVzc2luZyAqQ21kK09wdGlvbitJKi4KCldoZW4geW91IHNhdmUgdGhlIG5vdGVib29rLCBhbiBIVE1MIGZpbGUgY29udGFpbmluZyB0aGUgY29kZSBhbmQgb3V0cHV0IHdpbGwgYmUgc2F2ZWQgYWxvbmdzaWRlIGl0IChjbGljayB0aGUgKlByZXZpZXcqIGJ1dHRvbiBvciBwcmVzcyAqQ21kK1NoaWZ0K0sqIHRvIHByZXZpZXcgdGhlIEhUTUwgZmlsZSkuIAoKVGhlIHByZXZpZXcgc2hvd3MgeW91IGEgcmVuZGVyZWQgSFRNTCBjb3B5IG9mIHRoZSBjb250ZW50cyBvZiB0aGUgZWRpdG9yLiBDb25zZXF1ZW50bHksIHVubGlrZSAqS25pdCosICpQcmV2aWV3KiBkb2VzIG5vdCBydW4gYW55IFIgY29kZSBjaHVua3MuIEluc3RlYWQsIHRoZSBvdXRwdXQgb2YgdGhlIGNodW5rIHdoZW4gaXQgd2FzIGxhc3QgcnVuIGluIHRoZSBlZGl0b3IgaXMgZGlzcGxheWVkLgoK
- - - -
- - - - - - - - diff --git a/rmd_analysis/genes_assigned_plots.Rmd b/rmd_analysis/genes_assigned_plots.Rmd deleted file mode 100644 index b144950..0000000 --- a/rmd_analysis/genes_assigned_plots.Rmd +++ /dev/null @@ -1,52 +0,0 @@ ---- -title: "WGCNA - # genes assigned to a module (non-gray)" -output: html_notebook ---- - -```{r "setup", include=FALSE} -require("knitr") -opts_knit$set(root.dir = "/work-zfs/abattle4/parsana/networks_correction_v/networks/") -``` - -```{r} -rm(list = ls()) -library(reshape2) -library(ggplot2) -load("raw/wgcna_networks.Rdata") -plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(which(x$colors!=0)))) -plot.mod <- melt(do.call(cbind, plot.mod)) -ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle("Raw")+ - xlab("cut-height") + ylab("# genes assigned to modules") -``` - -```{r} -load("rin/wgcna_networks.Rdata") -plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(which(x$colors!=0)))) -plot.mod <- melt(do.call(cbind, plot.mod)) -ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle("RIN")+ - xlab("cut-height") + ylab("# genes assigned to modules") -``` - -```{r} -load("quarterpc/wgcna_networks.Rdata") -plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(which(x$colors!=0)))) -plot.mod <- melt(do.call(cbind, plot.mod)) -ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle("quarter-PC")+ - xlab("cut-height") + ylab("# genes assigned to modules") -``` - -```{r} -load("halfpc//wgcna_networks.Rdata") -plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(which(x$colors!=0)))) -plot.mod <- melt(do.call(cbind, plot.mod)) -ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle("halfPC")+ - xlab("cut-height") + ylab("# genes assigned to modules") -``` - -```{r} -load("pc//wgcna_networks.Rdata") -plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(which(x$colors!=0)))) -plot.mod <- melt(do.call(cbind, plot.mod)) -ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle("PC")+ - xlab("cut-height") + ylab("# genes assigned to modules") -``` diff --git a/rmd_analysis/genes_assigned_plots.nb.html b/rmd_analysis/genes_assigned_plots.nb.html deleted file mode 100644 index 9efc696..0000000 --- a/rmd_analysis/genes_assigned_plots.nb.html +++ /dev/null @@ -1,292 +0,0 @@ - - - - - - - - - - - - - -WGCNA - # genes assigned to a module (non-gray) - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
- - - - - - - - - - - - - - - - - - - - - - -
rm(list = ls())
-library(reshape2)
-library(ggplot2)
-load("raw/wgcna_networks.Rdata")
-plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(which(x$colors!=0))))
-plot.mod <- melt(do.call(cbind, plot.mod))
-ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle("Raw")+
-  xlab("cut-height") + ylab("# genes assigned to modules")
- - -

- - - - - - -
load("rin/wgcna_networks.Rdata")
-plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(which(x$colors!=0))))
-plot.mod <- melt(do.call(cbind, plot.mod))
-ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle("RIN")+
-  xlab("cut-height") + ylab("# genes assigned to modules")
- - -

- - - - - - -
load("quarterpc/wgcna_networks.Rdata")
-plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(which(x$colors!=0))))
-plot.mod <- melt(do.call(cbind, plot.mod))
-ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle("quarter-PC")+
-  xlab("cut-height") + ylab("# genes assigned to modules")
- - -

- - - - - - -
load("halfpc//wgcna_networks.Rdata")
-plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(which(x$colors!=0))))
-plot.mod <- melt(do.call(cbind, plot.mod))
-ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle("halfPC")+
-  xlab("cut-height") + ylab("# genes assigned to modules")
- - -

- - - - - - -
load("pc//wgcna_networks.Rdata")
-plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(which(x$colors!=0))))
-plot.mod <- melt(do.call(cbind, plot.mod))
-ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle("PC")+
-  xlab("cut-height") + ylab("# genes assigned to modules")
- - -

- - - -
LS0tCnRpdGxlOiAiV0dDTkEgLSAjIGdlbmVzIGFzc2lnbmVkIHRvIGEgbW9kdWxlIChub24tZ3JheSkiCm91dHB1dDogaHRtbF9ub3RlYm9vawotLS0KCmBgYHtyICJzZXR1cCIsIGluY2x1ZGU9RkFMU0V9CnJlcXVpcmUoImtuaXRyIikKb3B0c19rbml0JHNldChyb290LmRpciA9ICIvd29yay16ZnMvYWJhdHRsZTQvcGFyc2FuYS9uZXR3b3Jrc19jb3JyZWN0aW9uX3YvbmV0d29ya3MvIikKYGBgCgpgYGB7cn0Kcm0obGlzdCA9IGxzKCkpCmxpYnJhcnkocmVzaGFwZTIpCmxpYnJhcnkoZ2dwbG90MikKbG9hZCgicmF3L3dnY25hX25ldHdvcmtzLlJkYXRhIikKcGxvdC5tb2QgPC0gbGFwcGx5KGRhdC5uZXQsIGZ1bmN0aW9uKHkpIHNhcHBseSh5LCBmdW5jdGlvbih4KSBsZW5ndGgod2hpY2goeCRjb2xvcnMhPTApKSkpCnBsb3QubW9kIDwtIG1lbHQoZG8uY2FsbChjYmluZCwgcGxvdC5tb2QpKQpnZ3Bsb3QocGxvdC5tb2QsIGFlcyh4ID0gVmFyMSwgeSA9IHZhbHVlLCBjb2wgPSBWYXIyKSkgKyBnZW9tX3BvaW50KCkrZ2d0aXRsZSgiUmF3IikrCiAgeGxhYigiY3V0LWhlaWdodCIpICsgeWxhYigiIyBnZW5lcyBhc3NpZ25lZCB0byBtb2R1bGVzIikKYGBgCgpgYGB7cn0KbG9hZCgicmluL3dnY25hX25ldHdvcmtzLlJkYXRhIikKcGxvdC5tb2QgPC0gbGFwcGx5KGRhdC5uZXQsIGZ1bmN0aW9uKHkpIHNhcHBseSh5LCBmdW5jdGlvbih4KSBsZW5ndGgod2hpY2goeCRjb2xvcnMhPTApKSkpCnBsb3QubW9kIDwtIG1lbHQoZG8uY2FsbChjYmluZCwgcGxvdC5tb2QpKQpnZ3Bsb3QocGxvdC5tb2QsIGFlcyh4ID0gVmFyMSwgeSA9IHZhbHVlLCBjb2wgPSBWYXIyKSkgKyBnZW9tX3BvaW50KCkrZ2d0aXRsZSgiUklOIikrCiAgeGxhYigiY3V0LWhlaWdodCIpICsgeWxhYigiIyBnZW5lcyBhc3NpZ25lZCB0byBtb2R1bGVzIikKYGBgCgpgYGB7cn0KbG9hZCgicXVhcnRlcnBjL3dnY25hX25ldHdvcmtzLlJkYXRhIikKcGxvdC5tb2QgPC0gbGFwcGx5KGRhdC5uZXQsIGZ1bmN0aW9uKHkpIHNhcHBseSh5LCBmdW5jdGlvbih4KSBsZW5ndGgod2hpY2goeCRjb2xvcnMhPTApKSkpCnBsb3QubW9kIDwtIG1lbHQoZG8uY2FsbChjYmluZCwgcGxvdC5tb2QpKQpnZ3Bsb3QocGxvdC5tb2QsIGFlcyh4ID0gVmFyMSwgeSA9IHZhbHVlLCBjb2wgPSBWYXIyKSkgKyBnZW9tX3BvaW50KCkrZ2d0aXRsZSgicXVhcnRlci1QQyIpKwogIHhsYWIoImN1dC1oZWlnaHQiKSArIHlsYWIoIiMgZ2VuZXMgYXNzaWduZWQgdG8gbW9kdWxlcyIpCmBgYAoKYGBge3J9CmxvYWQoImhhbGZwYy8vd2djbmFfbmV0d29ya3MuUmRhdGEiKQpwbG90Lm1vZCA8LSBsYXBwbHkoZGF0Lm5ldCwgZnVuY3Rpb24oeSkgc2FwcGx5KHksIGZ1bmN0aW9uKHgpIGxlbmd0aCh3aGljaCh4JGNvbG9ycyE9MCkpKSkKcGxvdC5tb2QgPC0gbWVsdChkby5jYWxsKGNiaW5kLCBwbG90Lm1vZCkpCmdncGxvdChwbG90Lm1vZCwgYWVzKHggPSBWYXIxLCB5ID0gdmFsdWUsIGNvbCA9IFZhcjIpKSArIGdlb21fcG9pbnQoKStnZ3RpdGxlKCJoYWxmUEMiKSsKICB4bGFiKCJjdXQtaGVpZ2h0IikgKyB5bGFiKCIjIGdlbmVzIGFzc2lnbmVkIHRvIG1vZHVsZXMiKQpgYGAKCmBgYHtyfQpsb2FkKCJwYy8vd2djbmFfbmV0d29ya3MuUmRhdGEiKQpwbG90Lm1vZCA8LSBsYXBwbHkoZGF0Lm5ldCwgZnVuY3Rpb24oeSkgc2FwcGx5KHksIGZ1bmN0aW9uKHgpIGxlbmd0aCh3aGljaCh4JGNvbG9ycyE9MCkpKSkKcGxvdC5tb2QgPC0gbWVsdChkby5jYWxsKGNiaW5kLCBwbG90Lm1vZCkpCmdncGxvdChwbG90Lm1vZCwgYWVzKHggPSBWYXIxLCB5ID0gdmFsdWUsIGNvbCA9IFZhcjIpKSArIGdlb21fcG9pbnQoKStnZ3RpdGxlKCJQQyIpKwogIHhsYWIoImN1dC1oZWlnaHQiKSArIHlsYWIoIiMgZ2VuZXMgYXNzaWduZWQgdG8gbW9kdWxlcyIpCmBgYAo=
- - - -
- - - - - - - - diff --git a/rmd_analysis/module_count_bytissue.Rmd b/rmd_analysis/module_count_bytissue.Rmd deleted file mode 100644 index 0079a9e..0000000 --- a/rmd_analysis/module_count_bytissue.Rmd +++ /dev/null @@ -1,85 +0,0 @@ ---- -title: "WGCNA - # genes assigned to a module (non-gray) by tissue" -output: html_notebook ---- - -```{r "setup", include=FALSE} -require("knitr") -opts_knit$set(root.dir = "/work-zfs/abattle4/parsana/networks_correction/networks/") -``` - -```{r} -rm(list = ls()) -library(reshape2) -library(ggplot2) -load("raw/wgcna_networks.Rdata") -tiss <- "Thyroid" -raw <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0))) - -load("rin/wgcna_networks.Rdata") -rin <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0))) - -load("quarterpc/wgcna_networks.Rdata") -quarterPC <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0))) - -load("halfpc//wgcna_networks.Rdata") -halfPC <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0))) - -load("pc//wgcna_networks.Rdata") -pc <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0))) - -plot.mod <- melt(cbind(raw, rin, quarterPC, halfPC, pc)) -plot.mod$Var2 <- factor(plot.mod$Var2, levels = c("pc", "halfPC", "quarterPC", "rin", "raw"), labels = c("PC", "half-PC", "quarter-PC", "RIN", "uncorrected")) - -ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle(tiss)+ - xlab("cut-height") + ylab("# genes assigned to modules") -``` - -```{r} -tiss <- "Subcutaneous" -load("raw/wgcna_networks.Rdata") -raw <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0))) - -load("rin/wgcna_networks.Rdata") -rin <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0))) - -load("quarterpc/wgcna_networks.Rdata") -quarterPC <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0))) - -load("halfpc//wgcna_networks.Rdata") -halfPC <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0))) - -load("pc//wgcna_networks.Rdata") -pc <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0))) - -plot.mod <- melt(cbind(raw, rin, quarterPC, halfPC, pc)) -plot.mod$Var2 <- factor(plot.mod$Var2, levels = c("pc", "halfPC", "quarterPC", "rin", "raw"), labels = c("PC", "half-PC", "quarter-PC", "RIN", "uncorrected")) - -ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle(tiss)+ - xlab("cut-height") + ylab("# genes assigned to modules") -``` - -```{r} -tiss <- "Lung" -load("raw/wgcna_networks.Rdata") -raw <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0))) - -load("rin/wgcna_networks.Rdata") -rin <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0))) - -load("quarterpc/wgcna_networks.Rdata") -quarterPC <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0))) - -load("halfpc//wgcna_networks.Rdata") -halfPC <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0))) - -load("pc//wgcna_networks.Rdata") -pc <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0))) - -plot.mod <- melt(cbind(raw, rin, quarterPC, halfPC, pc)) -plot.mod$Var2 <- factor(plot.mod$Var2, levels = c("pc", "halfPC", "quarterPC", "rin", "raw"), labels = c("PC", "half-PC", "quarter-PC", "RIN", "uncorrected")) - -ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle(tiss)+ - xlab("cut-height") + ylab("# genes assigned to modules") -``` - diff --git a/rmd_analysis/module_count_bytissue.nb.html b/rmd_analysis/module_count_bytissue.nb.html deleted file mode 100644 index 9f3f483..0000000 --- a/rmd_analysis/module_count_bytissue.nb.html +++ /dev/null @@ -1,296 +0,0 @@ - - - - - - - - - - - - - -WGCNA - # genes assigned to a module (non-gray) by tissue - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
- - - - - - - - - - - - - - - - - - - - - - -
rm(list = ls())
-library(reshape2)
-library(ggplot2)
-load("raw/wgcna_networks.Rdata")
-tiss <- "Thyroid"
-raw <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0)))
-load("rin/wgcna_networks.Rdata")
-rin <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0)))
-load("quarterpc/wgcna_networks.Rdata")
-quarterPC <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0)))
-load("halfpc//wgcna_networks.Rdata")
-halfPC <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0)))
-load("pc//wgcna_networks.Rdata")
-pc <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0)))
-plot.mod <- melt(cbind(raw, rin, quarterPC, halfPC, pc))
-plot.mod$Var2 <- factor(plot.mod$Var2, levels = c("pc", "halfPC", "quarterPC", "rin", "raw"), labels = c("PC", "half-PC", "quarter-PC", "RIN", "uncorrected"))
-ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle(tiss)+
-  xlab("cut-height") + ylab("# genes assigned to modules")
- - -

- - - - - - -
tiss <- "Subcutaneous"
-load("raw/wgcna_networks.Rdata")
-raw <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0)))
-load("rin/wgcna_networks.Rdata")
-rin <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0)))
-load("quarterpc/wgcna_networks.Rdata")
-quarterPC <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0)))
-load("halfpc//wgcna_networks.Rdata")
-halfPC <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0)))
-load("pc//wgcna_networks.Rdata")
-pc <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0)))
-plot.mod <- melt(cbind(raw, rin, quarterPC, halfPC, pc))
-plot.mod$Var2 <- factor(plot.mod$Var2, levels = c("pc", "halfPC", "quarterPC", "rin", "raw"), labels = c("PC", "half-PC", "quarter-PC", "RIN", "uncorrected"))
-ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle(tiss)+
-  xlab("cut-height") + ylab("# genes assigned to modules")
- - -

- - - - - - -
tiss <- "Lung"
-load("raw/wgcna_networks.Rdata")
-raw <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0)))
-load("rin/wgcna_networks.Rdata")
-rin <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0)))
-load("quarterpc/wgcna_networks.Rdata")
-quarterPC <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0)))
-load("halfpc//wgcna_networks.Rdata")
-halfPC <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0)))
-load("pc//wgcna_networks.Rdata")
-pc <- sapply(dat.net[[tiss]], function(x) length(which(x$colors!=0)))
-plot.mod <- melt(cbind(raw, rin, quarterPC, halfPC, pc))
-plot.mod$Var2 <- factor(plot.mod$Var2, levels = c("pc", "halfPC", "quarterPC", "rin", "raw"), labels = c("PC", "half-PC", "quarter-PC", "RIN", "uncorrected"))
-ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle(tiss)+
-  xlab("cut-height") + ylab("# genes assigned to modules")
- - -

- - - - - -
LS0tCnRpdGxlOiAiV0dDTkEgLSAjIGdlbmVzIGFzc2lnbmVkIHRvIGEgbW9kdWxlIChub24tZ3JheSkgYnkgdGlzc3VlIgpvdXRwdXQ6IGh0bWxfbm90ZWJvb2sKLS0tCgpgYGB7ciAic2V0dXAiLCBpbmNsdWRlPUZBTFNFfQpyZXF1aXJlKCJrbml0ciIpCm9wdHNfa25pdCRzZXQocm9vdC5kaXIgPSAiL3dvcmstemZzL2FiYXR0bGU0L3BhcnNhbmEvbmV0d29ya3NfY29ycmVjdGlvbi9uZXR3b3Jrcy8iKQpgYGAKCmBgYHtyfQpybShsaXN0ID0gbHMoKSkKbGlicmFyeShyZXNoYXBlMikKbGlicmFyeShnZ3Bsb3QyKQpsb2FkKCJyYXcvd2djbmFfbmV0d29ya3MuUmRhdGEiKQp0aXNzIDwtICJUaHlyb2lkIgpyYXcgPC0gc2FwcGx5KGRhdC5uZXRbW3Rpc3NdXSwgZnVuY3Rpb24oeCkgbGVuZ3RoKHdoaWNoKHgkY29sb3JzIT0wKSkpCgpsb2FkKCJyaW4vd2djbmFfbmV0d29ya3MuUmRhdGEiKQpyaW4gPC0gc2FwcGx5KGRhdC5uZXRbW3Rpc3NdXSwgZnVuY3Rpb24oeCkgbGVuZ3RoKHdoaWNoKHgkY29sb3JzIT0wKSkpCgpsb2FkKCJxdWFydGVycGMvd2djbmFfbmV0d29ya3MuUmRhdGEiKQpxdWFydGVyUEMgPC0gc2FwcGx5KGRhdC5uZXRbW3Rpc3NdXSwgZnVuY3Rpb24oeCkgbGVuZ3RoKHdoaWNoKHgkY29sb3JzIT0wKSkpCgpsb2FkKCJoYWxmcGMvL3dnY25hX25ldHdvcmtzLlJkYXRhIikKaGFsZlBDIDwtIHNhcHBseShkYXQubmV0W1t0aXNzXV0sIGZ1bmN0aW9uKHgpIGxlbmd0aCh3aGljaCh4JGNvbG9ycyE9MCkpKQoKbG9hZCgicGMvL3dnY25hX25ldHdvcmtzLlJkYXRhIikKcGMgPC0gc2FwcGx5KGRhdC5uZXRbW3Rpc3NdXSwgZnVuY3Rpb24oeCkgbGVuZ3RoKHdoaWNoKHgkY29sb3JzIT0wKSkpCgpwbG90Lm1vZCA8LSBtZWx0KGNiaW5kKHJhdywgcmluLCBxdWFydGVyUEMsIGhhbGZQQywgcGMpKQpwbG90Lm1vZCRWYXIyIDwtIGZhY3RvcihwbG90Lm1vZCRWYXIyLCBsZXZlbHMgPSBjKCJwYyIsICJoYWxmUEMiLCAicXVhcnRlclBDIiwgInJpbiIsICJyYXciKSwgbGFiZWxzID0gYygiUEMiLCAiaGFsZi1QQyIsICJxdWFydGVyLVBDIiwgIlJJTiIsICJ1bmNvcnJlY3RlZCIpKQoKZ2dwbG90KHBsb3QubW9kLCBhZXMoeCA9IFZhcjEsIHkgPSB2YWx1ZSwgY29sID0gVmFyMikpICsgZ2VvbV9wb2ludCgpK2dndGl0bGUodGlzcykrCiAgeGxhYigiY3V0LWhlaWdodCIpICsgeWxhYigiIyBnZW5lcyBhc3NpZ25lZCB0byBtb2R1bGVzIikKYGBgCgpgYGB7cn0KdGlzcyA8LSAiU3ViY3V0YW5lb3VzIgpsb2FkKCJyYXcvd2djbmFfbmV0d29ya3MuUmRhdGEiKQpyYXcgPC0gc2FwcGx5KGRhdC5uZXRbW3Rpc3NdXSwgZnVuY3Rpb24oeCkgbGVuZ3RoKHdoaWNoKHgkY29sb3JzIT0wKSkpCgpsb2FkKCJyaW4vd2djbmFfbmV0d29ya3MuUmRhdGEiKQpyaW4gPC0gc2FwcGx5KGRhdC5uZXRbW3Rpc3NdXSwgZnVuY3Rpb24oeCkgbGVuZ3RoKHdoaWNoKHgkY29sb3JzIT0wKSkpCgpsb2FkKCJxdWFydGVycGMvd2djbmFfbmV0d29ya3MuUmRhdGEiKQpxdWFydGVyUEMgPC0gc2FwcGx5KGRhdC5uZXRbW3Rpc3NdXSwgZnVuY3Rpb24oeCkgbGVuZ3RoKHdoaWNoKHgkY29sb3JzIT0wKSkpCgpsb2FkKCJoYWxmcGMvL3dnY25hX25ldHdvcmtzLlJkYXRhIikKaGFsZlBDIDwtIHNhcHBseShkYXQubmV0W1t0aXNzXV0sIGZ1bmN0aW9uKHgpIGxlbmd0aCh3aGljaCh4JGNvbG9ycyE9MCkpKQoKbG9hZCgicGMvL3dnY25hX25ldHdvcmtzLlJkYXRhIikKcGMgPC0gc2FwcGx5KGRhdC5uZXRbW3Rpc3NdXSwgZnVuY3Rpb24oeCkgbGVuZ3RoKHdoaWNoKHgkY29sb3JzIT0wKSkpCgpwbG90Lm1vZCA8LSBtZWx0KGNiaW5kKHJhdywgcmluLCBxdWFydGVyUEMsIGhhbGZQQywgcGMpKQpwbG90Lm1vZCRWYXIyIDwtIGZhY3RvcihwbG90Lm1vZCRWYXIyLCBsZXZlbHMgPSBjKCJwYyIsICJoYWxmUEMiLCAicXVhcnRlclBDIiwgInJpbiIsICJyYXciKSwgbGFiZWxzID0gYygiUEMiLCAiaGFsZi1QQyIsICJxdWFydGVyLVBDIiwgIlJJTiIsICJ1bmNvcnJlY3RlZCIpKQoKZ2dwbG90KHBsb3QubW9kLCBhZXMoeCA9IFZhcjEsIHkgPSB2YWx1ZSwgY29sID0gVmFyMikpICsgZ2VvbV9wb2ludCgpK2dndGl0bGUodGlzcykrCiAgeGxhYigiY3V0LWhlaWdodCIpICsgeWxhYigiIyBnZW5lcyBhc3NpZ25lZCB0byBtb2R1bGVzIikKYGBgCgpgYGB7cn0KdGlzcyA8LSAiTHVuZyIKbG9hZCgicmF3L3dnY25hX25ldHdvcmtzLlJkYXRhIikKcmF3IDwtIHNhcHBseShkYXQubmV0W1t0aXNzXV0sIGZ1bmN0aW9uKHgpIGxlbmd0aCh3aGljaCh4JGNvbG9ycyE9MCkpKQoKbG9hZCgicmluL3dnY25hX25ldHdvcmtzLlJkYXRhIikKcmluIDwtIHNhcHBseShkYXQubmV0W1t0aXNzXV0sIGZ1bmN0aW9uKHgpIGxlbmd0aCh3aGljaCh4JGNvbG9ycyE9MCkpKQoKbG9hZCgicXVhcnRlcnBjL3dnY25hX25ldHdvcmtzLlJkYXRhIikKcXVhcnRlclBDIDwtIHNhcHBseShkYXQubmV0W1t0aXNzXV0sIGZ1bmN0aW9uKHgpIGxlbmd0aCh3aGljaCh4JGNvbG9ycyE9MCkpKQoKbG9hZCgiaGFsZnBjLy93Z2NuYV9uZXR3b3Jrcy5SZGF0YSIpCmhhbGZQQyA8LSBzYXBwbHkoZGF0Lm5ldFtbdGlzc11dLCBmdW5jdGlvbih4KSBsZW5ndGgod2hpY2goeCRjb2xvcnMhPTApKSkKCmxvYWQoInBjLy93Z2NuYV9uZXR3b3Jrcy5SZGF0YSIpCnBjIDwtIHNhcHBseShkYXQubmV0W1t0aXNzXV0sIGZ1bmN0aW9uKHgpIGxlbmd0aCh3aGljaCh4JGNvbG9ycyE9MCkpKQoKcGxvdC5tb2QgPC0gbWVsdChjYmluZChyYXcsIHJpbiwgcXVhcnRlclBDLCBoYWxmUEMsIHBjKSkKcGxvdC5tb2QkVmFyMiA8LSBmYWN0b3IocGxvdC5tb2QkVmFyMiwgbGV2ZWxzID0gYygicGMiLCAiaGFsZlBDIiwgInF1YXJ0ZXJQQyIsICJyaW4iLCAicmF3IiksIGxhYmVscyA9IGMoIlBDIiwgImhhbGYtUEMiLCAicXVhcnRlci1QQyIsICJSSU4iLCAidW5jb3JyZWN0ZWQiKSkKCmdncGxvdChwbG90Lm1vZCwgYWVzKHggPSBWYXIxLCB5ID0gdmFsdWUsIGNvbCA9IFZhcjIpKSArIGdlb21fcG9pbnQoKStnZ3RpdGxlKHRpc3MpKwogIHhsYWIoImN1dC1oZWlnaHQiKSArIHlsYWIoIiMgZ2VuZXMgYXNzaWduZWQgdG8gbW9kdWxlcyIpCmBgYAoK
- - - -
- - - - - - - - diff --git a/rmd_analysis/module_count_plots.Rmd b/rmd_analysis/module_count_plots.Rmd deleted file mode 100644 index 1a88a22..0000000 --- a/rmd_analysis/module_count_plots.Rmd +++ /dev/null @@ -1,55 +0,0 @@ ---- -title: "WGCNA module distribution" -output: html_notebook ---- - -```{r "setup", include=FALSE} -require("knitr") -opts_knit$set(root.dir = "/work-zfs/abattle4/parsana/networks_correction_v/networks/") -``` - -```{r} -rm(list = ls()) -library(reshape2) -library(ggplot2) -load("raw/wgcna_networks.Rdata") -plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(unique(x$colors))-1)) -plot.mod <- melt(do.call(cbind, plot.mod)) -ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle("Raw")+ - xlab("cut-height") + ylab("# modules") -``` - -```{r} -load("rin/wgcna_networks.Rdata") -plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(unique(x$colors))-1)) -plot.mod <- melt(do.call(cbind, plot.mod)) -ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle("RIN")+ - xlab("cut-height") + ylab("# modules") -``` - -```{r} -load("quarterpc/wgcna_networks.Rdata") -plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(unique(x$colors))-1)) -plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(unique(x$colors))-1)) -plot.mod <- melt(do.call(cbind, plot.mod)) -ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle("quarter-PC")+ - xlab("cut-height") + ylab("# modules") -``` - -```{r} -load("halfpc//wgcna_networks.Rdata") -plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(unique(x$colors))-1)) -plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(unique(x$colors))-1)) -plot.mod <- melt(do.call(cbind, plot.mod)) -ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle("halfPC")+ - xlab("cut-height") + ylab("# modules") -``` - -```{r} -load("pc//wgcna_networks.Rdata") -plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(unique(x$colors))-1)) -plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(unique(x$colors))-1)) -plot.mod <- melt(do.call(cbind, plot.mod)) -ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle("PC")+ - xlab("cut-height") + ylab("# modules") -``` diff --git a/rmd_analysis/module_count_plots.nb.html b/rmd_analysis/module_count_plots.nb.html deleted file mode 100644 index 83ceb42..0000000 --- a/rmd_analysis/module_count_plots.nb.html +++ /dev/null @@ -1,285 +0,0 @@ - - - - - - - - - - - - - -WGCNA module distribution - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
- - - - - - - - - - - - - - - - - - - - - - -

- - - - - - -
load("rin/wgcna_networks.Rdata")
-plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(unique(x$colors))-1))
-plot.mod <- melt(do.call(cbind, plot.mod))
-ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle("RIN")+
-  xlab("cut-height") + ylab("# modules")
- - -

- - - - - - -
load("quarterpc/wgcna_networks.Rdata")
-plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(unique(x$colors))-1))
-plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(unique(x$colors))-1))
-plot.mod <- melt(do.call(cbind, plot.mod))
-ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle("quarter-PC")+
-  xlab("cut-height") + ylab("# modules")
- - -

- - - - - - -
load("halfpc//wgcna_networks.Rdata")
-plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(unique(x$colors))-1))
-plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(unique(x$colors))-1))
-plot.mod <- melt(do.call(cbind, plot.mod))
-ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle("halfPC")+
-  xlab("cut-height") + ylab("# modules")
- - -

- - - - - - -
load("pc//wgcna_networks.Rdata")
-plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(unique(x$colors))-1))
-plot.mod <- lapply(dat.net, function(y) sapply(y, function(x) length(unique(x$colors))-1))
-plot.mod <- melt(do.call(cbind, plot.mod))
-ggplot(plot.mod, aes(x = Var1, y = value, col = Var2)) + geom_point()+ggtitle("PC")+
-  xlab("cut-height") + ylab("# modules")
- - -

- - - -
LS0tCnRpdGxlOiAiV0dDTkEgbW9kdWxlIGRpc3RyaWJ1dGlvbiIKb3V0cHV0OiBodG1sX25vdGVib29rCi0tLQoKYGBge3IgInNldHVwIiwgaW5jbHVkZT1GQUxTRX0KcmVxdWlyZSgia25pdHIiKQpvcHRzX2tuaXQkc2V0KHJvb3QuZGlyID0gIi93b3JrLXpmcy9hYmF0dGxlNC9wYXJzYW5hL25ldHdvcmtzX2NvcnJlY3Rpb25fdi9uZXR3b3Jrcy8iKQpgYGAKCmBgYHtyfQpybShsaXN0ID0gbHMoKSkKbGlicmFyeShyZXNoYXBlMikKbGlicmFyeShnZ3Bsb3QyKQpsb2FkKCJyYXcvd2djbmFfbmV0d29ya3MuUmRhdGEiKQpwbG90Lm1vZCA8LSBsYXBwbHkoZGF0Lm5ldCwgZnVuY3Rpb24oeSkgc2FwcGx5KHksIGZ1bmN0aW9uKHgpIGxlbmd0aCh1bmlxdWUoeCRjb2xvcnMpKS0xKSkKcGxvdC5tb2QgPC0gbWVsdChkby5jYWxsKGNiaW5kLCBwbG90Lm1vZCkpCmdncGxvdChwbG90Lm1vZCwgYWVzKHggPSBWYXIxLCB5ID0gdmFsdWUsIGNvbCA9IFZhcjIpKSArIGdlb21fcG9pbnQoKStnZ3RpdGxlKCJSYXciKSsKICB4bGFiKCJjdXQtaGVpZ2h0IikgKyB5bGFiKCIjIG1vZHVsZXMiKQpgYGAKCmBgYHtyfQpsb2FkKCJyaW4vd2djbmFfbmV0d29ya3MuUmRhdGEiKQpwbG90Lm1vZCA8LSBsYXBwbHkoZGF0Lm5ldCwgZnVuY3Rpb24oeSkgc2FwcGx5KHksIGZ1bmN0aW9uKHgpIGxlbmd0aCh1bmlxdWUoeCRjb2xvcnMpKS0xKSkKcGxvdC5tb2QgPC0gbWVsdChkby5jYWxsKGNiaW5kLCBwbG90Lm1vZCkpCmdncGxvdChwbG90Lm1vZCwgYWVzKHggPSBWYXIxLCB5ID0gdmFsdWUsIGNvbCA9IFZhcjIpKSArIGdlb21fcG9pbnQoKStnZ3RpdGxlKCJSSU4iKSsKICB4bGFiKCJjdXQtaGVpZ2h0IikgKyB5bGFiKCIjIG1vZHVsZXMiKQpgYGAKCmBgYHtyfQpsb2FkKCJxdWFydGVycGMvd2djbmFfbmV0d29ya3MuUmRhdGEiKQpwbG90Lm1vZCA8LSBsYXBwbHkoZGF0Lm5ldCwgZnVuY3Rpb24oeSkgc2FwcGx5KHksIGZ1bmN0aW9uKHgpIGxlbmd0aCh1bmlxdWUoeCRjb2xvcnMpKS0xKSkKcGxvdC5tb2QgPC0gbGFwcGx5KGRhdC5uZXQsIGZ1bmN0aW9uKHkpIHNhcHBseSh5LCBmdW5jdGlvbih4KSBsZW5ndGgodW5pcXVlKHgkY29sb3JzKSktMSkpCnBsb3QubW9kIDwtIG1lbHQoZG8uY2FsbChjYmluZCwgcGxvdC5tb2QpKQpnZ3Bsb3QocGxvdC5tb2QsIGFlcyh4ID0gVmFyMSwgeSA9IHZhbHVlLCBjb2wgPSBWYXIyKSkgKyBnZW9tX3BvaW50KCkrZ2d0aXRsZSgicXVhcnRlci1QQyIpKwogIHhsYWIoImN1dC1oZWlnaHQiKSArIHlsYWIoIiMgbW9kdWxlcyIpCmBgYAoKYGBge3J9CmxvYWQoImhhbGZwYy8vd2djbmFfbmV0d29ya3MuUmRhdGEiKQpwbG90Lm1vZCA8LSBsYXBwbHkoZGF0Lm5ldCwgZnVuY3Rpb24oeSkgc2FwcGx5KHksIGZ1bmN0aW9uKHgpIGxlbmd0aCh1bmlxdWUoeCRjb2xvcnMpKS0xKSkKcGxvdC5tb2QgPC0gbGFwcGx5KGRhdC5uZXQsIGZ1bmN0aW9uKHkpIHNhcHBseSh5LCBmdW5jdGlvbih4KSBsZW5ndGgodW5pcXVlKHgkY29sb3JzKSktMSkpCnBsb3QubW9kIDwtIG1lbHQoZG8uY2FsbChjYmluZCwgcGxvdC5tb2QpKQpnZ3Bsb3QocGxvdC5tb2QsIGFlcyh4ID0gVmFyMSwgeSA9IHZhbHVlLCBjb2wgPSBWYXIyKSkgKyBnZW9tX3BvaW50KCkrZ2d0aXRsZSgiaGFsZlBDIikrCiAgeGxhYigiY3V0LWhlaWdodCIpICsgeWxhYigiIyBtb2R1bGVzIikKYGBgCgpgYGB7cn0KbG9hZCgicGMvL3dnY25hX25ldHdvcmtzLlJkYXRhIikKcGxvdC5tb2QgPC0gbGFwcGx5KGRhdC5uZXQsIGZ1bmN0aW9uKHkpIHNhcHBseSh5LCBmdW5jdGlvbih4KSBsZW5ndGgodW5pcXVlKHgkY29sb3JzKSktMSkpCnBsb3QubW9kIDwtIGxhcHBseShkYXQubmV0LCBmdW5jdGlvbih5KSBzYXBwbHkoeSwgZnVuY3Rpb24oeCkgbGVuZ3RoKHVuaXF1ZSh4JGNvbG9ycykpLTEpKQpwbG90Lm1vZCA8LSBtZWx0KGRvLmNhbGwoY2JpbmQsIHBsb3QubW9kKSkKZ2dwbG90KHBsb3QubW9kLCBhZXMoeCA9IFZhcjEsIHkgPSB2YWx1ZSwgY29sID0gVmFyMikpICsgZ2VvbV9wb2ludCgpK2dndGl0bGUoIlBDIikrCiAgeGxhYigiY3V0LWhlaWdodCIpICsgeWxhYigiIyBtb2R1bGVzIikKYGBgCg==
- - - -
- - - - - - - - diff --git a/rmd_analysis/plots/correlation_networks_Blood.pdf b/rmd_analysis/plots/correlation_networks_Blood.pdf deleted file mode 100644 index 718c8aa..0000000 Binary files a/rmd_analysis/plots/correlation_networks_Blood.pdf and /dev/null differ diff --git a/rmd_analysis/plots/correlation_networks_Blood.png b/rmd_analysis/plots/correlation_networks_Blood.png deleted file mode 100644 index 60bcde7..0000000 Binary files a/rmd_analysis/plots/correlation_networks_Blood.png and /dev/null differ diff --git a/rmd_analysis/plots/correlation_networks_Lung.pdf b/rmd_analysis/plots/correlation_networks_Lung.pdf deleted file mode 100644 index b822617..0000000 Binary files a/rmd_analysis/plots/correlation_networks_Lung.pdf and /dev/null differ diff --git a/rmd_analysis/plots/correlation_networks_Lung.png b/rmd_analysis/plots/correlation_networks_Lung.png deleted file mode 100644 index 003c42a..0000000 Binary files a/rmd_analysis/plots/correlation_networks_Lung.png and /dev/null differ diff --git a/rmd_analysis/plots/correlation_networks_Muscle.pdf b/rmd_analysis/plots/correlation_networks_Muscle.pdf deleted file mode 100644 index 156682a..0000000 Binary files a/rmd_analysis/plots/correlation_networks_Muscle.pdf and /dev/null differ diff --git a/rmd_analysis/plots/correlation_networks_Muscle.png b/rmd_analysis/plots/correlation_networks_Muscle.png deleted file mode 100644 index 5489944..0000000 Binary files a/rmd_analysis/plots/correlation_networks_Muscle.png and /dev/null differ diff --git a/rmd_analysis/plots/correlation_networks_Subcutaneous.pdf b/rmd_analysis/plots/correlation_networks_Subcutaneous.pdf deleted file mode 100644 index da1939c..0000000 Binary files a/rmd_analysis/plots/correlation_networks_Subcutaneous.pdf and /dev/null differ diff --git a/rmd_analysis/plots/correlation_networks_Subcutaneous.png b/rmd_analysis/plots/correlation_networks_Subcutaneous.png deleted file mode 100644 index a118a68..0000000 Binary files a/rmd_analysis/plots/correlation_networks_Subcutaneous.png and /dev/null differ diff --git a/rmd_analysis/plots/correlation_networks_Thyroid.pdf b/rmd_analysis/plots/correlation_networks_Thyroid.pdf deleted file mode 100644 index 4b4af5a..0000000 Binary files a/rmd_analysis/plots/correlation_networks_Thyroid.pdf and /dev/null differ diff --git a/rmd_analysis/plots/correlation_networks_Thyroid.png b/rmd_analysis/plots/correlation_networks_Thyroid.png deleted file mode 100644 index 2b1e912..0000000 Binary files a/rmd_analysis/plots/correlation_networks_Thyroid.png and /dev/null differ diff --git a/rmd_analysis/plots/wgcna_networks_Blood.pdf b/rmd_analysis/plots/wgcna_networks_Blood.pdf deleted file mode 100644 index ee447ec..0000000 Binary files a/rmd_analysis/plots/wgcna_networks_Blood.pdf and /dev/null differ diff --git a/rmd_analysis/plots/wgcna_networks_Blood.png b/rmd_analysis/plots/wgcna_networks_Blood.png deleted file mode 100644 index 3e8b644..0000000 Binary files a/rmd_analysis/plots/wgcna_networks_Blood.png and /dev/null differ diff --git a/rmd_analysis/plots/wgcna_networks_Lung.pdf b/rmd_analysis/plots/wgcna_networks_Lung.pdf deleted file mode 100644 index fa07e37..0000000 Binary files a/rmd_analysis/plots/wgcna_networks_Lung.pdf and /dev/null differ diff --git a/rmd_analysis/plots/wgcna_networks_Lung.png b/rmd_analysis/plots/wgcna_networks_Lung.png deleted file mode 100644 index adf88f1..0000000 Binary files a/rmd_analysis/plots/wgcna_networks_Lung.png and /dev/null differ diff --git a/rmd_analysis/plots/wgcna_networks_Muscle.pdf b/rmd_analysis/plots/wgcna_networks_Muscle.pdf deleted file mode 100644 index 2e4b60b..0000000 Binary files a/rmd_analysis/plots/wgcna_networks_Muscle.pdf and /dev/null differ diff --git a/rmd_analysis/plots/wgcna_networks_Muscle.png b/rmd_analysis/plots/wgcna_networks_Muscle.png deleted file mode 100644 index 43c657c..0000000 Binary files a/rmd_analysis/plots/wgcna_networks_Muscle.png and /dev/null differ diff --git a/rmd_analysis/plots/wgcna_networks_Subcutaneous.pdf b/rmd_analysis/plots/wgcna_networks_Subcutaneous.pdf deleted file mode 100644 index 446d05b..0000000 Binary files a/rmd_analysis/plots/wgcna_networks_Subcutaneous.pdf and /dev/null differ diff --git a/rmd_analysis/plots/wgcna_networks_Subcutaneous.png b/rmd_analysis/plots/wgcna_networks_Subcutaneous.png deleted file mode 100644 index 27f1a4b..0000000 Binary files a/rmd_analysis/plots/wgcna_networks_Subcutaneous.png and /dev/null differ diff --git a/rmd_analysis/plots/wgcna_networks_Thyroid.pdf b/rmd_analysis/plots/wgcna_networks_Thyroid.pdf deleted file mode 100644 index c3de11a..0000000 Binary files a/rmd_analysis/plots/wgcna_networks_Thyroid.pdf and /dev/null differ diff --git a/rmd_analysis/plots/wgcna_networks_Thyroid.png b/rmd_analysis/plots/wgcna_networks_Thyroid.png deleted file mode 100644 index 582e59c..0000000 Binary files a/rmd_analysis/plots/wgcna_networks_Thyroid.png and /dev/null differ diff --git a/rmd_analysis/plots/zoomed_correlation_networks_Blood.png b/rmd_analysis/plots/zoomed_correlation_networks_Blood.png deleted file mode 100644 index 4976151..0000000 Binary files a/rmd_analysis/plots/zoomed_correlation_networks_Blood.png and /dev/null differ diff --git a/rmd_analysis/plots/zoomed_correlation_networks_Lung.png b/rmd_analysis/plots/zoomed_correlation_networks_Lung.png deleted file mode 100644 index 6163e10..0000000 Binary files a/rmd_analysis/plots/zoomed_correlation_networks_Lung.png and /dev/null differ diff --git a/rmd_analysis/plots/zoomed_correlation_networks_Muscle.png b/rmd_analysis/plots/zoomed_correlation_networks_Muscle.png deleted file mode 100644 index 8d75a65..0000000 Binary files a/rmd_analysis/plots/zoomed_correlation_networks_Muscle.png and /dev/null differ diff --git a/rmd_analysis/plots/zoomed_correlation_networks_Subcutaneous.png b/rmd_analysis/plots/zoomed_correlation_networks_Subcutaneous.png deleted file mode 100644 index 597e7e8..0000000 Binary files a/rmd_analysis/plots/zoomed_correlation_networks_Subcutaneous.png and /dev/null differ diff --git a/rmd_analysis/plots/zoomed_correlation_networks_Thyroid.png b/rmd_analysis/plots/zoomed_correlation_networks_Thyroid.png deleted file mode 100644 index 4ab904b..0000000 Binary files a/rmd_analysis/plots/zoomed_correlation_networks_Thyroid.png and /dev/null differ diff --git a/rmd_analysis/thyroid_pc_foxe1.Rmd b/rmd_analysis/thyroid_pc_foxe1.Rmd deleted file mode 100644 index 091a558..0000000 --- a/rmd_analysis/thyroid_pc_foxe1.Rmd +++ /dev/null @@ -1,56 +0,0 @@ ---- -title: "Thyroid" -output: - pdf_document: default - html_notebook: default ---- - -Association of PC with FOXE1. Ensembl ID for FOXE1 = ENSG00000178919 -```{r} -rm(list = ls()) -tiss <- "Thyroid" -ensid <- "ENSG00000178919" -## load subsetted raw expression data for thyroid -load("../data/raw_subset.Rdata") - -## we only care about thyroid for this analysis - set dat.expr to thyroid -dat.tiss.raw <- dat.expr[[tiss]] - -## which row is FOXE1? -grep(ensid, rownames(dat.tiss.raw)) -ensid.dat <- rownames(dat.tiss.raw)[grep(ensid, rownames(dat.tiss.raw))] - -## load pc corrected data -load("../data/pc_corrected.Rdata") -## we only care about thyroid for this analysis - set dat.expr to thyroid -dat.tiss.pc <- dat.expr[[tiss]] - -## which row is FOXE1? -grep(ensid, rownames(dat.tiss.pc)) -print(ensid) -print(rownames(dat.tiss.pc)[grep(ensid, rownames(dat.tiss.pc))]) -print(ensid.dat) -``` - -```{r} -foxe.raw <- dat.tiss.raw[ensid.dat,]@assays$data$counts -foxe.pc <- dat.tiss.pc[ensid.dat, ]@assays$data$counts -``` -Association between raw foxe expression and PC -```{r} -# load PC loadings -load("../data/pc_loadings.Rdata") -raw.pve <- sapply(summary(lm(pc.loadings[[tiss]][,1:num.pc.estimates[[tiss]]]~t(foxe.raw))), function(x) x$r.squared) -plot(c(1:num.pc.estimates[[tiss]]), raw.pve, col = "blue", pch = "*", xlab = "PC") -``` -```{r} -pc.pve <- sapply(summary(lm(pc.loadings[[tiss]][,1:num.pc.estimates[[tiss]]]~t(foxe.pc))), function(x) x$r.squared)*100 -plot(c(1:num.pc.estimates[[tiss]]), pc.pve, col = "red", pch = "*", xlab = "PC") -``` - -Add a new chunk by clicking the *Insert Chunk* button on the toolbar or by pressing *Cmd+Option+I*. - -When you save the notebook, an HTML file containing the code and output will be saved alongside it (click the *Preview* button or press *Cmd+Shift+K* to preview the HTML file). - -The preview shows you a rendered HTML copy of the contents of the editor. Consequently, unlike *Knit*, *Preview* does not run any R code chunks. Instead, the output of the chunk when it was last run in the editor is displayed. - diff --git a/rmd_analysis/thyroid_pc_foxe1.nb.html b/rmd_analysis/thyroid_pc_foxe1.nb.html deleted file mode 100644 index f7d69f0..0000000 --- a/rmd_analysis/thyroid_pc_foxe1.nb.html +++ /dev/null @@ -1,292 +0,0 @@ - - - - - - - - - - - - - -Thyroid - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
- - - - - - - - - - - - - - - - - -

Association of PC with FOXE1. Ensembl ID for FOXE1 = ENSG00000178919

- - - -
rm(list = ls())
-tiss <- "Thyroid"
-ensid <- "ENSG00000178919"
-## load subsetted raw expression data for thyroid
-load("../data/raw_subset.Rdata")
-## we only care about thyroid for this analysis - set dat.expr to thyroid
-dat.tiss.raw <- dat.expr[[tiss]]
-## which row is FOXE1?
-grep(ensid, rownames(dat.tiss.raw))
- - -
[1] 3000
- - -
ensid.dat <- rownames(dat.tiss.raw)[grep(ensid, rownames(dat.tiss.raw))]
-## load pc corrected data
-load("../data/pc_corrected.Rdata")
-## we only care about thyroid for this analysis - set dat.expr to thyroid
-dat.tiss.pc <- dat.expr[[tiss]]
-## which row is FOXE1?
-grep(ensid, rownames(dat.tiss.pc))
- - -
[1] 3000
- - -
print(ensid)
- - -
[1] "ENSG00000178919"
- - -
print(rownames(dat.tiss.pc)[grep(ensid, rownames(dat.tiss.pc))])
- - -
[1] "ENSG00000178919.8"
- - -
print(ensid.dat)
- - -
[1] "ENSG00000178919.8"
- - - - - - -
foxe.raw <- dat.tiss.raw[ensid.dat,]@assays$data$counts
-foxe.pc <- dat.tiss.pc[ensid.dat, ]@assays$data$counts
- - - -

Association between raw foxe expression and PC

- - - -

- - - - -

- - - -

Add a new chunk by clicking the Insert Chunk button on the toolbar or by pressing Cmd+Option+I.

-

When you save the notebook, an HTML file containing the code and output will be saved alongside it (click the Preview button or press Cmd+Shift+K to preview the HTML file).

-

The preview shows you a rendered HTML copy of the contents of the editor. Consequently, unlike Knit, Preview does not run any R code chunks. Instead, the output of the chunk when it was last run in the editor is displayed.

- - -
LS0tCnRpdGxlOiAiVGh5cm9pZCIKb3V0cHV0OgogIHBkZl9kb2N1bWVudDogZGVmYXVsdAogIGh0bWxfbm90ZWJvb2s6IGRlZmF1bHQKLS0tCgpBc3NvY2lhdGlvbiBvZiBQQyB3aXRoIEZPWEUxLiBFbnNlbWJsIElEIGZvciBGT1hFMSA9IEVOU0cwMDAwMDE3ODkxOQpgYGB7cn0Kcm0obGlzdCA9IGxzKCkpCnRpc3MgPC0gIlRoeXJvaWQiCmVuc2lkIDwtICJFTlNHMDAwMDAxNzg5MTkiCiMjIGxvYWQgc3Vic2V0dGVkIHJhdyBleHByZXNzaW9uIGRhdGEgZm9yIHRoeXJvaWQKbG9hZCgiLi4vZGF0YS9yYXdfc3Vic2V0LlJkYXRhIikKCiMjIHdlIG9ubHkgY2FyZSBhYm91dCB0aHlyb2lkIGZvciB0aGlzIGFuYWx5c2lzIC0gc2V0IGRhdC5leHByIHRvIHRoeXJvaWQKZGF0LnRpc3MucmF3IDwtIGRhdC5leHByW1t0aXNzXV0KCiMjIHdoaWNoIHJvdyBpcyBGT1hFMT8KZ3JlcChlbnNpZCwgcm93bmFtZXMoZGF0LnRpc3MucmF3KSkKZW5zaWQuZGF0IDwtIHJvd25hbWVzKGRhdC50aXNzLnJhdylbZ3JlcChlbnNpZCwgcm93bmFtZXMoZGF0LnRpc3MucmF3KSldCgojIyBsb2FkIHBjIGNvcnJlY3RlZCBkYXRhCmxvYWQoIi4uL2RhdGEvcGNfY29ycmVjdGVkLlJkYXRhIikKIyMgd2Ugb25seSBjYXJlIGFib3V0IHRoeXJvaWQgZm9yIHRoaXMgYW5hbHlzaXMgLSBzZXQgZGF0LmV4cHIgdG8gdGh5cm9pZApkYXQudGlzcy5wYyA8LSBkYXQuZXhwcltbdGlzc11dCgojIyB3aGljaCByb3cgaXMgRk9YRTE/CmdyZXAoZW5zaWQsIHJvd25hbWVzKGRhdC50aXNzLnBjKSkKcHJpbnQoZW5zaWQpCnByaW50KHJvd25hbWVzKGRhdC50aXNzLnBjKVtncmVwKGVuc2lkLCByb3duYW1lcyhkYXQudGlzcy5wYykpXSkKcHJpbnQoZW5zaWQuZGF0KQpgYGAKCmBgYHtyfQpmb3hlLnJhdyA8LSBkYXQudGlzcy5yYXdbZW5zaWQuZGF0LF1AYXNzYXlzJGRhdGEkY291bnRzCmZveGUucGMgPC0gZGF0LnRpc3MucGNbZW5zaWQuZGF0LCBdQGFzc2F5cyRkYXRhJGNvdW50cwpgYGAKQXNzb2NpYXRpb24gYmV0d2VlbiByYXcgZm94ZSBleHByZXNzaW9uIGFuZCBQQwpgYGB7cn0KIyBsb2FkIFBDIGxvYWRpbmdzCmxvYWQoIi4uL2RhdGEvcGNfbG9hZGluZ3MuUmRhdGEiKQpyYXcucHZlIDwtIHNhcHBseShzdW1tYXJ5KGxtKHBjLmxvYWRpbmdzW1t0aXNzXV1bLDE6bnVtLnBjLmVzdGltYXRlc1tbdGlzc11dXX50KGZveGUucmF3KSkpLCBmdW5jdGlvbih4KSB4JHIuc3F1YXJlZCkKcGxvdChjKDE6bnVtLnBjLmVzdGltYXRlc1tbdGlzc11dKSwgcmF3LnB2ZSwgY29sID0gImJsdWUiLCBwY2ggPSAiKiIsIHhsYWIgPSAiUEMiKQpgYGAKYGBge3J9CnBjLnB2ZSA8LSBzYXBwbHkoc3VtbWFyeShsbShwYy5sb2FkaW5nc1tbdGlzc11dWywxOm51bS5wYy5lc3RpbWF0ZXNbW3Rpc3NdXV1+dChmb3hlLnBjKSkpLCBmdW5jdGlvbih4KSB4JHIuc3F1YXJlZCkqMTAwCnBsb3QoYygxOm51bS5wYy5lc3RpbWF0ZXNbW3Rpc3NdXSksIHBjLnB2ZSwgY29sID0gInJlZCIsIHBjaCA9ICIqIiwgeGxhYiA9ICJQQyIpCmBgYAoKQWRkIGEgbmV3IGNodW5rIGJ5IGNsaWNraW5nIHRoZSAqSW5zZXJ0IENodW5rKiBidXR0b24gb24gdGhlIHRvb2xiYXIgb3IgYnkgcHJlc3NpbmcgKkNtZCtPcHRpb24rSSouCgpXaGVuIHlvdSBzYXZlIHRoZSBub3RlYm9vaywgYW4gSFRNTCBmaWxlIGNvbnRhaW5pbmcgdGhlIGNvZGUgYW5kIG91dHB1dCB3aWxsIGJlIHNhdmVkIGFsb25nc2lkZSBpdCAoY2xpY2sgdGhlICpQcmV2aWV3KiBidXR0b24gb3IgcHJlc3MgKkNtZCtTaGlmdCtLKiB0byBwcmV2aWV3IHRoZSBIVE1MIGZpbGUpLiAKClRoZSBwcmV2aWV3IHNob3dzIHlvdSBhIHJlbmRlcmVkIEhUTUwgY29weSBvZiB0aGUgY29udGVudHMgb2YgdGhlIGVkaXRvci4gQ29uc2VxdWVudGx5LCB1bmxpa2UgKktuaXQqLCAqUHJldmlldyogZG9lcyBub3QgcnVuIGFueSBSIGNvZGUgY2h1bmtzLiBJbnN0ZWFkLCB0aGUgb3V0cHV0IG9mIHRoZSBjaHVuayB3aGVuIGl0IHdhcyBsYXN0IHJ1biBpbiB0aGUgZWRpdG9yIGlzIGRpc3BsYXllZC4KCg==
- - - -
- - - - - - - - diff --git a/rmd_analysis/total_expressionPVE_allcovariates.Rmd b/rmd_analysis/total_expressionPVE_allcovariates.Rmd deleted file mode 100644 index d6bf381..0000000 --- a/rmd_analysis/total_expressionPVE_allcovariates.Rmd +++ /dev/null @@ -1,53 +0,0 @@ ---- -title: "Total PVE by all covariates" -output: - html_notebook: default - pdf_document: default ---- - - -```{r} -rm(list = ls()) -library(RcppEigen) -load("../data/raw_protein_coding_withGC.Rdata") - -## none of the covariates have NA --> total sum of squares can be computed before hand -dat.cov <- lapply(gtex.rse, function(tiss) { - cov.dat <- tiss@colData[,c(10, 11, 21:80, 83)] - cov.dat <- cov.dat[,-which(sapply(cov.dat, function(x) length(unique(x))) == 1)] - cov.dat <- cov.dat[, -which(colnames(cov.dat) %in% c("smunpdrd","smpthnts", "smtstptref", "smnabtch", "smnabtchd", "smgebtch"))] ## not enought unique entries in more than one category, < 50 - cov.dat - }) -dat.expr <- lapply(gtex.rse, function(tiss) tiss@assays$data$counts) - -## compute the residuals -residual.expr.dof <- mapply(function(x,y){ - x <- t(x) - res.expr <- matrix(ncol = ncol(x), nrow = nrow(x)) - print(paste("begin")) - for(i in 1:ncol(x)){ - lm.out <- fastLm(x[,i]~1+. , data = y) - res.expr[,i] <- lm.out$residuals - } - list(residual_expression = res.expr, dof = lm.out$df.residual) -}, dat.expr, dat.cov) - -residual.expr <- lapply(residual.expr.dof[1,], function(x) x) -model.dof <- lapply(residual.expr.dof[2,], function(x) x) - -``` -Now that we have the expression data, residuals from the regression and dof - we can compute the adjusted r^2. -```{r} -tss <- lapply(dat.expr, function(x) (norm(x - rowMeans(x), type = "F"))^2) -rss <- lapply(residual.expr, function(x) (norm(x, type = "F"))^2) - -total.covariate.pve <- vector("numeric", length = length(dat.expr)) -names(total.covariate.pve) <- names(dat.expr) -for(i in 1:length(total.covariate.pve)){ - n <- ncol(dat.expr[[i]]) - r2 <- (tss[[i]] - rss[[i]])/tss[[i]] - total.covariate.pve[i] <- 1 - ((1-r2) * ((n - 1) / model.dof[[i]])) -} - -total.covariate.pve -``` diff --git a/rmd_analysis/total_expressionPVE_allcovariates.nb.html b/rmd_analysis/total_expressionPVE_allcovariates.nb.html deleted file mode 100644 index 643a398..0000000 --- a/rmd_analysis/total_expressionPVE_allcovariates.nb.html +++ /dev/null @@ -1,264 +0,0 @@ - - - - - - - - - - - - - -Total PVE by all covariates - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
- - - - - - - - - - - - - - - - - - - - -
rm(list = ls())
-library(RcppEigen)
-load("../data/raw_protein_coding_withGC.Rdata")
-
-## none of the covariates have NA --> total sum of squares can be computed before hand
-dat.cov <- lapply(gtex.rse, function(tiss) {
-  cov.dat <- tiss@colData[,c(10, 11, 21:80, 83)]
-  cov.dat <- cov.dat[,-which(sapply(cov.dat, function(x) length(unique(x))) == 1)]
-  cov.dat <- cov.dat[, -which(colnames(cov.dat) %in% c("smunpdrd","smpthnts", "smtstptref", "smnabtch", "smnabtchd", "smgebtch"))] ## not enought unique entries in more than one category, < 50
-  cov.dat
-  })
-dat.expr <- lapply(gtex.rse, function(tiss) tiss@assays$data$counts)
-
-## compute the residuals
-residual.expr.dof <- mapply(function(x,y){
-  x <- t(x)
-  res.expr <- matrix(ncol = ncol(x), nrow = nrow(x))
-  print(paste("begin"))
-  for(i in 1:ncol(x)){
-    lm.out <- fastLm(x[,i]~1+. , data = y)
-    res.expr[,i] <- lm.out$residuals
-  }
-  list(residual_expression = res.expr, dof = lm.out$df.residual)
-}, dat.expr, dat.cov)
-
-residual.expr <- lapply(residual.expr.dof[1,], function(x) x)
-model.dof <- lapply(residual.expr.dof[2,], function(x) x)
-
- - - -

Now that we have the expression data, residuals from the regression and dof - we can compute the adjusted r^2.

- - - -
total.covariate.pve
-
- - -
Subcutaneous         Lung      Thyroid       Muscle        Blood 
-   0.2675448    0.3670305    0.2696517    0.3518515    0.6266195 
- - - -
LS0tCnRpdGxlOiAiVG90YWwgUFZFIGJ5IGFsbCBjb3ZhcmlhdGVzIgpvdXRwdXQ6CiAgaHRtbF9ub3RlYm9vazogZGVmYXVsdAogIHBkZl9kb2N1bWVudDogZGVmYXVsdAotLS0KCgpgYGB7cn0Kcm0obGlzdCA9IGxzKCkpCmxpYnJhcnkoUmNwcEVpZ2VuKQpsb2FkKCIuLi9kYXRhL3Jhd19wcm90ZWluX2NvZGluZ193aXRoR0MuUmRhdGEiKQoKIyMgbm9uZSBvZiB0aGUgY292YXJpYXRlcyBoYXZlIE5BIC0tPiB0b3RhbCBzdW0gb2Ygc3F1YXJlcyBjYW4gYmUgY29tcHV0ZWQgYmVmb3JlIGhhbmQKZGF0LmNvdiA8LSBsYXBwbHkoZ3RleC5yc2UsIGZ1bmN0aW9uKHRpc3MpIHsKICBjb3YuZGF0IDwtIHRpc3NAY29sRGF0YVssYygxMCwgMTEsIDIxOjgwLCA4MyldCiAgY292LmRhdCA8LSBjb3YuZGF0Wywtd2hpY2goc2FwcGx5KGNvdi5kYXQsIGZ1bmN0aW9uKHgpIGxlbmd0aCh1bmlxdWUoeCkpKSA9PSAxKV0KICBjb3YuZGF0IDwtIGNvdi5kYXRbLCAtd2hpY2goY29sbmFtZXMoY292LmRhdCkgJWluJSBjKCJzbXVucGRyZCIsInNtcHRobnRzIiwgInNtdHN0cHRyZWYiLCAic21uYWJ0Y2giLCAic21uYWJ0Y2hkIiwgInNtZ2VidGNoIikpXSAjIyBub3QgZW5vdWdodCB1bmlxdWUgZW50cmllcyBpbiBtb3JlIHRoYW4gb25lIGNhdGVnb3J5LCA8IDUwCiAgY292LmRhdAogIH0pCmRhdC5leHByIDwtIGxhcHBseShndGV4LnJzZSwgZnVuY3Rpb24odGlzcykgdGlzc0Bhc3NheXMkZGF0YSRjb3VudHMpCgojIyBjb21wdXRlIHRoZSByZXNpZHVhbHMKcmVzaWR1YWwuZXhwci5kb2YgPC0gbWFwcGx5KGZ1bmN0aW9uKHgseSl7CiAgeCA8LSB0KHgpCiAgcmVzLmV4cHIgPC0gbWF0cml4KG5jb2wgPSBuY29sKHgpLCBucm93ID0gbnJvdyh4KSkKICBwcmludChwYXN0ZSgiYmVnaW4iKSkKICBmb3IoaSBpbiAxOm5jb2woeCkpewogICAgbG0ub3V0IDwtIGZhc3RMbSh4WyxpXX4xKy4gLCBkYXRhID0geSkKICAgIHJlcy5leHByWyxpXSA8LSBsbS5vdXQkcmVzaWR1YWxzCiAgfQogIGxpc3QocmVzaWR1YWxfZXhwcmVzc2lvbiA9IHJlcy5leHByLCBkb2YgPSBsbS5vdXQkZGYucmVzaWR1YWwpCn0sIGRhdC5leHByLCBkYXQuY292KQoKcmVzaWR1YWwuZXhwciA8LSBsYXBwbHkocmVzaWR1YWwuZXhwci5kb2ZbMSxdLCBmdW5jdGlvbih4KSB4KQptb2RlbC5kb2YgPC0gbGFwcGx5KHJlc2lkdWFsLmV4cHIuZG9mWzIsXSwgZnVuY3Rpb24oeCkgeCkKCmBgYApOb3cgdGhhdCB3ZSBoYXZlIHRoZSBleHByZXNzaW9uIGRhdGEsIHJlc2lkdWFscyBmcm9tIHRoZSByZWdyZXNzaW9uIGFuZCBkb2YgLSB3ZSBjYW4gY29tcHV0ZSB0aGUgYWRqdXN0ZWQgcl4yLgpgYGB7cn0KdHNzIDwtIGxhcHBseShkYXQuZXhwciwgZnVuY3Rpb24oeCkgKG5vcm0oeCAtIHJvd01lYW5zKHgpLCB0eXBlID0gIkYiKSleMikKcnNzIDwtIGxhcHBseShyZXNpZHVhbC5leHByLCBmdW5jdGlvbih4KSAobm9ybSh4LCB0eXBlID0gIkYiKSleMikKCnRvdGFsLmNvdmFyaWF0ZS5wdmUgPC0gdmVjdG9yKCJudW1lcmljIiwgbGVuZ3RoID0gbGVuZ3RoKGRhdC5leHByKSkKbmFtZXModG90YWwuY292YXJpYXRlLnB2ZSkgPC0gbmFtZXMoZGF0LmV4cHIpCmZvcihpIGluIDE6bGVuZ3RoKHRvdGFsLmNvdmFyaWF0ZS5wdmUpKXsKICBuIDwtIG5jb2woZGF0LmV4cHJbW2ldXSkKICByMiA8LSAodHNzW1tpXV0gLSByc3NbW2ldXSkvdHNzW1tpXV0KICB0b3RhbC5jb3ZhcmlhdGUucHZlW2ldIDwtIDEgLSAoKDEtcjIpICogKChuIC0gMSkgLyBtb2RlbC5kb2ZbW2ldXSkpCn0KCnRvdGFsLmNvdmFyaWF0ZS5wdmUKYGBgCg==
- - - -
- - - - - - - -