Skip to content

Latest commit

 

History

History
114 lines (99 loc) · 2.88 KB

Fig_S8_Stem_cell_signature.md

File metadata and controls

114 lines (99 loc) · 2.88 KB
title author date output
stem cell signature
Laura Wolbeck
2024-07-02
html_document

setup

library(magrittr)
library(clusterProfiler)
library(ggplot2)

prepare TERM2GENE data.frame

using genes from Cheung and Rando

quiescent_genes <- c("Ccnd3", "Pdk1","Smarca2", "Foxo3", "Ezh1", "Prdm5","Ptov1", "Zfp30", "Zbtb20","Phf1", "Ctdsp1", "Thra", "Tef", "Dicer1", "Crebrf", "Bcas3", "Ddx3y", "Gabarapl1", "Nop53", "Itm2a", "Il18", "Zyx", "Ephx1", "Clstn1", "Gstk1", "Cdip1", "Ddt", "Ivd", "Fhl1", "Ndrg2", "Grina","Pik3r1", "Fyn", "Chkb", "Pink1", "Ulk2", "Dnajb9", "Pfdn5", "Ctsf", "Crim1", "Selenop", "Gabbr1", "Grb10", "Bbs2", "Rps14", "Igf2r", "Selenbp1", "Rnf167", "Map1lc3a")
active_genes <- c("Anln", "Birc5", "Ccna2","Ccnb1", "Ccne2", "Sgo1", "Mcm4", "Pcna", "Rrm2", "Top2a", "Cycs", "Mtch2", "Slc25a5", 	"H2afz", "Hat1", "Ddx39", 	"Pclaf", "Capza1", "Hadhb", "Idh3a", "Kpna2", "Pgk1")

TERM2GENE is a data.frame with first column of term ID and second column of corresponding mapped gene

term2gene <- data.frame(Term = replicate(49, "Quiescent stem cell signature"), Gene = quiescent_genes)
term2gene <- rbind(term2gene, data.frame(Term = replicate(22, "Active stem cell signature"), Gene = active_genes))
saveRDS(term2gene, "term2gene.rds")

Fig S8B: fullterm samples

cao <- readRDS("cao_fullterm_DEG2.rds")

taking all DEG (also non-significant) of RG

RG_DEG <-  cao$test.results$de$RG$res
RG_DEG <- RG_DEG$log2FoldChange
names(RG_DEG) <- cao$test.results$de$RG$res$Gene

sort genes by log2fold change

RG_DEG %<>% sort(decreasing = TRUE)
set.seed(123)
res <- clusterProfiler::GSEA(RG_DEG, TERM2GENE = term2gene, pvalueCutoff = 1)
summary(res)
clusterProfiler::dotplot(res)+ facet_grid(.~.sign) + ggtitle("Fullterm")
ggsave("Signature_fullterm.pdf", height=4)

late timepoints

cao <- readRDS("cao_late_DEG2.rds")

taking only DEG of RG

RG_DEG <-  cao$test.results$de$RG$res
RG_DEG <- RG_DEG$log2FoldChange
names(RG_DEG) <- cao$test.results$de$RG$res$Gene
RG_DEG %<>% sort(decreasing = TRUE)
set.seed(123)
res <- clusterProfiler::GSEA(RG_DEG, TERM2GENE = term2gene, pvalueCutoff = 1)
summary(res)
clusterProfiler::dotplot(res)+ facet_grid(.~.sign) + ggtitle("Late timepoints")
ggsave("Signature_late.pdf", height=4)

early timepoints

cao <- readRDS("cao_early_DEG2.rds")

taking only DEG of RG

RG_DEG <-  cao$test.results$de$RG$res
RG_DEG <- RG_DEG$log2FoldChange
names(RG_DEG) <- cao$test.results$de$RG$res$Gene
RG_DEG %<>% sort(decreasing = TRUE)
set.seed(123)
res <- clusterProfiler::GSEA(RG_DEG, TERM2GENE = term2gene, pvalueCutoff = 1)
summary(res)
clusterProfiler::dotplot(res)+ facet_grid(.~.sign) + ggtitle("Early timepoints")
ggsave("Signature_early.pdf", height=4)