--- title: "09.GSEA" output: html_document date: '2022-07-18' --- #### GSEA analysis #### ```{r} options(stringsAsFactors = F) library(org.Hs.eg.db) library(clusterProfiler) library(enrichplot) library(tidyverse) library(ggstatsplot) library(dplyr) library(plyr) ``` ```{r,create genelist for GSEA} organism = 'hsa' OrgDb = 'org.Hs.eg.db' need_DEG <- res_tbl[,c(1,3,6)] colnames(need_DEG) <- c('gene','log2FoldChange','pvalue') need_DEG$SYMBOL <- need_DEG$gene #convert id df <- bitr(need_DEG$SYMBOL, fromType = "SYMBOL", toType = "ENTREZID", OrgDb = OrgDb) need_DEG <- merge(need_DEG, df, by='SYMBOL') #write.csv(need_DEG,'need_DEG.csv') geneList <- need_DEG$log2FoldChange names(geneList) <- need_DEG$ENTREZID geneList <- sort(geneList, decreasing = T) #descending order ``` ```{r, enrichement by clusterprofiler} KEGG_kk_entrez <- gseKEGG(geneList = geneList, organism = organism, pvalueCutoff = 0.05) KEGG_kk <- DOSE::setReadable(KEGG_kk_entrez, OrgDb=OrgDb, keyType='ENTREZID')#convert id #save(KEGG_kk_entrez, file = "./data/epithelium/by_cancer_by_pheno/BC/GSEA_KEGG_results.RData") #GSEA Hall markers ##define the TERM2GENE list from msigdb. #Homo sapiens or Mus musculus library(msigdbr) library(ExperimentHub) library(GSEABase) C2_t2g <- msigdbr(species = "Homo sapiens",#Homo sapiens or Mus musculus category = "C5"#, subcategory = "BP" ) %>% dplyr::select(gs_name, entrez_gene) head(C2_t2g) C2_kk_entrez <- GSEA(geneList, TERM2GENE = C2_t2g, pAdjustMethod = "BH", pvalueCutoff = 0.05 ) C2_kk <- DOSE::setReadable(C2_kk_entrez, OrgDb=OrgDb, keyType='ENTREZID') head(C2_kk) head(C2_kk@result) #write.csv(C2_kk@result, '~/Desktop/C5_0.05_GSEA.csv') ```