##根據DAVID結果做圖GOterm分析,數(shù)據格式從DAVID中下載检碗,先保存至txt,后用excel打開平窘,再保存為CSV格式
x<-read.csv(file = "C:\\Users\\zhouwenqing789\\Desktop\\乳腺癌TCGA數(shù)據庫20191226\\test\\GOTerm.csv",stringsAsFactor=F,header=T)
head(x)
x<-x[x$PValue<0.05,]
x_go<-x[,1:5]
xbp<-x_go[grep("BP",x_go$Category),]
xcc<-x_go[grep("CC",x_go$Category),]
xmf<-x_go[grep("MF",x_go$Category),]
xkegg<-x_go[grep("KEGG",x_go$Category),]
##通過正則表達式將Term格式整理一下
xbp$Term<-gsub(".*\\~","",xbp$Term)
xcc$Term<-gsub(".*\\~","",xcc$Term)
xmf$Term<-gsub(".*\\~","",xmf$Term)
xkegg$Term<-gsub(".*\\:","",xkegg$Term)
library(ggplot2)
make_GO_bubble<-function(go_data,term_name){
? #選擇TOP10的數(shù)據(count)
? GO_DATA<-go_data[order(go_data$Count,decreasing = T),]
? GO_DATA<-head(GO_DATA,10)
? #思維數(shù)據的展示
? p<-ggplot(GO_DATA,aes(X.,Term))
? bubble<-p+geom_point(aes(size=Count,color=-log(PValue)))
? #自定義漸變顏色
? bubble<-bubble+scale_color_gradient(low = "green",high = "red")
? #改變圖片的樣式(主題)
? pr<-bubble+theme_test(base_size = 16,base_rect_size = 1)
? pr<-pr+labs(x="Rich factor",y=term_name,title = "Enrichment of DEGS")
? return(pr)
}
#BP
make_GO_bubble(xbp,term_name = "Biological Process")
make_GO_bubble(xcc,term_name = "Cell Component")
make_GO_bubble(xmf,term_name = "Molecular Function")
make_GO_bubble(xkegg,term_name = "KEGG pathway")