管理系统开发资讯 Bulk RNA(庸俗转录组)多组各异基因分析函数(视频教程)
发布日期:2024-09-28 13:24 点击次数:182
图片管理系统开发资讯
然后咱们测试一下:领先是两组等相通样本,很节略!
setwd('D:\\KS步地\\公众号著述\\Bulk多组各异基因分析函数')#一、两组分析(样本数卓越)-------------------------------------------------------------------df1 <- read.csv("Two_group.csv", header = T, row.names = 1)colnames(df1)# [1] "Cancer1" "Cancer2" "Cancer3" "Health1" "Health2" "Health3"meta1 <- data.frame(Cancer=c("Cancer1" ,"Cancer2" ,"Cancer3"), Health=c("Health1", "Health2", "Health3"))deg1_Deseq2 <- KS_bulkRNA_MultiGroup_DEGs(exprSet = df1, meta = meta1, methods = "DESeq2", test = "Cancer", control = "Health", repNum1 = 3, repNum2 = 3)deg1_edgeR <- KS_bulkRNA_MultiGroup_DEGs(exprSet = df1, meta = meta1, methods = "edgeR", test = "Cancer", control = "Health", repNum1 = 3, repNum2 = 3)deg1_limma <- KS_bulkRNA_MultiGroup_DEGs(exprSet = df1, meta = meta1, methods = "limma", test = "Cancer", control = "Health", repNum1 = 3, repNum2 = 3)
相通数不等的两组样天职析亦然如斯,独一诞生好test和control即可:
#二、两组分析(样本数不同)-------------------------------------------------------------------df4 <- read.csv("two_diff_group.csv", header = T, row.names = 1)colnames(df4)# [1] "HC_1" "HC_2" "HC_3" "HC_4" "PPC_1" "PPC_2" "PPC_3" "PPC_4" "PPC_5" "PPC_6"meta4 <- data.frame(HC=c("HC_1","HC_2","HC_3","HC_4","",""), PPC=c("PPC_1","PPC_2","PPC_3","PPC_4","PPC_5","PPC_6"))deg4_Deseq2 <- KS_bulkRNA_MultiGroup_DEGs(exprSet = df4, meta = meta4, methods = "DESeq2", test = "PPC", control = "HC", repNum1 = 6, repNum2 = 4)deg4_edgeR <- KS_bulkRNA_MultiGroup_DEGs(exprSet = df4, meta = meta4, methods = "edgeR", test = "PPC", control = "HC", repNum1 = 6, repNum2 = 4)deg4_limma <- KS_bulkRNA_MultiGroup_DEGs(exprSet = df4, meta = meta4, methods = "limma", test = "PPC", control = "HC", repNum1 = 6, repNum2 = 4)
咱们不错对比下三种圭臬各异基因后果,发现细目不是透顶通常,管理系统开发资讯那是因为算法不通常,无用纠结。在咱们这个数据内部不错看出,DEseq2和edgeR的后果重合照旧挺多的。
#韦恩图deg4_Deseq2_sig <- deg4_Deseq2[which(abs(deg4_Deseq2$log2FoldChange)>0 & deg4_Deseq2$pvalue <=0.05),]deg4_edgeR_sig <- deg4_edgeR[which(abs(deg4_edgeR$logFC)>0 & deg4_edgeR$PValue <=0.05),]deg4_limma_sig <- deg4_limma[which(abs(deg4_limma$logFC)>0 & deg4_limma$P.Value <=0.05),]library(ggvenn)library(tidyverse)Venn_list <- list(deg4_Deseq2_sig=rownames(deg4_Deseq2_sig), deg4_edgeR_sig=rownames(deg4_edgeR_sig), deg4_limma_sig=rownames(deg4_limma_sig))#使用list_to_data_frame将list挪动为data.framedata_veen = list_to_data_frame(Venn_list)ggvenn(Venn_list, show_percentage = T, show_elements = F, text_size=3, digits = 1, set_name_size=4, stroke_color = "grey30", fill_color = c("#FF8C00","#4DAF4A","#B64E89"), set_name_color = c("#FF8C00","#4DAF4A","#B64E89"))
图片
奇偶比分析:近十期奇偶比为26:24,奇数码出现概率较热。本期看好奇数号码出现概率走高,参考奇偶比4:1。
1 三区分析(三区划分:一区01-12段12码,二区13-24段12码,三区25-35段11码)
多组样本的分析就更节略了:大多诞生皆诞生好了。这里需要强调少量,那即是关于多组样本,在进行meta诞生的时分,test组靠前,control靠后!
小程序开发#四、多组test------------------------------------------------------------------df3 <- read.csv("count_gene.csv", header = T, row.names = 1, check.names = F)colnames(df3)# [1] "Fbrain 1" "Fbrain 2" "Fbrain 3" "Fbrain 4" "Fhom 1" "Fhom 2" "Fhom 3" # [8] "Mbrain 1" "Mbrain 2" "Mbrain 3" "Mbrain 4" "Mbrain 5" "Mhom 1" "Mhom 2" # [15] "Mhom 3" "Mhom 4" meta3 <- data.frame(Mhom = c("Mhom 1","Mhom 2", "Mhom 3","Mhom 4",""), Fhom = c("Fhom 1","Fhom 2","Fhom 3","",""), Mbrain=c("Mbrain 1","Mbrain 2","Mbrain 3","Mbrain 4","Mbrain 5"), Fbrain=c("Fbrain 1","Fbrain 2","Fbrain 3","Fbrain 4",""))deg3_Deseq2 <- KS_bulkRNA_MultiGroup_DEGs(exprSet = df3, meta = meta3, methods = "DESeq2", separator=" ")deg3_edgeR <- KS_bulkRNA_MultiGroup_DEGs(exprSet = df3, meta = meta3, methods = "edgeR", separator=" ")deg3_limma <- KS_bulkRNA_MultiGroup_DEGs(exprSet = df3, meta = meta3, methods = "limma", separator=" ")
图片
本站仅提供存储就业,扫数践诺均由用户发布,如发现存害或侵权践诺,请点击举报。