#only PCG #ENSMUSG00000079102 Dab2 1797 protein_coding #ENSMUSG00000022150 Dab2 2776.27 protein_coding setwd("~/bak/doc/fleming/kafasla/DKlab/mr/rnaseq-vs-polysomeseq/") require(edgeR) bt=read.table("/data/results/reference/mmu/Mus_musculus.NCBIM37.64-toMM9.transcript-gene_name.txt",sep="\t") rownames(bt)=bt$V2; %bt=bt[,(names(x) %in% c("V2","V4")] bt2=cbind(substring(bt[,2],2),as.character(bt[,4])) colnames(bt2)=c("EnsemblID","biotype") rownames(bt2)=bt2[,1] bt4=bt2[bt2[,2]=="protein_coding",] #bt4=bt2[bt2$biotype=="protein_coding",] bt3=bt2[!duplicated(rownames(bt2)),] rownames(bt3)=bt3[,1] gl=read.table("~/bak/doc/fleming/kafasla/DKlab/mr/rnaseq/deg/Mus_musculus.NCBIM37.64-toMM9.gene-lenghts.txt",sep="\t") gl.names=gl$V1; rownames(gl)=gl$V1 colnames(gl)=c("ID","geneID","genelength"); #poly1= read.table("gene_counts_merged_k20_NCBIM37.64.txt",header=T,sep="\t",skip=1) poly1= read.table("~/bak/doc/fleming/kafasla/DKlab/mr/Polysomes/deg/gene_counts_merged_NCBIM37.64_id.txt",header=T,sep="\t",skip=1) poly0 =poly1[,7:dim(poly1)[2]]; rownames(poly0)=poly1$Geneid; col_ordering = c(1,2,11,12)#0h poly =poly0[,col_ordering]; poly = poly[(rowSums(poly[,1:2])>=2)&(rowSums(poly[,3:4])>=2),] #poly2=merge(x=poly,y=bt3,by="row.names",all.x=TRUE) poly=poly[rownames(poly) %in% bt4[,1],] conditions = factor(c("KO","KO","WT","WT")); exp_study = DGEList(counts=poly, group=conditions);exp_study = calcNormFactors(exp_study);exp_study = estimateCommonDisp(exp_study);exp_study = estimateTagwiseDisp(exp_study);et = exactTest(exp_study,pair=c("WT","KO")) tTags = topTags(et,n=NULL,adjust.method = "fdr") #r <- rownames(topTags(et)$table) r <- rownames(tTags) c=cpm(exp_study)[r, order(exp_study$samples$group)] #x=cbind(as.data.frame(tTags),r) #x=cbind(as.data.frame(tTags), gl[r,2],gl[r,3]) x=merge(x=as.data.frame(tTags),y=gl,by="row.names",all.x=TRUE) rownames(x)=x$Row.names x=x[,!(names(x) %in% c("Row.names","ID"))] i=as.data.frame(c) x1=merge(x=x,y=i,by="row.names",all.x=TRUE) x=cbind(x1,1000*x1[,8]/x$genelength,1000*x1[,9]/x$genelength,1000*x1[,10]/x$genelength,1000*x1[,11]/x$genelength) x=cbind(x,0.5*(x[,12]+x[,13]),0.5*(x[,14]+x[,15])) colnames(x)=c("EnsemblID", "logFC", "logCPM", "PValue", "FDR", "geneID", "genelength", "CPM_KO_0h_replicate_I", "CPM_KO_0h_replicate_II", "CPM_WT_0h_replicate_I", "CPM_WT_0h_replicate_II", "RPKM_KO_0h_replicate_I", "RPKM_KO_0h_replicate_II", "RPKM_WT_0h_replicate_I", "RPKM_WT_0h_replicate_II", "RPKM_KO_0h", "RPKM_WT_0h") #x1=merge(x=x,y=bt2,by="EnsemblID",all.x=TRUE) write.table(x, file="edgeRgenesPolyExpr-0h_pcg.csv",quote=FALSE,row.names=FALSE,sep="\t") x_m0=x print ("P-m0") #-1 means WT > KO # 1 means KO > WT summary(de <- decideTestsDGE(et, p=0.05,adjust.method="none")) summary(de <- decideTestsDGE(et, p=0.05,adjust.method="BH")) summary(de <- decideTestsDGE(et, p=0.1,adjust.method="BH")) for (i in 8:11){ print (colnames(x)[i]) tt=summary(x[,i]>0) print(tt) } for (i in 12:15){ print (colnames(x)[i]) tt=summary(x[,i]>1) print(tt) } col_ordering = c(3,4,13,14)#2h poly =poly0[,col_ordering]; poly = poly[(rowSums(poly[,1:2])>=2)&(rowSums(poly[,3:4])>=2),] poly=poly[rownames(poly) %in% bt4[,1],] conditions = factor(c("KO","KO","WT","WT")); exp_study = DGEList(counts=poly, group=conditions);exp_study = calcNormFactors(exp_study);exp_study = estimateCommonDisp(exp_study);exp_study = estimateTagwiseDisp(exp_study);et = exactTest(exp_study,pair=c("WT","KO")) tTags = topTags(et,n=NULL,adjust.method = "fdr") #r <- rownames(topTags(et)$table) r <- rownames(tTags) c=cpm(exp_study)[r, order(exp_study$samples$group)] #x=cbind(as.data.frame(tTags),r) #x=cbind(as.data.frame(tTags), gl[r,2],gl[r,3]) x=merge(x=as.data.frame(tTags),y=gl,by="row.names",all.x=TRUE) rownames(x)=x$Row.names x=x[,!(names(x) %in% c("Row.names","ID"))] i=as.data.frame(c) x1=merge(x=x,y=i,by="row.names",all.x=TRUE) x=cbind(x1,1000*x1[,8]/x$genelength,1000*x1[,9]/x$genelength,1000*x1[,10]/x$genelength,1000*x1[,11]/x$genelength) x=cbind(x,0.5*(x[,12]+x[,13]),0.5*(x[,14]+x[,15])) colnames(x)=c("EnsemblID", "logFC", "logCPM", "PValue", "FDR", "geneID", "genelength", "CPM_KO_2h_replicate_I", "CPM_KO_2h_replicate_II", "CPM_WT_2h_replicate_I", "CPM_WT_2h_replicate_II", "RPKM_KO_2h_replicate_I", "RPKM_KO_2h_replicate_II", "RPKM_WT_2h_replicate_I", "RPKM_WT_2h_replicate_II", "RPKM_KO_2h", "RPKM_WT_2h")#2h #x=merge(x=x,y=bt2,by="EnsemblID",all.x=TRUE) write.table(x, file="edgeRgenesPolyExpr-2h_pcg.csv",quote=FALSE,row.names=FALSE) x_2h=x print ("P-2h") summary(de <- decideTestsDGE(et, p=0.05,adjust.method="none")) summary(de <- decideTestsDGE(et, p=0.05,adjust.method="BH")) summary(de <- decideTestsDGE(et, p=0.1,adjust.method="BH")) for (i in 8:11){ print (colnames(x)[i]) tt=summary(x[,i]>0) print(tt) } for (i in 12:15){ print (colnames(x)[i]) tt=summary(x[,i]>1) print(tt) } col_ordering = c(5,6,15,16)#6h poly =poly0[,col_ordering]; poly = poly[(rowSums(poly[,1:2])>=2)&(rowSums(poly[,3:4])>=2),] poly=poly[rownames(poly) %in% bt4[,1],] conditions = factor(c("KO","KO","WT","WT")); exp_study = DGEList(counts=poly, group=conditions);exp_study = calcNormFactors(exp_study);exp_study = estimateCommonDisp(exp_study);exp_study = estimateTagwiseDisp(exp_study);et = exactTest(exp_study,pair=c("WT","KO")) tTags = topTags(et,n=NULL,adjust.method = "fdr") #r <- rownames(topTags(et)$table) r <- rownames(tTags) c=cpm(exp_study)[r, order(exp_study$samples$group)] #x=cbind(as.data.frame(tTags),r) #x=cbind(as.data.frame(tTags), gl[r,2],gl[r,3]) x=merge(x=as.data.frame(tTags),y=gl,by="row.names",all.x=TRUE) rownames(x)=x$Row.names x=x[,!(names(x) %in% c("Row.names","ID"))] i=as.data.frame(c) x1=merge(x=x,y=i,by="row.names",all.x=TRUE) x=cbind(x1,1000*x1[,8]/x$genelength,1000*x1[,9]/x$genelength,1000*x1[,10]/x$genelength,1000*x1[,11]/x$genelength) x=cbind(x,0.5*(x[,12]+x[,13]),0.5*(x[,14]+x[,15])) colnames(x)=c("EnsemblID", "logFC", "logCPM", "PValue", "FDR", "geneID", "genelength", "CPM_KO_6h_replicate_I", "CPM_KO_6h_replicate_II", "CPM_WT_6h_replicate_I", "CPM_WT_6h_replicate_II", "RPKM_KO_6h_replicate_I", "RPKM_KO_6h_replicate_II", "RPKM_WT_6h_replicate_I", "RPKM_WT_6h_replicate_II", "RPKM_KO_6h", "RPKM_WT_6h")#6h #x=merge(x=x,y=bt2,by="EnsemblID",all.x=TRUE) write.table(x, file="edgeRgenesPolyExpr-6h_pcg.csv",quote=FALSE,row.names=FALSE) x_6h=x print ("P-6h") summary(de <- decideTestsDGE(et, p=0.05,adjust.method="none")) summary(de <- decideTestsDGE(et, p=0.05,adjust.method="BH")) summary(de <- decideTestsDGE(et, p=0.1,adjust.method="BH")) for (i in 8:11){ print (colnames(x)[i]) tt=summary(x[,i]>0) print(tt) } for (i in 12:15){ print (colnames(x)[i]) tt=summary(x[,i]>1) print(tt) } col_ordering = c(7,8,17,18)#IFN poly =poly0[,col_ordering]; poly = poly[(rowSums(poly[,1:2])>=2)&(rowSums(poly[,3:4])>=2),] poly=poly[rownames(poly) %in% bt4[,1],] conditions = factor(c("KO","KO","WT","WT")); exp_study = DGEList(counts=poly, group=conditions);exp_study = calcNormFactors(exp_study);exp_study = estimateCommonDisp(exp_study);exp_study = estimateTagwiseDisp(exp_study);et = exactTest(exp_study,pair=c("WT","KO")) tTags = topTags(et,n=NULL,adjust.method = "fdr") #r <- rownames(topTags(et)$table) r <- rownames(tTags) c=cpm(exp_study)[r, order(exp_study$samples$group)] #x=cbind(as.data.frame(tTags),r) #x=cbind(as.data.frame(tTags), gl[r,2],gl[r,3]) x=merge(x=as.data.frame(tTags),y=gl,by="row.names",all.x=TRUE) rownames(x)=x$Row.names x=x[,!(names(x) %in% c("Row.names","ID"))] i=as.data.frame(c) x1=merge(x=x,y=i,by="row.names",all.x=TRUE) x=cbind(x1,1000*x1[,8]/x$genelength,1000*x1[,9]/x$genelength,1000*x1[,10]/x$genelength,1000*x1[,11]/x$genelength) x=cbind(x,0.5*(x[,12]+x[,13]),0.5*(x[,14]+x[,15])) colnames(x)=c("EnsemblID", "logFC", "logCPM", "PValue", "FDR", "geneID", "genelength", "CPM_KO_m1_replicate_I", "CPM_KO_m1_replicate_II", "CPM_WT_m1_replicate_I", "CPM_WT_m1_replicate_II", "RPKM_KO_m1_replicate_I", "RPKM_KO_m1_replicate_II", "RPKM_WT_m1_replicate_I", "RPKM_WT_m1_replicate_II", "RPKM_KO_m1", "RPKM_WT_m1")#m1 #x=merge(x=x,y=bt2,by="EnsemblID",all.x=TRUE) write.table(x, file="edgeRgenesPolyExpr-IFN_pcg.csv") print ("P-m1") summary(de <- decideTestsDGE(et, p=0.05,adjust.method="none")) summary(de <- decideTestsDGE(et, p=0.05,adjust.method="BH")) summary(de <- decideTestsDGE(et, p=0.1,adjust.method="BH")) x_m1=x for (i in 8:11){ print (colnames(x)[i]) tt=summary(x[,i]>0) print(tt) } for (i in 12:15){ print (colnames(x)[i]) tt=summary(x[,i]>1) print(tt) } summary(de <- decideTestsDGE(et, p=0.05)) #-1 24 #0 19748 #1 34 col_ordering = c(9,10,19,20)#IL4 poly =poly0[,col_ordering]; poly = poly[(rowSums(poly[,1:2])>=2)&(rowSums(poly[,3:4])>=2),] poly=poly[rownames(poly) %in% bt4[,1],] conditions = factor(c("KO","KO","WT","WT")); exp_study = DGEList(counts=poly, group=conditions);exp_study = calcNormFactors(exp_study);exp_study = estimateCommonDisp(exp_study);exp_study = estimateTagwiseDisp(exp_study);et = exactTest(exp_study,pair=c("WT","KO")) tTags = topTags(et,n=NULL,adjust.method = "fdr") #r <- rownames(topTags(et)$table) r <- rownames(tTags) c=cpm(exp_study)[r, order(exp_study$samples$group)] #x=cbind(as.data.frame(tTags),r) #x=cbind(as.data.frame(tTags), gl[r,2],gl[r,3]) x=merge(x=as.data.frame(tTags),y=gl,by="row.names",all.x=TRUE) rownames(x)=x$Row.names x=x[,!(names(x) %in% c("Row.names","ID"))] i=as.data.frame(c) x1=merge(x=x,y=i,by="row.names",all.x=TRUE) x=cbind(x1,1000*x1[,8]/x$genelength,1000*x1[,9]/x$genelength,1000*x1[,10]/x$genelength,1000*x1[,11]/x$genelength) x=cbind(x,0.5*(x[,12]+x[,13]),0.5*(x[,14]+x[,15])) colnames(x)=c("EnsemblID", "logFC", "logCPM", "PValue", "FDR", "geneID", "genelength", "CPM_KO_m2_replicate_I", "CPM_KO_m2_replicate_II", "CPM_WT_m2_replicate_I", "CPM_WT_m2_replicate_II", "RPKM_KO_m2_replicate_I", "RPKM_KO_m2_replicate_II", "RPKM_WT_m2_replicate_I", "RPKM_WT_m2_replicate_II", "RPKM_KO_m2", "RPKM_WT_m2")#m2 #x=merge(x=x,y=bt2,by="EnsemblID",all.x=TRUE) #x=x[!duplicated(x),] write.table(x, file="edgeRgenesPolyExpr-IL4_pcg.csv") x_m2=x print ("P-m2") summary(de <- decideTestsDGE(et, p=0.05,adjust.method="none")) summary(de <- decideTestsDGE(et, p=0.05,adjust.method="BH")) summary(de <- decideTestsDGE(et, p=0.1,adjust.method="BH")) #dim(x_m2) for (i in 8:11){ print (colnames(x)[i]) tt=summary(x[,i]>0) print(tt) } for (i in 12:15){ print (colnames(x)[i]) tt=summary(x[,i]>1) print(tt) } #write.table(x, file="edgeRgenesExpr-IL4_pcg.csv") summary(de <- decideTestsDGE(et, p=0.05)) #-1 215 #0 18093 #1 106 #summary(de <- decideTestsDGE(et, p=0.05,adjust.method="none")) #rnaseq data rnaseqMatrix1= read.table("~/bak/doc/fleming/kafasla/DKlab/mr/rnaseq/stringtie2/gene_counts_merged_k20_NCBIM37.64_id.txt",header=T,sep="\t",skip=1) rnaseqMatrix0 =rnaseqMatrix1[,7:dim(rnaseqMatrix1)[2]]; rownames(rnaseqMatrix0)=rnaseqMatrix1$Geneid; col_ordering = c(11,12,1,2)#0h rnaseqMatrix =rnaseqMatrix0[,col_ordering]; rnaseqMatrix = rnaseqMatrix[(rowSums(rnaseqMatrix[,1:2])>=2)&(rowSums(rnaseqMatrix[,3:4])>=2),] #rnaseqMatrix = rnaseqMatrix[rowSums(rnaseqMatrix)>=2,] rnaseqMatrix=rnaseqMatrix[rownames(poly) %in% bt4[,1],] conditions = factor(c("KO","KO","WT","WT")); exp_study = DGEList(counts=rnaseqMatrix, group=conditions);exp_study = calcNormFactors(exp_study);exp_study = estimateCommonDisp(exp_study);exp_study = estimateTagwiseDisp(exp_study);et = exactTest(exp_study,pair=c("WT","KO")) #exp2=vst(exp_study) tTags = topTags(et,n=NULL,adjust.method = "fdr") #r <- rownames(topTags(et)$table) r <- rownames(tTags) c=cpm(exp_study)[r, order(exp_study$samples$group)] #rx=cbind(as.data.frame(tTags), gl[rownames(tTags),2],gl[rownames(tTags),3],c,1000*c/gl[rownames(tTags),3]) rx=merge(x=as.data.frame(tTags),y=gl,by="row.names",all.x=TRUE) rownames(rx)=rx$Row.names rx=rx[,!(names(rx) %in% c("Row.names","ID"))] i=as.data.frame(c) x1=merge(x=rx,y=i,by="row.names",all.x=TRUE) rx=cbind(x1,1000*x1[,8]/rx$genelength,1000*x1[,9]/rx$genelength,1000*x1[,10]/rx$genelength,1000*x1[,11]/rx$genelength) rx=cbind(rx,0.5*(rx[,12]+rx[,13]),0.5*(rx[,14]+rx[,15])) colnames(rx)=c("EnsemblID", "logFC", "logCPM", "PValue", "FDR", "geneID", "genelength", "CPM_KO_0h_replicate_I", "CPM_KO_0h_replicate_II", "CPM_WT_0h_replicate_I", "CPM_WT_0h_replicate_II", "RPKM_KO_0h_replicate_I", "RPKM_KO_0h_replicate_II", "RPKM_WT_0h_replicate_I", "RPKM_WT_0h_replicate_II", "RPKM_KO_0h", "RPKM_WT_0h") #rx=merge(x=rx,y=bt2,by="EnsemblID",all.x=TRUE) write.table(rx, file="edgeRgenesExpr-0h_pcg.csv",quote=FALSE,row.names=FALSE) rx_m0=rx print ("R-m0") summary(de <- decideTestsDGE(et, p=0.05,adjust.method="none")) summary(de <- decideTestsDGE(et, p=0.05,adjust.method="BH")) summary(de <- decideTestsDGE(et, p=0.1,adjust.method="BH")) for (i in 8:11){ print (colnames(rx)[i]) tt=summary(rx[,i]>0) print(tt) } for (i in 12:15){ print (colnames(rx)[i]) tt=summary(rx[,i]>1) print(tt) } col_ordering = c(13,14,3,4)#2h rnaseqMatrix =rnaseqMatrix0[,col_ordering]; rnaseqMatrix = rnaseqMatrix[(rowSums(rnaseqMatrix[,1:2])>=2)&(rowSums(rnaseqMatrix[,3:4])>=2),] #rnaseqMatrix = rnaseqMatrix[rowSums(rnaseqMatrix)>=2,] rnaseqMatrix=rnaseqMatrix[rownames(poly) %in% bt4[,1],] conditions = factor(c("KO","KO","WT","WT")); exp_study = DGEList(counts=rnaseqMatrix, group=conditions);exp_study = calcNormFactors(exp_study);exp_study = estimateCommonDisp(exp_study);exp_study = estimateTagwiseDisp(exp_study);et = exactTest(exp_study,pair=c("WT","KO")) tTags = topTags(et,n=NULL,adjust.method = "fdr") r <- rownames(tTags) c=cpm(exp_study)[r, order(exp_study$samples$group)] rx=merge(x=as.data.frame(tTags),y=gl,by="row.names",all.x=TRUE) rownames(rx)=rx$Row.names rx=rx[,!(names(rx) %in% c("Row.names","ID"))] i=as.data.frame(c) x1=merge(x=rx,y=i,by="row.names",all.x=TRUE) rx=cbind(x1,1000*x1[,8]/rx$genelength,1000*x1[,9]/rx$genelength,1000*x1[,10]/rx$genelength,1000*x1[,11]/rx$genelength) rx=cbind(rx,0.5*(rx[,12]+rx[,13]),0.5*(rx[,14]+rx[,15])) colnames(rx)=c("EnsemblID", "logFC", "logCPM", "PValue", "FDR", "geneID", "genelength", "CPM_KO_2h_replicate_I", "CPM_KO_2h_replicate_II", "CPM_WT_2h_replicate_I", "CPM_WT_2h_replicate_II", "RPKM_KO_2h_replicate_I", "RPKM_KO_2h_replicate_II", "RPKM_WT_2h_replicate_I", "RPKM_WT_2h_replicate_II", "RPKM_KO_2h", "RPKM_WT_2h")#2h #rx=merge(x=rx,y=bt2,by="EnsemblID",all.x=TRUE) write.table(rx, file="edgeRgenesExpr-2h_pcg.csv",quote=FALSE,row.names=FALSE) rx_2h=rx print ("R-2h") summary(de <- decideTestsDGE(et, p=0.05,adjust.method="none")) summary(de <- decideTestsDGE(et, p=0.05,adjust.method="BH")) summary(de <- decideTestsDGE(et, p=0.1,adjust.method="BH")) for (i in 8:11){ print (colnames(rx)[i]) tt=summary(rx[,i]>0) print(tt) } for (i in 12:15){ print (colnames(rx)[i]) tt=summary(rx[,i]>1) print(tt) } col_ordering = c(15,16,5,6)#6h rnaseqMatrix =rnaseqMatrix0[,col_ordering]; rnaseqMatrix = rnaseqMatrix[(rowSums(rnaseqMatrix[,1:2])>=2)&(rowSums(rnaseqMatrix[,3:4])>=2),] #rnaseqMatrix = rnaseqMatrix[rowSums(rnaseqMatrix)>=2,] rnaseqMatrix=rnaseqMatrix[rownames(poly) %in% bt4[,1],] conditions = factor(c("KO","KO","WT","WT")); exp_study = DGEList(counts=rnaseqMatrix, group=conditions);exp_study = calcNormFactors(exp_study);exp_study = estimateCommonDisp(exp_study);exp_study = estimateTagwiseDisp(exp_study);et = exactTest(exp_study,pair=c("WT","KO")) tTags = topTags(et,n=NULL,adjust.method = "fdr") r <- rownames(tTags) c=cpm(exp_study)[r, order(exp_study$samples$group)] rx=merge(x=as.data.frame(tTags),y=gl,by="row.names",all.x=TRUE) rownames(rx)=rx$Row.names rx=rx[,!(names(rx) %in% c("Row.names","ID"))] i=as.data.frame(c) x1=merge(x=rx,y=i,by="row.names",all.x=TRUE) rx=cbind(x1,1000*x1[,8]/rx$genelength,1000*x1[,9]/rx$genelength,1000*x1[,10]/rx$genelength,1000*x1[,11]/rx$genelength) rx=cbind(rx,0.5*(rx[,12]+rx[,13]),0.5*(rx[,14]+rx[,15])) colnames(rx)=c("EnsemblID", "logFC", "logCPM", "PValue", "FDR", "geneID", "genelength", "CPM_KO_6h_replicate_I", "CPM_KO_6h_replicate_II", "CPM_WT_6h_replicate_I", "CPM_WT_6h_replicate_II", "RPKM_KO_6h_replicate_I", "RPKM_KO_6h_replicate_II", "RPKM_WT_6h_replicate_I", "RPKM_WT_6h_replicate_II", "RPKM_KO_6h", "RPKM_WT_6h")#6h #rx=merge(x=rx,y=bt2,by="EnsemblID",all.x=TRUE) write.table(rx, file="edgeRgenesExpr-6h_pcg.csv",quote=FALSE,row.names=FALSE) rx_6h=rx print ("R-6h") summary(de <- decideTestsDGE(et, p=0.05,adjust.method="none")) summary(de <- decideTestsDGE(et, p=0.05,adjust.method="BH")) summary(de <- decideTestsDGE(et, p=0.1,adjust.method="BH")) for (i in 8:11){ print (colnames(rx)[i]) tt=summary(rx[,i]>0) print(tt) } for (i in 12:15){ print (colnames(rx)[i]) tt=summary(rx[,i]>1) print(tt) } col_ordering = c(17,18,7,8)#IFN rnaseqMatrix =rnaseqMatrix0[,col_ordering]; rnaseqMatrix = rnaseqMatrix[(rowSums(rnaseqMatrix[,1:2])>=2)&(rowSums(rnaseqMatrix[,3:4])>=2),] #rnaseqMatrix = rnaseqMatrix[rowSums(rnaseqMatrix)>=2,] rnaseqMatrix=rnaseqMatrix[rownames(poly) %in% bt4[,1],] conditions = factor(c("KO","KO","WT","WT")); exp_study = DGEList(counts=rnaseqMatrix, group=conditions);exp_study = calcNormFactors(exp_study);exp_study = estimateCommonDisp(exp_study);exp_study = estimateTagwiseDisp(exp_study);et = exactTest(exp_study,pair=c("WT","KO")) tTags = topTags(et,n=NULL,adjust.method = "fdr") r <- rownames(tTags) c=cpm(exp_study)[r, order(exp_study$samples$group)] rx=merge(x=as.data.frame(tTags),y=gl,by="row.names",all.x=TRUE) rownames(rx)=rx$Row.names rx=rx[,!(names(rx) %in% c("Row.names","ID"))] i=as.data.frame(c) x1=merge(x=rx,y=i,by="row.names",all.x=TRUE) rx=cbind(x1,1000*x1[,8]/rx$genelength,1000*x1[,9]/rx$genelength,1000*x1[,10]/rx$genelength,1000*x1[,11]/rx$genelength) rx=cbind(rx,0.5*(rx[,12]+rx[,13]),0.5*(rx[,14]+rx[,15])) colnames(rx)=c("EnsemblID", "logFC", "logCPM", "PValue", "FDR", "geneID", "genelength", "CPM_KO_m1_replicate_I", "CPM_KO_m1_replicate_II", "CPM_WT_m1_replicate_I", "CPM_WT_m1_replicate_II", "RPKM_KO_m1_replicate_I", "RPKM_KO_m1_replicate_II", "RPKM_WT_m1_replicate_I", "RPKM_WT_m1_replicate_II", "RPKM_KO_m1", "RPKM_WT_m1")#m1 #rx=merge(x=rx,y=bt2,by="EnsemblID",all.x=TRUE) write.table(rx, file="edgeRgenesExpr-IFN_pcg.csv",quote=FALSE,row.names=FALSE) rx_m1=rx print ("R-m1") summary(de <- decideTestsDGE(et, p=0.05,adjust.method="none")) summary(de <- decideTestsDGE(et, p=0.05,adjust.method="BH")) summary(de <- decideTestsDGE(et, p=0.1,adjust.method="BH")) for (i in 8:11){ print (colnames(rx)[i]) tt=summary(rx[,i]>0) print(tt) } for (i in 12:15){ print (colnames(rx)[i]) tt=summary(rx[,i]>1) print(tt) } col_ordering = c(19,20,9,10)#IL4 rnaseqMatrix =rnaseqMatrix0[,col_ordering]; rnaseqMatrix = rnaseqMatrix[(rowSums(rnaseqMatrix[,1:2])>=2)&(rowSums(rnaseqMatrix[,3:4])>=2),] #rnaseqMatrix = rnaseqMatrix[rowSums(rnaseqMatrix)>=2,] rnaseqMatrix=rnaseqMatrix[rownames(poly) %in% bt4[,1],] conditions = factor(c("KO","KO","WT","WT")); exp_study = DGEList(counts=rnaseqMatrix, group=conditions);exp_study = calcNormFactors(exp_study);exp_study = estimateCommonDisp(exp_study);exp_study = estimateTagwiseDisp(exp_study);et = exactTest(exp_study,pair=c("WT","KO")) tTags = topTags(et,n=NULL,adjust.method = "fdr") r <- rownames(tTags) c=cpm(exp_study)[r, order(exp_study$samples$group)] rx=merge(x=as.data.frame(tTags),y=gl,by="row.names",all.x=TRUE) rownames(rx)=rx$Row.names rx=rx[,!(names(rx) %in% c("Row.names","ID"))] i=as.data.frame(c) x1=merge(x=rx,y=i,by="row.names",all.x=TRUE) rx=cbind(x1,1000*x1[,8]/rx$genelength,1000*x1[,9]/rx$genelength,1000*x1[,10]/rx$genelength,1000*x1[,11]/rx$genelength) rx=cbind(rx,0.5*(rx[,12]+rx[,13]),0.5*(rx[,14]+rx[,15])) colnames(rx)=c("EnsemblID", "logFC", "logCPM", "PValue", "FDR", "geneID", "genelength", "CPM_KO_m2_replicate_I", "CPM_KO_m2_replicate_II", "CPM_WT_m2_replicate_I", "CPM_WT_m2_replicate_II", "RPKM_KO_m2_replicate_I", "RPKM_KO_m2_replicate_II", "RPKM_WT_m2_replicate_I", "RPKM_WT_m2_replicate_II", "RPKM_KO_m2", "RPKM_WT_m2")#m2 #rx=merge(x=rx,y=bt2,by="EnsemblID",all.x=TRUE) write.table(rx, file="edgeRgenesExpr-IL4_pcg.csv",quote=FALSE,row.names=FALSE) rx_m2=rx print ("R-m2") summary(de <- decideTestsDGE(et, p=0.05,adjust.method="none")) summary(de <- decideTestsDGE(et, p=0.05,adjust.method="BH")) summary(de <- decideTestsDGE(et, p=0.1,adjust.method="BH")) all_m0=merge(x=rx_m0,y=x_m0,by="EnsemblID",all.x=T,all.y=T) write.table(all_m0, file="rna_poly_m0_pcg.csv",quote=FALSE,row.names=FALSE) all_m1=merge(x=rx_m1,y=x_m1,by="EnsemblID",all.x=T,all.y=T) write.table(all_m1, file="rna_poly_m1_pcg.csv",quote=FALSE,row.names=FALSE) all_m2=merge(x=rx_m2,y=x_m2,by="EnsemblID",all.x=T,all.y=T) write.table(all_m2, file="rna_poly_m2_pcg.csv",quote=FALSE,row.names=FALSE) all_2h=merge(x=rx_2h,y=x_2h,by="EnsemblID",all.x=T,all.y=T) write.table(all_2h, file="rna_poly_2h_pcg.csv",quote=FALSE,row.names=FALSE) all_6h=merge(x=rx_6h,y=x_6h,by="EnsemblID",all.x=T,all.y=T) write.table(all_6h, file="rna_poly_6h_pcg.csv",quote=FALSE,row.names=FALSE) #write DEG tables deg=all_m0[(all_m0$PValue.x<=0.05)&(!is.na(all_m0$PValue.x)),] write.table(deg, file="rna_poly_m0_rna_deg_pval_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_m0[(all_m0$PValue.y<=0.05)&(!is.na(all_m0$PValue.y)),] write.table(deg, file="rna_poly_m0_poly_deg_pval_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_m0[(all_m0$FDR.x<=0.05)&(!is.na(all_m0$FDR.x)),] write.table(deg, file="rna_poly_m0_rna_deg_fdr_0.05_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_m0[(all_m0$FDR.y<=0.05)&(!is.na(all_m0$FDR.y)),] write.table(deg, file="rna_poly_m0_poly_deg_fdr_0.05_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_m0[(all_m0$FDR.x<=0.1)&(!is.na(all_m0$FDR.x)),] write.table(deg, file="rna_poly_m0_rna_deg_fdr_0.1_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_m0[(all_m0$FDR.y<=0.1)&(!is.na(all_m0$FDR.y)),] write.table(deg, file="rna_poly_m0_poly_deg_fdr_0.1_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_m1[(all_m1$PValue.x<=0.05)&(!is.na(all_m1$PValue.x)),] write.table(deg, file="rna_poly_m1_rna_deg_pval_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_m1[(all_m1$PValue.y<=0.05)&(!is.na(all_m1$PValue.y)),] write.table(deg, file="rna_poly_m1_poly_deg_pval_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_m1[(all_m1$FDR.x<=0.05)&(!is.na(all_m1$FDR.x)),] write.table(deg, file="rna_poly_m1_rna_deg_fdr_0.05_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_m1[(all_m1$FDR.y<=0.05)&(!is.na(all_m1$FDR.y)),] write.table(deg, file="rna_poly_m1_poly_deg_fdr_0.05_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_m1[(all_m1$FDR.x<=0.1)&(!is.na(all_m1$FDR.x)),] write.table(deg, file="rna_poly_m1_rna_deg_fdr_0.1_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_m1[(all_m1$FDR.y<=0.1)&(!is.na(all_m1$FDR.y)),] write.table(deg, file="rna_poly_m1_poly_deg_fdr_0.1_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_m2[(all_m2$PValue.x<=0.05)&(!is.na(all_m2$PValue.x)),] write.table(deg, file="rna_poly_m2_rna_deg_pval_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_m2[(all_m2$PValue.y<=0.05)&(!is.na(all_m2$PValue.y)),] write.table(deg, file="rna_poly_m2_poly_deg_pval_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_m2[(all_m2$FDR.x<=0.05)&(!is.na(all_m2$FDR.x)),] write.table(deg, file="rna_poly_m2_rna_deg_fdr_0.05_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_m2[(all_m2$FDR.y<=0.05)&(!is.na(all_m2$FDR.y)),] write.table(deg, file="rna_poly_m2_poly_deg_fdr_0.05_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_m2[(all_m2$FDR.x<=0.1)&(!is.na(all_m2$FDR.x)),] write.table(deg, file="rna_poly_m2_rna_deg_fdr_0.1_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_m2[(all_m2$FDR.y<=0.1)&(!is.na(all_m2$FDR.y)),] write.table(deg, file="rna_poly_m2_poly_deg_fdr_0.1_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_2h[(all_2h$PValue.x<=0.05)&(!is.na(all_2h$PValue.x)),] write.table(deg, file="rna_poly_2h_rna_deg_pval_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_2h[(all_2h$PValue.y<=0.05)&(!is.na(all_2h$PValue.y)),] write.table(deg, file="rna_poly_2h_poly_deg_pval_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_2h[(all_2h$FDR.x<=0.05)&(!is.na(all_2h$FDR.x)),] write.table(deg, file="rna_poly_2h_rna_deg_fdr_0.05_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_2h[(all_2h$FDR.y<=0.05)&(!is.na(all_2h$FDR.y)),] write.table(deg, file="rna_poly_2h_poly_deg_fdr_0.05_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_2h[(all_2h$FDR.x<=0.1)&(!is.na(all_2h$FDR.x)),] write.table(deg, file="rna_poly_2h_rna_deg_fdr_0.1_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_2h[(all_2h$FDR.y<=0.1)&(!is.na(all_2h$FDR.y)),] write.table(deg, file="rna_poly_2h_poly_deg_fdr_0.1_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_6h[(all_6h$PValue.x<=0.05)&(!is.na(all_6h$PValue.x)),] write.table(deg, file="rna_poly_6h_rna_deg_pval_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_6h[(all_6h$PValue.y<=0.05)&(!is.na(all_6h$PValue.y)),] write.table(deg, file="rna_poly_6h_poly_deg_pval_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_6h[(all_6h$FDR.x<=0.05)&(!is.na(all_6h$FDR.x)),] write.table(deg, file="rna_poly_6h_rna_deg_fdr_0.05_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_6h[(all_6h$FDR.y<=0.05)&(!is.na(all_6h$FDR.y)),] write.table(deg, file="rna_poly_6h_poly_deg_fdr_0.05_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_6h[(all_6h$FDR.x<=0.1)&(!is.na(all_6h$FDR.x)),] write.table(deg, file="rna_poly_6h_rna_deg_fdr_0.1_pcg.csv",quote=FALSE,row.names=FALSE) deg=all_6h[(all_6h$FDR.y<=0.1)&(!is.na(all_6h$FDR.y)),] write.table(deg, file="rna_poly_6h_poly_deg_fdr_0.1_pcg.csv",quote=FALSE,row.names=FALSE) # t-tests th=2 lpWT_m2=all_m2[ abs(all_m2$logFC.x)