-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathPancancer_1C_IFNG_CD8.R
207 lines (197 loc) · 12.5 KB
/
Pancancer_1C_IFNG_CD8.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
library(dplyr)
library(Seurat)
library(patchwork)
BC_CD4.data <- read.table("D:/GSE156728/GSE156728_BC_10X.CD4.counts.txt",sep = "\t",header = TRUE,row.names = 1)
BCL_CD4.data <- read.table("D:/GSE156728/GSE156728_BCL_10X.CD4.counts.txt",sep = "\t",header = TRUE,row.names = 1)
ESCA_CD4.data <- read.table("D:/GSE156728/GSE156728_ESCA_10X.CD4.counts.txt",sep = "\t",header = TRUE,row.names = 1)
MM_CD4.data <- read.table("D:/GSE156728/GSE156728_MM_10X.CD4.counts.txt",sep = "\t",header = TRUE,row.names = 1)
PACA_CD4.data <- read.table("D:/GSE156728/GSE156728_PACA_10X.CD4.counts.txt",sep = "\t",header = TRUE,row.names = 1)
RC_CD4.data <- read.table("D:/GSE156728/GSE156728_RC_10X.CD4.counts.txt",sep = "\t",header = TRUE,row.names = 1)
THCA_CD4.data <- read.table("D:/GSE156728/GSE156728_THCA_10X.CD4.counts.txt",sep = "\t",header = TRUE,row.names = 1)
UCEC_CD4.data <- read.table("D:/GSE156728/GSE156728_UCEC_10X.CD4.counts.txt",sep = "\t",header = TRUE,row.names = 1)
OV_CD4.data <- read.table("D:/GSE156728/GSM4743199_OV_10X.CD4.counts.txt",sep = "\t",header = TRUE,row.names = 1)
FTC_CD4.data <- read.table("D:/GSE156728/GSM4743231_FTC_10X.CD4.counts.txt",sep = "\t",header = TRUE,row.names = 1)
CHOL_CD4.data <- read.table("D:/GSE156728/GSM4743237_CHOL_SS2.CD4.counts.txt",sep = "\t",header = TRUE,row.names = 1)
BC_CD8.data <- read.table("D:/GSE156728/GSE156728_BC_10X.CD8.counts.txt",sep = "\t",header = TRUE,row.names = 1)
BCL_CD8.data <- read.table("D:/GSE156728/GSE156728_BCL_10X.CD8.counts.txt",sep = "\t",header = TRUE,row.names = 1)
ESCA_CD8.data <- read.table("D:/GSE156728/GSE156728_ESCA_10X.CD8.counts.txt",sep = "\t",header = TRUE,row.names = 1)
MM_CD8.data <- read.table("D:/GSE156728/GSE156728_MM_10X.CD8.counts.txt",sep = "\t",header = TRUE,row.names = 1)
PACA_CD8.data <- read.table("D:/GSE156728/GSE156728_PACA_10X.CD8.counts.txt",sep = "\t",header = TRUE,row.names = 1)
RC_CD8.data <- read.table("D:/GSE156728/GSE156728_RC_10X.CD8.counts.txt",sep = "\t",header = TRUE,row.names = 1)
THCA_CD8.data <- read.table("D:/GSE156728/GSE156728_THCA_10X.CD8.counts.txt",sep = "\t",header = TRUE,row.names = 1)
UCEC_CD8.data <- read.table("D:/GSE156728/GSE156728_UCEC_10X.CD8.counts.txt",sep = "\t",header = TRUE,row.names = 1)
OV_CD8.data <- read.table("D:/GSE156728/GSM4743199_OV_10X.CD8.counts.txt",sep = "\t",header = TRUE,row.names = 1)
FTC_CD8.data <- read.table("D:/GSE156728/GSM4743231_FTC_10X.CD8.counts.txt",sep = "\t",header = TRUE,row.names = 1)
CHOL_CD8.data <- read.table("D:/GSE156728/GSM4743237_CHOL_SS2.CD8.counts.txt",sep = "\t",header = TRUE,row.names = 1)
for (i in 1:length(colnames(BC_CD4.data))) {
colnames(BC_CD4.data)[i] <- paste(colnames(BC_CD4.data)[i],"BC_CD4",i,sep = "-")
}
for (i in 1:length(colnames(BCL_CD4.data))) {
colnames(BCL_CD4.data)[i] <- paste(colnames(BCL_CD4.data)[i],"BCL_CD4",i,sep = "-")
}
for (i in 1:length(colnames(ESCA_CD4.data))) {
colnames(ESCA_CD4.data)[i] <- paste(colnames(ESCA_CD4.data)[i],"ESCA_CD4",i,sep = "-")
}
for (i in 1:length(colnames(MM_CD4.data))) {
colnames(MM_CD4.data)[i] <- paste(colnames(MM_CD4.data)[i],"MM_CD4",i,sep = "-")
}
for (i in 1:length(colnames(PACA_CD4.data))) {
colnames(PACA_CD4.data)[i] <- paste(colnames(PACA_CD4.data)[i],"PACA_CD4",i,sep = "-")
}
for (i in 1:length(colnames(RC_CD4.data))) {
colnames(RC_CD4.data)[i] <- paste(colnames(RC_CD4.data)[i],"RC_CD4",i,sep = "-")
}
for (i in 1:length(colnames(THCA_CD4.data))) {
colnames(THCA_CD4.data)[i] <- paste(colnames(THCA_CD4.data)[i],"THCA_CD4",i,sep = "-")
}
for (i in 1:length(colnames(UCEC_CD4.data))) {
colnames(UCEC_CD4.data)[i] <- paste(colnames(UCEC_CD4.data)[i],"UCEC_CD4",i,sep = "-")
}
for (i in 1:length(colnames(OV_CD4.data))) {
colnames(OV_CD4.data)[i] <- paste(colnames(OV_CD4.data)[i],"OV_CD4",i,sep = "-")
}
for (i in 1:length(colnames(FTC_CD4.data))) {
colnames(FTC_CD4.data)[i] <- paste(colnames(FTC_CD4.data)[i],"FTC_CD4",i,sep = "-")
}
for (i in 1:length(colnames(CHOL_CD4.data))) {
colnames(CHOL_CD4.data)[i] <- paste(colnames(CHOL_CD4.data)[i],"CHOL_CD4",i,sep = "-")
}
for (i in 1:length(colnames(BC_CD8.data))) {
colnames(BC_CD8.data)[i] <- paste(colnames(BC_CD8.data)[i],"BC_CD8",i,sep = "-")
}
for (i in 1:length(colnames(BCL_CD8.data))) {
colnames(BCL_CD8.data)[i] <- paste(colnames(BCL_CD8.data)[i],"BCL_CD8",i,sep = "-")
}
for (i in 1:length(colnames(ESCA_CD8.data))) {
colnames(ESCA_CD8.data)[i] <- paste(colnames(ESCA_CD8.data)[i],"ESCA_CD8",i,sep = "-")
}
for (i in 1:length(colnames(MM_CD8.data))) {
colnames(MM_CD8.data)[i] <- paste(colnames(MM_CD8.data)[i],"MM_CD8",i,sep = "-")
}
for (i in 1:length(colnames(PACA_CD8.data))) {
colnames(PACA_CD8.data)[i] <- paste(colnames(PACA_CD8.data)[i],"PACA_CD8",i,sep = "-")
}
for (i in 1:length(colnames(RC_CD8.data))) {
colnames(RC_CD8.data)[i] <- paste(colnames(RC_CD8.data)[i],"RC_CD8",i,sep = "-")
}
for (i in 1:length(colnames(THCA_CD8.data))) {
colnames(THCA_CD8.data)[i] <- paste(colnames(THCA_CD8.data)[i],"THCA_CD8",i,sep = "-")
}
for (i in 1:length(colnames(UCEC_CD8.data))) {
colnames(UCEC_CD8.data)[i] <- paste(colnames(UCEC_CD8.data)[i],"UCEC_CD8",i,sep = "-")
}
for (i in 1:length(colnames(OV_CD8.data))) {
colnames(OV_CD8.data)[i] <- paste(colnames(OV_CD8.data)[i],"OV_CD8",i,sep = "-")
}
for (i in 1:length(colnames(FTC_CD8.data))) {
colnames(FTC_CD8.data)[i] <- paste(colnames(FTC_CD8.data)[i],"FTC_CD8",i,sep = "-")
}
for (i in 1:length(colnames(CHOL_CD8.data))) {
colnames(CHOL_CD8.data)[i] <- paste(colnames(CHOL_CD8.data)[i],"CHOL_CD8",i,sep = "-")
}
A<-cbind(BC_CD4.data,ESCA_CD4.data,FTC_CD4.data,OV_CD4.data,PACA_CD4.data,RC_CD4.data,THCA_CD4.data,UCEC_CD4.data,
BC_CD8.data,ESCA_CD8.data,FTC_CD8.data,OV_CD8.data,PACA_CD8.data,RC_CD8.data,THCA_CD8.data,UCEC_CD8.data)
B<-cbind(BCL_CD4.data,MM_CD4.data,
BCL_CD8.data,MM_CD8.data)
remove(BC_CD4.data,ESCA_CD4.data,FTC_CD4.data,OV_CD4.data,PACA_CD4.data,RC_CD4.data,THCA_CD4.data,UCEC_CD4.data,
BC_CD8.data,ESCA_CD8.data,FTC_CD8.data,OV_CD8.data,PACA_CD8.data,RC_CD8.data,THCA_CD8.data,UCEC_CD8.data,
BCL_CD4.data,MM_CD4.data,
BCL_CD8.data,MM_CD8.data)
#C<-intersect(rownames(A),rownames(B))
#B_new<-B[C,]
#D<-cbind(A,B_new)
#E<-intersect(rownames(D),rownames(CHOL_CD4.data))
#D_new<-D[E,]
#CHOL_CD4.data_new<-CHOL_CD4.data[E,]
#F<-cbind(D_new,CHOL_CD4.data_new)
#remove(BC_CD4.data,BCL_CD4.data,CHOL_CD4.data,CHOL_CD4.data_new,ESCA_CD4.data,FTC_CD4.data,MM_CD4.data,OV_CD4.data,PACA_CD4.data,RC_CD4.data,THCA_CD4.data,UCEC_CD4.data,C,E,i,B_new,D_new)
metadata<-read.table("D:/GSE156728/GSE156728_metadata.txt",sep = "\t",header = TRUE,row.names = 1)
G<-as.data.frame(colnames(A))
colnames(G)<-"A"
library(tidyr)
H<-separate(G,A,into = c("A","B","C"),sep = "-")
K<-separate(H,B,into = c("B","D"),sep = "_")
I<-intersect(K$A,rownames(metadata))
metadata_new<-metadata[I,]
rownames(K)<-K$A
K_new<-K[rownames(metadata_new),]
J<-cbind(metadata_new,K_new)
rownames(J)<-colnames(A)
remove(metadata,metadata_new,G,H,K,K_new)
remove(I)
pbmc <- CreateSeuratObject(counts = A, project = "pbmc3k", min.cells = 3, min.features = 200,meta.data = J )
remove(A,J)
pbmc[["percent.mt"]] <- PercentageFeatureSet(pbmc, pattern = "^MT-")
pbmc <- NormalizeData(pbmc)
pbmc <- FindVariableFeatures(pbmc, selection.method = "vst", nfeatures = 2000)
all.genes <- rownames(pbmc)
pbmc <- ScaleData(pbmc, features = all.genes)
pbmc <- RunPCA(pbmc, features = VariableFeatures(object = pbmc))
ElbowPlot(pbmc)
pbmc <- FindNeighbors(pbmc, dims = 1:31)
pbmc <- FindClusters(pbmc, resolution = 1)
pbmc <- RunUMAP(pbmc, dims = 1:31)
DimPlot(pbmc, reduction = "umap",label = TRUE)
Idents(pbmc)<[email protected]$D
pbmc_CD8<-subset(pbmc,idents = "CD8")
pbmc_CD4<-subset(pbmc,idents = "CD4")
pbmc_CD4 <- RunPCA(pbmc_CD4, features = VariableFeatures(object = pbmc_CD4))
ElbowPlot(pbmc_CD4)
pbmc_CD4 <- FindNeighbors(pbmc_CD4, dims = 1:31)
pbmc_CD4 <- FindClusters(pbmc_CD4, resolution = 1)
pbmc_CD4 <- RunUMAP(pbmc_CD4, dims = 1:31)
DimPlot(pbmc_CD4, reduction = "umap",label = TRUE)
VlnPlot(pbmc_CD4,features = "FOXP3",sort = TRUE,pt.size = 0)
FeaturePlot(pbmc_CD4,features = "FOXP3",label = TRUE)
Idents(pbmc_CD4)<[email protected]$meta.cluster
DimPlot(pbmc_CD4)
VlnPlot(pbmc_CD4,features = "FOXP3",sort = TRUE,pt.size = 0)
FeaturePlot(pbmc_CD4,features = "FOXP3",label = TRUE)
Idents(pbmc)<[email protected]$meta.cluster
VlnPlot(pbmc,features = "FOXP3",sort = TRUE,pt.size = 0)
FeaturePlot(pbmc,features = "FOXP3",label = TRUE)
remove(B,CHOL_CD4.data,CHOL_CD8.data,i,all.genes)
#Treg<-subset(pbmc_CD4,idents = c("CD4.c21.Treg.OAS1","CD4.c20.Treg.TNFRSF9","CD4.c19.Treg.S1PR1","CD4.c18.Treg.RTKN2","CD4.c23.Mix.NME1","CD4.c24.Mix.NME2"))
Treg<-subset(pbmc_CD4,idents = c("CD4.c21.Treg.OAS1","CD4.c20.Treg.TNFRSF9","CD4.c19.Treg.S1PR1","CD4.c18.Treg.RTKN2"))
Idents(pbmc_CD8)<[email protected]$meta.cluster
VlnPlot(pbmc_CD8,features = "IFNG",sort = TRUE,pt.size = 0)
#pbmc_CD8_IFNG<-subset(pbmc_CD8,idents = c("CD8.c11.Tex.PDCD1","CD8.c13.Tex.myl12a","CD8.c12.Tex.CXCL13"))
pbmc_CD8_IFNG<-subset(pbmc_CD8,idents = c("CD8.c11.Tex.PDCD1","CD8.c13.Tex.myl12a"))
Idents(pbmc_CD8_IFNG)<[email protected]$loc
pbmc_CD8_T<-subset(pbmc_CD8_IFNG,idents = "T")
remove(pbmc,pbmc_CD4)
Idents(Treg)<[email protected]$loc
Treg_T<-subset(Treg,idents = "T")
#remove(Treg)
Idents(pbmc_CD8_T)<[email protected]$patient
Idents(Treg_T)<[email protected]$patient
patient<-unique([email protected]$patient)
for (i in 1:length(patient)) {
assign(paste("Treg_",i,"_TIL",sep = ""),subset(Treg_T,idents = patient[i]))
assign("a",slot(get(paste("Treg_",i,"_TIL",sep = "")),"assays"))
assign("b",as.data.frame(t(as.data.frame([email protected]))))
assign("c",select(b,one_of("JMJD1C")))
assign(paste("pbmc_CD8T_",i,"_TIL",sep = ""),subset(pbmc_CD8_T,idents = patient[i]))
assign("d",slot(get(paste("pbmc_CD8T_",i,"_TIL",sep = "")),"assays"))
assign("e",as.data.frame(t(as.data.frame([email protected]))))
assign("f",select(e,one_of("IFNG")))
assign(paste("scaldata_",i,"_TIL",sep = ""),data.frame(mean(c$JMJD1C),mean(f$IFNG)))
}
scaldata<-scaldata_1_TIL
for (i in 2:length(patient)) {
scaldata<-rbind(scaldata,get(paste("scaldata_",i,"_TIL",sep = "")))
}
colnames(scaldata)<-c("JMJD1C","IFNG_CD8")
library(ggplot2)
library(ggpubr)
ggplot(data = scaldata,aes(x=JMJD1C,y=IFNG_CD8)) + geom_point(color="blue",size=3.4) + stat_smooth(method = "lm",se=TRUE,size=1.5,color="red")+stat_cor(data = scaldata,method = "spearman") + theme_set(theme_bw()) + theme_set(theme_bw())
remove(pbmc_CD8T_1_TIL,pbmc_CD8T_10_TIL,pbmc_CD8T_11_TIL,pbmc_CD8T_12_TIL,pbmc_CD8T_13_TIL,pbmc_CD8T_14_TIL,pbmc_CD8T_15_TIL,pbmc_CD8T_16_TIL,pbmc_CD8T_17_TIL,pbmc_CD8T_18_TIL,pbmc_CD8T_19_TIL,pbmc_CD8T_2_TIL,
pbmc_CD8T_20_TIL,pbmc_CD8T_21_TIL,pbmc_CD8T_22_TIL,pbmc_CD8T_23_TIL,pbmc_CD8T_24_TIL,pbmc_CD8T_25_TIL,pbmc_CD8T_26_TIL,pbmc_CD8T_27_TIL,pbmc_CD8T_28_TIL,pbmc_CD8T_29_TIL,pbmc_CD8T_3_TIL,pbmc_CD8T_30_TIL,pbmc_CD8T_31_TIL,pbmc_CD8T_32_TIL,pbmc_CD8T_33_TIL,pbmc_CD8T_34_TIL,pbmc_CD8T_35_TIL,pbmc_CD8T_36_TIL,pbmc_CD8T_37_TIL,pbmc_CD8T_38_TIL,pbmc_CD8T_39_TIL,
pbmc_CD8T_4_TIL,pbmc_CD8T_40_TIL,pbmc_CD8T_41_TIL,pbmc_CD8T_42_TIL,pbmc_CD8T_5_TIL,pbmc_CD8T_6_TIL,pbmc_CD8T_7_TIL,pbmc_CD8T_8_TIL,pbmc_CD8T_9_TIL)
remove(Treg_1_TIL,Treg_10_TIL,Treg_11_TIL,Treg_12_TIL,Treg_13_TIL,Treg_14_TIL,Treg_15_TIL,Treg_16_TIL,Treg_17_TIL,Treg_18_TIL,Treg_19_TIL,Treg_2_TIL,
Treg_20_TIL,Treg_21_TIL,Treg_22_TIL,Treg_23_TIL,Treg_24_TIL,Treg_25_TIL,Treg_26_TIL,Treg_27_TIL,Treg_28_TIL,Treg_29_TIL,Treg_3_TIL,Treg_30_TIL,Treg_31_TIL,Treg_32_TIL,Treg_33_TIL,Treg_34_TIL,Treg_35_TIL,Treg_36_TIL,Treg_37_TIL,Treg_38_TIL,Treg_39_TIL,
Treg_4_TIL,Treg_40_TIL,Treg_41_TIL,Treg_42_TIL,Treg_5_TIL,Treg_6_TIL,Treg_7_TIL,Treg_8_TIL,Treg_9_TIL)
remove(scaldata_1_TIL,scaldata_10_TIL,scaldata_11_TIL,scaldata_12_TIL,scaldata_13_TIL,scaldata_14_TIL,scaldata_15_TIL,scaldata_16_TIL,scaldata_17_TIL,scaldata_18_TIL,scaldata_19_TIL,scaldata_2_TIL,
scaldata_20_TIL,scaldata_21_TIL,scaldata_22_TIL,scaldata_23_TIL,scaldata_24_TIL,scaldata_25_TIL,scaldata_26_TIL,scaldata_27_TIL,scaldata_28_TIL,scaldata_29_TIL,scaldata_3_TIL,scaldata_30_TIL,scaldata_31_TIL,scaldata_32_TIL,scaldata_33_TIL,scaldata_34_TIL,scaldata_35_TIL,scaldata_36_TIL,scaldata_37_TIL,scaldata_38_TIL,scaldata_39_TIL,
scaldata_4_TIL,scaldata_40_TIL,scaldata_41_TIL,scaldata_42_TIL,scaldata_5_TIL,scaldata_6_TIL,scaldata_7_TIL,scaldata_8_TIL,scaldata_9_TIL)
#write.table(scaldata,file = "D:/GSE156728/1C_TregIFNG.txt",sep = "\t")