# luad
# 导入数据,并整理
rm(list = ls())
load( file = "./Rawdata/TCGA_LUNG_id_exp_sur.RData")
# 提取突变数据
d1 = as.data.frame(luad_mc3@data)
d2 = d1[,c("Hugo_Symbol","Tumor_Sample_Barcode")]
class(d2)
a = as.data.frame(table(d2$Tumor_Sample_Barcode))
a = as.character(a[,1])
# 提取突变基因
k = c("ALK")
d3 = d2[d2$Hugo_Symbol %in% k, ]
muid = d3$Tumor_Sample_Barcode
muid = muid[!duplicated(muid)]
muid = as.character(muid)
# 整理突变病人ID
library(stringr)
muid = str_split(muid, "-", simplify = T)[,c(1, 2, 3)]
muid2 = rnorm(30)
for(i in 1:nrow(muid)) {
muid2[i] = paste(c(muid[i,], "01"), sep = "-", collapse = "-")
}
muid2[14] = "TCGA-50-5946-02"
muid2 = muid2[muid2 %in% LUNG_survival_data$sample]
luad.alk.mu.id = muid2
## lusc
# 导入数据,并整理
load( file = "./Rawdata/TCGA_LUNG_id_exp_sur.RData")
# 提取突变数据
d1 = as.data.frame(lusc_mc3@data)
d2 = d1[,c("Hugo_Symbol","Tumor_Sample_Barcode")]
class(d2)
a = as.data.frame(table(d2$Tumor_Sample_Barcode))
a = as.character(a[,1])
# 提取突变基因
k = c("ALK")
d3 = d2[d2$Hugo_Symbol %in% k, ]
muid = d3$Tumor_Sample_Barcode
muid = muid[!duplicated(muid)]
muid = as.character(muid)
# 整理突变病人ID
library(stringr)
muid = str_split(muid, "-", simplify = T)[,c(1, 2, 3)]
muid2 = rnorm(30)
for(i in 1:nrow(muid)) {
muid2[i] = paste(c(muid[i,], "01"), sep = "-", collapse = "-")
}
muid2 = muid2[muid2 %in% LUNG_survival_data$sample]
lusc.alk.mu.id = muid2
save(luad.alk.mu.id, lusc.alk.mu.id, file = "./Rdata/luad.lusc.alk.muid.Rdata")