1. # luad
    2. # 导入数据,并整理
    3. rm(list = ls())
    4. load( file = "./Rawdata/TCGA_LUNG_id_exp_sur.RData")
    5. # 提取突变数据
    6. d1 = as.data.frame(luad_mc3@data)
    7. d2 = d1[,c("Hugo_Symbol","Tumor_Sample_Barcode")]
    8. class(d2)
    9. a = as.data.frame(table(d2$Tumor_Sample_Barcode))
    10. a = as.character(a[,1])
    11. # 提取突变基因
    12. k = c("ALK")
    13. d3 = d2[d2$Hugo_Symbol %in% k, ]
    14. muid = d3$Tumor_Sample_Barcode
    15. muid = muid[!duplicated(muid)]
    16. muid = as.character(muid)
    17. # 整理突变病人ID
    18. library(stringr)
    19. muid = str_split(muid, "-", simplify = T)[,c(1, 2, 3)]
    20. muid2 = rnorm(30)
    21. for(i in 1:nrow(muid)) {
    22. muid2[i] = paste(c(muid[i,], "01"), sep = "-", collapse = "-")
    23. }
    24. muid2[14] = "TCGA-50-5946-02"
    25. muid2 = muid2[muid2 %in% LUNG_survival_data$sample]
    26. luad.alk.mu.id = muid2
    27. ## lusc
    28. # 导入数据,并整理
    29. load( file = "./Rawdata/TCGA_LUNG_id_exp_sur.RData")
    30. # 提取突变数据
    31. d1 = as.data.frame(lusc_mc3@data)
    32. d2 = d1[,c("Hugo_Symbol","Tumor_Sample_Barcode")]
    33. class(d2)
    34. a = as.data.frame(table(d2$Tumor_Sample_Barcode))
    35. a = as.character(a[,1])
    36. # 提取突变基因
    37. k = c("ALK")
    38. d3 = d2[d2$Hugo_Symbol %in% k, ]
    39. muid = d3$Tumor_Sample_Barcode
    40. muid = muid[!duplicated(muid)]
    41. muid = as.character(muid)
    42. # 整理突变病人ID
    43. library(stringr)
    44. muid = str_split(muid, "-", simplify = T)[,c(1, 2, 3)]
    45. muid2 = rnorm(30)
    46. for(i in 1:nrow(muid)) {
    47. muid2[i] = paste(c(muid[i,], "01"), sep = "-", collapse = "-")
    48. }
    49. muid2 = muid2[muid2 %in% LUNG_survival_data$sample]
    50. lusc.alk.mu.id = muid2
    51. save(luad.alk.mu.id, lusc.alk.mu.id, file = "./Rdata/luad.lusc.alk.muid.Rdata")