点图

  1. GOinfo <- read_tsv("go.tb")
  2. emapper <- read_tsv("pep.diamond.emapper.annotations", comment = "##") %>% rename(query = "#query")
  3. # 读取时去掉`##`开头的行,而`#query`开头的行作为表头
  4. GOannotation <- emapper %>%
  5. dplyr::select(GID = query, GO = GOs) %>%
  6. dplyr::filter(GO != "-") %>%
  7. separate_rows(GO, sep = ",") %>%
  8. left_join(GOinfo, by = "GO") %>%
  9. dplyr::select(-Description)
  10. # genelist 赋值自己的基因集向量
  11. enrich <- enricher(genelist,
  12. TERM2GENE = GOannotation[c(2,1)],
  13. TERM2NAME = GOinfo[1:2])
  14. enrich2 <- as_tibble(enrich) %>%
  15. left_join(distinct(select(GOannotation, GO, level)), by = c("ID" = "GO")) %>%
  16. mutate(GeneRatio = as.numeric(str_replace(GeneRatio, "/.*", "")) / as.numeric(str_replace(GeneRatio, ".*/", ""))) %>%
  17. filter(!is.na(level)) %>%
  18. mutate(DescriptionLevel = str_c(Description, " | ", level))
  19. DescriptionOrder <- enrich2 %>%
  20. arrange(desc(level), GeneRatio) %>%
  21. .$DescriptionLevel
  22. # 排序
  23. enrich2$DescriptionLevel <- factor(enrich2$DescriptionLevel, levels = DescriptionOrder)
  24. p <- enrich2 %>%
  25. filter(GeneRatio > 0.03) %>%
  26. ggplot() +
  27. geom_point(aes(GeneRatio, DescriptionLevel, color = pvalue, size = -pvalue)) +
  28. scale_color_gradient(low = "red", high = "blue") +
  29. theme_bw()
  30. pdf(gofile, width = 8, height = 9)
  31. print(p)
  32. dev.off()