-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathconsensus_pathway_db.R
31 lines (24 loc) · 1.24 KB
/
consensus_pathway_db.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
library(data.table)
library(stringr)
read.data <- function(gene.set){
dt <- fread(paste0("/project_data/overlap_T2D_OA/pathway_analysis/ConsensusPathDb/", gene.set, "_ORA_results.tab")) %>%
.[, .(`p-value`, `q-value`, pathway, source, external_id, members_input_overlap, size, effective_size)]
dt.GO <- fread(paste0("/project_data/overlap_T2D_OA/pathway_analysis/ConsensusPathDb/", gene.set, "_GO_ORA_results.tab")) %>%
.[, source:="GO"] %>%
.[, .(`p-value`, `q-value`, pathway=term_name, source, external_id=term_goid, members_input_overlap=members_input_overlap_geneids, size, effective_size)]
dt <- rbind(dt, dt.GO) %>%
.[, `:=`(GeneSet=gene.set, N_genes=str_count(members_input_overlap, ";")+1)] %>%
dplyr::arrange(log(`q-value`))
setcolorder(dt, c(colnames(dt)[9], colnames(dt)[1:8]))
return(dt)
}
dt <- data.table()
for (gene.set in c("hc", "hc_knee", "hc_hip")) {
dt <- rbind(dt, read.data(gene.set))
fwrite(dt, "/project_data/overlap_T2D_OA/pathway_analysis/ConsensusPathDb/high_conf_genes.csv")
}
dt <- data.table()
for (gene.set in c("likely", "likely_knee", "likely_hip")){
dt <- rbind(dt, read.data(gene.set))
fwrite(dt, "/project_data/overlap_T2D_OA/pathway_analysis/ConsensusPathDb/likely_genes.csv")
}