Open files

Note: due to pairwise ordering from another file (tissue_specific_tDMRs), tDMRs labeled as "hypermethylated" are actually hypomethylated in the lung and kidney.

# Library
human_chimp_heart_specific_25_conserved_H3K27_HEART <- read.delim("~/Desktop/Regulatory_Evol/ashlar-trial/data/overlap_reg/overlap_25/human_chimp_heart_specific_25_conserved_H3K27_HEART.bed", header=FALSE, stringsAsFactors = FALSE)

human_chimp_heart_specific_25_conserved_H3K27_KIDNEY <- read.delim("~/Desktop/Regulatory_Evol/ashlar-trial/data/overlap_reg/overlap_25/human_chimp_kidney_specific_25_conserved_H3K27_KIDNEY.bed", header=FALSE, stringsAsFactors = FALSE)

human_chimp_heart_specific_25_conserved_H3K27_LIVER <- read.delim("~/Desktop/Regulatory_Evol/ashlar-trial/data/overlap_reg/overlap_25/human_chimp_liver_specific_25_conserved_H3K27_LIVER.bed", header=FALSE, stringsAsFactors = FALSE)

human_chimp_heart_specific_25_conserved_H3K27_LUNG <- read.delim("~/Desktop/Regulatory_Evol/ashlar-trial/data/overlap_reg/overlap_25/human_chimp_lung_specific_25_conserved_H3K27_LUNG.bed", header=FALSE, stringsAsFactors = FALSE)

refGene_hg19_TSS <- read.delim("~/Desktop/Regulatory_Evol/ashlar-trial/data/overlap_reg/overlap_25/refGene_hg19_TSS.R", header=FALSE, stringsAsFactors = FALSE)

# Adjust so that bedtools will accept it
refGene_hg19_TSS[,3] <- refGene_hg19_TSS[,3] + 1 

# Now sort

##    bedtools closest -a /var/folders/rf/qrcw6ncj05z1pc_pq9xzw3540000gn/T//RtmpXK3I56/a_bc557225e1f3.bed -b /var/folders/rf/qrcw6ncj05z1pc_pq9xzw3540000gn/T//RtmpXK3I56/b_bc5530e100bf.bed
# Sort based on upsteam/downstream

closest_heart_upstream <- closest_heart[which(closest_heart$V9 == "+"),]
closest_heart_downstream <- closest_heart[which(closest_heart$V9 == "-"),]
distance_heart_upstream <- as.numeric(closest_heart_upstream$V3) - as.numeric(closest_heart_upstream$V5)
distance_heart_downstream <- as.numeric(closest_heart_downstream$V5) - as.numeric(closest_heart_downstream$V3)

# Now sort

# Now sort

# Sort based on upsteam/downstream

closest_liver_upstream <- closest_heart[which(closest_heart$V9 == "+"),]
closest_liver_downstream <- closest_heart[which(closest_heart$V9 == "-"),]
distance_liver_upstream <- as.numeric(closest_liver_upstream$V3) - as.numeric(closest_liver_upstream$V5)
distance_liver_downstream <- as.numeric(closest_liver_downstream$V5) - as.numeric(closest_liver_downstream$V3)

length(which(distance_liver_upstream > 0))/length(distance_liver_upstream)
## [1] 0.6512043
length(which(distance_liver_downstream > 0))/length(distance_liver_downstream)
## [1] 0.6230032
all_distance <- c(distance_heart_upstream, distance_heart_downstream, distance_liver_upstream, distance_liver_downstream)
##    Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
## -805181   -7548    1690   13079   31168  999526


# Now sort

# Sort based on upsteam/downstream

closest_heart_upstream <- closest_heart[which(closest_heart$V9 == "+"),]
closest_heart_downstream <- closest_heart[which(closest_heart$V9 == "-"),]
distance_heart_upstream <- as.numeric(closest_heart_upstream$V3) - as.numeric(closest_heart_upstream$V5)
distance_heart_downstream <- as.numeric(closest_heart_downstream$V5) - as.numeric(closest_heart_downstream$V3)

length(which(distance_heart_upstream > 0))/length(distance_heart_upstream)
## [1] 0.673913
length(which(distance_heart_downstream > 0))/length(distance_heart_downstream)
## [1] 0.5714286

Separate into hypermethylated and overlapping H3K27ac


# Find the heart hypo
heart_hypo <- human_chimp_heart_specific_25_conserved_H3K27_HEART[which(human_chimp_heart_specific_25_conserved_H3K27_LIVER$V4 == "hyper" & human_chimp_heart_specific_25_conserved_H3K27_LIVER$V6 != "-1"),]

heart_hypo <- heart_hypo[complete.cases(heart_hypo), ]

# Find the closest gene

# Convert the gene name to ensg

gene_id <- read.table("../../../Reg_Evo_Primates/data/ENSG_GENE_HG19.csv", stringsAsFactors = FALSE, header=TRUE, sep = ",")

comb_kidney <- merge(closest_heart, gene_id, by.x = c("V8"), by.y = c("Gene"))

##  [1] "ENSG00000196839" "ENSG00000163050" "ENSG00000178878"
##  [4] "ENSG00000130762" "ENSG00000168646" "ENSG00000110092"
##  [7] "ENSG00000106554" "ENSG00000134871" "ENSG00000244274"
## [10] "ENSG00000244274" "ENSG00000135636" "ENSG00000135636"
## [13] "ENSG00000135636" "ENSG00000135636" "ENSG00000135636"
## [16] "ENSG00000135636" "ENSG00000135636" "ENSG00000108001"
## [19] "ENSG00000187773" "ENSG00000139132" "ENSG00000153303"
## [22] "ENSG00000143641" "ENSG00000144596" "ENSG00000115756"
## [25] "ENSG00000197081" "ENSG00000185507" "ENSG00000123104"
## [28] "ENSG00000127528" "ENSG00000106003" "ENSG00000107902"
## [31] "ENSG00000107902" "ENSG00000183060" "ENSG00000068305"
## [34] "ENSG00000068305" "ENSG00000068305" "ENSG00000068305"
## [37] "ENSG00000120254" "ENSG00000120254" "ENSG00000120254"
## [40] "ENSG00000133454" "ENSG00000124785" "ENSG00000162407"
## [43] "ENSG00000107263" "ENSG00000159788" "ENSG00000138835"
## [46] "ENSG00000064932" "ENSG00000104969" "ENSG00000130147"
## [49] "ENSG00000156222" "ENSG00000156222" "ENSG00000156222"
## [52] "ENSG00000156222" "ENSG00000095637" "ENSG00000095637"
## [55] "ENSG00000185594" "ENSG00000065882" "ENSG00000109927"
## [58] "ENSG00000100726" "ENSG00000185361" "ENSG00000198795"
## [61] "ENSG00000198597" "ENSG00000141579" "ENSG00000070476"
## [64] "ENSG00000070476"
# Convert the TSS to ensg as well 

ref_gene_hg19_ensg <- merge(refGene_hg19_TSS, gene_id, by.x = c("V5"), by.y = c("Gene"))

all_ref_gene_hg19_ensg <- unique(ref_gene_hg19_ensg$ensg)

heart_ref_gene <- all_ref_gene_hg19_ensg %in% comb_kidney$ensg

# Revisions- run GO
# Merge ENSG with true/false

test_gene <- as.numeric(as.vector(heart_ref_gene))
names(test_gene) <-  all_ref_gene_hg19_ensg

# Run topGO
go_data <- new("topGOdata",
                   ontology = "BP",
                   allGenes = test_gene, 
                    geneSel = function(allScore){
    return(allScore > 0)
                   nodeSize = 5,
                   annotationFun =,
                   mapping = "",
                   ID = "ensembl")
go_test <- runTest(go_data, algorithm = "weight01", statistic = "fisher")
go_table <- GenTable(go_data, weightFisher = go_test,
                         orderBy = "weightFisher", ranksOf = "weightFisher",
                         topNodes = sum(score(go_test) < .05))

##          GO.ID                                        Term Annotated
## 1   GO:0009113      purine nucleobase biosynthetic process        12
## 2   GO:0033197                       response to vitamin E        12
## 3   GO:0006351                transcription, DNA-templated      3277
## 4   GO:0032007        negative regulation of TOR signaling        40
## 5   GO:0043547      positive regulation of GTPase activity       354
## 6   GO:0060070             canonical Wnt signaling pathway       274
## 7   GO:1903078 positive regulation of protein localizat...        46
## 8   GO:0071320                   cellular response to cAMP        47
## 9   GO:0006501               C-terminal protein lipidation        62
## 10  GO:0007386           compartment pattern specification         5
## 11  GO:0070375                                ERK5 cascade         5
## 12  GO:0042321 negative regulation of circadian sleep/w...         5
## 13  GO:0009146 purine nucleoside triphosphate catabolic...         5
## 14  GO:0060509           Type I pneumocyte differentiation         5
## 15  GO:0046060                      dATP metabolic process         5
## 16  GO:0009256 10-formyltetrahydrofolate metabolic proc...         5
## 17  GO:0048541                   Peyer's patch development         5
## 18  GO:0009168 purine ribonucleoside monophosphate bios...        66
## 19  GO:0006863                 purine nucleobase transport         6
## 20  GO:0015942                   formate metabolic process         6
## 21  GO:0018242 protein O-linked glycosylation via serin...         6
## 22  GO:0001957                intramembranous ossification         6
## 23  GO:0060368 regulation of Fc receptor mediated stimu...         6
## 24  GO:0070141                            response to UV-A         6
## 25  GO:0038203                             TORC2 signaling         6
## 26  GO:0033632 regulation of cell-cell adhesion mediate...         6
## 27  GO:0060405               regulation of penile erection         6
## 28  GO:0009204 deoxyribonucleoside triphosphate catabol...         6
## 29  GO:0070244 negative regulation of thymocyte apoptot...         6
## 30  GO:0090630               activation of GTPase activity        76
## 31  GO:0002819      regulation of adaptive immune response       127
## 32  GO:0032261                   purine nucleotide salvage         7
## 33  GO:0018243 protein O-linked glycosylation via threo...         7
## 34  GO:0001778                      plasma membrane repair         7
## 35  GO:1903071 positive regulation of ER-associated ubi...         7
## 36  GO:0046654       tetrahydrofolate biosynthetic process         7
## 37  GO:0009120       deoxyribonucleoside metabolic process         7
## 38  GO:0019043              establishment of viral latency         7
## 39  GO:0048702        embryonic neurocranium morphogenesis         7
## 40  GO:1901642          nucleoside transmembrane transport         7
## 41  GO:2000109 regulation of macrophage apoptotic proce...         7
## 42  GO:0046130     purine ribonucleoside catabolic process         7
## 43  GO:0033601 positive regulation of mammary gland epi...         7
## 44  GO:0071499 cellular response to laminar fluid shear...         7
## 45  GO:0008277 regulation of G-protein coupled receptor...       120
## 46  GO:1904263      positive regulation of TORC1 signaling         8
## 47  GO:0038180       nerve growth factor signaling pathway         8
## 48  GO:0038063 collagen-activated tyrosine kinase recep...         8
## 49  GO:0060340 positive regulation of type I interferon...         8
## 50  GO:0072530 purine-containing compound transmembrane...         8
## 51  GO:0048703      embryonic viscerocranium morphogenesis         8
## 52  GO:0034127 regulation of MyD88-independent toll-lik...         8
## 53  GO:0008354                         germ cell migration         8
## 54  GO:0014807                 regulation of somitogenesis         8
## 55  GO:0045188 regulation of circadian sleep/wake cycle...         8
## 56  GO:0048387 negative regulation of retinoic acid rec...         8
## 57  GO:0002313 mature B cell differentiation involved i...        18
## 58  GO:0033089 positive regulation of T cell differenti...         9
## 59  GO:0002315        marginal zone B cell differentiation         9
## 60  GO:0035999            tetrahydrofolate interconversion         9
## 61  GO:0001821                         histamine secretion         9
## 62  GO:0003139         secondary heart field specification         9
## 63  GO:0039530                     MDA-5 signaling pathway         9
## 64  GO:0002634     regulation of germinal center formation         9
## 65  GO:0070255               regulation of mucus secretion         9
## 66  GO:0001889                           liver development       124
## 67  GO:0030282                         bone mineralization        93
## 68  GO:0002903 negative regulation of B cell apoptotic ...        10
## 69  GO:0070601       centromeric sister chromatid cohesion        10
## 70  GO:0046085                 adenosine metabolic process        10
## 71  GO:0042118                 endothelial cell activation        10
## 72  GO:0035414 negative regulation of catenin import in...        10
## 73  GO:0033033 negative regulation of myeloid cell apop...        11
## 74  GO:0001973        adenosine receptor signaling pathway        11
## 75  GO:0003413 chondrocyte differentiation involved in ...        11
## 76  GO:0033327                 Leydig cell differentiation        11
## 77  GO:0043249                      erythrocyte maturation        11
## 78  GO:1904293         negative regulation of ERAD pathway        12
## 79  GO:0045351      type I interferon biosynthetic process        12
## 80  GO:0055015 ventricular cardiac muscle cell developm...        12
## 81  GO:2000059 negative regulation of protein ubiquitin...        12
## 82  GO:0050862 positive regulation of T cell receptor s...        12
## 83  GO:0048311                  mitochondrion distribution        12
## 84  GO:0002281 macrophage activation involved in immune...        12
## 85  GO:0061430                bone trabecula morphogenesis        13
## 86  GO:0043650      dicarboxylic acid biosynthetic process        13
## 87  GO:0071361                cellular response to ethanol        13
## 88  GO:0032486             Rap protein signal transduction        13
## 89  GO:2000107 negative regulation of leukocyte apoptot...        39
## 90  GO:0036066               protein O-linked fucosylation        14
## 91  GO:0045725 positive regulation of glycogen biosynth...        15
## 92  GO:0060749          mammary gland alveolus development        15
## 93  GO:0001829        trophectodermal cell differentiation        15
## 94  GO:0006744             ubiquinone biosynthetic process        15
## 95  GO:0035023 regulation of Rho protein signal transdu...       118
## 96  GO:0051412                  response to corticosterone        16
## 97  GO:0051446 positive regulation of meiotic cell cycl...        16
## 98  GO:0072531 pyrimidine-containing compound transmemb...        16
## 99  GO:0055003                  cardiac myofibril assembly        16
## 100 GO:0009264       deoxyribonucleotide catabolic process        16
## 101 GO:0000122 negative regulation of transcription fro...       727
## 102 GO:0030111         regulation of Wnt signaling pathway       295
## 103 GO:0046386     deoxyribose phosphate catabolic process        17
## 104 GO:0045655      regulation of monocyte differentiation        17
## 105 GO:0071157    negative regulation of cell cycle arrest        18
## 106 GO:0032026                   response to magnesium ion        18
## 107 GO:0046655                folic acid metabolic process        18
## 108 GO:0007063     regulation of sister chromatid cohesion        19
## 109 GO:2000178 negative regulation of neural precursor ...        19
## 110 GO:0006139 nucleobase-containing compound metabolic...      5072
go_table_heart <-$GO.ID, go_table$weightFisher))

write.table(go_table_heart, "../data/go_table_heart.txt", quote = FALSE, row.names = FALSE, col.names = FALSE)

# Get names of kidney genes
sig.genes <- sigGenes(go_data)
goresults <- sapply(go_table$GO.ID, function(x)
      genes<-genesInTerm(go_data, x) 
      genes[[1]][genes[[1]] %in% sig.genes]

# cardiac myofibril assembly, positive regulation of heart rate, regulation of monocyte differentiation
## $`GO:0055003`
## [1] "ENSG00000068305"
## $<NA>
## $`GO:0045655`
## [1] "ENSG00000185507"


# Find the heart hypo
heart_hypo <- human_chimp_heart_specific_25_conserved_H3K27_KIDNEY[which(human_chimp_heart_specific_25_conserved_H3K27_KIDNEY$V4 == "hyper" & human_chimp_heart_specific_25_conserved_H3K27_KIDNEY$V6 != "-1"),]

heart_hypo <- heart_hypo[complete.cases(heart_hypo), ]
# Find the closest gene

# Convert the gene name to ensg

gene_id <- read.table("../../../Reg_Evo_Primates/data/ENSG_GENE_HG19.csv", stringsAsFactors = FALSE, header=TRUE, sep = ",")

comb_kidney <- merge(closest_heart, gene_id, by.x = c("V8"), by.y = c("Gene"))

##   [1] "ENSG00000081760" "ENSG00000198691" "ENSG00000100997"
##   [4] "ENSG00000100997" "ENSG00000117148" "ENSG00000169717"
##   [7] "ENSG00000169717" "ENSG00000139567" "ENSG00000145536"
##  [10] "ENSG00000134917" "ENSG00000105963" "ENSG00000162104"
##  [13] "ENSG00000164252" "ENSG00000063438" "ENSG00000063438"
##  [16] "ENSG00000110711" "ENSG00000196581" "ENSG00000196581"
##  [19] "ENSG00000179841" "ENSG00000053371" "ENSG00000151360"
##  [22] "ENSG00000178038" "ENSG00000178038" "ENSG00000106927"
##  [25] "ENSG00000159461" "ENSG00000089053" "ENSG00000138613"
##  [28] "ENSG00000138613" "ENSG00000198576" "ENSG00000147799"
##  [31] "ENSG00000116017" "ENSG00000029153" "ENSG00000029153"
##  [34] "ENSG00000029153" "ENSG00000029153" "ENSG00000029153"
##  [37] "ENSG00000117407" "ENSG00000117407" "ENSG00000117407"
##  [40] "ENSG00000126775" "ENSG00000126775" "ENSG00000068650"
##  [43] "ENSG00000068650" "ENSG00000068650" "ENSG00000068650"
##  [46] "ENSG00000241837" "ENSG00000241837" "ENSG00000158321"
##  [49] "ENSG00000158321" "ENSG00000183778" "ENSG00000183778"
##  [52] "ENSG00000183778" "ENSG00000183778" "ENSG00000183778"
##  [55] "ENSG00000128298" "ENSG00000125492" "ENSG00000125492"
##  [58] "ENSG00000125124" "ENSG00000050820" "ENSG00000127152"
##  [61] "ENSG00000127152" "ENSG00000110987" "ENSG00000110987"
##  [64] "ENSG00000116128" "ENSG00000162373" "ENSG00000165626"
##  [67] "ENSG00000165626" "ENSG00000122870" "ENSG00000122870"
##  [70] "ENSG00000136717" "ENSG00000136717" "ENSG00000136717"
##  [73] "ENSG00000136717" "ENSG00000136717" "ENSG00000136717"
##  [76] "ENSG00000136717" "ENSG00000136717" "ENSG00000136717"
##  [79] "ENSG00000136717" "ENSG00000136717" "ENSG00000136717"
##  [82] "ENSG00000136717" "ENSG00000136717" "ENSG00000136717"
##  [85] "ENSG00000136717" "ENSG00000136717" "ENSG00000136717"
##  [88] "ENSG00000136717" "ENSG00000136717" "ENSG00000125845"
##  [91] "ENSG00000101144" "ENSG00000104221" "ENSG00000165863"
##  [94] "ENSG00000109944" "ENSG00000109944" "ENSG00000173064"
##  [97] "ENSG00000235162" "ENSG00000089916" "ENSG00000089916"
## [100] "ENSG00000184601" "ENSG00000180336" "ENSG00000131943"
## [103] "ENSG00000175262" "ENSG00000128346" "ENSG00000185056"
## [106] "ENSG00000146521" "ENSG00000074410" "ENSG00000074410"
## [109] "ENSG00000158966" "ENSG00000198286" "ENSG00000130940"
## [112] "ENSG00000130940" "ENSG00000160200" "ENSG00000135736"
## [115] "ENSG00000168491" "ENSG00000168491" "ENSG00000109881"
## [118] "ENSG00000109881" "ENSG00000135127" "ENSG00000135127"
## [121] "ENSG00000135127" "ENSG00000110092" "ENSG00000138764"
## [124] "ENSG00000126353" "ENSG00000146731" "ENSG00000146731"
## [127] "ENSG00000112149" "ENSG00000112149" "ENSG00000198752"
## [130] "ENSG00000184661" "ENSG00000166589" "ENSG00000166589"
## [133] "ENSG00000166589" "ENSG00000166589" "ENSG00000179242"
## [136] "ENSG00000179242" "ENSG00000113100" "ENSG00000227767"
## [139] "ENSG00000153046" "ENSG00000101489" "ENSG00000101489"
## [142] "ENSG00000101489" "ENSG00000101489" "ENSG00000134873"
## [145] "ENSG00000134873" "ENSG00000159261" "ENSG00000169583"
## [148] "ENSG00000120885" "ENSG00000148842" "ENSG00000148842"
## [151] "ENSG00000148842" "ENSG00000149972" "ENSG00000149972"
## [154] "ENSG00000149972" "ENSG00000134871" "ENSG00000130635"
## [157] "ENSG00000165644" "ENSG00000198612" "ENSG00000198612"
## [160] "ENSG00000091704" "ENSG00000091704" "ENSG00000169372"
## [163] "ENSG00000146592" "ENSG00000146592" "ENSG00000160202"
## [166] "ENSG00000060069" "ENSG00000060069" "ENSG00000134030"
## [169] "ENSG00000134030" "ENSG00000153015" "ENSG00000153015"
## [172] "ENSG00000153015" "ENSG00000019186" "ENSG00000019186"
## [175] "ENSG00000132437" "ENSG00000079785" "ENSG00000141141"
## [178] "ENSG00000160049" "ENSG00000160049" "ENSG00000109016"
## [181] "ENSG00000100697" "ENSG00000151240" "ENSG00000150672"
## [184] "ENSG00000151208" "ENSG00000080845" "ENSG00000119689"
## [187] "ENSG00000119689" "ENSG00000119689" "ENSG00000119689"
## [190] "ENSG00000143006" "ENSG00000079805" "ENSG00000079805"
## [193] "ENSG00000079805" "ENSG00000079805" "ENSG00000079805"
## [196] "ENSG00000130226" "ENSG00000156162" "ENSG00000149636"
## [199] "ENSG00000149636" "ENSG00000149636" "ENSG00000047579"
## [202] "ENSG00000047579" "ENSG00000047579" "ENSG00000143507"
## [205] "ENSG00000143507" "ENSG00000229847" "ENSG00000229847"
## [208] "ENSG00000229847" "ENSG00000164778" "ENSG00000167280"
## [211] "ENSG00000104714" "ENSG00000119715" "ENSG00000119715"
## [214] "ENSG00000072840" "ENSG00000064655" "ENSG00000064655"
## [217] "ENSG00000088926" "ENSG00000168309" "ENSG00000168309"
## [220] "ENSG00000184731" "ENSG00000196814" "ENSG00000196814"
## [223] "ENSG00000154153" "ENSG00000189292" "ENSG00000182183"
## [226] "ENSG00000115363" "ENSG00000047662" "ENSG00000219438"
## [229] "ENSG00000168672" "ENSG00000083857" "ENSG00000083857"
## [232] "ENSG00000165140" "ENSG00000112787" "ENSG00000112787"
## [235] "ENSG00000085265" "ENSG00000126266" "ENSG00000066468"
## [238] "ENSG00000066468" "ENSG00000066468" "ENSG00000126500"
## [241] "ENSG00000075426" "ENSG00000164916" "ENSG00000114861"
## [244] "ENSG00000150893" "ENSG00000033170" "ENSG00000166206"
## [247] "ENSG00000116717" "ENSG00000116717" "ENSG00000116717"
## [250] "ENSG00000116717" "ENSG00000116717" "ENSG00000116717"
## [253] "ENSG00000143641" "ENSG00000182870" "ENSG00000130700"
## [256] "ENSG00000168505" "ENSG00000165702" "ENSG00000165702"
## [259] "ENSG00000167741" "ENSG00000167741" "ENSG00000074047"
## [262] "ENSG00000107249" "ENSG00000151948" "ENSG00000151948"
## [265] "ENSG00000137198" "ENSG00000156049" "ENSG00000197177"
## [268] "ENSG00000077585" "ENSG00000158292" "ENSG00000119714"
## [271] "ENSG00000178075" "ENSG00000125651" "ENSG00000077235"
## [274] "ENSG00000069812" "ENSG00000166135" "ENSG00000180448"
## [277] "ENSG00000108753" "ENSG00000108753" "ENSG00000108753"
## [280] "ENSG00000108753" "ENSG00000136720" "ENSG00000165868"
## [283] "ENSG00000165868" "ENSG00000003147" "ENSG00000003147"
## [286] "ENSG00000003147" "ENSG00000160223" "ENSG00000172201"
## [289] "ENSG00000172201" "ENSG00000134049" "ENSG00000117154"
## [292] "ENSG00000117154" "ENSG00000185950" "ENSG00000113430"
## [295] "ENSG00000113430" "ENSG00000105655" "ENSG00000105655"
## [298] "ENSG00000105655" "ENSG00000188385" "ENSG00000154118"
## [301] "ENSG00000107104" "ENSG00000102781" "ENSG00000189337"
## [304] "ENSG00000115041" "ENSG00000169427" "ENSG00000053918"
## [307] "ENSG00000134504" "ENSG00000167977" "ENSG00000127663"
## [310] "ENSG00000127663" "ENSG00000119537" "ENSG00000131149"
## [313] "ENSG00000136051" "ENSG00000257093" "ENSG00000122778"
## [316] "ENSG00000122778" "ENSG00000140950" "ENSG00000173214"
## [319] "ENSG00000130294" "ENSG00000066735" "ENSG00000066735"
## [322] "ENSG00000067082" "ENSG00000067082" "ENSG00000067082"
## [325] "ENSG00000067082" "ENSG00000150361" "ENSG00000197705"
## [328] "ENSG00000053747" "ENSG00000053747" "ENSG00000091136"
## [331] "ENSG00000168961" "ENSG00000168961" "ENSG00000168961"
## [334] "ENSG00000132130" "ENSG00000073350" "ENSG00000073350"
## [337] "ENSG00000073350" "ENSG00000103227" "ENSG00000103227"
## [340] "ENSG00000113368" "ENSG00000163380" "ENSG00000136944"
## [343] "ENSG00000136944" "ENSG00000136944" "ENSG00000167210"
## [346] "ENSG00000153395" "ENSG00000136141" "ENSG00000136141"
## [349] "ENSG00000136141" "ENSG00000146006" "ENSG00000146006"
## [352] "ENSG00000166159" "ENSG00000166159" "ENSG00000166159"
## [355] "ENSG00000166159" "ENSG00000166159" "ENSG00000166159"
## [358] "ENSG00000119681" "ENSG00000002822" "ENSG00000002822"
## [361] "ENSG00000002822" "ENSG00000178573" "ENSG00000178573"
## [364] "ENSG00000185022" "ENSG00000172469" "ENSG00000135525"
## [367] "ENSG00000135525" "ENSG00000135525" "ENSG00000138834"
## [370] "ENSG00000138834" "ENSG00000137337" "ENSG00000085871"
## [373] "ENSG00000085871" "ENSG00000085871" "ENSG00000085871"
## [376] "ENSG00000249567" "ENSG00000221323" "ENSG00000207588"
## [379] "ENSG00000105926" "ENSG00000158186" "ENSG00000182170"
## [382] "ENSG00000153944" "ENSG00000138823" "ENSG00000129422"
## [385] "ENSG00000129422" "ENSG00000132938" "ENSG00000133055"
## [388] "ENSG00000169994" "ENSG00000187556" "ENSG00000196498"
## [391] "ENSG00000196498" "ENSG00000196498" "ENSG00000196498"
## [394] "ENSG00000196498" "ENSG00000196498" "ENSG00000104419"
## [397] "ENSG00000104419" "ENSG00000104419" "ENSG00000104419"
## [400] "ENSG00000115286" "ENSG00000103154" "ENSG00000109320"
## [403] "ENSG00000109320" "ENSG00000148826" "ENSG00000148826"
## [406] "ENSG00000106410" "ENSG00000106410" "ENSG00000074771"
## [409] "ENSG00000170485" "ENSG00000214285" "ENSG00000105954"
## [412] "ENSG00000182667" "ENSG00000182667" "ENSG00000182667"
## [415] "ENSG00000115758" "ENSG00000205927" "ENSG00000183715"
## [418] "ENSG00000115947" "ENSG00000178602" "ENSG00000172818"
## [421] "ENSG00000125850" "ENSG00000099864" "ENSG00000099864"
## [424] "ENSG00000116183" "ENSG00000116183" "ENSG00000137819"
## [427] "ENSG00000102699" "ENSG00000242265" "ENSG00000242265"
## [430] "ENSG00000142655" "ENSG00000142655" "ENSG00000067057"
## [433] "ENSG00000144824" "ENSG00000165443" "ENSG00000105229"
## [436] "ENSG00000126822" "ENSG00000171680" "ENSG00000114554"
## [439] "ENSG00000114554" "ENSG00000114554" "ENSG00000141682"
## [442] "ENSG00000124225" "ENSG00000122512" "ENSG00000122512"
## [445] "ENSG00000168081" "ENSG00000014138" "ENSG00000166169"
## [448] "ENSG00000166169" "ENSG00000166169" "ENSG00000166169"
## [451] "ENSG00000106536" "ENSG00000106536" "ENSG00000162407"
## [454] "ENSG00000147535" "ENSG00000147535" "ENSG00000147535"
## [457] "ENSG00000154001" "ENSG00000170325" "ENSG00000170325"
## [460] "ENSG00000110851" "ENSG00000175785" "ENSG00000111725"
## [463] "ENSG00000106617" "ENSG00000065675" "ENSG00000065675"
## [466] "ENSG00000111218" "ENSG00000111218" "ENSG00000155066"
## [469] "ENSG00000155066" "ENSG00000155066" "ENSG00000205352"
## [472] "ENSG00000205352" "ENSG00000205352" "ENSG00000205352"
## [475] "ENSG00000167157" "ENSG00000163636" "ENSG00000169398"
## [478] "ENSG00000169398" "ENSG00000169398" "ENSG00000134644"
## [481] "ENSG00000134644" "ENSG00000112531" "ENSG00000112531"
## [484] "ENSG00000112531" "ENSG00000112531" "ENSG00000107560"
## [487] "ENSG00000168461" "ENSG00000141542" "ENSG00000017797"
## [490] "ENSG00000136828" "ENSG00000136828" "ENSG00000136828"
## [493] "ENSG00000185989" "ENSG00000165105" "ENSG00000122035"
## [496] "ENSG00000122965" "ENSG00000122965" "ENSG00000122965"
## [499] "ENSG00000160957" "ENSG00000143954" "ENSG00000143954"
## [502] "ENSG00000143954" "ENSG00000159788" "ENSG00000091844"
## [505] "ENSG00000158106" "ENSG00000183421" "ENSG00000139797"
## [508] "ENSG00000113269" "ENSG00000069667" "ENSG00000100784"
## [511] "ENSG00000100784" "ENSG00000141564" "ENSG00000141564"
## [514] "ENSG00000165526" "ENSG00000165526" "ENSG00000182010"
## [517] "ENSG00000198838" "ENSG00000198838" "ENSG00000256463"
## [520] "ENSG00000256463" "ENSG00000256463" "ENSG00000149021"
## [523] "ENSG00000136546" "ENSG00000136546" "ENSG00000146555"
## [526] "ENSG00000146555" "ENSG00000187764" "ENSG00000187764"
## [529] "ENSG00000163904" "ENSG00000152217" "ENSG00000183576"
## [532] "ENSG00000183576" "ENSG00000225383" "ENSG00000164690"
## [535] "ENSG00000142178" "ENSG00000159263" "ENSG00000159263"
## [538] "ENSG00000159263" "ENSG00000159263" "ENSG00000113504"
## [541] "ENSG00000152779" "ENSG00000162241" "ENSG00000162241"
## [544] "ENSG00000173262" "ENSG00000157765" "ENSG00000157765"
## [547] "ENSG00000160190" "ENSG00000143036" "ENSG00000143036"
## [550] "ENSG00000143036" "ENSG00000162426" "ENSG00000066230"
## [553] "ENSG00000173930" "ENSG00000166949" "ENSG00000127616"
## [556] "ENSG00000127616" "ENSG00000127616" "ENSG00000127616"
## [559] "ENSG00000188176" "ENSG00000048471" "ENSG00000172803"
## [562] "ENSG00000184557" "ENSG00000125398" "ENSG00000125398"
## [565] "ENSG00000185594" "ENSG00000187678" "ENSG00000187678"
## [568] "ENSG00000124783" "ENSG00000149418" "ENSG00000133121"
## [571] "ENSG00000133121" "ENSG00000102572" "ENSG00000152953"
## [574] "ENSG00000015592" "ENSG00000165730" "ENSG00000165730"
## [577] "ENSG00000165730" "ENSG00000165730" "ENSG00000198203"
## [580] "ENSG00000198203" "ENSG00000117614" "ENSG00000117614"
## [583] "ENSG00000131018" "ENSG00000131018" "ENSG00000078269"
## [586] "ENSG00000143028" "ENSG00000130699" "ENSG00000164691"
## [589] "ENSG00000164691" "ENSG00000164691" "ENSG00000167291"
## [592] "ENSG00000095383" "ENSG00000095383" "ENSG00000095383"
## [595] "ENSG00000095383" "ENSG00000095383" "ENSG00000095383"
## [598] "ENSG00000006638" "ENSG00000006638" "ENSG00000187621"
## [601] "ENSG00000160180" "ENSG00000163235" "ENSG00000163235"
## [604] "ENSG00000041988" "ENSG00000041988" "ENSG00000146426"
## [607] "ENSG00000106829" "ENSG00000155957" "ENSG00000144120"
## [610] "ENSG00000144120" "ENSG00000144120" "ENSG00000151353"
## [613] "ENSG00000151353" "ENSG00000214128" "ENSG00000160055"
## [616] "ENSG00000136205" "ENSG00000162341" "ENSG00000115705"
## [619] "ENSG00000115705" "ENSG00000126602" "ENSG00000167632"
## [622] "ENSG00000071575" "ENSG00000071575" "ENSG00000137699"
## [625] "ENSG00000100815" "ENSG00000103671" "ENSG00000119121"
## [628] "ENSG00000154743" "ENSG00000154743" "ENSG00000179981"
## [631] "ENSG00000182463" "ENSG00000121297" "ENSG00000214063"
## [634] "ENSG00000032389" "ENSG00000123607" "ENSG00000105948"
## [637] "ENSG00000105948" "ENSG00000105948" "ENSG00000100154"
## [640] "ENSG00000143367" "ENSG00000143367" "ENSG00000233608"
## [643] "ENSG00000184787" "ENSG00000184787" "ENSG00000184787"
## [646] "ENSG00000178473" "ENSG00000115446" "ENSG00000113763"
## [649] "ENSG00000101558" "ENSG00000101558" "ENSG00000129003"
## [652] "ENSG00000129003" "ENSG00000129003" "ENSG00000129003"
## [655] "ENSG00000176428" "ENSG00000185274" "ENSG00000185274"
## [658] "ENSG00000185274" "ENSG00000065268" "ENSG00000160193"
## [661] "ENSG00000103175" "ENSG00000198373" "ENSG00000076924"
## [664] "ENSG00000196584" "ENSG00000130733" "ENSG00000184828"
## [667] "ENSG00000213588" "ENSG00000014164" "ENSG00000175048"
## [670] "ENSG00000175048" "ENSG00000153786" "ENSG00000153786"
## [673] "ENSG00000156639" "ENSG00000156639" "ENSG00000133858"
## [676] "ENSG00000139800" "ENSG00000015171" "ENSG00000015171"
## [679] "ENSG00000102935" "ENSG00000102935" "ENSG00000183621"
## [682] "ENSG00000183621" "ENSG00000183621" "ENSG00000183621"
## [685] "ENSG00000183621" "ENSG00000183621" "ENSG00000183621"
## [688] "ENSG00000197857" "ENSG00000197857" "ENSG00000225614"
## [691] "ENSG00000225614" "ENSG00000171425" "ENSG00000157657"
## [694] "ENSG00000157657" "ENSG00000183779" "ENSG00000183779"
# Convert the TSS to ensg as well 

ref_gene_hg19_ensg <- merge(refGene_hg19_TSS, gene_id, by.x = c("V5"), by.y = c("Gene"))

all_ref_gene_hg19_ensg <- unique(ref_gene_hg19_ensg$ensg)

kidney_ref_gene <- all_ref_gene_hg19_ensg %in% comb_kidney$ensg

# Revisions- run GO
# Merge ENSG with true/false

test_gene <- as.numeric(as.vector(heart_ref_gene))
names(test_gene) <-  all_ref_gene_hg19_ensg

# Run topGO
go_data <- new("topGOdata",
                   ontology = "BP",
                   allGenes = test_gene, 
                    geneSel = function(allScore){
    return(allScore > 0)
                   nodeSize = 5,
                   annotationFun =,
                   mapping = "",
                   ID = "ensembl")
# Perform enrichment test
go_table <- GenTable(go_data, weightFisher = go_test,
                         orderBy = "weightFisher", ranksOf = "weightFisher",
                         topNodes = sum(score(go_test) < .01))

##        GO.ID                                        Term Annotated
## 1 GO:0009113      purine nucleobase biosynthetic process        12
## 2 GO:0033197                       response to vitamin E        12
## 3 GO:0006351                transcription, DNA-templated      3277
## 4 GO:0032007        negative regulation of TOR signaling        40
## 5 GO:0043547      positive regulation of GTPase activity       354
## 6 GO:0060070             canonical Wnt signaling pathway       274
## 7 GO:1903078 positive regulation of protein localizat...        46
## 8 GO:0071320                   cellular response to cAMP        47
##   Significant Expected weightFisher
## 1           2     0.03      0.00046
## 2           2     0.03      0.00046
## 3          14     8.81      0.00408
## 4           2     0.11      0.00515
## 5           6     0.95      0.00540
## 6           4     0.74      0.00656
## 7           2     0.12      0.00677
## 8           2     0.13      0.00706
## $<NA>


# Find the heart hypo
heart_hypo <- human_chimp_heart_specific_25_conserved_H3K27_LIVER[which(human_chimp_heart_specific_25_conserved_H3K27_LIVER$V4 == "hypo" & human_chimp_heart_specific_25_conserved_H3K27_LIVER$V6 != "-1"),]

heart_hypo <- heart_hypo[complete.cases(heart_hypo), ]

# Find the closest gene

# Convert the gene name to ensg

gene_id <- read.table("../../../Reg_Evo_Primates/data/ENSG_GENE_HG19.csv", stringsAsFactors = FALSE, header=TRUE, sep = ",")

comb_kidney <- merge(closest_heart, gene_id, by.x = c("V8"), by.y = c("Gene"))

##    [1] "ENSG00000121410" "ENSG00000114771" "ENSG00000114771"
##    [4] "ENSG00000141338" "ENSG00000121270" "ENSG00000108846"
##    [7] "ENSG00000108846" "ENSG00000108846" "ENSG00000108846"
##   [10] "ENSG00000138075" "ENSG00000076555" "ENSG00000076555"
##   [13] "ENSG00000181513" "ENSG00000181513" "ENSG00000181513"
##   [16] "ENSG00000181513" "ENSG00000122729" "ENSG00000197142"
##   [19] "ENSG00000183549" "ENSG00000143199" "ENSG00000143199"
##   [22] "ENSG00000143199" "ENSG00000143199" "ENSG00000162104"
##   [25] "ENSG00000183077" "ENSG00000183077" "ENSG00000183077"
##   [28] "ENSG00000157985" "ENSG00000157985" "ENSG00000157985"
##   [31] "ENSG00000165923" "ENSG00000165923" "ENSG00000165923"
##   [34] "ENSG00000144891" "ENSG00000144891" "ENSG00000144891"
##   [37] "ENSG00000144891" "ENSG00000172482" "ENSG00000113492"
##   [40] "ENSG00000042286" "ENSG00000042286" "ENSG00000011243"
##   [43] "ENSG00000106948" "ENSG00000198610" "ENSG00000198610"
##   [46] "ENSG00000142208" "ENSG00000023330" "ENSG00000023330"
##   [49] "ENSG00000170017" "ENSG00000170017" "ENSG00000170017"
##   [52] "ENSG00000170017" "ENSG00000170017" "ENSG00000170017"
##   [55] "ENSG00000170017" "ENSG00000170017" "ENSG00000033011"
##   [58] "ENSG00000198796" "ENSG00000136383" "ENSG00000136383"
##   [61] "ENSG00000162551" "ENSG00000162551" "ENSG00000162551"
##   [64] "ENSG00000106927" "ENSG00000139344" "ENSG00000166126"
##   [67] "ENSG00000166025" "ENSG00000166025" "ENSG00000116337"
##   [70] "ENSG00000116337" "ENSG00000174945" "ENSG00000116194"
##   [73] "ENSG00000116194" "ENSG00000198483" "ENSG00000154945"
##   [76] "ENSG00000131620" "ENSG00000131620" "ENSG00000074855"
##   [79] "ENSG00000042753" "ENSG00000042753" "ENSG00000132703"
##   [82] "ENSG00000110243" "ENSG00000110243" "ENSG00000084674"
##   [85] "ENSG00000175336" "ENSG00000118520" "ENSG00000118520"
##   [88] "ENSG00000118520" "ENSG00000118520" "ENSG00000196843"
##   [91] "ENSG00000133794" "ENSG00000133794" "ENSG00000133794"
##   [94] "ENSG00000136950" "ENSG00000111339" "ENSG00000111339"
##   [97] "ENSG00000100325" "ENSG00000100325" "ENSG00000141505"
##  [100] "ENSG00000141505" "ENSG00000141505" "ENSG00000141505"
##  [103] "ENSG00000161944" "ENSG00000161944" "ENSG00000161944"
##  [106] "ENSG00000161944" "ENSG00000161944" "ENSG00000126522"
##  [109] "ENSG00000126522" "ENSG00000126522" "ENSG00000169696"
##  [112] "ENSG00000169696" "ENSG00000169696" "ENSG00000169136"
##  [115] "ENSG00000169136" "ENSG00000157087" "ENSG00000157087"
##  [118] "ENSG00000186009" "ENSG00000107518" "ENSG00000204842"
##  [121] "ENSG00000158321" "ENSG00000119986" "ENSG00000109956"
##  [124] "ENSG00000109956" "ENSG00000182272" "ENSG00000117411"
##  [127] "ENSG00000156273" "ENSG00000175866" "ENSG00000175866"
##  [130] "ENSG00000175866" "ENSG00000175866" "ENSG00000255056"
##  [133] "ENSG00000172530" "ENSG00000172530" "ENSG00000172530"
##  [136] "ENSG00000172530" "ENSG00000172530" "ENSG00000114200"
##  [139] "ENSG00000153094" "ENSG00000153094" "ENSG00000153094"
##  [142] "ENSG00000153094" "ENSG00000153094" "ENSG00000153094"
##  [145] "ENSG00000153094" "ENSG00000153094" "ENSG00000153094"
##  [148] "ENSG00000153094" "ENSG00000153094" "ENSG00000153094"
##  [151] "ENSG00000153094" "ENSG00000153094" "ENSG00000153094"
##  [154] "ENSG00000153094" "ENSG00000153094" "ENSG00000153094"
##  [157] "ENSG00000121380" "ENSG00000121380" "ENSG00000100739"
##  [160] "ENSG00000015475" "ENSG00000015475" "ENSG00000136717"
##  [163] "ENSG00000136717" "ENSG00000136717" "ENSG00000136717"
##  [166] "ENSG00000136717" "ENSG00000136717" "ENSG00000136717"
##  [169] "ENSG00000136717" "ENSG00000136717" "ENSG00000136717"
##  [172] "ENSG00000115760" "ENSG00000197299" "ENSG00000168487"
##  [175] "ENSG00000168487" "ENSG00000168487" "ENSG00000168487"
##  [178] "ENSG00000140299" "ENSG00000145919" "ENSG00000145919"
##  [181] "ENSG00000176720" "ENSG00000234235" "ENSG00000214688"
##  [184] "ENSG00000110696" "ENSG00000111412" "ENSG00000173064"
##  [187] "ENSG00000214900" "ENSG00000128944" "ENSG00000128944"
##  [190] "ENSG00000128944" "ENSG00000166780" "ENSG00000125149"
##  [193] "ENSG00000125149" "ENSG00000174109" "ENSG00000185504"
##  [196] "ENSG00000185504" "ENSG00000168675" "ENSG00000168675"
##  [199] "ENSG00000168675" "ENSG00000168675" "ENSG00000168675"
##  [202] "ENSG00000168675" "ENSG00000130813" "ENSG00000130813"
##  [205] "ENSG00000130173" "ENSG00000168275" "ENSG00000159403"
##  [208] "ENSG00000159403" "ENSG00000182326" "ENSG00000182326"
##  [211] "ENSG00000166278" "ENSG00000166278" "ENSG00000166278"
##  [214] "ENSG00000166278" "ENSG00000101474" "ENSG00000128254"
##  [217] "ENSG00000215012" "ENSG00000100249" "ENSG00000115998"
##  [220] "ENSG00000204128" "ENSG00000215217" "ENSG00000039537"
##  [223] "ENSG00000146521" "ENSG00000244291" "ENSG00000170279"
##  [226] "ENSG00000157131" "ENSG00000021852" "ENSG00000021852"
##  [229] "ENSG00000021852" "ENSG00000176919" "ENSG00000113600"
##  [232] "ENSG00000134508" "ENSG00000134508" "ENSG00000154040"
##  [235] "ENSG00000154040" "ENSG00000154040" "ENSG00000154040"
##  [238] "ENSG00000154040" "ENSG00000171735" "ENSG00000171735"
##  [241] "ENSG00000171735" "ENSG00000171735" "ENSG00000042493"
##  [244] "ENSG00000110888" "ENSG00000110888" "ENSG00000110888"
##  [247] "ENSG00000110888" "ENSG00000110888" "ENSG00000213995"
##  [250] "ENSG00000213995" "ENSG00000142273" "ENSG00000142273"
##  [253] "ENSG00000139899" "ENSG00000139899" "ENSG00000160200"
##  [256] "ENSG00000160200" "ENSG00000144648" "ENSG00000005059"
##  [259] "ENSG00000160799" "ENSG00000144395" "ENSG00000165972"
##  [262] "ENSG00000161573" "ENSG00000110092" "ENSG00000110092"
##  [265] "ENSG00000177575" "ENSG00000177575" "ENSG00000177575"
##  [268] "ENSG00000177575" "ENSG00000134061" "ENSG00000178562"
##  [271] "ENSG00000178562" "ENSG00000178562" "ENSG00000110651"
##  [274] "ENSG00000151465" "ENSG00000099804" "ENSG00000198752"
##  [277] "ENSG00000149798" "ENSG00000170779" "ENSG00000170779"
##  [280] "ENSG00000136807" "ENSG00000166446" "ENSG00000153879"
##  [283] "ENSG00000153879" "ENSG00000241832" "ENSG00000149187"
##  [286] "ENSG00000011523" "ENSG00000011523" "ENSG00000159398"
##  [289] "ENSG00000159398" "ENSG00000087237" "ENSG00000243649"
##  [292] "ENSG00000165410" "ENSG00000165410" "ENSG00000165410"
##  [295] "ENSG00000016391" "ENSG00000016391" "ENSG00000085872"
##  [298] "ENSG00000177830" "ENSG00000177830" "ENSG00000177830"
##  [301] "ENSG00000177830" "ENSG00000177830" "ENSG00000110721"
##  [304] "ENSG00000110721" "ENSG00000104879" "ENSG00000159261"
##  [307] "ENSG00000159261" "ENSG00000125246" "ENSG00000091317"
##  [310] "ENSG00000091317" "ENSG00000170293" "ENSG00000150656"
##  [313] "ENSG00000133313" "ENSG00000168763" "ENSG00000168763"
##  [316] "ENSG00000158158" "ENSG00000184144" "ENSG00000106078"
##  [319] "ENSG00000196739" "ENSG00000118004" "ENSG00000118004"
##  [322] "ENSG00000118004" "ENSG00000118004" "ENSG00000118004"
##  [325] "ENSG00000118004" "ENSG00000131143" "ENSG00000178772"
##  [328] "ENSG00000178772" "ENSG00000178772" "ENSG00000100884"
##  [331] "ENSG00000157184" "ENSG00000167193" "ENSG00000167193"
##  [334] "ENSG00000178585" "ENSG00000178585" "ENSG00000040531"
##  [337] "ENSG00000040531" "ENSG00000111249" "ENSG00000111249"
##  [340] "ENSG00000154639" "ENSG00000154639" "ENSG00000154639"
##  [343] "ENSG00000154639" "ENSG00000154639" "ENSG00000166347"
##  [346] "ENSG00000166347" "ENSG00000166347" "ENSG00000166347"
##  [349] "ENSG00000166347" "ENSG00000166347" "ENSG00000166394"
##  [352] "ENSG00000140505" "ENSG00000135929" "ENSG00000135929"
##  [355] "ENSG00000135929" "ENSG00000138115" "ENSG00000138115"
##  [358] "ENSG00000138115" "ENSG00000138115" "ENSG00000106258"
##  [361] "ENSG00000106258" "ENSG00000106258" "ENSG00000106258"
##  [364] "ENSG00000106258" "ENSG00000106258" "ENSG00000106258"
##  [367] "ENSG00000106258" "ENSG00000106258" "ENSG00000106258"
##  [370] "ENSG00000106258" "ENSG00000106258" "ENSG00000106258"
##  [373] "ENSG00000106258" "ENSG00000106258" "ENSG00000106258"
##  [376] "ENSG00000186115" "ENSG00000171954" "ENSG00000171954"
##  [379] "ENSG00000186529" "ENSG00000186529" "ENSG00000186529"
##  [382] "ENSG00000164488" "ENSG00000112977" "ENSG00000172992"
##  [385] "ENSG00000043093" "ENSG00000132437" "ENSG00000100201"
##  [388] "ENSG00000100201" "ENSG00000141141" "ENSG00000100150"
##  [391] "ENSG00000100150" "ENSG00000077044" "ENSG00000102967"
##  [394] "ENSG00000181192" "ENSG00000181192" "ENSG00000067596"
##  [397] "ENSG00000184047" "ENSG00000184047" "ENSG00000184047"
##  [400] "ENSG00000184047" "ENSG00000258498" "ENSG00000258498"
##  [403] "ENSG00000258498" "ENSG00000066084" "ENSG00000108176"
##  [406] "ENSG00000108176" "ENSG00000163687" "ENSG00000163687"
##  [409] "ENSG00000167130" "ENSG00000167130" "ENSG00000167130"
##  [412] "ENSG00000184845" "ENSG00000143507" "ENSG00000161326"
##  [415] "ENSG00000108861" "ENSG00000107404" "ENSG00000105204"
##  [418] "ENSG00000105204" "ENSG00000105204" "ENSG00000123179"
##  [421] "ENSG00000134463" "ENSG00000229715" "ENSG00000229715"
##  [424] "ENSG00000142634" "ENSG00000169242" "ENSG00000169242"
##  [427] "ENSG00000099617" "ENSG00000172889" "ENSG00000172889"
##  [430] "ENSG00000146648" "ENSG00000146648" "ENSG00000146648"
##  [433] "ENSG00000146648" "ENSG00000171570" "ENSG00000173812"
##  [436] "ENSG00000106263" "ENSG00000106263" "ENSG00000066044"
##  [439] "ENSG00000196361" "ENSG00000196361" "ENSG00000155849"
##  [442] "ENSG00000155849" "ENSG00000155849" "ENSG00000134759"
##  [445] "ENSG00000134759" "ENSG00000134759" "ENSG00000134759"
##  [448] "ENSG00000134759" "ENSG00000134759" "ENSG00000134759"
##  [451] "ENSG00000160963" "ENSG00000167136" "ENSG00000116016"
##  [454] "ENSG00000182580" "ENSG00000196411" "ENSG00000196411"
##  [457] "ENSG00000130427" "ENSG00000113719" "ENSG00000086619"
##  [460] "ENSG00000139684" "ENSG00000196405" "ENSG00000205436"
##  [463] "ENSG00000107371" "ENSG00000107371" "ENSG00000182197"
##  [466] "ENSG00000092820" "ENSG00000126218" "ENSG00000180210"
##  [469] "ENSG00000159784" "ENSG00000109794" "ENSG00000152102"
##  [472] "ENSG00000185442" "ENSG00000188916" "ENSG00000189319"
##  [475] "ENSG00000133477" "ENSG00000188522" "ENSG00000176853"
##  [478] "ENSG00000169710" "ENSG00000177294" "ENSG00000100225"
##  [481] "ENSG00000100225" "ENSG00000171557" "ENSG00000171557"
##  [484] "ENSG00000115226" "ENSG00000160097" "ENSG00000160097"
##  [487] "ENSG00000170802" "ENSG00000106701" "ENSG00000106701"
##  [490] "ENSG00000070404" "ENSG00000160282" "ENSG00000160282"
##  [493] "ENSG00000107164" "ENSG00000165060" "ENSG00000165060"
##  [496] "ENSG00000165060" "ENSG00000163251" "ENSG00000131482"
##  [499] "ENSG00000131482" "ENSG00000154252" "ENSG00000108479"
##  [502] "ENSG00000106648" "ENSG00000106648" "ENSG00000128310"
##  [505] "ENSG00000130005" "ENSG00000130005" "ENSG00000111640"
##  [508] "ENSG00000213512" "ENSG00000213512" "ENSG00000106633"
##  [511] "ENSG00000106633" "ENSG00000084734" "ENSG00000023909"
##  [514] "ENSG00000178795" "ENSG00000141098" "ENSG00000141098"
##  [517] "ENSG00000141098" "ENSG00000151892" "ENSG00000115486"
##  [520] "ENSG00000115486" "ENSG00000157017" "ENSG00000157017"
##  [523] "ENSG00000157017" "ENSG00000157017" "ENSG00000157017"
##  [526] "ENSG00000157017" "ENSG00000157017" "ENSG00000157017"
##  [529] "ENSG00000157017" "ENSG00000157017" "ENSG00000137960"
##  [532] "ENSG00000151948" "ENSG00000016864" "ENSG00000016864"
##  [535] "ENSG00000203972" "ENSG00000196743" "ENSG00000196743"
##  [538] "ENSG00000112699" "ENSG00000114349" "ENSG00000114349"
##  [541] "ENSG00000100522" "ENSG00000185245" "ENSG00000119927"
##  [544] "ENSG00000119927" "ENSG00000119927" "ENSG00000119927"
##  [547] "ENSG00000112293" "ENSG00000132975" "ENSG00000180758"
##  [550] "ENSG00000166123" "ENSG00000176153" "ENSG00000176153"
##  [553] "ENSG00000176153" "ENSG00000075240" "ENSG00000083307"
##  [556] "ENSG00000139835" "ENSG00000100577" "ENSG00000077809"
##  [559] "ENSG00000077809" "ENSG00000077809" "ENSG00000077809"
##  [562] "ENSG00000077809" "ENSG00000101181" "ENSG00000169919"
##  [565] "ENSG00000130600" "ENSG00000148702" "ENSG00000148702"
##  [568] "ENSG00000148702" "ENSG00000130956" "ENSG00000084110"
##  [571] "ENSG00000084110" "ENSG00000084110" "ENSG00000115677"
##  [574] "ENSG00000115677" "ENSG00000122557" "ENSG00000114315"
##  [577] "ENSG00000114315" "ENSG00000168509" "ENSG00000168509"
##  [580] "ENSG00000168509" "ENSG00000168509" "ENSG00000109758"
##  [583] "ENSG00000137133" "ENSG00000100084" "ENSG00000108924"
##  [586] "ENSG00000117305" "ENSG00000117305" "ENSG00000115756"
##  [589] "ENSG00000158104" "ENSG00000110169" "ENSG00000110169"
##  [592] "ENSG00000113905" "ENSG00000113905" "ENSG00000005700"
##  [595] "ENSG00000115738" "ENSG00000142166" "ENSG00000142166"
##  [598] "ENSG00000115457" "ENSG00000243646" "ENSG00000115590"
##  [601] "ENSG00000115590" "ENSG00000196083" "ENSG00000196083"
##  [604] "ENSG00000196083" "ENSG00000196083" "ENSG00000196083"
##  [607] "ENSG00000196083" "ENSG00000196083" "ENSG00000196083"
##  [610] "ENSG00000196083" "ENSG00000196083" "ENSG00000196083"
##  [613] "ENSG00000196083" "ENSG00000196083" "ENSG00000196083"
##  [616] "ENSG00000196083" "ENSG00000196083" "ENSG00000196083"
##  [619] "ENSG00000196083" "ENSG00000196083" "ENSG00000196083"
##  [622] "ENSG00000196083" "ENSG00000196083" "ENSG00000196083"
##  [625] "ENSG00000196083" "ENSG00000136689" "ENSG00000103522"
##  [628] "ENSG00000103522" "ENSG00000100385" "ENSG00000203485"
##  [631] "ENSG00000203485" "ENSG00000203485" "ENSG00000122641"
##  [634] "ENSG00000148384" "ENSG00000254647" "ENSG00000254647"
##  [637] "ENSG00000254647" "ENSG00000129965" "ENSG00000129965"
##  [640] "ENSG00000186480" "ENSG00000186480" "ENSG00000186480"
##  [643] "ENSG00000186480" "ENSG00000186480" "ENSG00000186480"
##  [646] "ENSG00000125629" "ENSG00000134070" "ENSG00000134070"
##  [649] "ENSG00000172183" "ENSG00000078747" "ENSG00000078747"
##  [652] "ENSG00000078747" "ENSG00000083457" "ENSG00000083457"
##  [655] "ENSG00000162267" "ENSG00000055955" "ENSG00000055955"
##  [658] "ENSG00000100605" "ENSG00000100605" "ENSG00000100605"
##  [661] "ENSG00000205726" "ENSG00000205726" "ENSG00000163166"
##  [664] "ENSG00000009765" "ENSG00000009765" "ENSG00000009765"
##  [667] "ENSG00000140044" "ENSG00000154118" "ENSG00000102781"
##  [670] "ENSG00000176407" "ENSG00000069424" "ENSG00000158445"
##  [673] "ENSG00000124780" "ENSG00000169427" "ENSG00000188997"
##  [676] "ENSG00000089094" "ENSG00000089094" "ENSG00000107077"
##  [679] "ENSG00000107077" "ENSG00000166783" "ENSG00000166783"
##  [682] "ENSG00000166783" "ENSG00000176542" "ENSG00000125337"
##  [685] "ENSG00000125337" "ENSG00000118922" "ENSG00000129911"
##  [688] "ENSG00000128607" "ENSG00000128607" "ENSG00000025800"
##  [691] "ENSG00000185896" "ENSG00000002549" "ENSG00000107929"
##  [694] "ENSG00000086730" "ENSG00000086730" "ENSG00000086730"
##  [697] "ENSG00000213398" "ENSG00000164406" "ENSG00000164406"
##  [700] "ENSG00000145826" "ENSG00000116977" "ENSG00000072163"
##  [703] "ENSG00000166035" "ENSG00000166035" "ENSG00000166035"
##  [706] "ENSG00000101670" "ENSG00000189067" "ENSG00000189067"
##  [709] "ENSG00000162761" "ENSG00000102910" "ENSG00000134324"
##  [712] "ENSG00000134324" "ENSG00000070018" "ENSG00000175489"
##  [715] "ENSG00000160233" "ENSG00000124831" "ENSG00000124831"
##  [718] "ENSG00000124831" "ENSG00000124831" "ENSG00000143669"
##  [721] "ENSG00000197063" "ENSG00000145050" "ENSG00000101460"
##  [724] "ENSG00000076984" "ENSG00000119487" "ENSG00000119487"
##  [727] "ENSG00000119487" "ENSG00000119487" "ENSG00000119487"
##  [730] "ENSG00000119487" "ENSG00000099785" "ENSG00000099785"
##  [733] "ENSG00000099785" "ENSG00000009724" "ENSG00000009724"
##  [736] "ENSG00000197971" "ENSG00000197971" "ENSG00000197971"
##  [739] "ENSG00000197971" "ENSG00000126217" "ENSG00000180398"
##  [742] "ENSG00000180398" "ENSG00000128285" "ENSG00000090674"
##  [745] "ENSG00000135679" "ENSG00000135679" "ENSG00000135679"
##  [748] "ENSG00000135679" "ENSG00000108510" "ENSG00000152127"
##  [751] "ENSG00000170430" "ENSG00000199065" "ENSG00000199065"
##  [754] "ENSG00000199065" "ENSG00000221039" "ENSG00000221063"
##  [757] "ENSG00000208017" "ENSG00000199075" "ENSG00000207727"
##  [760] "ENSG00000207875" "ENSG00000207875" "ENSG00000130382"
##  [763] "ENSG00000115648" "ENSG00000115648" "ENSG00000009950"
##  [766] "ENSG00000009950" "ENSG00000009950" "ENSG00000009950"
##  [769] "ENSG00000108960" "ENSG00000173269" "ENSG00000075643"
##  [772] "ENSG00000166391" "ENSG00000166391" "ENSG00000107186"
##  [775] "ENSG00000107186" "ENSG00000107186" "ENSG00000214026"
##  [778] "ENSG00000173867" "ENSG00000173531" "ENSG00000149480"
##  [781] "ENSG00000122085" "ENSG00000122085" "ENSG00000122085"
##  [784] "ENSG00000122085" "ENSG00000132613" "ENSG00000110921"
##  [787] "ENSG00000110921" "ENSG00000172927" "ENSG00000172927"
##  [790] "ENSG00000106436" "ENSG00000065534" "ENSG00000065534"
##  [793] "ENSG00000065534" "ENSG00000065534" "ENSG00000091536"
##  [796] "ENSG00000091536" "ENSG00000236242" "ENSG00000139597"
##  [799] "ENSG00000139597" "ENSG00000008130" "ENSG00000008130"
##  [802] "ENSG00000152620" "ENSG00000141562" "ENSG00000141562"
##  [805] "ENSG00000141562" "ENSG00000166833" "ENSG00000255043"
##  [808] "ENSG00000255043" "ENSG00000255043" "ENSG00000196498"
##  [811] "ENSG00000196498" "ENSG00000196498" "ENSG00000166579"
##  [814] "ENSG00000166579" "ENSG00000151366" "ENSG00000151366"
##  [817] "ENSG00000151366" "ENSG00000165802" "ENSG00000165802"
##  [820] "ENSG00000165802" "ENSG00000165802" "ENSG00000165802"
##  [823] "ENSG00000173848" "ENSG00000107954" "ENSG00000100906"
##  [826] "ENSG00000104825" "ENSG00000104825" "ENSG00000101004"
##  [829] "ENSG00000163293" "ENSG00000172548" "ENSG00000172548"
##  [832] "ENSG00000136783" "ENSG00000169251" "ENSG00000169251"
##  [835] "ENSG00000166741" "ENSG00000015520" "ENSG00000015520"
##  [838] "ENSG00000015520" "ENSG00000015520" "ENSG00000148734"
##  [841] "ENSG00000242349" "ENSG00000131910" "ENSG00000012504"
##  [844] "ENSG00000012504" "ENSG00000012504" "ENSG00000012504"
##  [847] "ENSG00000012504" "ENSG00000012504" "ENSG00000012504"
##  [850] "ENSG00000012504" "ENSG00000144852" "ENSG00000144852"
##  [853] "ENSG00000144852" "ENSG00000143257" "ENSG00000143257"
##  [856] "ENSG00000143257" "ENSG00000143257" "ENSG00000143257"
##  [859] "ENSG00000143257" "ENSG00000143257" "ENSG00000143257"
##  [862] "ENSG00000143257" "ENSG00000143257" "ENSG00000143257"
##  [865] "ENSG00000143257" "ENSG00000143257" "ENSG00000143257"
##  [868] "ENSG00000143257" "ENSG00000143257" "ENSG00000143257"
##  [871] "ENSG00000143257" "ENSG00000143257" "ENSG00000143257"
##  [874] "ENSG00000143257" "ENSG00000143257" "ENSG00000143257"
##  [877] "ENSG00000143257" "ENSG00000143257" "ENSG00000143257"
##  [880] "ENSG00000143257" "ENSG00000143257" "ENSG00000143257"
##  [883] "ENSG00000143257" "ENSG00000113580" "ENSG00000113580"
##  [886] "ENSG00000113580" "ENSG00000113580" "ENSG00000113580"
##  [889] "ENSG00000113580" "ENSG00000113580" "ENSG00000113580"
##  [892] "ENSG00000113580" "ENSG00000113580" "ENSG00000113580"
##  [895] "ENSG00000113580" "ENSG00000113580" "ENSG00000113580"
##  [898] "ENSG00000113580" "ENSG00000113580" "ENSG00000113580"
##  [901] "ENSG00000113580" "ENSG00000113580" "ENSG00000113580"
##  [904] "ENSG00000113580" "ENSG00000113580" "ENSG00000116833"
##  [907] "ENSG00000116833" "ENSG00000116833" "ENSG00000116833"
##  [910] "ENSG00000116833" "ENSG00000116833" "ENSG00000180530"
##  [913] "ENSG00000171119" "ENSG00000151413" "ENSG00000090273"
##  [916] "ENSG00000168101" "ENSG00000168101" "ENSG00000168101"
##  [919] "ENSG00000168101" "ENSG00000132182" "ENSG00000125450"
##  [922] "ENSG00000176046" "ENSG00000176046" "ENSG00000065154"
##  [925] "ENSG00000065154" "ENSG00000180304" "ENSG00000111325"
##  [928] "ENSG00000060491" "ENSG00000119547" "ENSG00000119547"
##  [931] "ENSG00000224855" "ENSG00000175619" "ENSG00000140961"
##  [934] "ENSG00000185624" "ENSG00000179364" "ENSG00000100266"
##  [937] "ENSG00000006712" "ENSG00000006712" "ENSG00000006712"
##  [940] "ENSG00000140694" "ENSG00000140694" "ENSG00000140694"
##  [943] "ENSG00000140694" "ENSG00000140694" "ENSG00000140694"
# Convert the TSS to ensg as well 

ref_gene_hg19_ensg <- merge(refGene_hg19_TSS, gene_id, by.x = c("V5"), by.y = c("Gene"))

all_ref_gene_hg19_ensg <- unique(ref_gene_hg19_ensg$ensg)

liver_ref_gene <- all_ref_gene_hg19_ensg %in% comb_kidney$ensg

# Revisions- run GO
# Merge ENSG with true/false

test_gene <- as.numeric(as.vector(liver_ref_gene))
names(test_gene) <-  all_ref_gene_hg19_ensg

# Run topGO
go_data <- new("topGOdata",
                   ontology = "BP",
                   allGenes = test_gene, 
                    geneSel = function(allScore){
    return(allScore > 0)
                   nodeSize = 5,
                   annotationFun =,
                   mapping = "",
                   ID = "ensembl")
# Perform enrichment test
go_test <- runTest(go_data, algorithm = "weight01", statistic = "fisher")
go_table <- GenTable(go_data, weightFisher = go_test,
                         orderBy = "weightFisher", ranksOf = "weightFisher",
                         topNodes = sum(score(go_test) < .05))

 go_table_liver <-$GO.ID, go_table$weightFisher))

write.table(go_table_liver, "../data/go_table_liver.txt", quote = FALSE, row.names = FALSE, col.names = FALSE)


# Find the heart hypo
heart_hypo <- human_chimp_heart_specific_25_conserved_H3K27_LUNG[which(human_chimp_heart_specific_25_conserved_H3K27_LUNG$V4 == "hyper" & human_chimp_heart_specific_25_conserved_H3K27_LUNG$V6 != "-1"),]

heart_hypo <- heart_hypo[complete.cases(heart_hypo), ]

# Find the closest gene

closest_heart <- bedr(input = list(a = heart_hypo[,1:3], b = refGene_hg19_TSS), method = "closest", check.chr = FALSE)
##  * Processing input (1): a
##  * Checking input type... PASS
##    Input seems to be in bed format but chr/start/end column names are missing
##  * Check if index is a string... PASS
##  * Check index pattern... PASS
##  * Check for missing values... PASS
##  * Check for larger start position... PASS.
##  * Check if zero based... PASS
##  * Checking sort order... PASS
##  * Checking for overlapping 'contiguous' regions... PASS
##  * Processing input (2): b
##  * Checking input type... PASS
##    Input seems to be in bed format but chr/start/end column names are missing
##  * Check if index is a string... PASS
##  * Check index pattern... PASS
##  * Check for missing values... PASS
##  * Check for larger start position... PASS.
##  * Check if zero based... PASS
##  * Checking sort order... FAIL
##    The input for object is not *lexographically* ordered!
##    This can cause unexpected results for some set operations.
##    try: x <- bedr.sort.region(x)
##  * Checking for overlapping 'contiguous' regions... FAIL
##    The input for object has overlapping features!
##    This can cause unexpected results for some set operations.
##    i.e. x <- bedr.merge.region(x)
##    bedtools closest -a /var/folders/rf/qrcw6ncj05z1pc_pq9xzw3540000gn/T//RtmpXK3I56/a_bc552850ec24.bed -b /var/folders/rf/qrcw6ncj05z1pc_pq9xzw3540000gn/T//RtmpXK3I56/b_bc557772e5c1.bed
# Convert the gene name to ensg

gene_id <- read.table("../../../Reg_Evo_Primates/data/ENSG_GENE_HG19.csv", stringsAsFactors = FALSE, header=TRUE, sep = ",")

comb_kidney <- merge(closest_heart, gene_id, by.x = c("V8"), by.y = c("Gene"))

##  [1] "ENSG00000177674" "ENSG00000177674" "ENSG00000177674"
##  [4] "ENSG00000177674" "ENSG00000177674" "ENSG00000130762"
##  [7] "ENSG00000117411" "ENSG00000026508" "ENSG00000026508"
## [10] "ENSG00000026508" "ENSG00000026508" "ENSG00000026508"
## [13] "ENSG00000026508" "ENSG00000026508" "ENSG00000026508"
## [16] "ENSG00000114861" "ENSG00000114315" "ENSG00000131149"
## [19] "ENSG00000198951" "ENSG00000196498" "ENSG00000196498"
## [22] "ENSG00000196498" "ENSG00000170322" "ENSG00000100100"
## [25] "ENSG00000100100" "ENSG00000185917" "ENSG00000185917"
## [28] "ENSG00000167323" "ENSG00000143643" "ENSG00000143643"
## [31] "ENSG00000153786" "ENSG00000153786" "ENSG00000171940"
## [34] "ENSG00000183621" "ENSG00000183621" "ENSG00000183621"
## [37] "ENSG00000183621" "ENSG00000183621" "ENSG00000183621"
## [40] "ENSG00000183621"
# Convert the TSS to ensg as well 

ref_gene_hg19_ensg <- merge(refGene_hg19_TSS, gene_id, by.x = c("V5"), by.y = c("Gene"))

all_ref_gene_hg19_ensg <- unique(ref_gene_hg19_ensg$ensg)

heart_ref_gene <- all_ref_gene_hg19_ensg %in% comb_kidney$ensg

# Revisions- run GO
# Merge ENSG with true/false

test_gene <- as.numeric(as.vector(heart_ref_gene))
names(test_gene) <-  all_ref_gene_hg19_ensg

# Run topGO
go_data <- new("topGOdata",
                   ontology = "BP",
                   allGenes = test_gene, 
                    geneSel = function(allScore){
    return(allScore > 0)
                   nodeSize = 5,
                   annotationFun =,
                   mapping = "",
                   ID = "ensembl")
# Perform enrichment test
go_test <- runTest(go_data, algorithm = "weight01", statistic = "fisher")
go_table <- GenTable(go_data, weightFisher = go_test,
                         orderBy = "weightFisher", ranksOf = "weightFisher",
                         topNodes = sum(score(go_test) < .01))

Run clusterProfiler


#mydf <-, heart_ref_gene, liver_ref_gene))

#colnames(mydf) <- c("ensg", "heart", "liver")

#xx.formula.twogroups <- compareCluster(mydf$heart, data = mydf, fun="enrichGO", universe = df$ensg,
#                OrgDb         =

#dotplot(xx.formula.twogroups, showCategory=5, includeAll=FALSE)
library( ggplot2 );
revigo.names <- c("term_ID","description","frequency_%","plot_X","plot_Y","plot_size","value","uniqueness","dispensability"); <- rbind(c("GO:0009113","purine nucleobase biosynthetic process", 0.124,-4.742,-3.192, 4.202, 0.0005,0.769,0.000),
c("GO:0033197","response to vitamin E", 0.000, 7.179,-3.273, 1.740, 0.0005,0.849,0.000),
c("GO:0019043","establishment of viral latency", 0.001,-5.135, 5.016, 1.959, 0.0187,0.945,0.018),
c("GO:0006501","C-terminal protein lipidation", 0.004, 0.003,-5.207, 2.693, 0.0120,0.913,0.100),
c("GO:0060509","Type I pneumocyte differentiation", 0.001,-0.420, 6.928, 2.121, 0.0134,0.698,0.103),
c("GO:1903078","positive regulation of protein localization to plasma membrane", 0.010, 1.621, 0.720, 3.123, 0.0068,0.688,0.118),
c("GO:0033632","regulation of cell-cell adhesion mediated by integrin", 0.002, 2.909, 0.449, 2.378, 0.0160,0.835,0.132),
c("GO:2000109","regulation of macrophage apoptotic process", 0.001, 2.079,-2.113, 2.188, 0.0187,0.768,0.132),
c("GO:0032007","negative regulation of TOR signaling", 0.016, 5.974, 0.117, 3.325, 0.0052,0.640,0.175),
c("GO:0043547","positive regulation of GTPase activity", 0.470, 4.687, 1.488, 4.780, 0.0054,0.838,0.179),
c("GO:0009256","10-formyltetrahydrofolate metabolic process", 0.002,-6.344,-1.530, 2.474, 0.0134,0.809,0.185),
c("GO:0070141","response to UV-A", 0.002, 6.586,-3.433, 2.369, 0.0160,0.883,0.188),
c("GO:0071499","cellular response to laminar fluid shear stress", 0.001, 6.586,-2.544, 2.143, 0.0187,0.852,0.211),
c("GO:0006139","nucleobase-containing compound metabolic process",26.547,-4.434,-2.184, 6.532, 0.0499,0.889,0.214),
c("GO:0018242","protein O-linked glycosylation via serine", 0.001,-1.029,-5.988, 2.117, 0.0160,0.818,0.218),
c("GO:0015942","formate metabolic process", 0.065,-5.564,-1.813, 3.921, 0.0160,0.815,0.246),
c("GO:0070601","centromeric sister chromatid cohesion", 0.004,-1.575,-1.033, 2.749, 0.0266,0.829,0.253),
c("GO:0006863","purine nucleobase transport", 0.002,-4.632, 3.161, 2.464, 0.0160,0.877,0.268),
c("GO:0032026","response to magnesium ion", 0.002, 6.932,-3.864, 2.389, 0.0473,0.863,0.290),
c("GO:0070375","ERK5 cascade", 0.001, 3.865,-3.823, 2.041, 0.0134,0.729,0.303),
c("GO:0060070","canonical Wnt signaling pathway", 0.061, 4.991,-1.442, 3.893, 0.0066,0.678,0.315),
c("GO:0032486","Rap protein signal transduction", 0.002, 6.347,-0.924, 2.458, 0.0344,0.763,0.318),
c("GO:0061430","bone trabecula morphogenesis", 0.003,-2.302, 6.815, 2.553, 0.0344,0.798,0.326),
c("GO:0001957","intramembranous ossification", 0.001, 0.332, 7.419, 2.167, 0.0160,0.766,0.343),
c("GO:0009120","deoxyribonucleoside metabolic process", 0.006,-4.177,-4.617, 2.908, 0.0187,0.800,0.350),
c("GO:0007386","compartment pattern specification", 0.001, 0.048, 7.245, 2.111, 0.0134,0.749,0.356),
c("GO:0045351","type I interferon biosynthetic process", 0.002, 0.347, 6.406, 2.505, 0.0318,0.743,0.357),
c("GO:0001821","histamine secretion", 0.001,-3.314, 2.812, 2.143, 0.0240,0.877,0.358),
c("GO:0042321","negative regulation of circadian sleep/wake cycle, sleep", 0.001, 2.446, 5.266, 1.845, 0.0134,0.663,0.369),
c("GO:0006744","ubiquinone biosynthetic process", 0.136,-5.223,-2.418, 4.242, 0.0396,0.786,0.389),
c("GO:0009146","purine nucleoside triphosphate catabolic process", 0.035,-3.242,-4.729, 3.647, 0.0134,0.749,0.391),
c("GO:0046085","adenosine metabolic process", 0.003,-4.584,-4.405, 2.524, 0.0266,0.804,0.409),
c("GO:0060405","regulation of penile erection", 0.000, 1.798, 6.090, 1.716, 0.0160,0.701,0.410),
c("GO:0045725","positive regulation of glycogen biosynthetic process", 0.003, 0.849,-3.136, 2.547, 0.0396,0.723,0.414),
c("GO:1901642","nucleoside transmembrane transport", 0.047,-3.483, 2.842, 3.781, 0.0187,0.860,0.432),
c("GO:0048702","embryonic neurocranium morphogenesis", 0.002, 0.142, 6.947, 2.444, 0.0187,0.711,0.433),
c("GO:0048311","mitochondrion distribution", 0.025,-3.646, 1.645, 3.502, 0.0318,0.901,0.436),
c("GO:0046060","dATP metabolic process", 0.001,-3.497,-5.142, 2.207, 0.0134,0.789,0.437),
c("GO:1903071","positive regulation of ER-associated ubiquitin-dependent protein catabolic process", 0.001, 4.542,-2.446, 2.137, 0.0187,0.618,0.440),
c("GO:0033327","Leydig cell differentiation", 0.002,-0.252, 6.634, 2.407, 0.0292,0.686,0.450),
c("GO:0048541","Peyer's patch development", 0.002, 1.607, 6.672, 2.316, 0.0134,0.674,0.470),
c("GO:0060368","regulation of Fc receptor mediated stimulatory signaling pathway", 0.001, 6.210, 1.102, 1.919, 0.0160,0.646,0.480),
c("GO:0006351","transcription, DNA-templated",10.659,-3.806,-3.709, 6.136, 0.0041,0.852,0.480),
c("GO:0072530","purine-containing compound transmembrane transport", 0.016,-4.166, 2.833, 3.304, 0.0213,0.934,0.483),
c("GO:0072531","pyrimidine-containing compound transmembrane transport", 0.019,-4.073, 2.881, 3.391, 0.0422,0.934,0.489),
c("GO:0070255","regulation of mucus secretion", 0.002, 1.155, 4.966, 2.504, 0.0240,0.662,0.494),
c("GO:0038180","nerve growth factor signaling pathway", 0.001, 6.875,-1.582, 2.190, 0.0213,0.729,0.496),
c("GO:0009168","purine ribonucleoside monophosphate biosynthetic process", 1.043,-3.650,-3.225, 5.127, 0.0136,0.734,0.509),
c("GO:0033601","positive regulation of mammary gland epithelial cell proliferation", 0.002, 2.665, 4.905, 2.398, 0.0187,0.604,0.519),
c("GO:0000122","negative regulation of transcription from RNA polymerase II promoter", 0.199, 1.681,-2.816, 4.408, 0.0439,0.725,0.526),
c("GO:0001973","adenosine receptor signaling pathway", 0.005, 7.122,-0.404, 2.792, 0.0292,0.738,0.536),
c("GO:0038063","collagen-activated tyrosine kinase receptor signaling pathway", 0.005, 6.816,-0.631, 2.810, 0.0213,0.742,0.537),
c("GO:0008354","germ cell migration", 0.004,-0.730, 5.666, 2.729, 0.0213,0.700,0.552),
c("GO:0071320","cellular response to cAMP", 0.007, 7.142,-2.642, 2.937, 0.0071,0.810,0.553),
c("GO:0008277","regulation of G-protein coupled receptor protein signaling pathway", 0.024, 6.792, 0.170, 3.494, 0.0209,0.691,0.554),
c("GO:2000178","negative regulation of neural precursor cell proliferation", 0.005, 4.025, 1.444, 2.838, 0.0499,0.775,0.556),
c("GO:0071361","cellular response to ethanol", 0.003, 7.311,-2.794, 2.550, 0.0344,0.820,0.562),
c("GO:0043650","dicarboxylic acid biosynthetic process", 0.530,-5.261,-1.661, 4.833, 0.0344,0.767,0.571),
c("GO:0051412","response to corticosterone", 0.001, 6.485,-3.908, 2.053, 0.0422,0.848,0.572),
c("GO:0034127","regulation of MyD88-independent toll-like receptor signaling pathway", 0.000, 6.487, 1.509, 1.531, 0.0213,0.663,0.590),
c("GO:0002313","mature B cell differentiation involved in immune response", 0.003, 3.280, 4.691, 2.642, 0.0234,0.567,0.592),
c("GO:0032261","purine nucleotide salvage", 0.059,-4.165,-4.110, 3.878, 0.0187,0.768,0.593),
c("GO:0042118","endothelial cell activation", 0.002,-3.033, 0.342, 2.367, 0.0266,0.837,0.600),
c("GO:0003139","secondary heart field specification", 0.002, 0.004, 7.063, 2.358, 0.0240,0.711,0.600),
c("GO:0048387","negative regulation of retinoic acid receptor signaling pathway", 0.002, 6.096, 0.051, 2.394, 0.0213,0.681,0.601),
c("GO:0043249","erythrocyte maturation", 0.002, 2.358, 5.650, 2.461, 0.0292,0.610,0.607),
c("GO:0046130","purine ribonucleoside catabolic process", 0.036,-3.056,-4.878, 3.660, 0.0187,0.745,0.609),
c("GO:0001829","trophectodermal cell differentiation", 0.003,-0.657, 6.646, 2.521, 0.0396,0.689,0.620),
c("GO:0055015","ventricular cardiac muscle cell development", 0.003,-0.775, 6.758, 2.553, 0.0318,0.678,0.622),
c("GO:0002819","regulation of adaptive immune response", 0.025, 6.335, 1.438, 3.513, 0.0184,0.673,0.642),
c("GO:0051446","positive regulation of meiotic cell cycle", 0.007, 3.995, 2.576, 2.925, 0.0422,0.712,0.643),
c("GO:0014807","regulation of somitogenesis", 0.002, 1.564, 6.051, 2.342, 0.0213,0.651,0.660),
c("GO:0035414","negative regulation of catenin import into nucleus", 0.002, 1.162, 1.277, 2.497, 0.0266,0.750,0.669),
c("GO:0018243","protein O-linked glycosylation via threonine", 0.001,-1.054,-6.012, 2.201, 0.0187,0.817,0.676),
c("GO:0046654","tetrahydrofolate biosynthetic process", 0.101,-5.448,-2.197, 4.113, 0.0187,0.765,0.680),
c("GO:0060340","positive regulation of type I interferon-mediated signaling pathway", 0.002, 6.123, 0.385, 2.412, 0.0213,0.608,0.680),
c("GO:0046386","deoxyribose phosphate catabolic process", 0.023,-1.891,-6.345, 3.469, 0.0448,0.843,0.684),
c("GO:2000059","negative regulation of protein ubiquitination involved in ubiquitin-dependent protein catabolic process", 0.003, 2.146,-4.195, 2.603, 0.0318,0.743,0.686),
c("GO:0036066","protein O-linked fucosylation", 0.002,-0.988,-6.193, 2.307, 0.0370,0.815,0.689),
c("GO:0039530","MDA-5 signaling pathway", 0.002, 4.143, 3.197, 2.346, 0.0240,0.527,0.698),
c("GO:0071157","negative regulation of cell cycle arrest", 0.005, 3.360,-0.231, 2.804, 0.0473,0.687,0.699),
c("GO:0035023","regulation of Rho protein signal transduction", 0.125, 6.365, 0.101, 4.206, 0.0400,0.660,0.699));

  panel.border = element_rect(colour = "black", fill = NA, size = 2),
  plot.title = element_text(size = 16, face = "bold"),
  axis.text.y =  element_text(size = 14,face = "bold",color = "black"),
  axis.text.x =  element_text(size = 14,face = "bold",color = "black"),
  axis.title.y = element_text(size = 14,face = "bold"),
  axis.title.x = element_text(size = 14,face = "bold"),
  legend.text = element_text(size = 14,face = "bold"),
  legend.title = element_text(size = 14,face = "bold"),
  strip.text.x = element_text(size = 14,face = "bold"),
  strip.text.y = element_text(size = 14,face = "bold"),
  strip.background = element_rect(colour = "black", size = 2)) <- data.frame(;
names( <- revigo.names; <- [($plot_X != "null" &$plot_Y != "null"), ];$plot_X <- as.numeric( as.character($plot_X) );$plot_Y <- as.numeric( as.character($plot_Y) );$plot_size <- as.numeric( as.character($plot_size) );$log10_p_value <- as.numeric( as.character($value) );$frequency <- as.numeric( as.character($frequency) );$uniqueness <- as.numeric( as.character($uniqueness) );$dispensability <- as.numeric( as.character($dispensability) );
# --------------------------------------------------------------------------

# This is a table indicating which labels you would like to plot (all data will be plotted, but you need to indicate whether the label should be displayed), make this table manually.

label1 <- c("GO:0070375","ERK5 cascade", 0.001, 3.865,-3.823, 2.041, 0.0134,0.729,0.303)

label2 <- c("GO:0060070","canonical Wnt signaling pathway", 0.061, 4.991,-1.442, 3.893, 0.0066,0.678,0.315) 

label3 <- c("GO:0055015","ventricular cardiac muscle cell development", 0.003,-0.775, 6.758, 2.553, 0.0318,0.678,0.622) 

label4 <- c("GO:0003139","secondary heart field specification", 0.002, 0.004, 7.063, 2.358, 0.0240,0.711,0.600)

ex <-, label2, label3), stringsAsFactors = FALSE)
colnames(ex) <- c("term_ID","description","frequency_%","plot_X","plot_Y","plot_size","value","uniqueness","dispensability")

ggplot(data =
geom_point( aes( plot_X, plot_Y, fill = log10_p_value, size = plot_size),shape=21,color="black",stroke=0.7, alpha = 0.8) + guides(size=guide_legend(title="No. of genes")) + scale_fill_gradient2(low = muted("red"), mid = "white",
  high = muted("blue")) + guides(fill=guide_legend(title="P value"), size=guide_legend(title="No. of genes")) +
#scale_size( range=c(5, 20)) +
  labs (y = "Semantic space x", x = "Semantic space y") + theme_bw()  + geom_label_repel(ex, mapping = aes(as.numeric(ex$plot_X), as.numeric(ex$plot_Y), label = description),
    fontface = 'bold', color = 'black',
    box.padding = 0.6, point.padding = 1.6,
        size = 3,
    # Width of the line segments.
    segment.size = 0,
    # Strength of the repulsion force.
    force = 1)

## Revigo liver

revigo.names <- c("term_ID","description","frequency_%","plot_X","plot_Y","plot_size","value","uniqueness","dispensability"); <- rbind(c("GO:0002576","platelet degranulation", 0.003, 0.496,-3.539, 2.519, 0.0000,0.842,0.000),
c("GO:0008152","metabolic process",75.387, 0.813,-0.564, 6.986, 0.0308,0.998,0.000),
c("GO:0009820","alkaloid metabolic process", 0.006, 4.043, 1.159, 2.869, 0.0000,0.947,0.000),
c("GO:0042632","cholesterol homeostasis", 0.019,-3.975, 2.639, 3.381, 0.0000,0.818,0.000),
c("GO:0019835","cytolysis", 0.044, 0.583,-0.452, 3.749, 0.0007,0.971,0.018),
c("GO:0001887","selenium compound metabolic process", 0.008, 0.543,-0.357, 2.990, 0.0189,0.963,0.019),
c("GO:0042157","lipoprotein metabolic process", 0.210, 0.683,-0.584, 4.431, 0.0116,0.957,0.028),
c("GO:0017144","drug metabolic process", 0.058, 0.564,-0.386, 3.868, 0.0392,0.959,0.035),
c("GO:0070989","oxidative demethylation", 0.011, 1.605, 0.368, 3.133, 0.0064,0.912,0.041),
c("GO:0019740","nitrogen utilization", 0.085, 0.842,-0.775, 4.038, 0.0189,0.932,0.050),
c("GO:0019695","choline metabolic process", 0.016, 0.978, 0.110, 3.301, 0.0060,0.962,0.063),
c("GO:0048625","myoblast fate commitment", 0.001, 0.704,-6.082, 2.100, 0.0189,0.822,0.085),
c("GO:0006368","transcription elongation from RNA polymerase II promoter", 0.082, 1.989, 1.876, 4.021, 0.0139,0.890,0.085),
c("GO:0051081","nuclear envelope disassembly", 0.002, 0.688,-0.443, 2.338, 0.0116,0.883,0.087),
c("GO:0006957","complement activation, alternative pathway", 0.000,-6.310, 2.907, 1.771, 0.0003,0.689,0.121),
c("GO:0017187","peptidyl-glutamic acid carboxylation", 0.006,-0.167, 1.374, 2.865, 0.0011,0.918,0.125),
c("GO:0006629","lipid metabolic process", 3.522, 3.786, 1.634, 5.655, 0.0144,0.876,0.126),
c("GO:0034384","high-density lipoprotein particle clearance", 0.002,-3.947,-4.331, 2.294, 0.0001,0.733,0.128),
c("GO:1904683","regulation of metalloendopeptidase activity", 0.001,-3.073, 3.701, 2.210, 0.0017,0.790,0.131),
c("GO:0006641","triglyceride metabolic process", 0.038, 3.327, 1.871, 3.687, 0.0001,0.832,0.140),
c("GO:0051647","nucleus localization", 0.012,-0.140,-3.521, 3.198, 0.0117,0.927,0.141),
c("GO:0042738","exogenous drug catabolic process", 0.001,-1.097, 3.996, 2.193, 0.0009,0.834,0.156),
c("GO:0070141","response to UV-A", 0.002,-3.392, 1.485, 2.369, 0.0017,0.918,0.166),
c("GO:0006768","biotin metabolic process", 0.081, 5.718, 3.455, 4.018, 0.0007,0.805,0.167),
c("GO:1901160","primary amino compound metabolic process", 0.015, 4.703, 1.279, 3.290, 0.0455,0.944,0.178),
c("GO:0043627","response to estrogen", 0.010,-3.637, 1.577, 3.128, 0.0379,0.912,0.184),
c("GO:0099133","ATP hydrolysis coupled anion transmembrane transport", 0.271,-0.029,-4.342, 4.541, 0.0152,0.919,0.184),
c("GO:0010646","regulation of cell communication", 0.929,-6.450, 3.995, 5.076, 0.0173,0.784,0.190),
c("GO:0007041","lysosomal transport", 0.017, 0.052,-3.377, 3.341, 0.0395,0.947,0.196),
c("GO:0042158","lipoprotein biosynthetic process", 0.192, 0.957, 0.864, 4.391, 0.0189,0.919,0.199),
c("GO:1990535","neuron projection maintenance", 0.000, 0.267,-0.657, 1.301, 0.0275,0.897,0.200),
c("GO:0052652","cyclic purine nucleotide metabolic process", 0.094, 4.152, 4.182, 4.082, 0.0457,0.804,0.234),
c("GO:0006390","transcription from mitochondrial promoter", 0.005, 0.802, 1.042, 2.794, 0.0484,0.915,0.235),
c("GO:0006600","creatine metabolic process", 0.002, 5.427, 2.495, 2.328, 0.0374,0.857,0.244),
c("GO:0042127","regulation of cell proliferation", 0.313,-5.699, 3.430, 4.603, 0.0229,0.785,0.259),
c("GO:0016540","protein autoprocessing", 0.011,-0.432, 1.323, 3.147, 0.0191,0.924,0.274),
c("GO:0006476","protein deacetylation", 0.072,-0.361, 1.247, 3.967, 0.0455,0.913,0.278),
c("GO:0055114","oxidation-reduction process",15.060, 4.858, 2.263, 6.286, 0.0206,0.872,0.300),
c("GO:0015886","heme transport", 0.066,-0.143,-4.692, 3.927, 0.0044,0.860,0.302),
c("GO:0006461","protein complex assembly", 0.960, 0.086,-0.705, 5.091, 0.0285,0.920,0.312),
c("GO:0060052","neurofilament cytoskeleton organization", 0.002, 1.098,-0.364, 2.501, 0.0374,0.883,0.319),
c("GO:0010918","positive regulation of mitochondrial membrane potential", 0.001,-2.305, 1.655, 2.164, 0.0044,0.851,0.327),
c("GO:0033572","transferrin transport", 0.002,-0.385,-3.961, 2.449, 0.0180,0.915,0.333),
c("GO:0006524","alanine catabolic process", 0.025, 5.584, 3.621, 3.509, 0.0009,0.800,0.338),
c("GO:0097267","omega-hydroxylase P450 pathway", 0.000, 4.727, 2.654, 1.000, 0.0017,0.851,0.339),
c("GO:0019627","urea metabolic process", 0.051, 4.765, 2.756, 3.820, 0.0455,0.846,0.339),
c("GO:1903830","magnesium ion transmembrane transport", 0.088, 0.021,-4.086, 4.053, 0.0339,0.938,0.340),
c("GO:1904179","positive regulation of adipose tissue development", 0.001,-5.562,-3.251, 1.996, 0.0009,0.657,0.344),
c("GO:0007584","response to nutrient", 0.026,-3.941, 1.599, 3.530, 0.0010,0.865,0.345),
c("GO:0090400","stress-induced premature senescence", 0.002,-4.185,-2.548, 2.350, 0.0484,0.752,0.346),
c("GO:0042908","xenobiotic transport", 0.028,-0.145,-4.010, 3.556, 0.0064,0.876,0.348),
c("GO:0060021","palate development", 0.018,-0.008,-5.732, 3.363, 0.0445,0.883,0.355),
c("GO:0033860","regulation of NAD(P)H oxidase activity", 0.001,-3.702, 4.403, 2.057, 0.0275,0.831,0.356),
c("GO:0045725","positive regulation of glycogen biosynthetic process", 0.003,-0.905, 5.340, 2.547, 0.0039,0.686,0.357),
c("GO:0001907","killing by symbiont of host cells", 0.008,-3.276, 2.257, 3.001, 0.0009,0.818,0.362),
c("GO:0016310","phosphorylation", 7.764, 2.492, 2.058, 5.998, 0.0064,0.912,0.371),
c("GO:0050892","intestinal absorption", 0.006,-0.941,-7.157, 2.913, 0.0016,0.782,0.379),
c("GO:1900107","regulation of nodal signaling pathway", 0.002,-6.525, 3.443, 2.316, 0.0275,0.740,0.380),
c("GO:0008090","retrograde axonal transport", 0.003, 0.413,-4.290, 2.521, 0.0374,0.827,0.390),
c("GO:0008203","cholesterol metabolic process", 0.028, 5.004, 2.844, 3.554, 0.0004,0.835,0.402),
c("GO:0070301","cellular response to hydrogen peroxide", 0.019,-5.078, 2.109, 3.397, 0.0023,0.823,0.402),
c("GO:0007628","adult walking behavior", 0.008,-0.864,-5.875, 3.000, 0.0288,0.814,0.411),
c("GO:0043433","negative regulation of sequence-specific DNA binding transcription factor activity", 0.031,-3.638, 4.535, 3.600, 0.0023,0.715,0.412),
c("GO:0051340","regulation of ligase activity", 0.002,-2.775, 3.103, 2.391, 0.0455,0.849,0.421),
c("GO:0097190","apoptotic signaling pathway", 0.117,-4.388, 4.477, 4.177, 0.0357,0.702,0.427),
c("GO:0006869","lipid transport", 0.270,-0.359,-4.931, 4.539, 0.0084,0.825,0.430),
c("GO:0045717","negative regulation of fatty acid biosynthetic process", 0.007, 0.731, 5.462, 2.935, 0.0030,0.667,0.434),
c("GO:0051004","regulation of lipoprotein lipase activity", 0.003,-2.788, 2.773, 2.587, 0.0089,0.840,0.435),
c("GO:0006536","glutamate metabolic process", 0.201, 5.539, 3.254, 4.412, 0.0020,0.816,0.441),
c("GO:0018279","protein N-linked glycosylation via asparagine", 0.015, 1.838, 3.560, 3.284, 0.0410,0.833,0.446),
c("GO:0046185","aldehyde catabolic process", 0.048, 4.214, 2.777, 3.790, 0.0064,0.832,0.451),
c("GO:0032071","regulation of endodeoxyribonuclease activity", 0.003,-3.421, 4.017, 2.537, 0.0374,0.791,0.451),
c("GO:0008202","steroid metabolic process", 0.161, 3.336, 1.762, 4.315, 0.0005,0.851,0.451),
c("GO:0071156","regulation of cell cycle arrest", 0.013,-2.547, 3.556, 3.230, 0.0275,0.745,0.452),
c("GO:0071372","cellular response to follicle-stimulating hormone stimulus", 0.001,-4.403, 1.848, 2.220, 0.0118,0.859,0.460),
c("GO:0042940","D-amino acid transport", 0.003,-0.063,-4.288, 2.562, 0.0275,0.873,0.471),
c("GO:1903427","negative regulation of reactive oxygen species biosynthetic process", 0.002,-3.996, 3.252, 2.486, 0.0044,0.777,0.477),
c("GO:0042493","response to drug", 0.266,-5.108, 2.172, 4.534, 0.0449,0.863,0.477),
c("GO:0001889","liver development", 0.023,-1.101,-6.479, 3.471, 0.0009,0.766,0.478),
c("GO:0006545","glycine biosynthetic process", 0.079, 5.573, 3.375, 4.005, 0.0275,0.814,0.479),
c("GO:0019216","regulation of lipid metabolic process", 0.095,-2.218, 5.684, 4.086, 0.0052,0.745,0.482),
c("GO:0006591","ornithine metabolic process", 0.088, 5.478, 3.118, 4.052, 0.0484,0.825,0.483),
c("GO:0046838","phosphorylated carbohydrate dephosphorylation", 0.064, 1.908, 2.032, 3.915, 0.0455,0.926,0.484),
c("GO:0006739","NADP metabolic process", 0.357, 4.701, 4.332, 4.661, 0.0063,0.793,0.485),
c("GO:0006520","cellular amino acid metabolic process", 5.591, 5.069, 3.403, 5.856, 0.0148,0.779,0.487),
c("GO:2000343","positive regulation of chemokine (C-X-C motif) ligand 2 production", 0.001,-5.534,-2.610, 1.959, 0.0275,0.680,0.489),
c("GO:0021814","cell motility involved in cerebral cortex radial glia guided migration", 0.001,-0.848,-6.605, 2.238, 0.0189,0.729,0.492),
c("GO:0022900","electron transport chain", 0.564, 3.324, 2.185, 4.860, 0.0186,0.848,0.493),
c("GO:0090277","positive regulation of peptide hormone secretion", 0.013,-4.678, 0.230, 3.226, 0.0004,0.601,0.496),
c("GO:0015942","formate metabolic process", 0.065, 5.321, 3.235, 3.921, 0.0017,0.832,0.499),
c("GO:0046329","negative regulation of JNK cascade", 0.007,-4.599, 5.445, 2.940, 0.0063,0.605,0.500),
c("GO:0001503","ossification", 0.074,-0.710,-6.573, 3.979, 0.0413,0.791,0.504),
c("GO:0006898","receptor-mediated endocytosis", 0.095, 0.278,-4.169, 4.086, 0.0004,0.935,0.511),
c("GO:0090239","regulation of histone H4 acetylation", 0.003,-3.175, 3.088, 2.531, 0.0455,0.769,0.511),
c("GO:0060059","embryonic retina morphogenesis in camera-type eye", 0.003,-0.909,-6.515, 2.573, 0.0029,0.790,0.512),
c("GO:1902459","positive regulation of stem cell population maintenance", 0.001,-4.906,-2.513, 2.236, 0.0275,0.663,0.517),
c("GO:1902959","regulation of aspartic-type endopeptidase activity involved in amyloid precursor protein catabolic process", 0.000,-2.854, 3.852, 1.756, 0.0455,0.802,0.517),
c("GO:0031100","animal organ regeneration", 0.005,-1.364,-6.064, 2.792, 0.0402,0.788,0.526),
c("GO:0061620","glycolytic process through glucose-6-phosphate", 0.002, 5.004, 4.281, 2.290, 0.0455,0.798,0.529),
c("GO:0002679","respiratory burst involved in defense response", 0.001,-3.703, 1.450, 2.258, 0.0374,0.816,0.535),
c("GO:0034504","protein localization to nucleus", 0.129,-0.313,-4.647, 4.218, 0.0210,0.899,0.539),
c("GO:0014911","positive regulation of smooth muscle cell migration", 0.003,-5.348,-0.209, 2.620, 0.0461,0.695,0.540),
c("GO:0061138","morphogenesis of a branching epithelium", 0.042,-1.117,-6.445, 3.730, 0.0021,0.775,0.541),
c("GO:0010793","regulation of mRNA export from nucleus", 0.003,-3.669,-1.160, 2.625, 0.0275,0.749,0.541),
c("GO:0072049","comma-shaped body morphogenesis", 0.001,-1.363,-5.960, 2.173, 0.0189,0.801,0.543),
c("GO:0046498","S-adenosylhomocysteine metabolic process", 0.066, 5.725, 3.823, 3.925, 0.0275,0.808,0.544),
c("GO:0045620","negative regulation of lymphocyte differentiation", 0.008,-3.807,-2.279, 3.018, 0.0029,0.590,0.549),
c("GO:0019626","short-chain fatty acid catabolic process", 0.024, 5.002, 3.731, 3.490, 0.0189,0.779,0.556),
c("GO:0034356","NAD biosynthesis via nicotinamide riboside salvage pathway", 0.004, 4.983, 4.281, 2.691, 0.0235,0.828,0.560),
c("GO:0046620","regulation of organ growth", 0.020,-4.335,-3.406, 3.403, 0.0044,0.688,0.561),
c("GO:0006778","porphyrin-containing compound metabolic process", 0.457, 5.545, 2.444, 4.768, 0.0453,0.896,0.561),
c("GO:0010269","response to selenium ion", 0.001,-3.417, 1.446, 1.991, 0.0189,0.892,0.564),
c("GO:0090335","regulation of brown fat cell differentiation", 0.003,-3.134,-2.585, 2.531, 0.0274,0.735,0.566),
c("GO:0000098","sulfur amino acid catabolic process", 0.008, 5.398, 3.462, 3.030, 0.0064,0.815,0.566),
c("GO:1905668","positive regulation of protein localization to endosome", 0.001,-4.713,-0.861, 2.079, 0.0275,0.732,0.569),
c("GO:0031016","pancreas development", 0.021,-1.275,-6.229, 3.438, 0.0453,0.774,0.573),
c("GO:0071397","cellular response to cholesterol", 0.001,-4.311, 1.853, 2.272, 0.0191,0.857,0.574),
c("GO:0060712","spongiotrophoblast layer development", 0.003,-1.057,-6.380, 2.533, 0.0191,0.790,0.578),
c("GO:0031659","positive regulation of cyclin-dependent protein serine/threonine kinase activity involved in G1/S transition of mitotic cell cycle", 0.002,-3.538, 4.926, 2.350, 0.0275,0.670,0.578),
c("GO:1903896","positive regulation of IRE1-mediated unfolded protein response", 0.001,-6.708, 3.143, 1.857, 0.0275,0.671,0.580),
c("GO:0071560","cellular response to transforming growth factor beta stimulus", 0.050,-4.466, 1.856, 3.804, 0.0127,0.832,0.582),
c("GO:0035733","hepatic stellate cell activation", 0.000, 0.492,-0.383, 1.748, 0.0455,0.898,0.584),
c("GO:0034763","negative regulation of transmembrane transport", 0.014,-4.429,-0.887, 3.251, 0.0274,0.743,0.585),
c("GO:0042167","heme catabolic process", 0.002, 5.014, 2.712, 2.408, 0.0374,0.834,0.586),
c("GO:0006853","carnitine shuttle", 0.000,-0.241,-4.610, 1.114, 0.0089,0.860,0.587),
c("GO:0007411","axon guidance", 0.066,-3.249,-3.116, 3.930, 0.0223,0.617,0.587),
c("GO:0048013","ephrin receptor signaling pathway", 0.016,-6.783, 3.560, 3.308, 0.0309,0.752,0.593),
c("GO:0034340","response to type I interferon", 0.008,-5.227, 1.865, 3.007, 0.0117,0.821,0.598),
c("GO:0031325","positive regulation of cellular metabolic process", 1.004,-6.818, 4.034, 5.110, 0.0233,0.668,0.602),
c("GO:0042177","negative regulation of protein catabolic process", 0.025,-2.311, 5.307, 3.513, 0.0177,0.698,0.606),
c("GO:1900016","negative regulation of cytokine production involved in inflammatory response", 0.002,-5.942,-1.181, 2.391, 0.0191,0.603,0.606),
c("GO:2000463","positive regulation of excitatory postsynaptic potential", 0.003,-6.002, 3.548, 2.606, 0.0220,0.638,0.607),
c("GO:0098902","regulation of membrane depolarization during action potential", 0.001,-3.098, 2.354, 2.188, 0.0455,0.827,0.608),
c("GO:1902237","positive regulation of endoplasmic reticulum stress-induced intrinsic apoptotic signaling pathway", 0.002,-6.892, 3.889, 2.324, 0.0089,0.647,0.617),
c("GO:0008635","activation of cysteine-type endopeptidase activity involved in apoptotic process by cytochrome c", 0.001,-5.340, 4.602, 2.279, 0.0484,0.665,0.619),
c("GO:2000271","positive regulation of fibroblast apoptotic process", 0.002,-6.128, 4.110, 2.320, 0.0374,0.726,0.621),
c("GO:0050730","regulation of peptidyl-tyrosine phosphorylation", 0.045,-2.927, 5.206, 3.759, 0.0115,0.746,0.627),
c("GO:0014068","positive regulation of phosphatidylinositol 3-kinase signaling", 0.013,-6.835, 3.378, 3.216, 0.0477,0.656,0.627),
c("GO:0032148","activation of protein kinase B activity", 0.004,-3.889, 4.818, 2.738, 0.0411,0.689,0.628),
c("GO:0000122","negative regulation of transcription from RNA polymerase II promoter", 0.199,-3.286, 4.570, 4.408, 0.0343,0.704,0.628),
c("GO:2000659","regulation of interleukin-1-mediated signaling pathway", 0.001,-6.610, 3.398, 2.117, 0.0275,0.727,0.629),
c("GO:0043392","negative regulation of DNA binding", 0.014,-3.451, 2.990, 3.256, 0.0324,0.830,0.631),
c("GO:0042426","choline catabolic process", 0.001, 4.091, 2.217, 2.230, 0.0275,0.898,0.632),
c("GO:1900119","positive regulation of execution phase of apoptosis", 0.003,-5.254, 3.939, 2.528, 0.0152,0.720,0.635),
c("GO:0046487","glyoxylate metabolic process", 0.049, 5.512, 3.224, 3.794, 0.0484,0.832,0.635),
c("GO:0030917","midbrain-hindbrain boundary development", 0.003,-0.916,-6.603, 2.576, 0.0064,0.776,0.636),
c("GO:0031663","lipopolysaccharide-mediated signaling pathway", 0.010,-6.114, 3.001, 3.128, 0.0363,0.713,0.638),
c("GO:1901679","nucleotide transmembrane transport", 0.011,-0.193,-4.465, 3.131, 0.0374,0.862,0.638),
c("GO:0032933","SREBP signaling pathway", 0.008,-6.008, 4.192, 2.989, 0.0484,0.656,0.640),
c("GO:2000646","positive regulation of receptor catabolic process", 0.001,-2.717, 5.596, 1.881, 0.0189,0.731,0.642),
c("GO:0071276","cellular response to cadmium ion", 0.009,-4.925, 2.123, 3.077, 0.0040,0.848,0.644),
c("GO:0000060","protein import into nucleus, translocation", 0.012,-0.358,-4.229, 3.175, 0.0286,0.853,0.645),
c("GO:0006548","histidine catabolic process", 0.052, 5.484, 3.853, 3.828, 0.0044,0.789,0.649),
c("GO:0034638","phosphatidylcholine catabolic process", 0.002, 4.403, 3.693, 2.328, 0.0374,0.793,0.652),
c("GO:1901523","icosanoid catabolic process", 0.000, 5.088, 3.154, 1.732, 0.0189,0.841,0.653),
c("GO:0006559","L-phenylalanine catabolic process", 0.031, 5.469, 3.690, 3.596, 0.0118,0.794,0.657),
c("GO:0051642","centrosome localization", 0.007,-0.128,-3.483, 2.973, 0.0190,0.928,0.658),
c("GO:0010040","response to iron(II) ion", 0.002,-4.034, 1.687, 2.407, 0.0189,0.886,0.658),
c("GO:0000042","protein targeting to Golgi", 0.021,-0.296,-4.424, 3.422, 0.0374,0.900,0.670),
c("GO:0090201","negative regulation of release of cytochrome c from mitochondria", 0.003,-5.536, 3.408, 2.591, 0.0285,0.651,0.672),
c("GO:0006855","drug transmembrane transport", 0.189,-4.897,-2.034, 4.384, 0.0138,0.752,0.672),
c("GO:0009887","animal organ morphogenesis", 0.264,-1.342,-6.260, 4.530, 0.0333,0.742,0.673),
c("GO:0006879","cellular iron ion homeostasis", 0.110,-1.935, 4.780, 4.148, 0.0002,0.750,0.674),
c("GO:0030178","negative regulation of Wnt signaling pathway", 0.037,-5.011, 4.290, 3.681, 0.0367,0.636,0.676),
c("GO:0007262","STAT protein import into nucleus", 0.001,-5.800,-0.845, 2.223, 0.0484,0.729,0.677),
c("GO:0045739","positive regulation of DNA repair", 0.013,-5.991, 3.701, 3.205, 0.0123,0.635,0.678),
c("GO:0034142","toll-like receptor 4 signaling pathway", 0.006,-6.777, 3.183, 2.892, 0.0191,0.642,0.679),
c("GO:0046326","positive regulation of glucose import", 0.007,-6.120,-0.943, 2.979, 0.0287,0.694,0.680),
c("GO:0042773","ATP synthesis coupled electron transport", 0.221, 4.104, 4.074, 4.452, 0.0456,0.794,0.685),
c("GO:0010886","positive regulation of cholesterol storage", 0.002,-5.084,-0.414, 2.320, 0.0374,0.711,0.685),
c("GO:0001568","blood vessel development", 0.136,-1.287,-6.290, 4.243, 0.0452,0.758,0.689),
c("GO:0006505","GPI anchor metabolic process", 0.102, 3.442, 3.385, 4.115, 0.0456,0.805,0.690),
c("GO:0046439","L-cysteine metabolic process", 0.039, 6.129, 3.195, 3.699, 0.0374,0.827,0.692),
c("GO:0051897","positive regulation of protein kinase B signaling", 0.016,-6.848, 3.394, 3.304, 0.0485,0.653,0.692),
c("GO:0032287","peripheral nervous system myelin maintenance", 0.002,-0.055,-6.738, 2.468, 0.0374,0.750,0.693),
c("GO:1904468","negative regulation of tumor necrosis factor secretion", 0.001,-3.544,-4.697, 1.982, 0.0374,0.625,0.695),
c("GO:1903874","ferrous iron transmembrane transport", 0.028, 0.089,-4.022, 3.563, 0.0374,0.931,0.700)); <- data.frame(;
names( <- revigo.names; <- [($plot_X != "null" &$plot_Y != "null"), ];$plot_X <- as.numeric( as.character($plot_X) );$plot_Y <- as.numeric( as.character($plot_Y) );$plot_size <- as.numeric( as.character($plot_size) );$log10_p_value <- as.numeric( as.character($value) );$frequency <- as.numeric( as.character($frequency) );$uniqueness <- as.numeric( as.character($uniqueness) );$dispensability <- as.numeric( as.character($dispensability) );
# --------------------------------------------------------------------------

# This is a table indicating which labels you would like to plot (all data will be plotted, but you need to indicate whether the label should be displayed), make this table manually.

label1 <- c("GO:0042632","cholesterol homeostasis", 0.019,-3.975, 2.639, 3.381, 0.0000,0.818,0.000)

label2 <- c("GO:0017144","drug metabolic process", 0.058, 0.564,-0.386, 3.868, 0.0392,0.959,0.035) 

label3 <- c("GO:0006629","lipid metabolic process", 3.522, 3.786, 1.634, 5.655, 0.0144,0.876,0.126)

ex <-, label2, label3), stringsAsFactors = FALSE)
colnames(ex) <- c("term_ID","description","frequency_%","plot_X","plot_Y","plot_size","value","uniqueness","dispensability")

ggplot(data =
geom_point( aes( plot_X, plot_Y, fill = log10_p_value, size = plot_size),shape=21,color="black",stroke=0.7, alpha = 0.8) + guides(size=guide_legend(title="No. of genes")) + scale_fill_gradient2(low = muted("red"), mid = "white",
  high = muted("blue")) + guides(fill=guide_legend(title="P value"), size=guide_legend(title="No. of genes")) +
#scale_size( range=c(5, 20)) +
  labs (y = "Semantic space x", x = "Semantic space y") + theme_bw()  + geom_label_repel(ex, mapping = aes(as.numeric(ex$plot_X), as.numeric(ex$plot_Y), label = description),
    fontface = 'bold', color = 'black',
    box.padding = 0.6, point.padding = 1.6,
        size = 3,
    # Width of the line segments.
    segment.size = 0,
    # Strength of the repulsion force.
    force = 1)