5
5
none :
6
6
7
7
# make all sets of annotations
8
- all : gencode ensembl gencode-hg38 ensembl-hg38
8
+ all : gencode-hg19 ensembl-hg19 gencode-hg38 ensembl-hg38
9
9
10
10
11
11
# ~~~~~ GENCODE hg19 ~~~~~ #
12
12
# generate the Gencode hg19 annotations .bed file
13
- gencode : gencode.v19.annotation.genes.bed
13
+ gencode-hg19 : gencode.v19.annotation.genes.bed
14
14
15
15
gencode.v19.annotation.gtf.gz :
16
16
wget ftp://ftp.sanger.ac.uk/pub/gencode/Gencode_human/release_19/gencode.v19.annotation.gtf.gz
@@ -36,27 +36,20 @@ gencode.v27.annotation.genes.bed: gencode.v27.annotation.gtf.gz
36
36
37
37
# ~~~~~ ENSEMBL hg19 ~~~~~ #
38
38
# generate the Ensembl hg19 annotations .bed file
39
- ensembl : Homo_sapiens.GRCh37.82.noGLMT. chr.genes .bed
39
+ ensembl-hg19 : Homo_sapiens.GRCh37.82.chr.bed
40
40
41
- Homo_sapiens.GRCh37.82.gtf.gz :
42
- wget ftp://ftp.ensembl.org/pub/grch37/release-84/gtf/homo_sapiens/Homo_sapiens.GRCh37.82.gtf.gz
41
+ Homo_sapiens.GRCh37.82.chr. gtf.gz :
42
+ wget ftp://ftp.ensembl.org/pub/grch37/release-84/gtf/homo_sapiens/Homo_sapiens.GRCh37.82.chr. gtf.gz
43
43
44
- # Need to filter out the GL, MT entries
45
- Homo_sapiens.GRCh37.82.noGLMT.gtf : Homo_sapiens.GRCh37.82.gtf.gz
46
- zcat Homo_sapiens.GRCh37.82.gtf.gz | grep -Ev " ^#|^GL|^M" > Homo_sapiens.GRCh37.82.noGLMT.gtf
47
-
48
- # need to add 'chr' to the start of each 1st entry
49
- Homo_sapiens.GRCh37.82.noGLMT.chr.gtf : Homo_sapiens.GRCh37.82.noGLMT.gtf
50
- cat Homo_sapiens.GRCh37.82.noGLMT.gtf | sed ' s/^/chr/' > Homo_sapiens.GRCh37.82.noGLMT.chr.gtf
44
+ # remove comment lines
45
+ # extract only 'gene' entries
46
+ # add 'chr' to first entry, change 'chrMT' to 'chrM'
47
+ Homo_sapiens.GRCh37.82.chr.gtf : Homo_sapiens.GRCh37.82.chr.gtf.gz
48
+ zcat Homo_sapiens.GRCh37.82.chr.gtf.gz | grep -Ev ' ^#' | grep -w ' gene' | sed -e ' s/^/chr/' -e ' s/^chrMT/chrM/' > Homo_sapiens.GRCh37.82.chr.gtf
51
49
52
50
# convert to .bed
53
- Homo_sapiens.GRCh37.82.noGLMT.chr.bed : Homo_sapiens.GRCh37.82.noGLMT.chr.gtf
54
- gtf2bed < Homo_sapiens.GRCh37.82.noGLMT.chr.gtf > Homo_sapiens.GRCh37.82.noGLMT.chr.bed
55
-
56
- # extract genes
57
- Homo_sapiens.GRCh37.82.noGLMT.chr.genes.bed : Homo_sapiens.GRCh37.82.noGLMT.chr.bed
58
- grep -w gene Homo_sapiens.GRCh37.82.noGLMT.chr.bed > Homo_sapiens.GRCh37.82.noGLMT.chr.genes.bed
59
-
51
+ Homo_sapiens.GRCh37.82.chr.bed : Homo_sapiens.GRCh37.82.chr.gtf
52
+ gtf2bed < Homo_sapiens.GRCh37.82.chr.gtf > Homo_sapiens.GRCh37.82.chr.bed
60
53
61
54
62
55
@@ -86,6 +79,8 @@ Homo_sapiens.GRCh38.91.chr.bed: Homo_sapiens.GRCh38.91.chr.gtf
86
79
Homo_sapiens.GRCh37.82.noGLMT.chr.gtf \
87
80
gencode.v27.annotation.gtf.gz \
88
81
Homo_sapiens.GRCh38.91.chr.gtf \
89
- Homo_sapiens.GRCh38.91.chr.gtf.gz
82
+ Homo_sapiens.GRCh38.91.chr.gtf.gz \
83
+ Homo_sapiens.GRCh37.82.chr.gtf \
84
+ Homo_sapiens.GRCh37.82.chr.gtf.gz
90
85
91
86
0 commit comments