@@ -12,6 +12,8 @@ gencode-hg19: gencode.v19.annotation.genes.id4.bed
1212
1313gencode-hg38 : gencode.v27.annotation.genes.bed
1414
15+ gencode-hg38v41 : gencode.v41.annotation.genes.bed
16+
1517ensembl-hg19 : Homo_sapiens.GRCh37.82.chr.bed
1618
1719ensembl-hg38 : Homo_sapiens.GRCh38.91.chr.bed
@@ -35,11 +37,16 @@ gencode.v19.annotation.genes.id4.bed: gencode.v19.annotation.genes.bed
3537# ~~~~~ GENCODE hg38 ~~~~~ #
3638# generate the Gencode hg38 annotations .bed file
3739gencode.v27.annotation.gtf.gz :
38- wget ftp://ftp.sanger .ac.uk/pub/gencode/Gencode_human/release_27/gencode.v27.annotation.gtf.gz
40+ wget ftp://ftp.ebi .ac.uk/pub/databases /gencode/Gencode_human/release_27/gencode.v27.annotation.gtf.gz
3941
4042gencode.v27.annotation.genes.bed : gencode.v27.annotation.gtf.gz
41- zcat gencode.v27.annotation.gtf.gz | grep -w gene | convert2bed --input=gtf - > gencode.v27.annotation.genes.bed
43+ zcat gencode.v27.annotation.gtf.gz | grep -w gene | awk ' { if ($$0 ~ "transcript_id") print $$0; else print $$0" transcript_id \"\";"; }' | convert2bed --input=gtf - > gencode.v27.annotation.genes.bed
44+
45+ gencode.v41.annotation.gtf.gz :
46+ wget ftp://ftp.ebi.ac.uk/pub/databases/gencode/Gencode_human/release_41/gencode.v41.annotation.gtf.gz
4247
48+ gencode.v41.annotation.genes.bed : gencode.v41.annotation.gtf.gz
49+ zcat gencode.v41.annotation.gtf.gz | grep -w gene | awk ' { if ($$0 ~ "transcript_id") print $$0; else print $$0" transcript_id \"\";"; }' | convert2bed --input=gtf - > gencode.v41.annotation.genes.bed
4350
4451
4552# ~~~~~ ENSEMBL hg19 ~~~~~ #
@@ -102,6 +109,7 @@ Mus_musculus.GRCm38.91.chr.bed: Mus_musculus.GRCm38.91.chr.gtf
102109 Homo_sapiens.GRCh37.82.noGLMT.chr.bed \
103110 Homo_sapiens.GRCh37.82.noGLMT.chr.gtf \
104111 gencode.v27.annotation.gtf.gz \
112+ gencode.v41.annotation.gtf.gz \
105113 Homo_sapiens.GRCh38.91.chr.gtf \
106114 Homo_sapiens.GRCh38.91.chr.gtf.gz \
107115 Homo_sapiens.GRCh37.82.chr.gtf \
0 commit comments