-
Notifications
You must be signed in to change notification settings - Fork 155
Expand file tree
/
Copy pathgtf.yaml
More file actions
20 lines (20 loc) · 824 Bytes
/
gtf.yaml
File metadata and controls
20 lines (20 loc) · 824 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
# Ensembl GTF file distributed by Ensembl for hg38
# Cleans GTF file by converting chromosome names to standard names
# Uses https://github.com/dpryan79/ChromosomeMappings to remap the chromosome names
---
attributes:
name: gtf
version: 78
recipe:
full:
recipe_type: bash
recipe_cmds:
- |
url=http://ftp.ensembl.org/pub/release-78/gtf/homo_sapiens/Homo_sapiens.GRCh38.78.gtf.gz
mkdir -p rnaseq
remap_url=http://raw.githubusercontent.com/dpryan79/ChromosomeMappings/master/GRCh38_ensembl2UCSC.txt
wget --no-check-certificate -qO- $remap_url | awk '{if($1!=$2) print "s/^"$1"/"$2"/g"}' > remap.sed
wget --no-check-certificate -qO- $url | gunzip | sed -f remap.sed | grep -v "*_*_alt" > rnaseq/hg38.gtf
rm remap.sed
recipe_outfiles:
- rnaseq/hg38.gtf