File tree 32 files changed +45
-45
lines changed
32 files changed +45
-45
lines changed Original file line number Diff line number Diff line change @@ -11,7 +11,7 @@ recipe:
11
11
recipe_cmds :
12
12
- |
13
13
release=20170905
14
- baseurl=ftp ://ftp.ncbi.nlm.nih.gov/pub/clinvar/vcf_GRCh37/archive_2.0/2017/clinvar_${release}.vcf.gz
14
+ baseurl=http ://ftp.ncbi.nlm.nih.gov/pub/clinvar/vcf_GRCh37/archive_2.0/2017/clinvar_${release}.vcf.gz
15
15
mkdir -p variation
16
16
wget -c -O variation/clinvar-orig.vcf.gz $baseurl
17
17
[[ -f variation/clinvar.vcf.gz ]] || zcat variation/clinvar-orig.vcf.gz | bgzip -c > variation/clinvar.vcf.gz
Original file line number Diff line number Diff line change @@ -11,7 +11,7 @@ recipe:
11
11
version=150
12
12
org=human_9606_b${version}_GRCh37p13
13
13
release=20170710
14
- url=ftp ://ftp.ncbi.nih.gov/snp/organisms/$org/VCF/GATK/All_${release}.vcf.gz
14
+ url=http ://ftp.ncbi.nih.gov/snp/organisms/$org/VCF/GATK/All_${release}.vcf.gz
15
15
mkdir -p variation
16
16
wget -c -O variation/dbsnp-$version-orig.vcf.gz $url
17
17
[[ -f variation/dbsnp-$version.vcf.gz ]] || zcat variation/dbsnp-$version-orig.vcf.gz | sed "s/^chrM/MT/g" | sed "s/^chr//g" | bgzip -c > variation/dbsnp-$version.vcf.gz
Original file line number Diff line number Diff line change 1
1
# Truth set for NA12878/NA24385 somatic mixture
2
- # ftp ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/use_cases/mixtures/UMCUTRECHT_NA12878_NA24385_mixture_10052016/
2
+ # http ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/use_cases/mixtures/UMCUTRECHT_NA12878_NA24385_mixture_10052016/
3
3
---
4
4
attributes :
5
5
name : giab-NA12878-NA24385-somatic
@@ -10,7 +10,7 @@ recipe:
10
10
recipe_cmds :
11
11
- |
12
12
dir=validation/giab-NA12878-NA24385-somatic
13
- url=ftp ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/use_cases/mixtures/UMCUTRECHT_NA12878_NA24385_mixture_10052016/
13
+ url=http ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/use_cases/mixtures/UMCUTRECHT_NA12878_NA24385_mixture_10052016/
14
14
calls=na12878-na24385-somatic-truth.vcf.gz
15
15
regions=na12878-na24385-somatic-truth-regions.bed
16
16
mkdir -p $dir
Original file line number Diff line number Diff line change @@ -9,15 +9,15 @@ recipe:
9
9
recipe_cmds :
10
10
- |
11
11
dir=validation/giab-NA12878
12
- url=ftp ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/release/NA12878_HG001/NISTv3.3.2/GRCh37/
12
+ url=http ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/release/NA12878_HG001/NISTv3.3.2/GRCh37/
13
13
calls=HG001_GRCh37_GIAB_highconf_CG-IllFB-IllGATKHC-Ion-10X-SOLID_CHROM1-X_v.3.3.2_highconf_PGandRTGphasetransfer.vcf.gz
14
14
regions=HG001_GRCh37_GIAB_highconf_CG-IllFB-IllGATKHC-Ion-10X-SOLID_CHROM1-X_v.3.3.2_highconf_nosomaticdel.bed
15
15
mkdir -p $dir
16
16
wget -c -O $dir/truth_small_variants.vcf.gz $url/$calls
17
17
tabix -f -p vcf $dir/truth_small_variants.vcf.gz
18
- wget -c -O $dir/truth_regions.bed $url/$regions
19
- wget -O - ftp ://ftp.ncbi.nih.gov/giab/ftp/technical/svclassify_Manuscript/Supplementary_Information/Personalis_1000_Genomes_deduplicated_deletions.bed | grep -v ^Chr > $dir/truth_DEL.bed
20
- wget -O - ftp ://ftp.ncbi.nih.gov/giab/ftp/technical/svclassify_Manuscript/Supplementary_Information/Spiral_Genetics_insertions.bed | grep -v ^Chr > $dir/truth_INS.bed
18
+ wget -c -O $dir/truth_regions.bed $url/$regions
19
+ wget -O - http ://ftp.ncbi.nih.gov/giab/ftp/technical/svclassify_Manuscript/Supplementary_Information/Personalis_1000_Genomes_deduplicated_deletions.bed | grep -v ^Chr > $dir/truth_DEL.bed
20
+ wget -O - http ://ftp.ncbi.nih.gov/giab/ftp/technical/svclassify_Manuscript/Supplementary_Information/Spiral_Genetics_insertions.bed | grep -v ^Chr > $dir/truth_INS.bed
21
21
recipe_outfiles :
22
22
- validation/giab-NA12878/truth_small_variants.vcf.gz
23
23
- validation/giab-NA12878/truth_small_variants.vcf.gz.tbi
Original file line number Diff line number Diff line change @@ -11,20 +11,20 @@ recipe:
11
11
recipe_cmds :
12
12
- |
13
13
dir=validation/giab-NA24385
14
- url=ftp ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/release/AshkenazimTrio/HG002_NA24385_son/NISTv3.3.2/GRCh37/
14
+ url=http ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/release/AshkenazimTrio/HG002_NA24385_son/NISTv3.3.2/GRCh37/
15
15
calls=HG002_GRCh37_GIAB_highconf_CG-IllFB-IllGATKHC-Ion-10X-SOLID_CHROM1-22_v.3.3.2_highconf_triophased.vcf.gz
16
16
regions=HG002_GRCh37_GIAB_highconf_CG-IllFB-IllGATKHC-Ion-10X-SOLID_CHROM1-22_v.3.3.2_highconf_noinconsistent.bed
17
17
mkdir -p $dir
18
18
wget -c -O $dir/truth_small_variants.vcf.gz $url/$calls
19
19
tabix -f -p vcf $dir/truth_small_variants.vcf.gz
20
- wget -c -O $dir/truth_regions.bed $url/$regions
20
+ wget -c -O $dir/truth_regions.bed $url/$regions
21
21
delurl=https://s3.amazonaws.com/bcbio/giab/NA24385/NA24385-GIAB-2tech-dels-v0_1_8-GRCh37.bed.gz
22
22
wget -c -O $dir/truth_DEL_giab.bed.gz $delurl
23
23
wget -c -O $dir/truth_DEL_giab.bed.gz.tbi $delurl.tbi
24
24
cnvurl=https://s3.amazonaws.com/bcbio/giab/NA24385/NA24385-crowd-dels-GRCh37.bed.gz
25
25
wget -c -O $dir/truth_DEL_crowd.bed.gz $cnvurl
26
26
wget -c -O $dir/truth_DEL_crowd.bed.gz.tbi $cnvurl.tbi
27
- svurl=ftp ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/data/AshkenazimTrio/analysis/NIST_UnionSVs_12122017/svanalyzer_union_171212_v0.5.0_annotated.vcf.gz
27
+ svurl=http ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/data/AshkenazimTrio/analysis/NIST_UnionSVs_12122017/svanalyzer_union_171212_v0.5.0_annotated.vcf.gz
28
28
wget -c -O $dir/truth_sv.vcf.gz $svurl
29
29
wget -c -O $dir/truth_sv.vcf.gz.tbi $svurl.tbi
30
30
recipe_outfiles :
Original file line number Diff line number Diff line change @@ -9,13 +9,13 @@ recipe:
9
9
recipe_cmds :
10
10
- |
11
11
dir=validation/giab-NA24631
12
- url=ftp ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/release/ChineseTrio/HG005_NA24631_son/NISTv3.3.2/GRCh37/
12
+ url=http ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/release/ChineseTrio/HG005_NA24631_son/NISTv3.3.2/GRCh37/
13
13
calls=HG005_GRCh37_highconf_CG-IllFB-IllGATKHC-Ion-SOLID_CHROM1-22_v.3.3.2_highconf.vcf.gz
14
14
regions=HG005_GRCh37_highconf_CG-IllFB-IllGATKHC-Ion-SOLID_CHROM1-22_v.3.3.2_highconf_noMetaSV.bed
15
15
mkdir -p $dir
16
16
wget -c -O $dir/truth_small_variants.vcf.gz $url/$calls
17
17
tabix -f -p vcf $dir/truth_small_variants.vcf.gz
18
- wget -c -O $dir/truth_regions.bed $url/$regions
18
+ wget -c -O $dir/truth_regions.bed $url/$regions
19
19
recipe_outfiles :
20
20
- validation/giab-NA24631/truth_small_variants.vcf.gz
21
21
- validation/giab-NA24631/truth_small_variants.vcf.gz.tbi
Original file line number Diff line number Diff line change 8
8
recipe_type : bash
9
9
recipe_cmds :
10
10
- |
11
- url=ftp ://ftp.ensembl.org/pub/data_files/homo_sapiens/GRCh37/variation_genotype/gnomad.genomes.r2.0.1.sites.noVEP.vcf.gz
11
+ url=http ://ftp.ensembl.org/pub/data_files/homo_sapiens/GRCh37/variation_genotype/gnomad.genomes.r2.0.1.sites.noVEP.vcf.gz
12
12
ref=../seq/GRCh37.fa
13
13
mkdir -p variation
14
14
export TMPDIR=`pwd`
Original file line number Diff line number Diff line change 8
8
recipe_cmds :
9
9
- |
10
10
BUILD=GRCz11
11
- url=ftp ://ftp.ensembl.org/pub/release-92/fasta/danio_rerio/dna/Danio_rerio.GRCz11.dna.toplevel.fa.gz
11
+ url=http ://ftp.ensembl.org/pub/release-92/fasta/danio_rerio/dna/Danio_rerio.GRCz11.dna.toplevel.fa.gz
12
12
mkdir -p seq
13
13
wget --no-check-certificate -O - $url | gunzip -c > seq/$BUILD.fa
14
14
samtools faidx seq/$BUILD.fa
Original file line number Diff line number Diff line change 8
8
recipe_cmds :
9
9
- |
10
10
BUILD=Sscrofa11.1
11
- url=ftp ://ftp.ensembl.org/pub/release-92/fasta/sus_scrofa/dna/Sus_scrofa.Sscrofa11.1.dna_rm.toplevel.fa.gz
11
+ url=http ://ftp.ensembl.org/pub/release-92/fasta/sus_scrofa/dna/Sus_scrofa.Sscrofa11.1.dna_rm.toplevel.fa.gz
12
12
mkdir -p seq
13
13
wget --no-check-certificate -O - $url | gunzip -c > seq/$BUILD.fa
14
14
samtools faidx seq/$BUILD.fa
Original file line number Diff line number Diff line change @@ -11,7 +11,7 @@ recipe:
11
11
recipe_cmds :
12
12
- |
13
13
release=20170905
14
- baseurl=ftp ://ftp.ncbi.nlm.nih.gov/pub/clinvar/vcf_GRCh37/archive_2.0/2017/clinvar_${release}.vcf.gz
14
+ baseurl=http ://ftp.ncbi.nlm.nih.gov/pub/clinvar/vcf_GRCh37/archive_2.0/2017/clinvar_${release}.vcf.gz
15
15
mkdir -p variation
16
16
wget -c -O variation/clinvar-orig.vcf.gz $baseurl
17
17
[[ -f variation/clinvar.vcf.gz ]] || zcat variation/clinvar-orig.vcf.gz | sed "s/^\([0-9]\+\)\t/chr\1\t/g" | sed "s/^MT/chrM/g" | sed "s/^X/chrX/g" | sed "s/^Y/chrY/g" | bgzip -c > variation/clinvar.vcf.gz
Original file line number Diff line number Diff line change @@ -11,7 +11,7 @@ recipe:
11
11
version=150
12
12
org=human_9606_b${version}_GRCh37p13
13
13
release=20170710
14
- url=ftp ://ftp.ncbi.nih.gov/snp/organisms/$org/VCF/GATK/All_${release}.vcf.gz
14
+ url=http ://ftp.ncbi.nih.gov/snp/organisms/$org/VCF/GATK/All_${release}.vcf.gz
15
15
mkdir -p variation
16
16
wget -c -O variation/dbsnp-$version-orig.vcf.gz $url
17
17
[[ -f variation/dbsnp-$version.vcf.gz ]] || zcat variation/dbsnp-$version-orig.vcf.gz | bgzip -c > variation/dbsnp-$version.vcf.gz
Original file line number Diff line number Diff line change @@ -12,16 +12,16 @@ recipe:
12
12
- |
13
13
dir=validation/giab-NA12878
14
14
remapurl=https://raw.githubusercontent.com/dpryan79/ChromosomeMappings/master/GRCh37_ensembl2UCSC.txt
15
- url=ftp ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/release/NA12878_HG001/NISTv3.3.2/GRCh37/
15
+ url=http ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/release/NA12878_HG001/NISTv3.3.2/GRCh37/
16
16
calls=HG001_GRCh37_GIAB_highconf_CG-IllFB-IllGATKHC-Ion-10X-SOLID_CHROM1-X_v.3.3.2_highconf_PGandRTGphasetransfer.vcf.gz
17
17
regions=HG001_GRCh37_GIAB_highconf_CG-IllFB-IllGATKHC-Ion-10X-SOLID_CHROM1-X_v.3.3.2_highconf_nosomaticdel.bed
18
18
mkdir -p $dir
19
19
wget -qO- $remapurl | awk '{if($1!=$2) print "s/^"$1"/"$2"/g"}' > remap.sed
20
20
wget -c -O - $url/$calls | gunzip -c | sed -f remap.sed | grep -v "##contig=" | bgzip -c > $dir/truth_small_variants.vcf.gz
21
21
tabix -f -p vcf $dir/truth_small_variants.vcf.gz
22
22
wget -c -O - $url/$regions | sed -f remap.sed > $dir/truth_regions.bed
23
- wget -O - ftp ://ftp.ncbi.nih.gov/giab/ftp/technical/svclassify_Manuscript/Supplementary_Information/Personalis_1000_Genomes_deduplicated_deletions.bed | grep -v ^Chr | sed "s/^\([0-9]\+\)\t/chr\1\t/g" | sed "s/^MT/chrM/g" | sed "s/^X/chrX/g" | sed "s/^Y/chrY/g" > $dir/truth_DEL.bed
24
- wget -O - ftp ://ftp.ncbi.nih.gov/giab/ftp/technical/svclassify_Manuscript/Supplementary_Information/Spiral_Genetics_insertions.bed | grep -v ^Chr | sed "s/^\([0-9]\+\)\t/chr\1\t/g" | sed "s/^MT/chrM/g" | sed "s/^X/chrX/g" | sed "s/^Y/chrY/g" > $dir/truth_INS.bed
23
+ wget -O - http ://ftp.ncbi.nih.gov/giab/ftp/technical/svclassify_Manuscript/Supplementary_Information/Personalis_1000_Genomes_deduplicated_deletions.bed | grep -v ^Chr | sed "s/^\([0-9]\+\)\t/chr\1\t/g" | sed "s/^MT/chrM/g" | sed "s/^X/chrX/g" | sed "s/^Y/chrY/g" > $dir/truth_DEL.bed
24
+ wget -O - http ://ftp.ncbi.nih.gov/giab/ftp/technical/svclassify_Manuscript/Supplementary_Information/Spiral_Genetics_insertions.bed | grep -v ^Chr | sed "s/^\([0-9]\+\)\t/chr\1\t/g" | sed "s/^MT/chrM/g" | sed "s/^X/chrX/g" | sed "s/^Y/chrY/g" > $dir/truth_INS.bed
25
25
recipe_outfiles :
26
26
- validation/giab-NA12878/truth_small_variants.vcf.gz
27
27
- validation/giab-NA12878/truth_small_variants.vcf.gz.tbi
Original file line number Diff line number Diff line change 9
9
recipe_cmds :
10
10
- |
11
11
dir=validation/giab-NA24385
12
- url=ftp ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/release/AshkenazimTrio/HG002_NA24385_son/NISTv3.3.2/GRCh37/
12
+ url=http ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/release/AshkenazimTrio/HG002_NA24385_son/NISTv3.3.2/GRCh37/
13
13
calls=HG002_GRCh37_GIAB_highconf_CG-IllFB-IllGATKHC-Ion-10X-SOLID_CHROM1-22_v.3.3.2_highconf_triophased.vcf.gz
14
14
regions=HG002_GRCh37_GIAB_highconf_CG-IllFB-IllGATKHC-Ion-10X-SOLID_CHROM1-22_v.3.3.2_highconf_noinconsistent.bed
15
15
remapurl=https://raw.githubusercontent.com/dpryan79/ChromosomeMappings/master/GRCh37_ensembl2UCSC.txt
@@ -24,7 +24,7 @@ recipe:
24
24
cnvurl=https://s3.amazonaws.com/bcbio/giab/NA24385/NA24385-crowd-dels-hg19.bed.gz
25
25
wget -c -O $dir/truth_DEL_crowd.bed.gz $cnvurl
26
26
wget -c -O $dir/truth_DEL_crowd.bed.gz.tbi $cnvurl.tbi
27
- svurl=ftp ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/data/AshkenazimTrio/analysis/NIST_UnionSVs_12122017/svanalyzer_union_171212_v0.5.0_annotated.vcf.gz
27
+ svurl=http ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/data/AshkenazimTrio/analysis/NIST_UnionSVs_12122017/svanalyzer_union_171212_v0.5.0_annotated.vcf.gz
28
28
wget -c -O - $svurl | gunzip -c | sed -f remap.sed | grep -v "##contig=" | bgzip -c > $dir/truth_sv.vcf.gz
29
29
tabix -f -p vcf $dir/truth_sv.vcf.gz
30
30
recipe_outfiles :
Original file line number Diff line number Diff line change 9
9
recipe_cmds :
10
10
- |
11
11
dir=validation/giab-NA24631
12
- url=ftp ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/release/ChineseTrio/HG005_NA24631_son/NISTv3.3.2/GRCh37/
12
+ url=http ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/release/ChineseTrio/HG005_NA24631_son/NISTv3.3.2/GRCh37/
13
13
calls=HG005_GRCh37_highconf_CG-IllFB-IllGATKHC-Ion-SOLID_CHROM1-22_v.3.3.2_highconf.vcf.gz
14
14
regions=HG005_GRCh37_highconf_CG-IllFB-IllGATKHC-Ion-SOLID_CHROM1-22_v.3.3.2_highconf_noMetaSV.bed
15
15
remapurl=https://raw.githubusercontent.com/dpryan79/ChromosomeMappings/master/GRCh37_ensembl2UCSC.txt
Original file line number Diff line number Diff line change 9
9
recipe_type : bash
10
10
recipe_cmds :
11
11
- |
12
- url=ftp ://ftp.ensembl.org/pub/data_files/homo_sapiens/GRCh37/variation_genotype/gnomad.genomes.r2.0.1.sites.noVEP.vcf.gz
12
+ url=http ://ftp.ensembl.org/pub/data_files/homo_sapiens/GRCh37/variation_genotype/gnomad.genomes.r2.0.1.sites.noVEP.vcf.gz
13
13
remap_url=https://raw.githubusercontent.com/dpryan79/ChromosomeMappings/master/GRCh37_ensembl2UCSC.txt
14
14
ref=../seq/hg19.fa
15
15
mkdir -p variation
Original file line number Diff line number Diff line change 1
1
Human reference genome: GRCh38/hg38 without any alternative reference contigs
2
2
3
- ftp ://ftp.ncbi.nlm.nih.gov/genomes/genbank/vertebrate_mammalian/Homo_sapiens/all_assembly_versions/GCA_000001405.15_GRCh38/seqs_for_alignment_pipelines.ucsc_ids/
3
+ http ://ftp.ncbi.nlm.nih.gov/genomes/genbank/vertebrate_mammalian/Homo_sapiens/all_assembly_versions/GCA_000001405.15_GRCh38/seqs_for_alignment_pipelines.ucsc_ids/
Original file line number Diff line number Diff line change @@ -10,7 +10,7 @@ recipe:
10
10
- |
11
11
base=GCA_000001405.15_GRCh38_no_alt_analysis_set.fna.bowtie_index
12
12
new=hg38-noalt.fa
13
- ncbiurl=ftp ://ftp.ncbi.nlm.nih.gov/genomes/genbank/vertebrate_mammalian/Homo_sapiens/all_assembly_versions/GCA_000001405.15_GRCh38/seqs_for_alignment_pipelines.ucsc_ids
13
+ ncbiurl=http ://ftp.ncbi.nlm.nih.gov/genomes/genbank/vertebrate_mammalian/Homo_sapiens/all_assembly_versions/GCA_000001405.15_GRCh38/seqs_for_alignment_pipelines.ucsc_ids
14
14
wget -c $ncbiurl/$base.tar.gz
15
15
[[ -f $base.1.bt2 ]] || tar -xzvpf $base.tar.gz
16
16
mkdir -p bowtie2
Original file line number Diff line number Diff line change @@ -10,7 +10,7 @@ recipe:
10
10
- |
11
11
base=GCA_000001405.15_GRCh38_no_alt_analysis_set.fna
12
12
new=hg38-noalt.fa
13
- ncbiurl=ftp ://ftp.ncbi.nlm.nih.gov/genomes/genbank/vertebrate_mammalian/Homo_sapiens/all_assembly_versions/GCA_000001405.15_GRCh38/seqs_for_alignment_pipelines.ucsc_ids
13
+ ncbiurl=http ://ftp.ncbi.nlm.nih.gov/genomes/genbank/vertebrate_mammalian/Homo_sapiens/all_assembly_versions/GCA_000001405.15_GRCh38/seqs_for_alignment_pipelines.ucsc_ids
14
14
wget -c $ncbiurl/$base.bwa_index.tar.gz
15
15
[[ -f $base.fna.bwt ]] || tar -xzvpf $base.bwa_index.tar.gz
16
16
mkdir -p bwa
Original file line number Diff line number Diff line change @@ -10,7 +10,7 @@ recipe:
10
10
recipe_type : bash
11
11
recipe_cmds :
12
12
- |
13
- url=ftp ://ftp.ensembl.org/pub/release-78/gtf/homo_sapiens/Homo_sapiens.GRCh38.78.gtf.gz
13
+ url=http ://ftp.ensembl.org/pub/release-78/gtf/homo_sapiens/Homo_sapiens.GRCh38.78.gtf.gz
14
14
mkdir -p rnaseq
15
15
remap_url=http://raw.githubusercontent.com/dpryan79/ChromosomeMappings/master/GRCh38_ensembl2UCSC.txt
16
16
wget -qO- $remap_url | awk '{if($1!=$2) print "s/^"$1"/"$2"/g"}' > remap.sed
Original file line number Diff line number Diff line change 1
1
Full hg38/GRCh38 reference genome distributed by 1000 genomes
2
2
Derived from NCBI set with HLA and decoy alternative alleles
3
- ftp ://ftp.1000genomes.ebi.ac.uk/vol1/ftp/technical/reference/GRCh38_reference_genome/
3
+ http ://ftp.1000genomes.ebi.ac.uk/vol1/ftp/technical/reference/GRCh38_reference_genome/
Original file line number Diff line number Diff line change 1
1
# Full hg38/GRCh38 reference genome distributed by 1000 genomes
2
2
# Derived from NCBI set with HLA and decoy alternative alleles
3
- # ftp ://ftp.1000genomes.ebi.ac.uk/vol1/ftp/technical/reference/GRCh38_reference_genome/
3
+ # http ://ftp.1000genomes.ebi.ac.uk/vol1/ftp/technical/reference/GRCh38_reference_genome/
4
4
# Pre-build bwa indices
5
5
---
6
6
attributes :
@@ -11,7 +11,7 @@ recipe:
11
11
recipe_type : bash
12
12
recipe_cmds :
13
13
- |
14
- url=ftp ://ftp.1000genomes.ebi.ac.uk/vol1/ftp/technical/reference/GRCh38_reference_genome
14
+ url=http ://ftp.1000genomes.ebi.ac.uk/vol1/ftp/technical/reference/GRCh38_reference_genome
15
15
base=GRCh38_full_analysis_set_plus_decoy_hla.fa
16
16
new=hg38.fa
17
17
mkdir -p bwa
Original file line number Diff line number Diff line change @@ -11,7 +11,7 @@ recipe:
11
11
recipe_cmds :
12
12
- |
13
13
release=20170905
14
- baseurl=ftp ://ftp.ncbi.nlm.nih.gov/pub/clinvar/vcf_GRCh38/archive_2.0/2017/clinvar_${release}.vcf.gz
14
+ baseurl=http ://ftp.ncbi.nlm.nih.gov/pub/clinvar/vcf_GRCh38/archive_2.0/2017/clinvar_${release}.vcf.gz
15
15
mkdir -p variation
16
16
wget -c -O variation/clinvar-orig.vcf.gz $baseurl
17
17
[[ -f variation/clinvar.vcf.gz ]] || zcat variation/clinvar-orig.vcf.gz | sed "s/^\([0-9]\+\)\t/chr\1\t/g" | sed "s/^MT/chrM/g" | sed "s/^X/chrX/g" | sed "s/^Y/chrY/g" | bgzip -c > variation/clinvar.vcf.gz
Original file line number Diff line number Diff line change @@ -13,7 +13,7 @@ recipe:
13
13
version=150
14
14
org=human_9606_b${version}_GRCh38p7
15
15
release=20170710
16
- url=ftp ://ftp.ncbi.nih.gov/snp/organisms/$org/VCF/GATK/All_${release}.vcf.gz
16
+ url=http ://ftp.ncbi.nih.gov/snp/organisms/$org/VCF/GATK/All_${release}.vcf.gz
17
17
mkdir -p variation
18
18
wget -c -O variation/dbsnp-$version-orig.vcf.gz $url
19
19
[[ -f variation/dbsnp-$version.vcf.gz ]] || zcat variation/dbsnp-$version-orig.vcf.gz | sed "s/^\([0-9]\+\)\t/chr\1\t/g" | sed "s/^MT/chrM/g" | sed "s/^X/chrX/g" | sed "s/^Y/chrY/g" | bgzip -c > variation/dbsnp-$version.vcf.gz
Original file line number Diff line number Diff line change 1
1
# Truth set for NA12878/NA24385 somatic mixture
2
- # ftp ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/use_cases/mixtures/UMCUTRECHT_NA12878_NA24385_mixture_10052016/
2
+ # http ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/use_cases/mixtures/UMCUTRECHT_NA12878_NA24385_mixture_10052016/
3
3
---
4
4
attributes :
5
5
name : giab-NA12878-NA24385-somatic
Original file line number Diff line number Diff line change 9
9
recipe_cmds :
10
10
- |
11
11
dir=validation/giab-NA12878
12
- url=ftp ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/release/NA12878_HG001/NISTv3.3.2/GRCh38/
12
+ url=http ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/release/NA12878_HG001/NISTv3.3.2/GRCh38/
13
13
calls=HG001_GRCh38_GIAB_highconf_CG-IllFB-IllGATKHC-Ion-10X-SOLID_CHROM1-X_v.3.3.2_highconf_PGandRTGphasetransfer.vcf.gz
14
14
regions=HG001_GRCh38_GIAB_highconf_CG-IllFB-IllGATKHC-Ion-10X-SOLID_CHROM1-X_v.3.3.2_highconf_nosomaticdel_noCENorHET7.bed
15
15
mkdir -p $dir
Original file line number Diff line number Diff line change 9
9
recipe_cmds :
10
10
- |
11
11
dir=validation/giab-NA24385
12
- url=ftp ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/release/AshkenazimTrio/HG002_NA24385_son/NISTv3.3.2/GRCh38/
12
+ url=http ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/release/AshkenazimTrio/HG002_NA24385_son/NISTv3.3.2/GRCh38/
13
13
calls=HG002_GRCh38_GIAB_highconf_CG-Illfb-IllsentieonHC-Ion-10XsentieonHC-SOLIDgatkHC_CHROM1-22_v.3.3.2_highconf_triophased.vcf.gz
14
14
regions=HG002_GRCh38_GIAB_highconf_CG-Illfb-IllsentieonHC-Ion-10XsentieonHC-SOLIDgatkHC_CHROM1-22_v.3.3.2_highconf_noinconsistent.bed
15
15
mkdir -p $dir
Original file line number Diff line number Diff line change 9
9
recipe_cmds :
10
10
- |
11
11
dir=validation/giab-NA24631
12
- url=ftp ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/release/ChineseTrio/HG005_NA24631_son/NISTv3.3.2/GRCh38/
12
+ url=http ://ftp-trace.ncbi.nlm.nih.gov/giab/ftp/release/ChineseTrio/HG005_NA24631_son/NISTv3.3.2/GRCh38/
13
13
calls=HG005_GRCh38_GIAB_highconf_CG-Illfb-IllsentieonHC-Ion-10XsentieonHC-SOLIDgatkHC_CHROM1-22_v.3.3.2_highconf.vcf.gz
14
14
regions=HG005_GRCh38_GIAB_highconf_CG-Illfb-IllsentieonHC-Ion-10XsentieonHC-SOLIDgatkHC_CHROM1-22_v.3.3.2_highconf.bed
15
15
mkdir -p $dir
You can’t perform that action at this time.
0 commit comments