-
Notifications
You must be signed in to change notification settings - Fork 9
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Merge pull request #233 from dib-lab/microtrios
New microtrios for reduced (?) test/CI build times
- Loading branch information
Showing
23 changed files
with
102 additions
and
48 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,3 +1,4 @@ | ||
pico-trio-refr.fa.gz.* | ||
fiveparts-refr.fa.gz.* | ||
inf-mate-dist/*.genome.fa.gz.* | ||
calls-*.vcf |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,4 @@ | ||
*.fa | ||
*.fasta | ||
*.fastq | ||
refr-*.fa.gz.* |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,27 @@ | ||
#!/usr/bin/env bash | ||
|
||
nuclmm simulate --order 6 --numseqs 1 --seqlen 20000 --seed 2468 --out kevlar/tests/data/microtrios/refr-li.fa notebook/human-sim-pico/human.order6.mm | ||
nuclmm simulate --order 6 --numseqs 1 --seqlen 20000 --seed 1357 --out kevlar/tests/data/microtrios/refr-na.fa notebook/human-sim-pico/human.order6.mm | ||
nuclmm simulate --order 6 --numseqs 1 --seqlen 20000 --seed 1235 --out kevlar/tests/data/microtrios/refr-k.fa notebook/human-sim-pico/human.order6.mm | ||
|
||
kevlar gentrio --inherited 2 --de-novo 1 --vcf kevlar/tests/data/microtrios/variants-li.vcf --prefix kevlar/tests/data/microtrios/trio-li --weights snv=1.0 --seed 102938 kevlar/tests/data/microtrios/refr-li.fa | ||
kevlar gentrio --inherited 2 --de-novo 1 --vcf kevlar/tests/data/microtrios/variants-na.vcf --prefix kevlar/tests/data/microtrios/trio-na --weights snv=1.0 --seed 475656 kevlar/tests/data/microtrios/refr-na.fa | ||
kevlar gentrio --inherited 2 --de-novo 1 --vcf kevlar/tests/data/microtrios/variants-k.vcf --prefix kevlar/tests/data/microtrios/trio-k --weights snv=1.0 --seed 928374 kevlar/tests/data/microtrios/refr-k.fa | ||
|
||
wgsim -e 0.005 -r 0.0 -d 450 -s 50 -N 3000 -1 100 -2 100 -S 111111 kevlar/tests/data/microtrios/trio-li-father.fasta kevlar/tests/data/microtrios/trio-li-father-{1,2}.fastq | ||
wgsim -e 0.005 -r 0.0 -d 450 -s 50 -N 3000 -1 100 -2 100 -S 222222 kevlar/tests/data/microtrios/trio-li-mother.fasta kevlar/tests/data/microtrios/trio-li-mother-{1,2}.fastq | ||
wgsim -e 0.005 -r 0.0 -d 450 -s 50 -N 3000 -1 100 -2 100 -S 333333 kevlar/tests/data/microtrios/trio-li-proband.fasta kevlar/tests/data/microtrios/trio-li-proband-{1,2}.fastq | ||
wgsim -e 0.005 -r 0.0 -d 450 -s 50 -N 3000 -1 100 -2 100 -S 444444 kevlar/tests/data/microtrios/trio-na-father.fasta kevlar/tests/data/microtrios/trio-na-father-{1,2}.fastq | ||
wgsim -e 0.005 -r 0.0 -d 450 -s 50 -N 3000 -1 100 -2 100 -S 555555 kevlar/tests/data/microtrios/trio-na-mother.fasta kevlar/tests/data/microtrios/trio-na-mother-{1,2}.fastq | ||
wgsim -e 0.005 -r 0.0 -d 450 -s 50 -N 3000 -1 100 -2 100 -S 666666 kevlar/tests/data/microtrios/trio-na-proband.fasta kevlar/tests/data/microtrios/trio-na-proband-{1,2}.fastq | ||
wgsim -e 0.005 -r 0.0 -d 450 -s 50 -N 3000 -1 100 -2 100 -S 777777 kevlar/tests/data/microtrios/trio-k-father.fasta kevlar/tests/data/microtrios/trio-k-father-{1,2}.fastq | ||
wgsim -e 0.005 -r 0.0 -d 450 -s 50 -N 3000 -1 100 -2 100 -S 888888 kevlar/tests/data/microtrios/trio-k-mother.fasta kevlar/tests/data/microtrios/trio-k-mother-{1,2}.fastq | ||
wgsim -e 0.005 -r 0.0 -d 450 -s 50 -N 3000 -1 100 -2 100 -S 999999 kevlar/tests/data/microtrios/trio-k-proband.fasta kevlar/tests/data/microtrios/trio-k-proband-{1,2}.fastq | ||
|
||
for trio in li na k | ||
do | ||
for ind in father mother proband | ||
do | ||
interleave-reads.py kevlar/tests/data/microtrios/trio-${trio}-${ind}-{1,2}.fastq | gzip -c > kevlar/tests/data/microtrios/trio-${trio}-${ind}.fq.gz | ||
done | ||
done |
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,9 @@ | ||
##fileformat=VCFv4.2 | ||
##source=kevlar::gentrio | ||
##INFO=<GT,Number=3,Type=String,Description="Genotypes of each individual in the trio (proband, mother, father)"> | ||
##INFO=<VW,Number=1,Type=String,Description="Genomic interval bounding all k-mers that contain the alternate allele"> | ||
##INFO=<RW,Number=1,Type=String,Description="Genomic interval bounding all k-mers that contain the reference allele"> | ||
#CHROM POS ID REF ALT QUAL FILTER INFO | ||
seq1 1356 . C A . PASS GT=0/0,0/1,0/0;RW=TTAGTCTTAAGTCTTCTTTAGAGTCACCCTCCCTTTTTAAAGTTGTTCTCCTATACTTCCC;VW=TTAGTCTTAAGTCTTCTTTAGAGTCACCCTACCTTTTTAAAGTTGTTCTCCTATACTTCCC | ||
seq1 7255 . T A . PASS GT=0/0,0/1,0/1;RW=CTTGTACTCCATCTGAGACCGGGAGGGAGATATCAGGATTATGACTTTGGGCTATGGATTG;VW=CTTGTACTCCATCTGAGACCGGGAGGGAGAAATCAGGATTATGACTTTGGGCTATGGATTG | ||
seq1 16661 . A C . PASS GT=0/1,0/0,0/0;RW=AGCAATCTCCTTTGAAACTGACTCAAAATTAGCAAACAGTAAGCAGCCGCCACCCAGCCTC;VW=AGCAATCTCCTTTGAAACTGACTCAAAATTCGCAAACAGTAAGCAGCCGCCACCCAGCCTC |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,9 @@ | ||
##fileformat=VCFv4.2 | ||
##source=kevlar::gentrio | ||
##INFO=<GT,Number=3,Type=String,Description="Genotypes of each individual in the trio (proband, mother, father)"> | ||
##INFO=<VW,Number=1,Type=String,Description="Genomic interval bounding all k-mers that contain the alternate allele"> | ||
##INFO=<RW,Number=1,Type=String,Description="Genomic interval bounding all k-mers that contain the reference allele"> | ||
#CHROM POS ID REF ALT QUAL FILTER INFO | ||
seq1 9279 . A T . PASS GT=1/0,1/0,1/1;RW=ATTTTTCTTCTCTTTTTAGTCACTGCAACCAGGACATCACCCTGCAGCCATTTATTTCCAA;VW=ATTTTTCTTCTCTTTTTAGTCACTGCAACCTGGACATCACCCTGCAGCCATTTATTTCCAA | ||
seq1 10367 . G C . PASS GT=1/0,0/1,0/0;RW=TGATCTGGCTCAGACCTGCCAGTGAAGGGGGGAGCTTCATTGGTATTTCAAGACCTGTGAA;VW=TGATCTGGCTCAGACCTGCCAGTGAAGGGGCGAGCTTCATTGGTATTTCAAGACCTGTGAA | ||
seq1 14742 . T C . PASS GT=1/0,0/0,0/0;RW=AATTCATTTCTCCCAACTCACACCACCTGTTTATTCCAGGCTGCATTTACTATTTTAAAAT;VW=AATTCATTTCTCCCAACTCACACCACCTGTCTATTCCAGGCTGCATTTACTATTTTAAAAT |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,9 @@ | ||
##fileformat=VCFv4.2 | ||
##source=kevlar::gentrio | ||
##INFO=<GT,Number=3,Type=String,Description="Genotypes of each individual in the trio (proband, mother, father)"> | ||
##INFO=<VW,Number=1,Type=String,Description="Genomic interval bounding all k-mers that contain the alternate allele"> | ||
##INFO=<RW,Number=1,Type=String,Description="Genomic interval bounding all k-mers that contain the reference allele"> | ||
#CHROM POS ID REF ALT QUAL FILTER INFO | ||
seq1 5018 . A T . PASS GT=1/1,1/1,1/1;RW=GATCACCCACATACCACCCTGCACAGAGACAGGGTACCAACCTCCCTATCATCCTTCTCCA;VW=GATCACCCACATACCACCCTGCACAGAGACTGGGTACCAACCTCCCTATCATCCTTCTCCA | ||
seq1 6691 . A T . PASS GT=1/0,0/0,0/0;RW=AACTGCCCGCCTTGGGGTCTATAGTTATCCAGGGAACAGAGACGCGGAGAGGAAAACCATA;VW=AACTGCCCGCCTTGGGGTCTATAGTTATCCTGGGAACAGAGACGCGGAGAGGAAAACCATA | ||
seq1 17260 . T A . PASS GT=1/1,1/0,1/1;RW=AAATATGGCAAGGATCTACTAACACTGCTTTCATTTGATAGCTGGGAGTATAATCCGGATA;VW=AAATATGGCAAGGATCTACTAACACTGCTTACATTTGATAGCTGGGAGTATAATCCGGATA |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters