diff --git a/.travis.yml b/.travis.yml
index f4af3dad894..4fbdf61ef30 100644
--- a/.travis.yml
+++ b/.travis.yml
@@ -11,6 +11,7 @@ before_install:
- export GALAXY_REPO=https://github.com/galaxyproject/galaxy
- export GALAXY_RELEASE=release_16.10
- export PLANEMO_CONDA_PREFIX="$HOME/conda"
+ - unset JAVA_HOME
install:
- pip install flake8 planemo
diff --git a/macros/read_group_macros.xml b/macros/read_group_macros.xml
new file mode 100644
index 00000000000..26e8d6b209f
--- /dev/null
+++ b/macros/read_group_macros.xml
@@ -0,0 +1,294 @@
+
+
+
+#def identifier_or_name($input1)
+ #if hasattr($input1, 'element_identifier')
+ #return $input1.element_identifier
+ #else
+ #return $input1.name.rstrip('.gz').rstrip('.fastq').rstrip('.fq')
+ #end if
+#end def
+
+#def clean(name)
+ #import re
+ #set $name_clean = re.sub('[^\w\-_\.]', '_', $name)
+ #return $name_clean
+#end def
+
+#def read_group_name_default($input1, $input2=None)
+ #if $input2 is None
+ #return $clean($identifier_or_name($input1))
+ #else
+ #import itertools
+ #set $input_name1 = $clean($identifier_or_name($input1))
+ #set $input_name2 = $clean($identifier_or_name($input2))
+ #set $common_prefix = ''.join([c[0] for c in itertools.takewhile(lambda x: all(x[0] == y for y in x), itertools.izip(*[$input_name1, $input_name2]))])
+ #if len($common_prefix) > 3
+ #return $common_prefix
+ #else
+ #return $input_name1
+ #end if
+ #end if
+#end def
+
+#def format_read_group(prefix, value, quote='', arg='')
+ #if $value
+ #return $arg + $quote + $prefix + $value + $quote
+ #else
+ #return ''
+ #end if
+#end def
+
+#def rg_param(name)
+ #if $varExists("rg")
+ #return $rg.get($name, None)
+ #else
+ #return $getVar($name, None)
+ #end if
+#end def
+
+#set $use_rg = True
+
+
+
+#if $use_rg
+ #if $rg_param('read_group_id_conditional') is None
+ #set $rg_id = $rg_auto_name
+ #elif $rg_param('read_group_id_conditional').do_auto_name
+ #set $rg_id = $rg_auto_name
+ #else
+ #set $rg_id = str($rg_param('read_group_id_conditional').ID)
+ #end if
+
+ #if $rg_param('read_group_sm_conditional') is None
+ #set $rg_sm = ''
+ #elif $rg_param('read_group_sm_conditional').do_auto_name
+ #set $rg_sm = $rg_auto_name
+ #else
+ #set $rg_sm = str($rg_param('read_group_sm_conditional').SM)
+ #end if
+
+ #if $rg_param('PL')
+ #set $rg_pl = str($rg_param('PL'))
+ #else
+ #set $rg_pl = ''
+ #end if
+
+ #if $rg_param('read_group_lb_conditional') is None
+ #set $rg_lb = ''
+ #elif $rg_param('read_group_lb_conditional').do_auto_name
+ #set $rg_lb = $rg_auto_name
+ #else
+ #set $rg_lb = str($rg_param('read_group_lb_conditional').LB)
+ #end if
+
+ #if $rg_param('CN')
+ #set $rg_cn = str($rg_param('CN'))
+ #else
+ #set $rg_cn = ''
+ #end if
+
+ #if $rg_param("DS")
+ #set $rg_ds = str($rg_param("DS"))
+ #else
+ #set $rg_ds = ''
+ #end if
+
+ #if $rg_param("DT")
+ #set $rg_dt = str($rg_param("DT"))
+ #else
+ #set $rg_dt = ''
+ #end if
+
+ #if $rg_param("FO")
+ #set $rg_fo = str($rg_param("FO"))
+ #else
+ #set $rg_fo = ''
+ #end if
+
+ #if $rg_param("KS")
+ #set $rg_ks = str($rg_param("KS"))
+ #else
+ #set $rg_ks = ''
+ #end if
+
+ #if $rg_param("PG")
+ #set $rg_pg = str($rg_param("PG"))
+ #else
+ #set $rg_pg = ''
+ #end if
+
+ #if $rg_param("PI") != None
+ #set $rg_pi = str($rg_param("PI"))
+ #else
+ #set $rg_pi = ''
+ #end if
+
+ #if $rg_param("PU")
+ #set $rg_pu = str($rg_param("PU"))
+ #else
+ #set $rg_pu = ''
+ #end if
+#end if
+
+
+#set $use_rg = str($rg.rg_selector) != "do_not_set"
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ \*|[ACMGRSVTWYHKDBN]+$
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
diff --git a/tools/emboss_5/.shed.yml b/tools/emboss_5/.shed.yml
new file mode 100644
index 00000000000..d63012e81c0
--- /dev/null
+++ b/tools/emboss_5/.shed.yml
@@ -0,0 +1,11 @@
+categories:
+- Sequence Analysis
+- Fasta Manipulation
+description: Galaxy wrappers for EMBOSS version 5.0.0 tools
+homepage_url: http://emboss.open-bio.org/
+long_description: |
+ The European Molecular Biology Open Software Suite (EMBOSS) is a high quality, well documented package of open source software tools for molecular biology. It includes over 200 applications for molecular sequence analysis and other common tasks in bioinformatics.
+name: emboss_5
+owner: devteam
+remote_repository_url: https://github.com/galaxyproject/tools-iuc/tree/master/tools/emboss_5
+type: unrestricted
diff --git a/tools/emboss_5/emboss_antigenic.xml b/tools/emboss_5/emboss_antigenic.xml
new file mode 100644
index 00000000000..de0ecec83b1
--- /dev/null
+++ b/tools/emboss_5/emboss_antigenic.xml
@@ -0,0 +1,48 @@
+
+ Predicts potentially antigenic regions of a protein sequence, using the method of Kolaskar and Tongaonkar.
+
+ macros.xml
+
+
+
+ antigenic -sequence '$input1' -outfile '$out_file1' -minlen $minlen -rformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/antigenic.html
+
+
+
diff --git a/tools/emboss_5/emboss_backtranseq.xml b/tools/emboss_5/emboss_backtranseq.xml
new file mode 100644
index 00000000000..36a2ac7a626
--- /dev/null
+++ b/tools/emboss_5/emboss_backtranseq.xml
@@ -0,0 +1,219 @@
+
+ Back translate a protein sequence
+
+ macros.xml
+
+
+
+ backtranseq -sequence '$input1' -outfile '$out_file1' -cfile $cfile -osformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/backtranseq.html
+
+
+
diff --git a/tools/emboss_5/emboss_banana.xml b/tools/emboss_5/emboss_banana.xml
new file mode 100644
index 00000000000..7bcc729cfc9
--- /dev/null
+++ b/tools/emboss_5/emboss_banana.xml
@@ -0,0 +1,26 @@
+
+ Bending and curvature plot in B-DNA
+
+ macros.xml
+
+
+ banana -sequence '$input1' -outfile '$out_file1' -graph none -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/banana.html
+
+
+
diff --git a/tools/emboss_5/emboss_biosed.xml b/tools/emboss_5/emboss_biosed.xml
new file mode 100644
index 00000000000..59cc79b53f3
--- /dev/null
+++ b/tools/emboss_5/emboss_biosed.xml
@@ -0,0 +1,69 @@
+
+ Replace or delete sequence sections
+
+ macros.xml
+
+
+
+ biosed -sequence '$input1' -outseq '$out_file1' -target '$target' -replace '$replace' -osformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/biosed.html
+
+
+
diff --git a/tools/emboss_5/emboss_btwisted.xml b/tools/emboss_5/emboss_btwisted.xml
new file mode 100644
index 00000000000..1542778b0f0
--- /dev/null
+++ b/tools/emboss_5/emboss_btwisted.xml
@@ -0,0 +1,26 @@
+
+ Calculates the twisting in a B-DNA sequence
+
+ macros.xml
+
+
+ btwisted -sequence '$input1' -outfile '$out_file1' -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/btwisted.html
+
+
+
diff --git a/tools/emboss_5/emboss_cai.xml b/tools/emboss_5/emboss_cai.xml
new file mode 100644
index 00000000000..22bca21b3f2
--- /dev/null
+++ b/tools/emboss_5/emboss_cai.xml
@@ -0,0 +1,186 @@
+
+ CAI codon adaptation index
+
+ macros.xml
+
+
+ cai -seqall '$input1' -outfile '$out_file1' -cfile $cfile -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/cai.html
+
+
+
diff --git a/tools/emboss_5/emboss_cai_custom.xml b/tools/emboss_5/emboss_cai_custom.xml
new file mode 100644
index 00000000000..dcc613245dc
--- /dev/null
+++ b/tools/emboss_5/emboss_cai_custom.xml
@@ -0,0 +1,27 @@
+
+ CAI codon adaptation index using custom codon usage file
+
+ macros.xml
+
+
+ cai -seqall '$input1' -outfile '$out_file1' -cfile '$input2' -auto
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/cai.html
+
+
+
diff --git a/tools/emboss_5/emboss_chaos.xml b/tools/emboss_5/emboss_chaos.xml
new file mode 100644
index 00000000000..62ddb829ba5
--- /dev/null
+++ b/tools/emboss_5/emboss_chaos.xml
@@ -0,0 +1,25 @@
+
+ Create a chaos game representation plot for a sequence
+
+ macros.xml
+
+
+ perl '$__tool_directory__/emboss_single_outputfile_wrapper.pl' chaos -sequence '$input1' -graph png -goutfile '$out_file1' -auto
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/chaos.html
+
+
+
diff --git a/tools/emboss_5/emboss_charge.xml b/tools/emboss_5/emboss_charge.xml
new file mode 100644
index 00000000000..b2ed04a8385
--- /dev/null
+++ b/tools/emboss_5/emboss_charge.xml
@@ -0,0 +1,34 @@
+
+ Protein charge plot
+
+ macros.xml
+
+
+ charge -seqall '$input1' -outfile '$out_file1' -window $window -auto
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/charge.html
+
+
+
diff --git a/tools/emboss_5/emboss_checktrans.xml b/tools/emboss_5/emboss_checktrans.xml
new file mode 100644
index 00000000000..ee35f1e5a39
--- /dev/null
+++ b/tools/emboss_5/emboss_checktrans.xml
@@ -0,0 +1,82 @@
+
+ Reports STOP codons and ORF statistics of a protein
+
+ macros.xml
+
+
+
+ checktrans -sequence '$input1' -outfile '$out_file1' -outseq '$out_file2' -osformat3 $out_format2 -outfeat '$out_file3' -offormat4 $out_format3 -orfml $orfml -addlast $addlast -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/checktrans.html
+
+
+
diff --git a/tools/emboss_5/emboss_chips.xml b/tools/emboss_5/emboss_chips.xml
new file mode 100644
index 00000000000..1e485a408fd
--- /dev/null
+++ b/tools/emboss_5/emboss_chips.xml
@@ -0,0 +1,31 @@
+
+ Codon usage statistics
+
+ macros.xml
+
+
+ chips -seqall '$input1' -outfile '$out_file1' -sum $sum -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/chips.html
+
+
+
diff --git a/tools/emboss_5/emboss_cirdna.xml b/tools/emboss_5/emboss_cirdna.xml
new file mode 100644
index 00000000000..04444227caf
--- /dev/null
+++ b/tools/emboss_5/emboss_cirdna.xml
@@ -0,0 +1,25 @@
+
+ Draws circular maps of DNA constructs
+
+ macros.xml
+
+
+ perl '$__tool_directory__/emboss_single_outputfile_wrapper.pl' cirdna -infile '$input1' -graphout png -goutfile '$out_file1' -auto
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/cirdna.html
+
+
+
diff --git a/tools/emboss_5/emboss_codcmp.xml b/tools/emboss_5/emboss_codcmp.xml
new file mode 100644
index 00000000000..8bfebadd6c7
--- /dev/null
+++ b/tools/emboss_5/emboss_codcmp.xml
@@ -0,0 +1,332 @@
+
+ Codon usage table comparison
+
+ macros.xml
+
+
+ codcmp -first $cfile1 -second $cfile2 -outfile '$out_file1' -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/codcmp.html
+
+
+
diff --git a/tools/emboss_5/emboss_coderet.xml b/tools/emboss_5/emboss_coderet.xml
new file mode 100644
index 00000000000..3a26c89f50a
--- /dev/null
+++ b/tools/emboss_5/emboss_coderet.xml
@@ -0,0 +1,70 @@
+
+ Extract CDS, mRNA and translations from feature tables
+
+ macros.xml
+
+
+
+
+ coderet -seqall '$input1' -outfile '$out_file1' -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/coderet.html
+
+
+
diff --git a/tools/emboss_5/emboss_compseq.xml b/tools/emboss_5/emboss_compseq.xml
new file mode 100644
index 00000000000..4dbae8e792b
--- /dev/null
+++ b/tools/emboss_5/emboss_compseq.xml
@@ -0,0 +1,41 @@
+
+ Count composition of dimer/trimer/etc words in a sequence
+
+ macros.xml
+
+
+ compseq -sequence '$input1' -outfile '$out_file1' -word $word -frame $frame -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/compseq.html
+
+
+
diff --git a/tools/emboss_5/emboss_cpgplot.xml b/tools/emboss_5/emboss_cpgplot.xml
new file mode 100644
index 00000000000..a1cd7037cd7
--- /dev/null
+++ b/tools/emboss_5/emboss_cpgplot.xml
@@ -0,0 +1,27 @@
+
+ Plot CpG rich areas
+
+ macros.xml
+
+
+
+ perl '$__tool_directory__/emboss_cpgplot_wrapper.pl' cpgplot -sequence '$input1' -window $window -minlen $minlen -minpc $minpc -outfile '$outfile' -graph png -goutfile '$goutfile' -outfeat '$outfeat' -minoe $minoe -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/cpgplot.html
+
+
+
diff --git a/tools/emboss_5/emboss_cpgplot_wrapper.pl b/tools/emboss_5/emboss_cpgplot_wrapper.pl
new file mode 100644
index 00000000000..6edbbbfd456
--- /dev/null
+++ b/tools/emboss_5/emboss_cpgplot_wrapper.pl
@@ -0,0 +1,9 @@
+#! /usr/bin/perl -w
+use strict;
+use File::Copy;
+
+my $cmd_string = join (" ",@ARGV);
+my $results = `$cmd_string`;
+my @files = split("\n",$results);
+my $fileNameOut = $ARGV[14];
+move($fileNameOut.".1.png",$fileNameOut);
diff --git a/tools/emboss_5/emboss_cpgreport.xml b/tools/emboss_5/emboss_cpgreport.xml
new file mode 100644
index 00000000000..6c15dba8de2
--- /dev/null
+++ b/tools/emboss_5/emboss_cpgreport.xml
@@ -0,0 +1,57 @@
+
+ Reports all CpG rich regions
+
+ macros.xml
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/cpgreport.html
+
+
+
diff --git a/tools/emboss_5/emboss_cusp.xml b/tools/emboss_5/emboss_cusp.xml
new file mode 100644
index 00000000000..c24eed6d595
--- /dev/null
+++ b/tools/emboss_5/emboss_cusp.xml
@@ -0,0 +1,32 @@
+
+ Create a codon usage table
+
+ macros.xml
+
+
+ cusp -sequence '$input1' -outfile '$out_file1' -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/cusp.html
+
+
+
diff --git a/tools/emboss_5/emboss_cutseq.xml b/tools/emboss_5/emboss_cutseq.xml
new file mode 100644
index 00000000000..dea4462a107
--- /dev/null
+++ b/tools/emboss_5/emboss_cutseq.xml
@@ -0,0 +1,69 @@
+
+ Removes a specified section from a sequence
+
+ macros.xml
+
+
+
+ cutseq -sequence '$input1' -outseq '$out_file1' -from $from -to $to -osformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/cutseq.html
+
+
+
diff --git a/tools/emboss_5/emboss_dan.xml b/tools/emboss_5/emboss_dan.xml
new file mode 100644
index 00000000000..111bf099c2d
--- /dev/null
+++ b/tools/emboss_5/emboss_dan.xml
@@ -0,0 +1,66 @@
+
+ Calculates DNA RNA/DNA melting temperature
+
+ macros.xml
+
+
+
+ perl '$__tool_directory__/emboss_single_outputfile_wrapper.pl' dan -sequence '$input1' -windowsize $window -goutfile '$out_file1' -graph png -plot $plot1 -shiftincrement $shift -dnaconc $dnaconc
+ -saltconc $saltconc -product $product -formamide $formamide -mismatch $mismatch -prodlen $prodlen -thermo $thermo -temperature $temperature -rna $rna -outfile $out_file1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/dan.html
+
+
+
diff --git a/tools/emboss_5/emboss_degapseq.xml b/tools/emboss_5/emboss_degapseq.xml
new file mode 100644
index 00000000000..ec68aed2801
--- /dev/null
+++ b/tools/emboss_5/emboss_degapseq.xml
@@ -0,0 +1,59 @@
+
+ Removes gap characters from sequences
+
+ macros.xml
+
+
+
+ degapseq -sequence '$input1' -outseq '$out_file1' -osformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/degapseq.html
+
+
+
diff --git a/tools/emboss_5/emboss_descseq.xml b/tools/emboss_5/emboss_descseq.xml
new file mode 100644
index 00000000000..0b91178b52e
--- /dev/null
+++ b/tools/emboss_5/emboss_descseq.xml
@@ -0,0 +1,68 @@
+
+ Alter the name or description of a sequence
+
+ macros.xml
+
+
+
+ descseq -sequence '$input1' -outseq '$out_file1' -name '$seqname' -description '$desc' -append $append -osformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/descseq.html
+
+
+
diff --git a/tools/emboss_5/emboss_diffseq.xml b/tools/emboss_5/emboss_diffseq.xml
new file mode 100644
index 00000000000..f73a19ab76f
--- /dev/null
+++ b/tools/emboss_5/emboss_diffseq.xml
@@ -0,0 +1,58 @@
+
+ Find differences between nearly identical sequences
+
+ macros.xml
+
+
+
+ diffseq -asequence '$input1' -bsequence '$input2' -outfile '$out_file1' -aoutfeat '$out_file2' -boutfeat '$out_file3' -wordsize $wordsize -globaldifferences $globaldifferences -rformat3
+ $out_format1 -offormat4 $out_format2 -offormat5 $out_format3 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/diffseq.html
+
+
+
diff --git a/tools/emboss_5/emboss_digest.xml b/tools/emboss_5/emboss_digest.xml
new file mode 100644
index 00000000000..2d4f1331cea
--- /dev/null
+++ b/tools/emboss_5/emboss_digest.xml
@@ -0,0 +1,61 @@
+
+ Protein proteolytic enzyme or reagent cleavage digest
+
+ macros.xml
+
+
+
+ digest -seqall '$input1' -outfile '$out_file1' -menu $menu -unfavoured $unfavoured -overlap $overlap -allpartials $allpartials -rformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/digest.html
+
+
+
diff --git a/tools/emboss_5/emboss_dotmatcher.xml b/tools/emboss_5/emboss_dotmatcher.xml
new file mode 100644
index 00000000000..dedf58e0d60
--- /dev/null
+++ b/tools/emboss_5/emboss_dotmatcher.xml
@@ -0,0 +1,24 @@
+
+ Displays a thresholded dotplot of two sequences
+
+ macros.xml
+
+
+ perl '$__tool_directory__/emboss_single_outputfile_wrapper.pl' dotmatcher -asequence '$input1' -bsequence '$input2' -goutfile '$out_file1' -windowsize $windowsize -threshold $threshold -graph png -xygraph png -auto
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/dotmatcher.html
+
+
+
diff --git a/tools/emboss_5/emboss_dotpath.xml b/tools/emboss_5/emboss_dotpath.xml
new file mode 100644
index 00000000000..ffac325b898
--- /dev/null
+++ b/tools/emboss_5/emboss_dotpath.xml
@@ -0,0 +1,31 @@
+
+ Non-overlapping wordmatch dotplot of two sequences
+
+ macros.xml
+
+
+ perl '$__tool_directory__/emboss_single_outputfile_wrapper.pl' dotpath -asequence '$input1' -bsequence '$input2' -goutfile '$out_file1' -wordsize $wordsize -overlaps $overlaps -boxit $boxit -graph png -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/dotpath.html
+
+
+
diff --git a/tools/emboss_5/emboss_dottup.xml b/tools/emboss_5/emboss_dottup.xml
new file mode 100644
index 00000000000..6f51fdcaef3
--- /dev/null
+++ b/tools/emboss_5/emboss_dottup.xml
@@ -0,0 +1,27 @@
+
+ Displays a wordmatch dotplot of two sequences
+
+ macros.xml
+
+
+ perl '$__tool_directory__/emboss_single_outputfile_wrapper.pl' dottup -asequence '$input1' -bsequence '$input2' -goutfile '$out_file1' -wordsize $wordsize -boxit $boxit -graph png -xygraph png -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/dottup.html
+
+
+
diff --git a/tools/emboss_5/emboss_dreg.xml b/tools/emboss_5/emboss_dreg.xml
new file mode 100644
index 00000000000..01971a3b3c3
--- /dev/null
+++ b/tools/emboss_5/emboss_dreg.xml
@@ -0,0 +1,22 @@
+
+ Regular expression search of a nucleotide sequence
+
+ macros.xml
+
+
+ dreg -sequence '$input1' -outfile '$out_file1' -pattern '$pattern' -raccshow3 "no" -rusashow3 "no" -rdesshow3 "no" -auto
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/dreg.html
+
+
+
diff --git a/tools/emboss_5/emboss_einverted.xml b/tools/emboss_5/emboss_einverted.xml
new file mode 100644
index 00000000000..6f3d56ac1d8
--- /dev/null
+++ b/tools/emboss_5/emboss_einverted.xml
@@ -0,0 +1,42 @@
+
+ Finds DNA inverted repeats
+
+ macros.xml
+
+
+ einverted -sequence '$input1' -outfile '$out_file1' -gap $gap -threshold $threshold -match $match -mismatch $mismatch -maxrepeat $maxrepeat -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/einverted.html
+
+
+
diff --git a/tools/emboss_5/emboss_epestfind.xml b/tools/emboss_5/emboss_epestfind.xml
new file mode 100644
index 00000000000..48188a4c5cb
--- /dev/null
+++ b/tools/emboss_5/emboss_epestfind.xml
@@ -0,0 +1,58 @@
+
+ Finds PEST motifs as potential proteolytic cleavage sites
+
+ macros.xml
+
+
+ perl '$__tool_directory__/emboss_single_outputfile_wrapper.pl' epestfind -sequence '$input1' -goutfile '$ofile2' -outfile '$ofile1' -window $window -order $order -potential $potential -poor $poor
+ -invalid $invalid -map $map -graph png -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/epestfind.html
+
+
+
diff --git a/tools/emboss_5/emboss_equicktandem.xml b/tools/emboss_5/emboss_equicktandem.xml
new file mode 100644
index 00000000000..5656b3e2d55
--- /dev/null
+++ b/tools/emboss_5/emboss_equicktandem.xml
@@ -0,0 +1,57 @@
+
+ Finds tandem repeats
+
+ macros.xml
+
+
+
+ equicktandem -sequence '$input1' -outfile '$out_file1' -origfile '$ofile2' -maxrepeat $maxrepeat -threshold $threshold -rformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/equicktandem.html
+
+
+
diff --git a/tools/emboss_5/emboss_est2genome.xml b/tools/emboss_5/emboss_est2genome.xml
new file mode 100644
index 00000000000..7eba62aaf5d
--- /dev/null
+++ b/tools/emboss_5/emboss_est2genome.xml
@@ -0,0 +1,80 @@
+
+ Align EST and genomic DNA sequences
+
+ macros.xml
+
+
+ est2genome -estsequence '$input1' -genomesequence '$input2' -outfile '$out_file1' -match $match -mismatch $mismatch -gappenalty $gappenalty -intronpenalty $intronpenalty -splicepenalty
+ $splicepenalty -minscore $minscore -reverse $reverse -splice $splice -mode $mode -best $best -shuffle $shuffle -seed $seed -align $align -width $width -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/est2genome.html
+
+
+
diff --git a/tools/emboss_5/emboss_etandem.xml b/tools/emboss_5/emboss_etandem.xml
new file mode 100644
index 00000000000..e912e078c09
--- /dev/null
+++ b/tools/emboss_5/emboss_etandem.xml
@@ -0,0 +1,69 @@
+
+ Looks for tandem repeats in a nucleotide sequence
+
+ macros.xml
+
+
+
+ etandem -sequence '$input1' -outfile '$out_file1' -origfile '$ofile2' -minrepeat $minrepeat -maxrepeat $maxrepeat -threshold $threshold -mismatch $mismatch -uniform $uniform -rformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/etandem.html
+
+
+
diff --git a/tools/emboss_5/emboss_extractfeat.xml b/tools/emboss_5/emboss_extractfeat.xml
new file mode 100644
index 00000000000..896e899cd10
--- /dev/null
+++ b/tools/emboss_5/emboss_extractfeat.xml
@@ -0,0 +1,76 @@
+
diff --git a/tools/emboss_5/emboss_extractseq.xml b/tools/emboss_5/emboss_extractseq.xml
new file mode 100644
index 00000000000..3b22779e66d
--- /dev/null
+++ b/tools/emboss_5/emboss_extractseq.xml
@@ -0,0 +1,66 @@
+
diff --git a/tools/emboss_5/emboss_format_corrector.py b/tools/emboss_5/emboss_format_corrector.py
new file mode 100644
index 00000000000..a387b3b695a
--- /dev/null
+++ b/tools/emboss_5/emboss_format_corrector.py
@@ -0,0 +1,47 @@
+# EMBOSS format corrector
+import operator
+
+
+# Properly set file formats before job run
+def exec_before_job( app, inp_data=None, out_data=None, tool=None, param_dict=None ):
+ # why isn't items an ordered list?
+ items = out_data.items()
+ items = sorted(items, key=operator.itemgetter(0))
+
+ # normal filetype correction
+ data_count = 1
+ for name, data in items:
+ outputType = param_dict.get( 'out_format' + str(data_count), None )
+ if outputType is not None:
+ if outputType == 'ncbi':
+ outputType = "fasta"
+ elif outputType == 'excel':
+ outputType = "tabular"
+ elif outputType == 'text':
+ outputType = "txt"
+ data = app.datatypes_registry.change_datatype(data, outputType)
+ app.model.context.add( data )
+ app.model.context.flush()
+ data_count += 1
+
+ # html filetype correction
+ data_count = 1
+ for name, data in items:
+ wants_plot = param_dict.get( 'html_out' + str(data_count), None )
+ ext = "html"
+ if wants_plot == "yes":
+ data = app.datatypes_registry.change_datatype(data, ext)
+ app.model.context.add( data )
+ app.model.context.flush()
+ data_count += 1
+
+ # png file correction
+ data_count = 1
+ for name, data in items:
+ wants_plot = param_dict.get( 'plot' + str(data_count), None )
+ ext = "png"
+ if wants_plot == "yes":
+ data = app.datatypes_registry.change_datatype(data, ext)
+ app.model.context.add( data )
+ app.model.context.flush()
+ data_count += 1
diff --git a/tools/emboss_5/emboss_freak.xml b/tools/emboss_5/emboss_freak.xml
new file mode 100644
index 00000000000..17f489e504b
--- /dev/null
+++ b/tools/emboss_5/emboss_freak.xml
@@ -0,0 +1,32 @@
+
+ Residue/base frequency table or plot
+
+ macros.xml
+
+
+ freak -seqall '$input1' -outfile '$out_file1' -window $window -letters '$letters' -graph png -step $step -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/freak.html
+
+
+
diff --git a/tools/emboss_5/emboss_fuzznuc.xml b/tools/emboss_5/emboss_fuzznuc.xml
new file mode 100644
index 00000000000..f23a85e8c4a
--- /dev/null
+++ b/tools/emboss_5/emboss_fuzznuc.xml
@@ -0,0 +1,71 @@
+
+ Nucleic acid pattern search
+
+ macros.xml
+
+
+
+ fuzznuc -sequence '$input1' -outfile '$out_file1' -pattern '$pattern' -pmismatch $mismatch -complement $complement -rformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/fuzznuc.html
+
+
+
diff --git a/tools/emboss_5/emboss_fuzzpro.xml b/tools/emboss_5/emboss_fuzzpro.xml
new file mode 100644
index 00000000000..b803ae91d06
--- /dev/null
+++ b/tools/emboss_5/emboss_fuzzpro.xml
@@ -0,0 +1,50 @@
+
+ Protein pattern search
+
+ macros.xml
+
+
+
+ fuzzpro -sequence '$input1' -outfile '$out_file1' -pattern '$pattern' -pmismatch $mismatch -rformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/fuzzpro.html
+
+
+
diff --git a/tools/emboss_5/emboss_fuzztran.xml b/tools/emboss_5/emboss_fuzztran.xml
new file mode 100644
index 00000000000..0853cf8ff35
--- /dev/null
+++ b/tools/emboss_5/emboss_fuzztran.xml
@@ -0,0 +1,89 @@
+
+ Protein pattern search after translation
+
+ macros.xml
+
+
+
+ fuzztran -sequence '$input1' -outfile '$out_file1' -pattern '$pattern' -pmismatch $mismatch -frame $frame -table $table -rformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/fuzztran.html
+
+
+
diff --git a/tools/emboss_5/emboss_garnier.xml b/tools/emboss_5/emboss_garnier.xml
new file mode 100644
index 00000000000..95bc4c27cda
--- /dev/null
+++ b/tools/emboss_5/emboss_garnier.xml
@@ -0,0 +1,56 @@
+
+ Predicts protein secondary structure
+
+ macros.xml
+
+
+
+ garnier -sequence '$input1' -outfile '$out_file1' -idc $idc -rformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: https://galaxy-iuc.github.io/emboss-5.0-docs/garnier.html
+
+
+
diff --git a/tools/emboss_5/emboss_geecee.xml b/tools/emboss_5/emboss_geecee.xml
new file mode 100644
index 00000000000..1d621ae165e
--- /dev/null
+++ b/tools/emboss_5/emboss_geecee.xml
@@ -0,0 +1,26 @@
+
+ Calculates fractional GC content of nucleic acid sequences
+
+ macros.xml
+
+
+ geecee -sequence '$input1' -outfile '$out_file1' -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/geecee.html
+
+
+
diff --git a/tools/emboss_5/emboss_getorf.xml b/tools/emboss_5/emboss_getorf.xml
new file mode 100644
index 00000000000..3f312a1c131
--- /dev/null
+++ b/tools/emboss_5/emboss_getorf.xml
@@ -0,0 +1,118 @@
+
+ Finds and extracts open reading frames (ORFs)
+
+ macros.xml
+
+
+
+ getorf -sequence '$input1' -outseq '$out_file1' -table $table -minsize $minsize -maxsize $maxsize -find $find -methionine $methionine -circular $circular -reverse $reverse -flanking $flanking
+ -osformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/getorf.html
+
+
+
diff --git a/tools/emboss_5/emboss_helixturnhelix.xml b/tools/emboss_5/emboss_helixturnhelix.xml
new file mode 100644
index 00000000000..30cee6d1807
--- /dev/null
+++ b/tools/emboss_5/emboss_helixturnhelix.xml
@@ -0,0 +1,57 @@
+
+ Report nucleic acid binding motifs
+
+ macros.xml
+
+
+
+ helixturnhelix -sequence '$input1' -outfile '$out_file1' -mean $mean -sd $sd -minsd $minsd -eightyseven $eightyseven -rformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/helixturnhelix.html
+
+
+
diff --git a/tools/emboss_5/emboss_hmoment.xml b/tools/emboss_5/emboss_hmoment.xml
new file mode 100644
index 00000000000..1d76d2b43d2
--- /dev/null
+++ b/tools/emboss_5/emboss_hmoment.xml
@@ -0,0 +1,30 @@
+
+ Hydrophobic moment calculation
+
+ macros.xml
+
+
+ hmoment -seqall '$input1' -outfile '$out_file1' -window $window -aangle $aangle -graph png -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/hmoment.html
+
+
+
diff --git a/tools/emboss_5/emboss_iep.xml b/tools/emboss_5/emboss_iep.xml
new file mode 100644
index 00000000000..df5b5d04511
--- /dev/null
+++ b/tools/emboss_5/emboss_iep.xml
@@ -0,0 +1,35 @@
+
+ Calculates the isoelectric point of a protein
+
+ macros.xml
+
+
+ iep -sequence '$input1' -outfile '$out_file1' -step $step -amino $amino -graph png -termini $termini -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/iep.html
+
+
+
diff --git a/tools/emboss_5/emboss_infoseq.xml b/tools/emboss_5/emboss_infoseq.xml
new file mode 100644
index 00000000000..2e0ba793a0a
--- /dev/null
+++ b/tools/emboss_5/emboss_infoseq.xml
@@ -0,0 +1,67 @@
+
+
+ Displays some simple information about sequences
+
+ macros.xml
+
+
+
+ infoseq -sequence '$input1' -outfile '$out_file1' -html $html_out1 -heading $heading -usa $usa -name $disname -accession $accession -gi $gi -version $version -type $type -length $length -pgc
+ $pgc -description $description -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/infoseq.html
+
+
+
diff --git a/tools/emboss_5/emboss_infoseq_wrapper.pl b/tools/emboss_5/emboss_infoseq_wrapper.pl
new file mode 100644
index 00000000000..188e03f8d42
--- /dev/null
+++ b/tools/emboss_5/emboss_infoseq_wrapper.pl
@@ -0,0 +1,9 @@
+#! /usr/bin/perl -w
+use strict;
+
+my $cmd_string = join (" ",@ARGV);
+my $results = `$cmd_string`;
+if ($ARGV[6]=~/yes/)
+{
+ print "Extension: html\n";
+}
diff --git a/tools/emboss_5/emboss_isochore.xml b/tools/emboss_5/emboss_isochore.xml
new file mode 100644
index 00000000000..b5b15e7d879
--- /dev/null
+++ b/tools/emboss_5/emboss_isochore.xml
@@ -0,0 +1,77 @@
+
+ Plots isochores in large DNA sequences
+
+ macros.xml
+
+
+ perl '$__tool_directory__/emboss_single_outputfile_wrapper.pl' isochore -sequence '$input1' -outfile '$ofile2' -goutfile '$ofile1' -graph png -window $window -shift $shift -auto
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+**Syntax**
+
+This application plots GC content over a sequence. It is intended for large sequences such as complete chromosomes or large genomic contigs, although interesting results can also be obtained from shorter sequences. You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/isochore.html
+
+- Both **Window size** and **Shift increment** are intergers.
+
+-----
+
+**Example**
+
+- Input sequences::
+
+ >hg18_dna range=chrX:151073054-151073376 5'pad=0 3'pad=0 revComp=FALSE strand=? repeatMasking=none
+ TTTATGTCTATAATCCTTACCAAAAGTTACCTTGGAATAAGAAGAAGTCA
+ GTAAAAAGAAGGCTGTTGTTCCGTGAAATACTGTCTTTATGCCTCAGATT
+ TGGAGTGCTCAGAGCCTCTGCAGCAAAGATTTGGCATGTGTCCTAGGCCT
+ GCTCAGAGCAGCAAATCCCACCCTCTTGGAGAATGAGACTCATAGAGGGA
+ CAGCTCCCTCCTCAGAGGCTTCTCTAATGGGACTCCAAAGAGCAAACACT
+ CAGCCCCATGAGGACTGGCCAGGCCAAGTGGTGTGTGGGAACAGGGAGCA
+ GCGGTTTCCAAGAGGATACAGTA
+
+- Output data file::
+
+ Position Percent G+C 1 .. 323
+ 80 0.422
+ 112 0.460
+ 144 0.509
+ 176 0.534
+ 208 0.553
+ 240 0.553
+
+- Output graphics file:
+
+.. image:: ./static/emboss_icons/isochore.png
+
+
+
diff --git a/tools/emboss_5/emboss_lindna.xml b/tools/emboss_5/emboss_lindna.xml
new file mode 100644
index 00000000000..4474b799e6e
--- /dev/null
+++ b/tools/emboss_5/emboss_lindna.xml
@@ -0,0 +1,72 @@
+
+
+ Draws linear maps of DNA constructs
+
+ macros.xml
+
+
+ lindna -infile '$input1' -graphout png -goutfile '$out_file1' -ruler $ruler -blocktype $blocktype -maxgroups $maxgroups -maxlabels $maxlabels -intersymbol $intersymbol -intercolour $intercolour
+ -interticks $interticks -gapsize $gapsize -ticklines $ticklines -textheight $textheight -textlength $textlength -margin $margin -tickheight $tickheight -blockheight $blockheight -rangeheight
+ $rangeheight -gapgroup $gapgroup -postext $postext -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/lindna.html
+
+
+
diff --git a/tools/emboss_5/emboss_marscan.xml b/tools/emboss_5/emboss_marscan.xml
new file mode 100644
index 00000000000..bb77b0cde39
--- /dev/null
+++ b/tools/emboss_5/emboss_marscan.xml
@@ -0,0 +1,46 @@
+
+ Finds MAR/SAR sites in nucleic sequences
+
+ macros.xml
+
+
+
+ marscan -sequence '$input1' -outfile '$out_file1' -rformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/marscan.html
+
+
+
diff --git a/tools/emboss_5/emboss_maskfeat.xml b/tools/emboss_5/emboss_maskfeat.xml
new file mode 100644
index 00000000000..b707d6eaa2b
--- /dev/null
+++ b/tools/emboss_5/emboss_maskfeat.xml
@@ -0,0 +1,68 @@
+
+ Mask off features of a sequence
+
+ macros.xml
+
+
+
+ maskfeat -sequence '$input1' -outseq '$out_file1' -type '$type' -tolower $tolower -maskchar '$maskchar' -osformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/maskfeat.html
+
+
+
diff --git a/tools/emboss_5/emboss_maskseq.xml b/tools/emboss_5/emboss_maskseq.xml
new file mode 100644
index 00000000000..40905f19a90
--- /dev/null
+++ b/tools/emboss_5/emboss_maskseq.xml
@@ -0,0 +1,68 @@
+
+ Mask off regions of a sequence
+
+ macros.xml
+
+
+
+ maskseq -sequence '$input1' -outseq '$out_file1' -regions '$regions' -tolower $tolower -maskchar '$maskchar' -osformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/maskseq.html
+
+
+
diff --git a/tools/emboss_5/emboss_matcher.xml b/tools/emboss_5/emboss_matcher.xml
new file mode 100644
index 00000000000..041fb70effd
--- /dev/null
+++ b/tools/emboss_5/emboss_matcher.xml
@@ -0,0 +1,50 @@
+
+ Finds the best local alignments between two sequences
+
+ macros.xml
+
+
+
+ matcher -asequence '$input1' -bsequence '$input2' -outfile '$out_file1' -alternatives $alternatives -gapopen $gapopen -gapextend $gapextend -aformat3 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/matcher.html
+
+
+
diff --git a/tools/emboss_5/emboss_megamerger.xml b/tools/emboss_5/emboss_megamerger.xml
new file mode 100644
index 00000000000..f507fe501f6
--- /dev/null
+++ b/tools/emboss_5/emboss_megamerger.xml
@@ -0,0 +1,59 @@
+
+ Merge two large overlapping nucleic acid sequences
+
+ macros.xml
+
+
+
+ megamerger -asequence '$input1' -bsequence '$input2' -outseq '$out_file1' -outfile '$out_file2' -wordsize $wordsize -prefer $prefer -osformat3 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/megamerger.html
+
+
+
diff --git a/tools/emboss_5/emboss_merger.xml b/tools/emboss_5/emboss_merger.xml
new file mode 100644
index 00000000000..7dcb3af6bdf
--- /dev/null
+++ b/tools/emboss_5/emboss_merger.xml
@@ -0,0 +1,70 @@
+
+ Merge two overlapping nucleic acid sequences
+
+ macros.xml
+
+
+
+ merger -asequence '$input1' -bsequence '$input2' -outseq '$out_file1' -outfile '$out_file2' -gapopen $gapopen -gapextend $gapextend -osformat4 $out_format1 -aformat3 $out_format2 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/merger.html
+
+
+
diff --git a/tools/emboss_5/emboss_msbar.xml b/tools/emboss_5/emboss_msbar.xml
new file mode 100644
index 00000000000..7ecd9b9bc28
--- /dev/null
+++ b/tools/emboss_5/emboss_msbar.xml
@@ -0,0 +1,107 @@
+
+ Mutate sequence beyond all recognition
+
+ macros.xml
+
+
+
+ msbar -sequence '$input1' -outseq '$out_file1' -count $count -point $point -block $block -codon $codon -inframe $inframe -minimum $minimum -maximum $maximum -osformat2 $out_format1
+ -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/msbar.html
+
+
+
diff --git a/tools/emboss_5/emboss_multiple_outputfile_wrapper.pl b/tools/emboss_5/emboss_multiple_outputfile_wrapper.pl
new file mode 100644
index 00000000000..e87c5423070
--- /dev/null
+++ b/tools/emboss_5/emboss_multiple_outputfile_wrapper.pl
@@ -0,0 +1,19 @@
+#! /usr/bin/perl -w
+use strict;
+
+my $cmd_string = join (" ",@ARGV);
+my $results = `$cmd_string`;
+my @files = split("\n",$results);
+foreach my $thisLine (@files)
+{
+ if ($thisLine =~ /Created /)
+ {
+ $thisLine =~ /[\w|\.]+$/;
+ $thisLine =$&;
+ print "outfile: $thisLine\n";
+ }
+ else
+ {
+ print $thisLine,"\n";
+ }
+}
diff --git a/tools/emboss_5/emboss_needle.xml b/tools/emboss_5/emboss_needle.xml
new file mode 100644
index 00000000000..0caa66b0cfb
--- /dev/null
+++ b/tools/emboss_5/emboss_needle.xml
@@ -0,0 +1,118 @@
+
+ Needleman-Wunsch global alignment
+
+ macros.xml
+
+
+
+ needle -asequence '$input1' -bsequence '$input2' -outfile '$out_file1' -gapopen $gapopen -gapextend $gapextend -brief $brief -aformat3 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+needle reads any two sequences of the same type (DNA or protein).
+
+-----
+
+**Syntax**
+
+This tool uses the Needleman-Wunsch global alignment algorithm to find the optimum alignment (including gaps) of two sequences when considering their entire length.
+
+- **Optimal alignment:** Dynamic programming methods ensure the optimal global alignment by exploring all possible alignments and choosing the best.
+
+- **The Needleman-Wunsch algorithm** is a member of the class of algorithms that can calculate the best score and alignment in the order of mn steps, (where 'n' and 'm' are the lengths of the two sequences).
+
+- **Gap open penalty:** [10.0 for any sequence] The gap open penalty is the score taken away when a gap is created. The best value depends on the choice of comparison matrix. The default value assumes you are using the EBLOSUM62 matrix for protein sequences, and the EDNAFULL matrix for nucleotide sequences. (Floating point number from 1.0 to 100.0)
+
+- **Gap extension penalty:** [0.5 for any sequence] The gap extension, penalty is added to the standard gap penalty for each base or residue in the gap. This is how long gaps are penalized. Usually you will expect a few long gaps rather than many short gaps, so the gap extension penalty should be lower than the gap penalty. An exception is where one or both sequences are single reads with possible sequencing errors in which case you would expect many single base gaps. You can get this result by setting the gap open penalty to zero (or very low) and using the gap extension penalty to control gap scoring. (Floating point number from 0.0 to 10.0)
+
+You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/needle.html
+
+-----
+
+**Example**
+
+- Input File::
+
+ >hg18_dna range=chrX:151073054-151073136 5'pad=0 3'pad=0 revComp=FALSE strand=? repeatMasking=none
+ TTTATGTCTATAATCCTTACCAAAAGTTACCTTGGAATAAGAAGAAGTCA
+ GTAAAAAGAAGGCTGTTGTTCCGTGAAATACTG
+
+- If both Sequence1 and Sequence2 take the above file as input, Gap open penalty equals 10.0, Gap extension penalty equals 0.5, Brief identity and similarity is set to Yes, Output alignment file format is set to SRS pairs, the output file is::
+
+ ########################################
+ # Program: needle
+ # Rundate: Mon Apr 02 2007 14:23:16
+ # Align_format: srspair
+ # Report_file: ./database/files/dataset_7.dat
+ ########################################
+
+ #=======================================
+ #
+ # Aligned_sequences: 2
+ # 1: hg18_dna
+ # 2: hg18_dna
+ # Matrix: EDNAFULL
+ # Gap_penalty: 10.0
+ # Extend_penalty: 0.5
+ #
+ # Length: 83
+ # Identity: 83/83 (100.0%)
+ # Similarity: 83/83 (100.0%)
+ # Gaps: 0/83 ( 0.0%)
+ # Score: 415.0
+ #
+ #=======================================
+
+ hg18_dna 1 TTTATGTCTATAATCCTTACCAAAAGTTACCTTGGAATAAGAAGAAGTCA 50
+ ||||||||||||||||||||||||||||||||||||||||||||||||||
+ hg18_dna 1 TTTATGTCTATAATCCTTACCAAAAGTTACCTTGGAATAAGAAGAAGTCA 50
+
+ hg18_dna 51 GTAAAAAGAAGGCTGTTGTTCCGTGAAATACTG 83
+ |||||||||||||||||||||||||||||||||
+ hg18_dna 51 GTAAAAAGAAGGCTGTTGTTCCGTGAAATACTG 83
+
+ #---------------------------------------
+ #---------------------------------------
+
+
+
diff --git a/tools/emboss_5/emboss_newcpgreport.xml b/tools/emboss_5/emboss_newcpgreport.xml
new file mode 100644
index 00000000000..79721769dbd
--- /dev/null
+++ b/tools/emboss_5/emboss_newcpgreport.xml
@@ -0,0 +1,36 @@
+
+ Report CpG rich areas
+
+ macros.xml
+
+
+ newcpgreport -sequence '$input1' -window $window -shift $shift -minlen $minlen -minpc $minpc -outfile '$out_file1' -minoe $minoe -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/newcpgreport.html
+
+
+
diff --git a/tools/emboss_5/emboss_newcpgseek.xml b/tools/emboss_5/emboss_newcpgseek.xml
new file mode 100644
index 00000000000..610cfbb02dc
--- /dev/null
+++ b/tools/emboss_5/emboss_newcpgseek.xml
@@ -0,0 +1,34 @@
+
+ Reports CpG rich region
+
+ macros.xml
+
+
+ newcpgseek -sequence '$input1' -outfile '$out_file1' -score $score -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/newcpgseek.html
+
+
+
diff --git a/tools/emboss_5/emboss_newseq.xml b/tools/emboss_5/emboss_newseq.xml
new file mode 100644
index 00000000000..e90a85ddaf7
--- /dev/null
+++ b/tools/emboss_5/emboss_newseq.xml
@@ -0,0 +1,79 @@
+
+ Type in a short new sequence
+
+ macros.xml
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/newseq.html
+
+
+
diff --git a/tools/emboss_5/emboss_noreturn.xml b/tools/emboss_5/emboss_noreturn.xml
new file mode 100644
index 00000000000..3f10cb9bbb0
--- /dev/null
+++ b/tools/emboss_5/emboss_noreturn.xml
@@ -0,0 +1,32 @@
+
+ Removes carriage return from ASCII files
+
+ macros.xml
+
+
+ noreturn -infile '$input1' -outfile '$out_file1' -system $system -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/noreturn.html
+
+
+
diff --git a/tools/emboss_5/emboss_notseq.xml b/tools/emboss_5/emboss_notseq.xml
new file mode 100644
index 00000000000..95ca06e2ef9
--- /dev/null
+++ b/tools/emboss_5/emboss_notseq.xml
@@ -0,0 +1,67 @@
+
+ Exclude a set of sequences and write out the remaining ones
+
+ macros.xml
+
+
+
+ notseq -sequence '$input1' -outseq '$out_file1' -exclude '$exclude' -osformat3 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/notseq.html
+
+
+
diff --git a/tools/emboss_5/emboss_nthseq.xml b/tools/emboss_5/emboss_nthseq.xml
new file mode 100644
index 00000000000..fd2dea33b7c
--- /dev/null
+++ b/tools/emboss_5/emboss_nthseq.xml
@@ -0,0 +1,67 @@
+
+ Writes one sequence from a multiple set of sequences
+
+ macros.xml
+
+
+
+ nthseq -sequence '$input1' -outseq '$out_file1' -number $number -osformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/nthseq.html
+
+
+
diff --git a/tools/emboss_5/emboss_octanol.xml b/tools/emboss_5/emboss_octanol.xml
new file mode 100644
index 00000000000..18f2e62a3ca
--- /dev/null
+++ b/tools/emboss_5/emboss_octanol.xml
@@ -0,0 +1,35 @@
+
+
+ Displays protein hydropathy
+
+ macros.xml
+
+
+ perl '$__tool_directory__/emboss_single_outputfile_wrapper.pl' octanol -sequence '$input1' -graph png -goutfile '$out_file1' -width $width -octanolplot $octanolplot -interfaceplot $interfaceplot
+ -differenceplot $differenceplot -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/octanol.html
+
+
+
diff --git a/tools/emboss_5/emboss_oddcomp.xml b/tools/emboss_5/emboss_oddcomp.xml
new file mode 100644
index 00000000000..f8c8ab4ad39
--- /dev/null
+++ b/tools/emboss_5/emboss_oddcomp.xml
@@ -0,0 +1,36 @@
+
+
+ Find protein sequence regions with a biased composition
+
+ macros.xml
+
+
+ oddcomp -sequence '$input1' -infile '$input2' -outfile '$out_file1' -window $window -ignorebz $ignorebz -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/oddcomp.html
+
+
+
diff --git a/tools/emboss_5/emboss_palindrome.xml b/tools/emboss_5/emboss_palindrome.xml
new file mode 100644
index 00000000000..bc709e28925
--- /dev/null
+++ b/tools/emboss_5/emboss_palindrome.xml
@@ -0,0 +1,45 @@
+
+ Looks for inverted repeats in a nucleotide sequence
+
+ macros.xml
+
+
+ palindrome -sequence '$input1' -outfile '$out_file1' -minpallen $minpallen -maxpallen $maxpallen -gaplimit $gaplimit -nummismatches $nummismatches -overlap $overlap -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/palindrome.html
+
+
+
diff --git a/tools/emboss_5/emboss_pasteseq.xml b/tools/emboss_5/emboss_pasteseq.xml
new file mode 100644
index 00000000000..cd2134a25b5
--- /dev/null
+++ b/tools/emboss_5/emboss_pasteseq.xml
@@ -0,0 +1,69 @@
+
+ Insert one sequence into another
+
+ macros.xml
+
+
+
+ pasteseq -asequence '$input2' -bsequence '$input1' -outseq '$out_file1' -pos $pos -osformat3 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input datasets need to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/pasteseq.html
+
+
+
diff --git a/tools/emboss_5/emboss_patmatdb.xml b/tools/emboss_5/emboss_patmatdb.xml
new file mode 100644
index 00000000000..d01ccc153d0
--- /dev/null
+++ b/tools/emboss_5/emboss_patmatdb.xml
@@ -0,0 +1,48 @@
+
+ Search a protein sequence with a motif
+
+ macros.xml
+
+
+
+ patmatdb -sequence '$input1' -outfile '$out_file1' -motif '$motif' -rformat3 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/patmatdb.html
+
+
+
diff --git a/tools/emboss_5/emboss_pepcoil.xml b/tools/emboss_5/emboss_pepcoil.xml
new file mode 100644
index 00000000000..3560232cd1e
--- /dev/null
+++ b/tools/emboss_5/emboss_pepcoil.xml
@@ -0,0 +1,43 @@
+
+ Predicts coiled coil regions
+
+ macros.xml
+
+
+ pepcoil -sequence '$input1' -outfile '$out_file1' -window $window -coil $coil -frame $frame -other $other -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/pepcoil.html
+
+
+
diff --git a/tools/emboss_5/emboss_pepinfo.xml b/tools/emboss_5/emboss_pepinfo.xml
new file mode 100644
index 00000000000..7c9050c823e
--- /dev/null
+++ b/tools/emboss_5/emboss_pepinfo.xml
@@ -0,0 +1,27 @@
+
+
+ Plots simple amino acid properties in parallel
+
+ macros.xml
+
+
+ perl '$__tool_directory__/emboss_single_outputfile_wrapper.pl' pepinfo -sequence '$input1' -outfile '$out_file1' -goutfile '$out_file2' -graph png -hwindow $hwindow $plot_type -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/pepinfo.html
+
+
+
diff --git a/tools/emboss_5/emboss_pepnet.xml b/tools/emboss_5/emboss_pepnet.xml
new file mode 100644
index 00000000000..71784f85169
--- /dev/null
+++ b/tools/emboss_5/emboss_pepnet.xml
@@ -0,0 +1,28 @@
+
+
+ Displays proteins as a helical net
+
+ macros.xml
+
+
+ pepnet -sequence '$input1' -graph png -goutfile '$out_file1' -squares '$squares' -diamonds '$diamonds' -octags '$octags' -amphipathic $amphipathic -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/pepnet.html
+
+
+
diff --git a/tools/emboss_5/emboss_pepstats.xml b/tools/emboss_5/emboss_pepstats.xml
new file mode 100644
index 00000000000..607c8c546fe
--- /dev/null
+++ b/tools/emboss_5/emboss_pepstats.xml
@@ -0,0 +1,31 @@
+
+ Protein statistics
+
+ macros.xml
+
+
+ pepstats -sequence '$input1' -outfile '$out_file1' -termini $termini -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/pepstats.html
+
+
+
diff --git a/tools/emboss_5/emboss_pepwheel.xml b/tools/emboss_5/emboss_pepwheel.xml
new file mode 100644
index 00000000000..c190ee61224
--- /dev/null
+++ b/tools/emboss_5/emboss_pepwheel.xml
@@ -0,0 +1,35 @@
+
+
+ Shows protein sequences as helices
+
+ macros.xml
+
+
+ perl '$__tool_directory__/emboss_single_outputfile_wrapper.pl' pepwheel -sequence '$input1' -graph png -goutfile '$out_file1' -squares '$squares' -diamonds '$diamonds' -octags '$octags' -amphipathic
+ $amphipathic -steps $steps -turns $turns -wheel $wheel -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/pepwheel.html
+
+
+
diff --git a/tools/emboss_5/emboss_pepwindow.xml b/tools/emboss_5/emboss_pepwindow.xml
new file mode 100644
index 00000000000..ce4ab715900
--- /dev/null
+++ b/tools/emboss_5/emboss_pepwindow.xml
@@ -0,0 +1,22 @@
+
+
+ Displays protein hydropathy
+
+ macros.xml
+
+
+ perl '$__tool_directory__/emboss_single_outputfile_wrapper.pl' pepwindow -sequence '$input1' -graph png -goutfile '$out_file1' -length $length -auto
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/pepwindow.html
+
+
+
diff --git a/tools/emboss_5/emboss_pepwindowall.xml b/tools/emboss_5/emboss_pepwindowall.xml
new file mode 100644
index 00000000000..ce31a5a3171
--- /dev/null
+++ b/tools/emboss_5/emboss_pepwindowall.xml
@@ -0,0 +1,22 @@
+
+
+ Displays protein hydropathy of a set of sequences
+
+ macros.xml
+
+
+ perl '$__tool_directory__/emboss_single_outputfile_wrapper.pl' pepwindowall -sequence '$input1' -graph png -goutfile '$out_file1' -length $length -auto
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/pepwindowall.html
+
+
+
diff --git a/tools/emboss_5/emboss_plotcon.xml b/tools/emboss_5/emboss_plotcon.xml
new file mode 100644
index 00000000000..1955530640d
--- /dev/null
+++ b/tools/emboss_5/emboss_plotcon.xml
@@ -0,0 +1,22 @@
+
+
+ Plot quality of conservation of a sequence alignment
+
+ macros.xml
+
+
+ perl '$__tool_directory__/emboss_single_outputfile_wrapper.pl' plotcon -sequences '$input1' -graph png -goutfile '$out_file1' -winsize $winsize -auto
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/plotcon.html
+
+
+
diff --git a/tools/emboss_5/emboss_plotorf.xml b/tools/emboss_5/emboss_plotorf.xml
new file mode 100644
index 00000000000..c08a9da575e
--- /dev/null
+++ b/tools/emboss_5/emboss_plotorf.xml
@@ -0,0 +1,37 @@
+
+
+ Plot potential open reading frames
+
+ macros.xml
+
+
+ perl '$__tool_directory__/emboss_single_outputfile_wrapper.pl' plotorf -sequence '$input1' -graph png -goutfile '$out_file1' -start '$start' -stop '$stop' -auto
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/plotorf.html
+
+
+
diff --git a/tools/emboss_5/emboss_polydot.xml b/tools/emboss_5/emboss_polydot.xml
new file mode 100644
index 00000000000..e60babbe836
--- /dev/null
+++ b/tools/emboss_5/emboss_polydot.xml
@@ -0,0 +1,44 @@
+
+
+ Displays all-against-all dotplots of a set of sequences
+
+ macros.xml
+
+
+ perl '$__tool_directory__/emboss_single_outputfile_wrapper.pl' polydot -sequence '$input1' -graph png -goutfile '$output2' -outfeat '$output1' -wordsize $wordsize -boxit $boxit -dumpfeat yes -gap
+ $gap -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/polydot.html
+
+
+
diff --git a/tools/emboss_5/emboss_preg.xml b/tools/emboss_5/emboss_preg.xml
new file mode 100644
index 00000000000..169c0085586
--- /dev/null
+++ b/tools/emboss_5/emboss_preg.xml
@@ -0,0 +1,21 @@
+
+ Regular expression search of a protein sequence
+
+ macros.xml
+
+
+ preg -sequence '$input1' -outfile '$out_file1' -pattern '$pattern' -auto
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/preg.html
+
+
+
diff --git a/tools/emboss_5/emboss_prettyplot.xml b/tools/emboss_5/emboss_prettyplot.xml
new file mode 100644
index 00000000000..263274ddaa5
--- /dev/null
+++ b/tools/emboss_5/emboss_prettyplot.xml
@@ -0,0 +1,83 @@
+
+
+ Displays aligned sequences, with colouring and boxing
+
+ macros.xml
+
+
+ prettyplot -sequences '$input1' -graph png -goutfile '$out_file1' -residuesperline $residuesperline -resbreak $resbreak -ccolours $ccolours -cidentity '$cidentity' -csimilarity '$csimilarity'
+ -cother '$cother' -docolour $docolour -gtitle $title -pair '$pair' -identity $identity -box $box -boxcol $boxcol -boxcolval '$boxcolval' -name $name -maxnamelen $maxnamelen -number $number -listoptions
+ $listoptions -consensus $consensus -collision $collision -alternative $alternative -showscore $showscore -portrait $portrait -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/prettyplot.html
+
+
+
diff --git a/tools/emboss_5/emboss_prettyseq.xml b/tools/emboss_5/emboss_prettyseq.xml
new file mode 100644
index 00000000000..8ee5ead2a43
--- /dev/null
+++ b/tools/emboss_5/emboss_prettyseq.xml
@@ -0,0 +1,49 @@
+
+ Output sequence with translated ranges
+
+ macros.xml
+
+
+ prettyseq -sequence '$input1' -outfile '$out_file1' -ruler $ruler -plabel $plabel -nlabel $nlabel -width $width -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/prettyseq.html
+
+
+
diff --git a/tools/emboss_5/emboss_primersearch.xml b/tools/emboss_5/emboss_primersearch.xml
new file mode 100644
index 00000000000..873171949b3
--- /dev/null
+++ b/tools/emboss_5/emboss_primersearch.xml
@@ -0,0 +1,30 @@
+
+ Searches DNA sequences for matches with primer pairs
+
+ macros.xml
+
+
+ primersearch -seqall '$input1' -infile '$input2' -outfile '$out_file1' -mismatchpercent $mismatchpercent -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/primersearch.html
+
+
+
diff --git a/tools/emboss_5/emboss_revseq.xml b/tools/emboss_5/emboss_revseq.xml
new file mode 100644
index 00000000000..a601215f6f6
--- /dev/null
+++ b/tools/emboss_5/emboss_revseq.xml
@@ -0,0 +1,75 @@
+
+ Reverse and complement a sequence
+
+ macros.xml
+
+
+
+ revseq -sequence '$input1' -outseq '$out_file1' -reverse $reverse -complement $complement -osformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/revseq.html
+
+
+
diff --git a/tools/emboss_5/emboss_seqmatchall.xml b/tools/emboss_5/emboss_seqmatchall.xml
new file mode 100644
index 00000000000..41f5941d046
--- /dev/null
+++ b/tools/emboss_5/emboss_seqmatchall.xml
@@ -0,0 +1,52 @@
+
+ All-against-all comparison of a set of sequences
+
+ macros.xml
+
+
+
+ seqmatchall -sequence '$input1' -outfile '$out_file1' -wordsize $wordsize -aformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/seqmatchall.html
+
+
+
diff --git a/tools/emboss_5/emboss_seqret.xml b/tools/emboss_5/emboss_seqret.xml
new file mode 100644
index 00000000000..a941cc5e53d
--- /dev/null
+++ b/tools/emboss_5/emboss_seqret.xml
@@ -0,0 +1,69 @@
+
+ Reads and writes sequences
+
+ macros.xml
+
+
+
+ seqret -sequence '$input1' -outseq '$out_file1' -feature $feature -firstonly $firstonly -osformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/seqret.html
+
+
+
diff --git a/tools/emboss_5/emboss_showfeat.xml b/tools/emboss_5/emboss_showfeat.xml
new file mode 100644
index 00000000000..ff7ddcddede
--- /dev/null
+++ b/tools/emboss_5/emboss_showfeat.xml
@@ -0,0 +1,97 @@
+
+
+ Show features of a sequence
+
+ macros.xml
+
+
+
+ showfeat -sequence '$input1' -outfile '$out_file1' -matchsource '$matchsource' -matchtype '$matchtype' -matchtag '$matchtag' -matchvalue '$matchvalue' -sort $sort -annotation '$annotation' -id
+ $id -description $description -scale $scale -width $width -collapse $collapse -forward $forward -reverse $reverse -unknown $unknown -strand $strand -source $source -position $position -type
+ $type -tags $tags -values $values -stricttags $stricttags -html $html_out1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/showfeat.html
+
+
+
diff --git a/tools/emboss_5/emboss_shuffleseq.xml b/tools/emboss_5/emboss_shuffleseq.xml
new file mode 100644
index 00000000000..4ec50c33ca6
--- /dev/null
+++ b/tools/emboss_5/emboss_shuffleseq.xml
@@ -0,0 +1,60 @@
+
+
+ Shuffles a set of sequences maintaining composition
+
+ macros.xml
+
+
+
+ shuffleseq -sequence '$input1' -outseq '$out_file1' -shuffle $shuffle -osformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/shuffleseq.html
+
+
+
diff --git a/tools/emboss_5/emboss_sigcleave.xml b/tools/emboss_5/emboss_sigcleave.xml
new file mode 100644
index 00000000000..16c5c7e9869
--- /dev/null
+++ b/tools/emboss_5/emboss_sigcleave.xml
@@ -0,0 +1,53 @@
+
+ Reports protein signal cleavage sites
+
+ macros.xml
+
+
+
+ sigcleave -sequence '$input1' -outfile '$out_file1' -minweight $minweight -prokaryote $prokaryote -rformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/sigcleave.html
+
+
+
diff --git a/tools/emboss_5/emboss_single_outputfile_wrapper.pl b/tools/emboss_5/emboss_single_outputfile_wrapper.pl
new file mode 100644
index 00000000000..1ec458386ca
--- /dev/null
+++ b/tools/emboss_5/emboss_single_outputfile_wrapper.pl
@@ -0,0 +1,27 @@
+#! /usr/bin/perl -w
+use strict;
+use File::Copy;
+
+my $cmd_string = join (" ",@ARGV);
+my $results = `$cmd_string`;
+my @files = split("\n",$results);
+my $fileNameOut = $ARGV[6];
+my ($drive, $outputDir, $file) = File::Spec->splitpath( $fileNameOut );
+my $destination = $fileNameOut;
+
+foreach my $thisLine (@files)
+{
+ if ($thisLine =~ /Created /)
+ {
+ $thisLine =~ /[\w|\.]+$/;
+ $thisLine =$&;
+ #print "outfile: $thisLine\n";
+ #there is only one file to move, so we can quit after finding it
+ move($drive.$outputDir.$thisLine,$fileNameOut);
+ exit(1);
+ }
+ else
+ {
+ print $thisLine,"\n";
+ }
+}
diff --git a/tools/emboss_5/emboss_sirna.xml b/tools/emboss_5/emboss_sirna.xml
new file mode 100644
index 00000000000..ec6725430f5
--- /dev/null
+++ b/tools/emboss_5/emboss_sirna.xml
@@ -0,0 +1,112 @@
+
+ Finds siRNA duplexes in mRNA
+
+ macros.xml
+
+
+
+ sirna -sequence '$input1' -outfile '$ofile1' -outseq '$ofile2' -poliii $poliii -aa $aa -tt $tt -polybase $polybase -context $context -rformat2 $out_format1 -osformat3 $out_format2
+ -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/sirna.html
+
+
+
diff --git a/tools/emboss_5/emboss_sixpack.xml b/tools/emboss_5/emboss_sixpack.xml
new file mode 100644
index 00000000000..e5ebd239d68
--- /dev/null
+++ b/tools/emboss_5/emboss_sixpack.xml
@@ -0,0 +1,141 @@
+
+
+ Display a DNA sequence with 6-frame translation and ORFs
+
+ macros.xml
+
+
+
+ sixpack -sequence '$input1' -outfile '$ofile1' -outseq '$ofile2' -table $table -firstorf $firstorf -lastorf $lastorf -mstart $mstart -reverse $reverse -orfminsize $orfminsize -uppercase
+ '$uppercase' -number $number -width $width -length $length -margin $margin -name $disp_name -description $description -offset $offset -html $html_out1 -osformat $out_format2 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/sixpack.html
+
+
+
diff --git a/tools/emboss_5/emboss_skipseq.xml b/tools/emboss_5/emboss_skipseq.xml
new file mode 100644
index 00000000000..eee0f8ed7d3
--- /dev/null
+++ b/tools/emboss_5/emboss_skipseq.xml
@@ -0,0 +1,57 @@
+
+ Reads and writes sequences, skipping first few
+
+ macros.xml
+
+
+
+ skipseq -sequence '$input1' -outseq '$out_file1' -skip $skip -feature $feature -osformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/skipseq.html
+
+
+
diff --git a/tools/emboss_5/emboss_splitter.xml b/tools/emboss_5/emboss_splitter.xml
new file mode 100644
index 00000000000..38f70b9ace4
--- /dev/null
+++ b/tools/emboss_5/emboss_splitter.xml
@@ -0,0 +1,74 @@
+
+ Split a sequence into (overlapping) smaller sequences
+
+ macros.xml
+
+
+
+ splitter -sequence '$input1' -outseq '$out_file1' -size $size -overlap $overlap -addoverlap $addoverlap -osformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/splitter.html
+
+
+
diff --git a/tools/emboss_5/emboss_supermatcher.xml b/tools/emboss_5/emboss_supermatcher.xml
new file mode 100644
index 00000000000..32ff29a9f08
--- /dev/null
+++ b/tools/emboss_5/emboss_supermatcher.xml
@@ -0,0 +1,55 @@
+
+
+ Match large sequences against one or more other sequences
+
+ macros.xml
+
+
+
+ supermatcher -asequence '$input1' -bsequence '$input2' -gapopen $gapopen -gapextend $gapextend -width $width -wordlen $wordlen -outfile '$ofile1' -errorfile '$ofile2' -aformat3
+ $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/supermatcher.html
+
+
+
diff --git a/tools/emboss_5/emboss_syco.xml b/tools/emboss_5/emboss_syco.xml
new file mode 100644
index 00000000000..2c5fff4c343
--- /dev/null
+++ b/tools/emboss_5/emboss_syco.xml
@@ -0,0 +1,192 @@
+
+
+ Synonymous codon usage Gribskov statistic plot
+
+ macros.xml
+
+
+ perl '$__tool_directory__/emboss_single_outputfile_wrapper.pl' syco -sequence '$input1' -graph png -goutfile '$ofile1' -outfile '$ofile2' -cfile $cfile -window $window -uncommon $uncommon -minimum $minimum
+ -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/syco.html
+
+
+
diff --git a/tools/emboss_5/emboss_tcode.xml b/tools/emboss_5/emboss_tcode.xml
new file mode 100644
index 00000000000..b000d4e3af5
--- /dev/null
+++ b/tools/emboss_5/emboss_tcode.xml
@@ -0,0 +1,41 @@
+
+ Fickett TESTCODE statistic to identify protein-coding DNA
+
+ macros.xml
+
+
+
+ tcode -sequence '$input1' -outfile '$out_file1' -window $window -step $step -rformat $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/tcode.html
+
+
+
diff --git a/tools/emboss_5/emboss_textsearch.xml b/tools/emboss_5/emboss_textsearch.xml
new file mode 100644
index 00000000000..044ca040014
--- /dev/null
+++ b/tools/emboss_5/emboss_textsearch.xml
@@ -0,0 +1,51 @@
+
+ Search sequence documentation. Slow, use SRS and Entrez!
+
+ macros.xml
+
+
+
+ textsearch -sequence '$input1' -outfile '$out_file1' -pattern '$pattern' -casesensitive -heading $heading -usa $usa -accession $accession -name $search_name -description $description -html
+ $html_out1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/textsearch.html
+
+
+
diff --git a/tools/emboss_5/emboss_tmap.xml b/tools/emboss_5/emboss_tmap.xml
new file mode 100644
index 00000000000..e0b98c967fe
--- /dev/null
+++ b/tools/emboss_5/emboss_tmap.xml
@@ -0,0 +1,40 @@
+
+ Displays membrane spanning regions
+
+ macros.xml
+
+
+
+ perl '$__tool_directory__/emboss_single_outputfile_wrapper.pl' tmap -sequences '$input1' -outfile '$out_file1' -goutfile '$out_file2' -graph png -rformat $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/tmap.html
+
+
+
diff --git a/tools/emboss_5/emboss_tranalign.xml b/tools/emboss_5/emboss_tranalign.xml
new file mode 100644
index 00000000000..50178f4d0e4
--- /dev/null
+++ b/tools/emboss_5/emboss_tranalign.xml
@@ -0,0 +1,82 @@
+
+ Align nucleic coding regions given the aligned proteins
+
+ macros.xml
+
+
+
+ tranalign -asequence '$input1' -bsequence '$input2' -outseq '$out_file1' -table $table -osformat3 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/tranalign.html
+
+
+
diff --git a/tools/emboss_5/emboss_transeq.xml b/tools/emboss_5/emboss_transeq.xml
new file mode 100644
index 00000000000..8b16e1ee4c3
--- /dev/null
+++ b/tools/emboss_5/emboss_transeq.xml
@@ -0,0 +1,130 @@
+
+ Translate nucleic acid sequences
+
+ macros.xml
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/transeq.html
+
+
+
diff --git a/tools/emboss_5/emboss_trimest.xml b/tools/emboss_5/emboss_trimest.xml
new file mode 100644
index 00000000000..c55e7aa7493
--- /dev/null
+++ b/tools/emboss_5/emboss_trimest.xml
@@ -0,0 +1,85 @@
+
+ Trim poly-A tails off EST sequences
+
+ macros.xml
+
+
+
+ trimest -sequence '$input1' -outseq '$out_file1' -minlength $minlength -mismatches $mismatches -reverse $reverse -tolower $tolower -fiveprime $fiveprime -osformat2 $out_format1
+ -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/trimest.html
+
+
+
diff --git a/tools/emboss_5/emboss_trimseq.xml b/tools/emboss_5/emboss_trimseq.xml
new file mode 100644
index 00000000000..8e1ec34b68e
--- /dev/null
+++ b/tools/emboss_5/emboss_trimseq.xml
@@ -0,0 +1,89 @@
+
+ Trim ambiguous bits off the ends of sequences
+
+ macros.xml
+
+
+
+ trimseq -sequence '$input1' -outseq '$out_file1' -window $window -percent $percent -strict $strict -star $star -left $left -right $right -osformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/trimseq.html
+
+
+
diff --git a/tools/emboss_5/emboss_twofeat.xml b/tools/emboss_5/emboss_twofeat.xml
new file mode 100644
index 00000000000..b9da42481cb
--- /dev/null
+++ b/tools/emboss_5/emboss_twofeat.xml
@@ -0,0 +1,94 @@
+
+ Finds neighbouring pairs of features in sequences
+
+ macros.xml
+
+
+
+ twofeat -sequence '$input1' -outfile '$out_file1' -atype '$atype' -btype '$btype' -minrange $minrange -maxrange $maxrange -asource '$asource' -asense $asense -aminscore $aminscore
+ -amaxscore $amaxscore -atag '$atag' -avalue '$avalue' -bsource '$bsource' -bsense $bsense -bminscore $bminscore -bmaxscore $bmaxscore -btag '$btag' -bvalue '$bvalue' -overlap $overlap
+ -rangetype $rangetype -sense $sense -order $order -twoout $twoout -typeout '$typeout' -rformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/twofeat.html
+
+
+
diff --git a/tools/emboss_5/emboss_union.xml b/tools/emboss_5/emboss_union.xml
new file mode 100644
index 00000000000..9228f668a7e
--- /dev/null
+++ b/tools/emboss_5/emboss_union.xml
@@ -0,0 +1,65 @@
+
+ Reads sequence fragments and builds one sequence
+
+ macros.xml
+
+
+
+ union -sequence '$input1' -outseq '$out_file1' -osformat2 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/union.html
+
+
+
diff --git a/tools/emboss_5/emboss_vectorstrip.xml b/tools/emboss_5/emboss_vectorstrip.xml
new file mode 100644
index 00000000000..de8b079b46b
--- /dev/null
+++ b/tools/emboss_5/emboss_vectorstrip.xml
@@ -0,0 +1,74 @@
+
+ Strips out DNA between a pair of vector sequences
+
+ macros.xml
+
+
+
+ vectorstrip -sequence '$input1' -vectorsfile '$input2' -outseq '$ofile1' -outfile '$ofile2' -vectorfile yes -mismatch $mismatch -besthits $besthits -linkera '$linkera' -linkerb
+ '$linkerb' -osformat4 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/vectorstrip.html
+
+
+
diff --git a/tools/emboss_5/emboss_water.xml b/tools/emboss_5/emboss_water.xml
new file mode 100644
index 00000000000..3d23706e595
--- /dev/null
+++ b/tools/emboss_5/emboss_water.xml
@@ -0,0 +1,59 @@
+
+ Smith-Waterman local alignment
+
+ macros.xml
+
+
+
+ water -asequence '$input1' -bsequence '$input2' -outfile '$out_file1' -gapopen $gapopen -gapextend $gapextend -brief $brief -aformat3 $out_format1 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input datasets need to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/water.html
+
+
+
diff --git a/tools/emboss_5/emboss_wobble.xml b/tools/emboss_5/emboss_wobble.xml
new file mode 100644
index 00000000000..54afc12a7dd
--- /dev/null
+++ b/tools/emboss_5/emboss_wobble.xml
@@ -0,0 +1,37 @@
+
+ Wobble base plot
+
+ macros.xml
+
+
+ perl '$__tool_directory__/emboss_single_outputfile_wrapper.pl' wobble -sequence '$input1' -graph png -goutfile '$ofile1' -outfile '$ofile2' -window $window -bases '$bases' -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/wobble.html
+
+
+
diff --git a/tools/emboss_5/emboss_wordcount.xml b/tools/emboss_5/emboss_wordcount.xml
new file mode 100644
index 00000000000..e077c8b8f74
--- /dev/null
+++ b/tools/emboss_5/emboss_wordcount.xml
@@ -0,0 +1,34 @@
+
+ Counts words of a specified size in a DNA sequence
+
+ macros.xml
+
+
+ wordcount -sequence '$input1' -outfile '$out_file1' -wordsize $wordsize -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input dataset needs to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/wordcount.html
+
+
+
diff --git a/tools/emboss_5/emboss_wordmatch.xml b/tools/emboss_5/emboss_wordmatch.xml
new file mode 100644
index 00000000000..1da7ea8c7f0
--- /dev/null
+++ b/tools/emboss_5/emboss_wordmatch.xml
@@ -0,0 +1,68 @@
+
+ Finds all exact matches of a given size between 2 sequences
+
+ macros.xml
+
+
+
+ wordmatch -asequence '$input1' -bsequence '$input2' -outfile '$out_file1' -aoutfeat '$out_file2' -boutfeat '$out_file3' -wordsize $wordsize -aformat3 $out_format1 -offormat4 $out_format2
+ -offormat5 $out_format3 -auto
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: warningmark
+
+The input datasets need to be sequences.
+
+-----
+
+ You can view the original documentation here_.
+
+ .. _here: http://galaxy-iuc.github.io/emboss-5.0-docs/wordmatch.html
+
+
+
diff --git a/tools/emboss_5/macros.xml b/tools/emboss_5/macros.xml
new file mode 100644
index 00000000000..4a0e4f55e2a
--- /dev/null
+++ b/tools/emboss_5/macros.xml
@@ -0,0 +1,14 @@
+
+
+
+ emboss
+
+
+
+
+ 10.1016/S0168-9525(00)02024-2
+ 10.1101/gr.5578007
+
+
+
+
diff --git a/tools/emboss_5/test-data/1.fasta b/tools/emboss_5/test-data/1.fasta
new file mode 100644
index 00000000000..c9ecbb612dd
--- /dev/null
+++ b/tools/emboss_5/test-data/1.fasta
@@ -0,0 +1,2 @@
+>hg17
+gtttgccatcttttgctgctctagggaatccagcagctgtcaccatgtaaacaagcccaggctagaccaGTTACCCTCATCATCTTAGCTGATAGCCAGCCAGCCACCACAGGCAtgagtcaggccatattgctggacccacagaattatgagctaaataaatagtcttgggttaagccactaagttttaggcatagtgtgttatgtaTCTCACAAACATATAAGACTGTGTGTTTGTTGACTGGAGGAAGAGATGCTATAAAGACCACCTTTTAAAACTTCCC-------------------------------AAATACT-GCCACTGATGTCCTG-----ATGGAGGTA-------TGAA-------------------AACATCCACTAAAATTTGTGGTTTATTCATTTTTCATTATTTTGTTTAAGGAGGTCTATAGTGGAAGAGGGAGATATTTGGggaaatt---ttgtatagactagctttcacgatgttagggaattattattgtgtgataatggtcttgcagttaca-cagaaattcttccttattttttgggaa---gcaccaaag----tagggat---aaaatgtcatgatgtgtgcaatacactttaaaatgtttttg-----ccaaaataatt----------------aatgaagc--aaatatggaaa-ataataattattaaatctaggtgatgggtatattgtagttcactatagtattgcacacttttctgtatgtttaaatttttcatttaaaaaaaaactttgagc-----tagacaccaggctatgagctaggagcatagcaatgaccaa----------------------------------------------------------------------------------------------atagactcctaccaa--------------------------------------------------ctc-aaagaatgcacattctCTGGGAAACATGTTTCCATTAGGAAGCCTCGAATGCAATGTGACTGTGGTCTCCAGGACCTG-TGTGATCCTGGCTTTTCCTGTTCCCTCCG---CATCATCACTGCAGGTGTGTTTTCCCAAGTTTTAAACATTTA------CCTTCCCAGTGGCCTTGCGTCTAGAGGAATCCCTGTATAGTGGT-ACATGAATATAACACATAACAAA-AATCATCTCTATGGTGTGTGTTGTTCCTGGGGTTCAattcagcaaattttccctg-ggcacccatgtgttcttggcactggaaaagtaccgggactgaaacagttgatggccca-atccctgtcctct---taaaacctaagggaggagaTGGAAAGGGG-CACCCAACCCAGACTGAGAGACAGGAATTAGCTGCAAGGGGAACTAGGAAAAGCTTCTTTA---AGGATGGAGAGGCCCTAGTGGAAT-GGGGAGATTCTTCCGGGAGAAGCGATGGATGCACAGTTGGGCATCCCCACAGACGGACTGGAAAGAAAAAAGGCCTGGAGGAATCAATGTG-------CAATGTATGTGTGTTCCCTGGTTcaagggctgg-gaactttctcta-aagggccaggtagaaaacattttaggctttctaagccaag--gcaaaat-tgaggatattacatgggtacttatacaacaagaataaacaatt---tacacaattttttgttgacagaattcaaaactttat----agacacagaaatgcaaatttcctgtaattttcccat-gagaactattcttct--tttgttttgttttgcgacAGGGTTGCGCtgatcctcccgcctcagtctccctaagtgctgagatgttgcaggaagtcagggaccccgaacagagagatcggctggagccgtggcagaggaacataaattttgaagatttcattttaatatggacacttatcagttcccaaataatacttttataattttttatgcctgtctttgctttaatctcttaatcctgttatcttcataagctaaggatgtacgtcacctcaggaccactgtgataattgtgttaactgtacagattgattgcaaaacatgtgtgtttgaacaatatgaaatcagtgcaccttgaaaaagagcagaataacagcaatttttagggaacaagggaagacaactataaggtctgactgcctgcggggtcgggcaaagggagccatatttttcttcttgcagagagcctataaatagacctgcaagtaggagagatattgctaatttcttttgctagcatggaatattaatattaacaccctgggaaaggaatgcattcctggggggaggtctataaatggccgctctgggaatgtctatcctacgcaatggagataaggactgagatacgccctggtctcctgcagtaccctcaggcttactagggtggtgaaaaactccgccctggtaaatttgtggtcagaccagttttctgctctcgaacactgttttctgttgtttaagatgtttatcaagacaatacgtgcaccgctgaacacagacccttatcagtagttctcctttttgccctttgaagcatgtgatctactccctgttttacaccccctcaccttttgaaacccttaataaaaaacttgctggttt-gaggctcaggtgggcatcacagtactaccgatatgtgatgtcacccccggcggcccagctgtaaaattcctctctttgtactctctctctttatttctcagccagctgacacttatggaaaatagaaagaacctacgttgaaatattgggggcaggttcccccaataTCTGGTGCCCAACGTGGGAtactgagattacaagcatgagccactgcatctggcctcttcttttgatttttttttttcaaacttttacaaatgtagaaaccattcttagcttttgggcattaccaaacccggcagtgg-caggctcggttcaccaacgtcatttgcagttccccgCTTTATGTTATGGgttttgttttgttttgtttttttt-attgagacagagtttcactcttgttgcccaggctgtagtgcaatggtctgatcttggctcactgcaacctccacttcccaggttcaagccattctcctgcctcagcctctcaagtagctgggattacagacactcaccaccacacctggctaattttgtatttttagtagagatgaggtttcaccatgttggccaggctggtctcgaaatcctgacctcaggtgatccacccaccttggcctcccaaagtgctgggattacaggcttgagctaccacgcctggctGGGTTGGTTCTCAATGGAGTGGTTTGTTTTTGGAGCTGCTCT-GCGCAGtggggaccagaataggcctg-------------------ggttcctagcccattgctattcctt----accagctgtggattctaaggaaagtcatttaacctcgctggaccttag-attcctcatccctgaaGCCCAAGGGTaaaacaaaacaaaacaaaacaaaacaaaccaaCCCATCATGTAAAGCGGGGAACTACAAACGATACAGGTGAAACATGCCTACCACACCACTCACAGGCT--ATGATGACAAAAACGTGGCTACATCTGGGACCACCCCCCAACCCCCACTTTGTACGTAGGAAATACGGAGTTGAGGATGGAGACCCACAGTATGTCCAGAGTGTCCCCAAAGGCCACAGTGCCCGCCTGGAGCCCTCCAGAGAGCGTGCACTCCCTGGGGTGCCAGCCAGAGACAACTTGCCCTGAGGCTTGGAACTCGATTCTCCGCGTGCCAGAGAAGGGGTGGGACTTCAGAACCCCCAACCCCGCAATCTGGGTCGGGGAGCCTGGCGCACTGCGGGCCGCTCCCTCTAACCCTGGGCTTCCCTG------GCGTCCAGGGCCGTCGG-----------GGCCGAGTCCCGATTCGCTCCCACCCCGAAGCCGCGCCAGGACCAACGAGGGCGCAGCCGTATGCCCCAGCCCGCTCCGCGGAGCCCCTCACAGCCAcccccgccccgaccgcgccccgcgcggcTCGAAGCACCTTCCCAAGGGGCTGGTCCTTGC----------GCCATAGTCGCGCCGGAGCCTCTGGAGGGACATCAAGGATTTCTC-GCTCCTACCAGCCACCCCCAAATTTTTGGGAGGTACCCAAGGGTGCGCGCGTGGCTCCTGGCGCGCCGAGGCCCTCCCTCGAGGCCCCGCGAGGTGCACACTGC---------GGGCCCAGGGCTAGCAGCCGCCCGGCACGTCGCTACCCTGAGGGGCGGGGCGGGAGCTGGCGCTAGAAATGCGCCGGGGCCTGCGGGGCAGTTGCGCAAGTTGTGATCGGGCCGCTATAAGAGGGGCGGGCAGGCATGGAGCCCCGTAGGAATCGCAGCGCCAGCGGTTGCAAGGTAAGGCCC-CGGCGCGCTCCTTCCTCCTTCTCTGCTGGTCTTTCTTGGCAGGCCACAGGGCCCCACACAACTCTGGATCCCGGGGAAACTGAGTCAGG-AGGGATGCAGGGCGGATGGCTTAGTTCTGGACTATGATAGCTTTGTACCGAG-----TTCTAGCCAGATAGAAGGTTACCGGGAGCTGGGGAGCGTTGGATTTGCTGCTGGGCTGTGCCGGTGCCCAGAAGGCA------GGACCTTGCAGAACCAGCCAGGTCCCTGGGAGACTGTCAGACCCACCAACCTGGTGGCATTCGCAGAGCTGAGATGCATTGGAAATTGCCTTGGGCACATCCCCAAAGATCAGGATGTCCCACCCCAGTCTGAAGGAGA---TAAAGTTGGGGGTAGGAGAGACGCAG-ATGCAAGTGATCAGTCTC---AGTCCCAGACATTGCCTTGCTCTGCGGGTAGGAATTCAGGATTCATTTTCCAGGGAAG--------TTCCTGACCTCTGAATGAGAGGGGCTGTGTAAGGCCAATGCCTGGG-AGGAAGGCAAGGATGAGTAGAGGTGGGGGGAAACAAGTGTCAGGAAGA--------------------------------------------CTCAAA---------ATCTTC--------------------------------------------------------------CAGAGAAATTGT-----GCAGGGTCTTACCAGATCTGTCCTCAAAGCCATGCAAATTGCCTTCTTTGCAATGCAT-ACAATGAGGTGTCTCTGGGGGTCAGAACTGG-----------------------TTATTAGGGAACTTCTAGCCAGGACTGCTAAATACGCGCTGTTGG---------CCCACCAGGCTCACCTATAGCCT-TCCTTCAGTCTGGGCTTGGTTTGGATTTCACTGTGGGTGCCATCGCCTTTACACTCCTGTTTCTATAGTTTAAAGATAGTGGTGCTTTGGGAAAG---TGACTCCTTAAATACAGTTAGGTCCAAGTGA-GACAAGTGGCCTGGCTGTCATTTCAGAATAGCAGCTTCCAAGAGG----------TGATTAATTTCTGTTGGAAGGGTGAT-CTTTGGGGAGGT--GGGTGAAGAGCAGAGACTTGGTGGTACCGTTCCAGGAGCACAGGCTCTCT-----TCCTTTGCA--GTGCAGAATGACCTCTGGCAGCCGGAGTTGTGTTTGTT--------CTGTAGGATTCTGAGGTGGGCCATGGGCAGCTGGAACTGGG-----GAATTTTGCCAATCTCTTTCATATTAGGATTGTCTGCAGAACCAGATATGGAGG------CTTCTAGCAACGTGAGTGCTCCTGTTCTAATGCCCTTAGAAACAAGAAGGCCACACTGATCATTTCTCTCACTTAGGCAGGGAGACAAGGCAAGAGAGAAACAGT-----------------GGATGC--TTTTAGGTTCTTTCCCTTCCCAAGCAGTTGTGGACATTGGGCTGA-GGGGAACATTTCCACATTGGCTAAAGGAGCGTCCTCCTCATATTTTGTACATTTTATACCCAA--AATAA-CTCTTCTTGGTATTT-GGGGAAATATTTTCCTCCCCGTCC------------ATTCCAGGAAATGGCTCCAAGTGCCAAGGACAGAGCCAGGGAAGTTGCAATGAATTCCTGCCCGTCAGCCCCAGGCAGATGCCTTGCACGTCTGAGTGGCCCATGCAGAGCGTGGAGGTGGCCGCC----------------ACGGAACC-TGGGTCAATGT-CCCACCCCCG----CTTAGATGCCA-CCAGGGG--CGTGGGAGCCAAGGAG--AGAAGAGGGGCTCCAGGAAGGTAGAGTCCTTGTGTCTTGTGCATCTGTGAACAGCACTGGTATGATTTAAAGGAAAATTGAGCCAAATTTTCCGGCAGTCAGTT-----ACCCCATCCCCACCGGGGTAGGAGTCTGGCAGCCGCAGCTCCATTCTGGCCAGTCGGCAGAGAGCCTTGAAATTCTTCTTTGTCCACACAGTTGTCTCAGAGAAACAG--AGAGGTT-GTTTCTGCTTAAAAACAACACACTTGGTGTCTGGGCCCACAGACTCCTTTGCACTTATTCCACGTGTGACAGCCAATGTGCCTCGTTGCTTAGCAGACAGCATGTTACCGTCTTTCCTGCTCAGTTTGTTAG--------------CTCTATGGAATGGAATTTATAATCAATGCCCATACCAACATTTCACTAATATCATAGGAGATTTAGTCTCCATCTGGGTGTACATTACATTTGC--TCTGGGG-TGCTCCAGGC--TGGGGGGTTGCCAAGGAAGAGAAGAGAAACCGCAGAGAAGAC---GGGAGGGCAGGGCAGGGGTCTCTGAGAAGGGGAGGGGTCCCAGAGTGCAGGAGCAGGAGCCAGGCTC---------ATGAAAGGGGCCACGGGCGGGAGTATCCAGGGACGGCAGTCAAGATGGAGCACAGCTTAGG--AAGCTGAAGGGAATCCTGGCCCACCTGGGTGCTAGAGGGCACATAGGAAGTGCAGGAAGCAGACCAAGGTCCCCAAGAGAGGGAGACCTGGACGCTGAAGCATTTTCTGTCTTTATTAAG-------------ACAACTCCGTAAGAATTCCTGCTGGGCCAAAGTGAATTCTAGGATGCGACTTTAAGATGGGAGCAAGCGAACCATTGAGGAGGCAGGTTACCCTAGTTAGCCAATGCAGATCGAGAATGGGAAATCTTTCatttattcatgcaacagatatttaacgaagccctgccgtgttccaggcctgtgatagatgctggaacaggtacagaga----------tAc-------aggtgtcattaattgatcaggg--caacctctc---cttctgagt--cttgctggagcttcagatgc-ccctcacacagagctcgagggagcctc-aacaattgatcagaagtcaggcaccatggctcacgcatataatcccagcactttgggaggccaaggcaggtggatcactggagcccaggagttccagatcagctggggcaacatggcaaaaccccatctctattaaaaaaaaaaaaagtaactggatgtgatggtacacacctgtagtcccagctacttgggaggctgagaggtgggagaattgcttgagcccgggaagtcgggggtccagtgagccttgatcacaccactgcactccagcctgagtgacagagcaagaccctgacacacacacacacacacacacacacacacacacagattagagctgaaacaggagtagaaacctatctg-tatctctgATGA-GATCAGATC---------TTTCTGATGAACAGAAAGAATGTAACCCCTGTACTCACACCCTCTCTGCTGGTTACATATGTTAACACGATTTCTCAAATGAGGCTTTTGGTTGCAAATAAGAGAAAATCACTCACGCT-GGCCCTGTG--TTTTTCAAATTGTTTATTGTGATCAACATTTGAAAAAAGAGCCGAGACTCTCAAGAGTGCATTACCCACGGTAAGGGTGAATTTT-ACTTCTTGACACTTATTTCTCTTACATGTATCTATCTGTCTC-----AAATGAAAAATATATTTAGAAAGTTGAAAGCTATCCAAGTGAGTATAAGAAAAGAGTATCTCACCCTGAAGGCTAAGGACAGGGAGGGC---------------------------CACCAGGCCTCACGAGGACCCAGGAACCACAAAGAAGGCT-AGGAAGGAGCACAGGCGGTGACCATACTCTGGCTCAGTGGCTATGTGGGCTCTGGTCTCTCTCAGCTGTTCCATGCATATGAGGCCAAATGTGGCTACCCTAGAGCTTCTGAGCCCTCAACAGAGATGAACTGGACTCTCTGCAGCCCCACTCTAAATTCCTAAGAGAGAAGTTGATTGACCCAATCAGGGTCAGGAGAAGGAAGGGAGGAGGAAAGGGAGGAGAGAAGAGCCTCTTCGTCTCTTGCCTACCACTGGCCAGGCAATTGTAGCCAAGGGGGCTGGAGTGTAAATGCAAACATAGCCATCAAGGGTtgtgtatgtgtgtgtgtgtgtctgtgtgtgtgtatgtgtgtCTCTTGGGTAGGTTAGA-TCTCCCAGGAGGTCCCTACTAAACAGACTTAAGCCCGCAAAATTTTAGCTCTCCAGCCTCACACACTCCACCCCTCTACCATATTGAATCTTCCCAAACCAACTATGGCTTTCCCTAACTCCGGAGc------ttggcctggaatgccctgcttcccctctttcccctggggaacgcctgtccttcaggcctcagttcacacactgcctcccttgcaaagctctccTCCCATCCCCGGAGTCCCT--CTTCCCCTTTGTTCTTTGGGTTCTATGCTTCTTCCCTCATAACTCCCACCAGGTTGTGTTAAAATGAGTTGTTCAAGGTCCTGTCTGTTCCACTAGATTCTGAGCAACTTGGAGAACGAAGATCCAAACTTCGCTGCCTTTATTTCCTCCTTTGTTCTTTTCTCATCCCCAAGTCCCTTCCAACTTGGAGTTATgaagaaaggaaggaaggaagggtgggagggaagaaCAGGAGGGGATCCCACAGG-AGAATGTGTATAGGGAGAGGACTCAGACTAGCTAAAGCTTTTCCCTCATAATTAATAGCAAATACCATGTTACCTGAATTTAATTCACAGTAGCATACAAAAGACTCGCTTTGTTCT-------CCCCA---------TTGATGTCATCAGAGG--------------------GCTGTGGG--------------CAGGCCTAATCTTGGCTCAGGAGGCCCTCCAGCCTGGATCTAAAGAGCAGCAGATGggccaggctcggtggctcatgcctgtaatcccagcattttgggaggccgaggcgggtggatcacgaggtcaggagtttgagaccagcctggccaagatggtgaagcctcgtctctactaaaaatacaaaaattagccaggtgcggtggtgggcgcctgtatttccagctacccgggaggctgaggaggctgaggcaggagaatcgcttgaacccgggaggcggaggttgcagtgagccgaggtcacgccactgcactctagcctgggcaacagagcaagactccgtcaaaaaaaaaataaaaaaataaaaaaataaaaaaaataaaGAGGAGCACACATCTCTGCCCATCCTAACTCCCACTTTGACATTGAGGTCCCCAGGATGGAGGGTCTGCCTCCATCTGCCTTGTCCCCTG-CAATGGTGGGAAGGTGATGGAGCTCAAGTCTAGAGGCCACCAGCTTCTTAGGGAGG--TAGGAGGTG---------------GAGGGTGGGGTGC-GGGCCCTGCACACAACTGCCAAGTGAGGATGGGGGTGGG-GTCCACCTGAGGATAAGTAACAGTGAGGCTGGTGCAGAGGACCCAGGTGGAGGTAGACAGCAGAATTTGTGGTGGGGT--GGATGGCAC-ATTATATAAGCCTCTCTTGC------TGCCCTGT---TTACTGAGATTGTTTCAttatcttttttggcttttgtttttaagagatggggtcttgctgtgtcacacaggctggagtgcactgtgtgatcatacctcactgcagcctcgacatcctgggctcaggcaaacctcccaccttggcctcccaagtagctgggaccacaagcgtttgccaccacactcagctatttttatttttattttta--ttttttttagagatggggtcttgctgtgtcgcccaggctggtcttgaactcctgggctcaagcgatcctcctgccttggcctcccaaagccctgggattataggctgagccaccacacccagccACATTTCATCTGTGCAGCTCCAGGGGCTCCACATTCT-ACTCTTCTCATTTCTTCTCCAGGGTACCC----------ATGGCAAGGGATGAGGGT--AGAAGATGGGGCA--GCCAGGCCTTGATTAAAGGAGAAGGAAGGCAGCCTGTGGAGAGG---GCAGCC---C---AGGGAG---TGCAGAGAGAAGTGGGCCATGAGGGAGA---CAGCAGAGTGCAGGCTGCGTCC---CAAATGAGCATACAGCCCACTGTGAGCCCACC--ATCTTCCTAGA-GA--CCCCTCTCCTCTCC-AGGAGCTGCTTCAGTAGCACTCA---------GAGGAAAGAATGATGC--------TGTATCAACATTTCAGCAGCTCATCTTTTAACTCTAAGAAAATGGCAGCTCCTAAATGTTCAA--AACTGCTTTGGAAACTTCT---GGAGAGAGGTTTTGCAGCTCAGGCAGACAGCTGATCGCGGCCTTTCTTCCACCCCAACCCATGCTCTCCCCATGCT--CTCCTGCCACAGCTGCAGCGGGCCCCTGGGTCCTACATTTGCAG-CCCTTTGTCTCTGAGCT-----CAGACTTCCAATTCCAAGCGGCAGCTGGGCAGGCTCACCAGCATGT---CCAGCCAGTACTAGGACATCAGCAGGAGC----CCAACCACCTCTTTCCAAAATCTCTCCTCATGTCTCTCCTAGTTTCCATCTCCATCCTTCTAGTCAGCCAGGCTGAAAACATT-----------------TGCTCCTCAGGGTGCAGAAGGGAAAGCTTTGCCTCCCTTCCTGGTGCTCACTGCCCCTGCGATTCCAGCCCAAGCCCTCCCCGGCTCCTCACC----------CTGGTGTCAGCTGGAAGCCACCATCTCCTAAACCCACCTGtgttcttccacctctgc--------cagggctgc-cctctcctccaccttcacaaactcaattcctacccattctcaggtcccttatcaaatgccatctcctccatgatgcctccctgattccccTGCTGGAaataatggtgataacagctaag--gcattggggttggctacgtgccaggcaaggagttggcactttacatgctttatctcatttcagccacataacatcgacaggt-ggcattatgattcatatcatccccatctgatagccaggaaaactgagtcccagagaggttagc-cactttcctagggccCTGTGCTCTGACTCAAGCATAGCTCTGAGGAACTCTAGCATTCATCAGTTTAAGCACCATGACTTTCTTTGCTGAGTCACCCAAGGCAT-TTCTTCATTTAAATGTTCTTCCTTGGCCAGGCGCAGTGGCTCAggcccaatgcggtggctcacgcctgtaatctcaacactttgggaggccgaggtgggcagataatctgaggtcaggagttcaagaccagcctggccaacatggtgaaaccccatctctactaaaaatacaaaaaaatgaggctgggcgtgatgactcacacctgtaatcccagcactttgggaggccaaggcaggtggattacatgaggtcaggagttcgagaccagcctggccaacatggtgaaatcctatctctattaaaaatacaaaaaattagccaggcatggtggcaggcacctgtaatcccagctacttgggaggctgaggcaggaaaatggcttgaacccgggaggtggaggttgcagtgagccaaggttgcaccattgcactccagcctgggcaaaaagagggaaacatcgtctaaaaaagaaaaaaaaaaaattagccaggctgggtggtgcatgcccgtaattccagctactcaggaggatgaagcaagagaattgcttgaacccaggaggcagagattacagtgagctgagatcacaacactgcactccagcctaggtaaagaacaagactccatctcaaaaataaataaataaaaataaaTGTTCTTCCTTGCAATGAAGTTAAATATGTAAATTCTCAAACCAGTTGCTTAAGGGCACAGTTTTGTTCTTTACCTATATTTTTAACAAATATTTTATGTAAGTAGTTGAC-AAAATCAAATACTGT-GTACACTACCGAGGCTTCCCTGGGAAAGCCATCAG-CCTCTGCCCCATCCCTTCCCACTCCTGATT-CCACTTTCCTGTGTTTCCATATCTTTTTCATGTCTGTTTCTGGCCCACAGTGGGCGATCAATACATGTTAGCCACCAACCATCAAACCTATATTGAGTAATTATGGTATGTCAGGCACTATGCTCAATGAAATTGTAttaggcttgtacaaaagtaattgtggtttttaagagtaatggcaaaaacggcagttactttcgcaccaacTATTTGCTGCCTTGAATTATTCCTCCTCTC-CTCATCCCTAAACCCTGCTCCTCCCAGCCATTCTTCCTCCCCTTCTTGGGCCATGGCCAGGCCCCACCCAGGTACTAAGACTCAGGTGAACCAAGGAAGACTTAATGCCCACTCTTTTCTGATGCCCATGTT--GGCATGTGTTAAGtcggttagcattaagtttggctgcatttagcagagacccaaaagaacagtgccttttaaaaggcagaggttatgtctctcacacacacccagcacaagtccaag-------------------------accagcatggcatctcagctccatcaa--cctcaggaaccgagctcctgcagctccctgccctgcagttgataaggtgaggtctttgtcctcctggttcaagatggtgctagaatgttggctaccatatctatagtccaggcatcagaatggagcaagggatgaaaaaggaagagatgaaggcacacgacaggttcctgagagctggcacaggacacttctgcttatatttcactggccagaacttagtcacatggtcacacctagttgggagactctgagaagtaa----agtatttattctagatggccatatccctacc-taagacttggagttttctatgactggggaagaacggaagacaagatattgggaaagactagcagcctctactaAAAGGGTGATCtgtgttgatgtgcgtgtgtgtgtgatgtttgtatg---agcatgtgtgt-tatgtgttgt--gtgtTGGTGGGGCA--GATTCTTGCGAGCACTTTGGTCTCAGATGGACCTGCTACCAGTTCTCTCTGCAGACCCCCATAGGTTTCTCCTAAACCTGGCCT-CTCCTATTAGGCAGCCTTACTCAGCGGCAGCTTCTCAGCTCCATGTTTTCAAGGAACCACAATTTATTTCCAGCATCCACTGAAGCATATTATCAGTGGTGATAGAGGGGGCTTGTAAAACTGTTTTTCCACTTAGGTATTAGAGGGTGGCCATTATTTGAGAGTGAC-----TATGACCACAGTTAATCTGGTAATAAATTCTCTTGGGTAGGAGGGGGAAAGGAAAGGATGCTTTAAGGAAGCATCTTGCCAGGAGACACAAAGCTAACAAGAGTGGAGCCTGCAG----------------------------CTGGAGCCGCAGAGCCTAATCACTACACCCGCCCATCTCTGCTAGGGTTTCATGACTTCGTATCGGGGATTAGCAGTATTTAACTCTGTTGCACAAACATTTGGTGTA-----TTATTCAGGTAACAAGTAGCTAATAGAGGAAGTTTTACTTTTTTAAGACATAA--------------------ATTTGCCTTTTCCCAAATTACTTGGTACATAGTAC-TTTTCATGTTTGAAGTTGAGATGTGGGTACAATACCATAGCTTTATTCCAGAGCAGGGTATTTGTTTCCAAATGCCATGTTCCCAGCAGCTGCCCTTGACTGGGAATTGGGGTG-----TGATTTGGGCTTTTCCTTAAATCCTTGA-----GGAGCTGGA---GGGGTGGGTGGCTCGCACTCCTGCTTTctgg---------atctgaatc--------------ctgactctgtcatggacctgtt-tgactttgggcaagttgactcctattcctgagccccatat-ttttctcttctgtgaaattcagattaaaaA-AACATGGCTTTGATCAAACATTATAAATAATATATAGACAGACTGCTTGTTTTTATTGTATTGCCAG-AAATGAATCCTACTAATATTGCCATCTATGGACAGAAAATGTATTACCTGTCTTCATCAAGACCCAGACGAGGAAGAACACGAAAAGCGGAGATTAATTTTACTGCCATCTCCAGAACCGTCATCCTAATATTTACTTACAT-TTTATTATTATTTCAGGCTCATGCACATATACTTAGCATGGATCATTGGCCACAGACTCGCATACATTTAACTTTATTACCTTT-TGCCTCATGTATCTCATTAAAATTTTGCTGCTTAATCAAGGATCTGCATATTATTTTAATTTTAGAATTCACAGTTCCAAGACTTTGAAAGTTTCAAGCGTTCTGGGTGaatgtgttatgc--tctctcccgccaccatgtctttataccccctgatttctcagccact-atggcaaccactttctactcttagtagcccatatttag--tccaatccccagctcaggagacacttcttccaggg--agccccctgtgccttccagtagtatcttgtacctgccctttttgcaaagctctttcctcctggcttagaatggcccattgacctgtttgtttctcctattaaactgtaagccactcgagggtagagagcatctgttgttcaccattgcatcctcggtgctgagcactgcgtctgacatattatttagaaggtcagtaagtgctagtgggatTCAGGCTCCCAGTGGGTGGGAGAGAAAGGACGTAAGGAAGCAAGTGGTAAAGGCCCTCACAGA-GTATCAGCAGGCTGGTGTGA-GGGAGAAATGCAGAGGATGGGTGAGTAGCA-----TAATCGCTAATGAT-AGGGTAATGATAGAGCACATTTCACAACACCTTt-aagccctttcacgtgcatcagataatttgatcctcataaaagcctagagatagatatattacagg-gatgaaggtggagtattttgtggttatgtgatatg-tttaaaattatgcagtgagtaaatgactgggttcaaaccagaccttaaaagtctgttatctttccCTCG-AGCATGCAATGAAGTCTACATCATCCCTACCATGTCCATTTGATCACACCCTGGCCTCACAGCTCTGTGGTCTACAGGATACCTCATGGTGGTTTTATTGACCAGACAATAATCCTCTTTCTAAGGGGATGCATTTCATTAATACATATGTAGATCATGAATTGTCTTTGACTTTGAGGGGATGGTAGC----CAGAGCAGAAAGCAAAGCTGATTTTCATCCCCGTCTGGTAATGTGGTTGGTAATGTGAAGA-TGGGTGTATTCTGAGATACCGGCTCCTTGCAGTGTGTGGTTCCTTCTGTTTTCAGGCCC------AAGAAGCCCATCCTGGGAAGGAAAATGCATTGGGGAACCCTGTGCGGATTCTTGTGGCTTTGGCCCTATCTTTTCTATGTCCAAGCTGTGCCCATCCAAAAAGTCCAAGATGACACCAAAACCCTCATCAAGACAATTGTCACCAGGATCAATGACATTTCACACACGGTAAGGAG---AGTATGCGGGGACAAA---GTAGAACTGCAGCCAGCCCAGCACTGGCTCCTAGTGGCACT-GGACC-CAGATAGtccaagaaacatttattgaacgcctcctgaatgccaggcacctactggaagctgagaaGGATTTGAAAGCACAGGGC-TCCACTCTTTCTGGTTGTTTCTTTTGGCCCCTCTGCCTGCTGAGATTCCAGGGGTTAGTGG--------------------------------------------------------TTCTAATTCTAAACCACTCCAAGAACATTTGATTTTGCTACATGTTTCCATTTAAAAATCATAGGATTTGggctgggtgtggtggcttgtacctgtcatcccagcactttgggaggccaaagcaggaggatcattcgagcccaagagttcgagaccagcctgggcagcatagggagaccccatctctacaaaaataataaaaaatgttagctgggcatggtggtgtgtacctgtggtcccagctaggggaggctgagatggaaggatcacctgagcctgggaggttgaggctgcagtgggccctgatcatgccaccgtgctccagcctgggtgacagagtgagaccttgtctcaaaataaataaataaataaataaaAGTCATAGGATTTgatcaggcatgatgggtcacatctgtaagcccattgctttaggaggccaaggtaggaggatcagttgaggccaggagttcaagaccagcctgggcaacatggcaagacctctctctctaatttttaaaaaaataaaaaTTAAAGATAAGAAAAAAATCATAGGATTCTCATGAGGCCTCACGTGCTTATTTTCAACCTACCAAGGGGAAACCCAGGCCTCAGCGATTAGCTGAGC----------CACATGCAGGCACAG------------------------CCACTG-----TCTCTTTCCTTCCTGTCCCCTCTGTCCCCACCTTCTGCGCTCGCCTTCCTCCCTGACTTCACTTCCTTGAATCTTAGTGCCTACGACCAGAGGGAGCTGTGAAGTTCCTTG----TGTCCCATTGGCAGGAA-CAAGACCCCCAGAAGCATCTCCTCAGGGC------CTCTA-----TCCCATCTC-TAGATGTGCTTGTCATTAGG-Gttct-------------tgtagttccagctgatctctggccctgccgctcaaagatacccaaaagagcgagtctaccctttttcacattcaaccctctactgatttgcaaatagcagtcagtgcccaccctggtcttttctctggggtccagcaggcctagaccttcagccattttcctgatgaGGTCTGTAtttgaaattaggaagattaagtttgaatcttcacacttctgat----gtctgtgagatcttcagcaagttccttact--gtctttaagccttgt-tttcatcatctggataatggggatatcacacacta-ttcacaaggttgttatgaggcctaaattagctaaagcaATTGAATCCTCCTTACCCCCTGCATGGAGCTCTCTGGAGACTTCCACGTCTCCTGGTCATTGTGGGTGTCTTATGGTA-GTCTTGGGCAGTTAGGGAGAAGTTAGGTGTCTGGAAGCAAAGATGGCTCAGAACTAGATAGAGTC-TTGGGCATTTTATA-GATAAAAACTCTT--GTCTCCtttaaaaataataaaaaaaaattaGCTGGGCATATTAGCCACTCAGCAAGACTGCACGTGATAGATCCCGAGTGCCCCACCTTGGGTGGTGTAATACACAATATCACGGGAGCCCCGGGTAGTAACCACGGAGGTGTCAGCCTCAGTGCTGTGGGCAGATG-GATGGGGAGAGCC--TCCCGG-AACTGGAGTCACTGGAGCA----------------------------GGGTTGGGGGGCCTCACTGAGGGTACGGCCTTGATCTCTAAGGAGGAGGGACTGCCTGGAAAAGC-TGACTGGGAGGGAGGACTCGGCTGGGGGTAGAAGGGA----------CTAGGGAAGGCTGGGGGTGGGGGTGCTTATGGAGGACCTCAGATGCCTGGGGAACAGACTCCACTAAATAAAACATATGAAACCATGGCTGGTTCTTCAGCAGAGGCCATGTAGAGAAAGGAATGACCTAGGAAAGTTGGCCTGGAAGTGGAGGGAAGGATGGTGTGGGAAAAGCAGGAA--------TCTCGGAGACCAGCTTAGAGGCTTGGCAGTCACCTGGGTGCAGG-ATACAAGGGCCTGAGCCAAAGTGGTGAGGGAGGGTGGAAGGAGGCAGCCCAGAGAATGACCCTCCATGCCCACGGGGAAGGCAGAGGGCTCT-GAGAGCGA--TTCCTCCCACATG-CT-GAGCACTTGTTCTCCCTCTTCCTCCTGCATAGCAGTCAGTCTCCTCCAAACAGAAAGTCACCGGTTTGGACTTCATTCCTGGGCTCCACCCCATCCTGACCTTATCCAAGATGGACCAGACACTGGCAGTCTACCAACAGATCCTCACCAGTATGCCTTCCAGAAACGTGATCCAAATATCCAACGACCTGGAGAACCTCCGGGATCTTCTTCACGTGCTGGCCTTCTCTAAGAGCTGCCACTTGCCCTGGGCCAGTGGCCTGGAGACCTTGGACAGCCTGGGGGGTGTCCTGGAAGCTTCAGGCTACTCCACAGAGGTGGTGGCCCTGAGCAGGCTGCAGGGGTCTCTGCAGGACATGCTGTGGCAGCTGGACCTCAGCCCTGGGTGCTGAGGCCTTGAAGGTCACTCTTCCTGCAAGGACTACGTTAAGGGAAGGAACTCTGGCTTCCAGGTATCTCCAGGATTGAAGAGCATTGCATGGACACCCCTTATCCAGGACTCTGTCAATT--TCCCTGACTCCTCTAAGCCACTCTTCCAAAGGCATAAGACCCTAAGCCTCCTTTTGCTTGAAACCAAAGATATATACACAGGATCCTATTCTCACCAGGAAGGGGG-TCCACCC-AGCAAAGAGTGGGCTGCATCTGGGATTCCCACCAAGGTCTTCAGCCATCA---ACAAGAGTTGTCTTGTCCCCTCT-TGACCCATCT-----------------CCCCCTCACTGAATGCCTCAATGTGACCAGGGGTGATTTCAGAGAGGGCAGAGGGGTAGGCAGAGCCTTTGGATGACCA--GAACAAGGTTCCCTCTGAGAATTCCAAGGAGTTCCATGAAGACCACATCCACACACG--CAGGAACTCCC--AGCAACACAAGCTGGAA---GCACATGTTTATTTATTCTGCATTTTATTCTGGATGGATTTGAAGCAAAGCACCAGCTTCTCCAGGCTCTTTGGGGTCAGCCAGGGCCAGGGGTCTCCCTGGAGTGCAGTTTCCAATCCCATAGATGGGTC-TGGCTGAGCTGAACCCA---TTTTGAGTGACT----CGAGGGTTGGG-TTCATCTGAGCAAGAGCTGGCAAAGGTGGCTCTCCAGTTAGTTCTCTCGTAACTGGTTTCATTTCTACTGTGACTGATGTTACATCACAGTGTTTGCAATGGTGTTGCCCTGAGTGGATCTCCAAGGACCAGGTTATTTTAAAA---AGATTTGTTTTGTCAAGTGTCATATGTAGGTGTCTGCACCCAGGGGTGGG-GAATGTTTGGGCAGAAGGGAGAAGGATCTAGAATGTGTTTTCTGAATAACATTTGTGTGGTGGGTTCTTTGGAAGGAGTGAGA-TCATTTTCTTATCTTCTGCAATTGCTTAGGATGTTTTTCATGAAAA------------TAGCTCTTTCAG-GGGGGTTGTGAGGCCTGGCCAGGCACCCCCTGGAGAGAAGTTTCTGGCCCTGGCTGACCCCAAAGAGCCTGGAGAAGCTGATGCTTTGCTTCAAATCCATCCAGAATAAAACGCAAAGGGCTGAAAGCCATTTGTTGGGGCAGTGGTAAGCTCTGGCTTTCTCCGACTGCTAGGGAGTGGTCTTTCCTATCATGGAGTGACGGTCCCACACTGGTGACTGCGATCTTCAGAGCAGGGGTCCTTGGTGT-GACCCTCTGAATGGTCCAGGGTTGATCACACTCTGGGTTTATTACATGGCAG-----TGTTCCTATTTGGGGCTTGCATGCCAAATTGTAGTTCTTGTCTGATTGGCTCACCC-AAGCAAGGCCAAAATTACCAAAAATCTTGGGGGG--TTTTTACTC-CAGTGGTGAAGAAAACTCCTTTAGCAGG-TGGTCCTGAGACCT-GACAAGCACTGCTAGGCGAGTGCCAGGACTCCCCAGGCCAGGCCACCAGGATGGCCCTTCCCACTGGAGGTCACATTCAGGAAGATGAAAGAGGAGGTTTGGGGTCTGCCACCATCCTGCTGCTGTGTTTTTGCTATCACACAGTGGGTGGTGGATCTGTCCAAGGAAACTTGAATCAAAGCAGTTAAC-TTTAAGactgagcacctgcttcatgctcagccctgactggtgctataggctggagaagctcacccaataaacattaagatt-gaggcctgccctcagggatcttgcattcccagtggTCAAACC-GCACTCACCCATGTGCCAAGGTGGGGTA-TTTACCACAGCAG--CTGAACAGCCAAATGCATGGTGCAGTTGACAGCAGGTGGGAAATGGTATGAGCTGAGGGGGGCCGTGCCCAGGGGCCCACAGG-GAACCCTGCTTGCACTTTGTAACATGTTTA-----CTTTTCagggcatcttagctt---ctatta-----tagccacatccctttga---aacaagataactgagaatttaaaaataagaa-----aata--TGACCCCAAAGAGCCTGGAGAAGCTGATGCTTTGCTTCAAATCCATCCAGAATAAAACGCAGACCCCAAAGAGCCTGGAGAAGCTGATGCTTTGCTTCAAATCCATCCAGAATAAAACGCAGATGCTTTGCTTCAAATCCATCCAGAATAAAACGCAAATGACCCCAAAGAGCCTGGAGAAGCTGATGCTTTGCTTCAAATCCATCCAGAATAAAACGCATGACCCCAAAGAGCCTGGAGAAGCTGATGCTTTGCTTCAAATCCATCCAGAATAAAACGCAGACCCCAAAGAGCCTGGAGAAGCTGATGCTTTGCTTCAAATCCATCCAGAATAAAACGCAGATGCTTTGCTTCAAATCCATCCAGAATAAAACGCAGACCCCAAAGAGCCTGGAGAAGCTGATGCTTTGCTTCAAATCCATCCAGAATAAAACGCAGACCCCAAAGAGCCTGGAGAAGCTGATGCTTTGCTTCAAATCCATCCAGAATAAAACGCAGACCCCAAAGAGCCTGGAGAAGCTGATGCTTTGCTTCAAATCCATCCAGAATAAAACGCAGATGCTTTGCTTCAAATCCATCCAGAATAAAACGCA
diff --git a/tools/emboss_5/test-data/2.fasta b/tools/emboss_5/test-data/2.fasta
new file mode 100644
index 00000000000..3bfe7d3d3eb
--- /dev/null
+++ b/tools/emboss_5/test-data/2.fasta
@@ -0,0 +1,11 @@
+>Sequence 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gttcgatgcc taaaatacct tcttttgtcc ctacacagac cacagttttc ctaatggctt
+tacaccgact agaaattctt gtgcaagcac taattgaaag cggttggcct agagtgttac
+cggtttgtat agctgagcgc gtctcttgcc ctgatcaaag gttcattttc tctactttgg
+aagacgttgt ggaagaatac aacaagtacg agtctctccc ccctggtttg ctgattactg
+gatacagttg taataccctt cgcaacaccg cgtaactatc tatatgaatt attttccctt
+tattatatgt agtaggttcg tctttaatct tcctttagca agtcttttac tgttttcgac
+ctcaatgttc atgttcttag gttgttttgg ataatatgcg gtcagtttaa tcttcgttgt
+ttcttcttaa aatatttatt catggtttaa tttttggttt gtacttgttc aggggccagt
+tcattattta ctctgtttgt atacagcagt tcttttattt ttagtatgat tttaatttaa
+aacaattcta atggtcaaaa a
\ No newline at end of file
diff --git a/tools/emboss_5/test-data/2.pep b/tools/emboss_5/test-data/2.pep
new file mode 100644
index 00000000000..94a7e80e884
--- /dev/null
+++ b/tools/emboss_5/test-data/2.pep
@@ -0,0 +1,19 @@
+>HSFAU1_3
+PLSRLHLRGSWDRRSVANMQLFVRAQELHTFEVTGQETVAQIKAHVAS-LEGIAPEDQVV
+LLAG-PLEDEATLGQCGVEALTTLEVAGRMLG-GKVHGSLARAGKVRGQTPKVAKQEKKK
+KKTGRAKRRMQYNRRFVNVVPTFGKKKGPNANS
+>HSFAU2_3
+PLSRLHLRGSWDRRSVANMQLFVRAQELHTFEVTGQETVAQIKAHVAS-LEGIAPEDQVV
+LLAGAPLEDALWASAGWRP
+>HSFAU3_3
+PLSRLHLRGSWDRRSVANMQLFVRAQELHTFEVTGQETVAQIKAHVAS-LEGIAPEDQVV
+LLAGAPLEDEATLGQCGVEALTTLEVAGRMLG-GKVHGSLARAGKVRGQTPKGAKQEKKK
+KKTGRAKRRMQYNRRFVNVVPTFGKKKGPNANS
+>HSFAU4_3
+PLSRLHLRGSWDRRSVANMQLFVRAQELHTFEVTGQETVAQIKAHEIASLEGIAPEDQVV
+LLAGAPLEDEATLGQCGVEALTTLEVAGRMLARGKVHGSLARAGKVRGQTPKVAKQEKKK
+KKTGRAKRRMQYNRRFVNVVPTFGKKKGPNANS
+>HSFAU5_3
+PLSRLHLRGSWDRRSVANMQLFVRAQELHTFEVTGQETVAQIKAHVAS-LEGIAPEDQVV
+LLAGAPLEDEATLGQCGVEALTTLEVGRMLFG-GKVHGSLARAGKVRGQTPKVAKQEKKK
+KKTGRAKRRMQYNRRFVNVVPTFGKKKGPNANS
\ No newline at end of file
diff --git a/tools/emboss_5/test-data/3.fasta b/tools/emboss_5/test-data/3.fasta
new file mode 100644
index 00000000000..ddaab64c88d
--- /dev/null
+++ b/tools/emboss_5/test-data/3.fasta
@@ -0,0 +1,50 @@
+>HSFAU1
+ttcctctttctcgactccatcttcgcggtagctgggaccgccgttcagtcgccaatatgc
+agctctttgtccgcgcccaggagctacacaccttcgaggtgaccggccaggaaacggtcg
+cccagatcaaggctcatgtagcctcactggagggcattgccccggaagatcaagtcgtgc
+tcctggcaggccccctggaggatgaggccactctgggccagtgcggggtggaggccc
+tgactaccctggaagtagcaggccgcatgcttggaggtaaagttcatggttccctggccc
+gtgctggaaaagtgagaggtcagactcctaaggtggccaaacaggagaagaagaagaaga
+agacaggtcgggctaagcggcggatgcagtacaaccggcgctttgtcaacgttgtgccca
+cctttggcaagaagaagggccccaatgccaactcttaagtcttttgtaattctggctttc
+tctaataaaaaagccacttagttcagtcaaaaaaaaaa
+>HSFAU2
+ttcctctttctcgactccatcttcgcggtagctgggaccgccgttcagtcgccaatatgc
+agctctttgtccgcgcccaggagctacacaccttcgaggtgaccggccaggaaacggtcg
+cccagatcaaggctcatgtagcctcactggagggcattgccccggaagatcaagtcgtgc
+tcctggcaggcgcgcccctggaggatgcactctgggccagtgcggggtggaggccc
+tgactaccctggaagtagcaggccgcatgcttggaggtaaagttcatggttccctggccc
+gtgctggaaaagtgagaggtcagactcctaaggtggccaaacaggagaagaagaagaaga
+agacaggtcgggctaagcggcggatgcagtacaaccggcgctttgtcaacgttgtgccca
+cctttggcaagaagaagggccccaatgccaactcttaagtcttttgtaattctggctttc
+tctaataaaaaagccacttagttcagtcaaaaaaaaaa
+>HSFAU3
+ttcctctttctcgactccatcttcgcggtagctgggaccgccgttcagtcgccaatatgc
+agctctttgtccgcgcccaggagctacacaccttcgaggtgaccggccaggaaacggtcg
+cccagatcaaggctcatgtagcctcactggagggcattgccccggaagatcaagtcgtgc
+tcctggcaggcgcgcccctggaggatgaggccactctgggccagtgcggggtggaggccc
+tgactaccctggaagtagcaggccgcatgcttggaggtaaagttcatggttccctggccc
+gtgctggaaaagtgagaggtcagactcctaagggggccaaacaggagaagaagaagaaga
+agacaggtcgggctaagcggcggatgcagtacaaccggcgctttgtcaacgttgtgccca
+cctttggcaagaagaagggccccaatgccaactcttaagtcttttgtaattctggctttc
+tctaataaaaaagccacttagttcagtcaaaaaaaaaa
+>HSFAU4
+ttcctctttctcgactccatcttcgcggtagctgggaccgccgttcagtcgccaatatgc
+agctctttgtccgcgcccaggagctacacaccttcgaggtgaccggccaggaaacggtcg
+cccagatcaaggctcatgaaatagcctcactggagggcattgccccggaagatcaagtcgtgc
+tcctggcaggcgcgcccctggaggatgaggccactctgggccagtgcggggtggaggccc
+tgactaccctggaagtagcaggccgcatgcttgcccgaggtaaagttcatggttccctggccc
+gtgctggaaaagtgagaggtcagactcctaaggtggccaaacaggagaagaagaagaaga
+agacaggtcgggctaagcggcggatgcagtacaaccggcgctttgtcaacgttgtgccca
+cctttggcaagaagaagggccccaatgccaactcttaagtcttttgtaattctggctttc
+tctaataaaaaagccacttagttcagtcaaaaaaaaaa
+>HSFAU5
+ttcctctttctcgactccatcttcgcggtagctgggaccgccgttcagtcgccaatatgc
+agctctttgtccgcgcccaggagctacacaccttcgaggtgaccggccaggaaacggtcg
+cccagatcaaggctcatgtagcctcactggagggcattgccccggaagatcaagtcgtgc
+tcctggcaggcgcgcccctggaggatgaggccactctgggccagtgcggggtggaggccc
+tgactaccctggaagtaggccgcatgctttttggaggtaaagttcatggttccctggccc
+gtgctggaaaagtgagaggtcagactcctaaggtggccaaacaggagaagaagaagaaga
+agacaggtcgggctaagcggcggatgcagtacaaccggcgctttgtcaacgttgtgccca
+cctttggcaagaagaagggccccaatgccaactcttaagtcttttgtaattctggctttc
+tctaataaaaaagccacttagttcagtcaaaaaaaaaa
\ No newline at end of file
diff --git a/tools/emboss_5/test-data/emboss_antigenic_out.tabular b/tools/emboss_5/test-data/emboss_antigenic_out.tabular
new file mode 100644
index 00000000000..6d40c606802
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_antigenic_out.tabular
@@ -0,0 +1,23 @@
+SeqName Start End Score Strand Max_score_pos
+Sequence 196 225 1.340 + 221
+Sequence 253 283 1.263 + 266
+Sequence 27 45 1.241 + 32
+Sequence 60 72 1.236 + 66
+Sequence 357 368 1.214 + 360
+Sequence 130 159 1.191 + 148
+Sequence 83 93 1.186 + 87
+Sequence 165 175 1.147 + 173
+Sequence 6 22 1.147 + 20
+Sequence 293 301 1.147 + 299
+Sequence 324 343 1.147 + 330
+Sequence 473 481 1.142 + 479
+Sequence 540 551 1.119 + 545
+Sequence 501 510 1.114 + 504
+Sequence 409 415 1.097 + 412
+Sequence 48 56 1.097 + 51
+Sequence 553 558 1.092 + 558
+Sequence 106 112 1.087 + 110
+Sequence 488 494 1.075 + 490
+Sequence 423 429 1.075 + 426
+Sequence 118 123 1.070 + 118
+Sequence 239 247 1.042 + 245
diff --git a/tools/emboss_5/test-data/emboss_backtranseq_out.fasta b/tools/emboss_5/test-data/emboss_backtranseq_out.fasta
new file mode 100644
index 00000000000..9b1496cc9a5
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_backtranseq_out.fasta
@@ -0,0 +1,30 @@
+>Sequence 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+GGCACCACCTGCGGCGCCACCGGCTGCTGCACCGCCGCCGCCGCCACCGCCTGCTGCACC
+ACCTGCACCACCACCACCGGCACCTGCTGCTGCACCGCCTGCGCCTGCGCCGGCGCCTGC
+TGCGCCTGCGCCGGCACCACCACCACCTGCTGCACCGCCGCCACCGGCGGCTGCACCACC
+ACCGCCTGCGCCTGCTGCGGCGCCTGCACCGCCGGCGCCGCCGCCACCACCTGCACCACC
+GGCACCGGCTGCGCCGCCGGCTGCGCCTGCACCGCCGCCACCACCGGCGCCGCCGCCGGC
+TGCGGCGGCACCACCGGCGGCTGCTGCACCGCCGGCGCCGGCACCGGCACCACCGCCTGC
+TGCGGCGGCACCACCACCGGCACCGCCACCGCCGGCTGCACCGGCGCCGGCTGCGGCTGC
+GGCACCTGCACCTGCACCACCGGCTGCTGCTGCACCGGCGCCACCTGCGCCGCCGCCGGC
+GGCACCACCTGCGCCACCACCACCACCTGCACCTGCACCGCCTGCACCACCACCGGCGGC
+GCCGCCGGCGCCTGCGGCACCACCGGCACCGGCGGCGCCGCCGGCGCCGCCACCGCCTGC
+GCCGCCTGCGCCGCCGGCACCGCCTGCGGCGCCGGCACCTGCACCTGCACCTGCTGCTGC
+TGCTGCTGCACCGGCGGCACCACCACCGGCTGCACCGGCGCCACCACCGCCTGCACCGGC
+GGCGCCACCGCCTGCGCCGGCACCACCGGCACCGCCGCCACCGCCTGCTGCTGCACCACC
+TGCGGCTGCGCCGCCTGCGCCTGCTGCGGCTGCGGCACCGCCGCCTGCACCGCCACCTGC
+ACCGCCACCGCCACCGGCGCCGCCACCACCGCCACCACCACCACCTGCTGCTGCACCACC
+ACCGCCACCACCGCCACCGCCACCGGCACCGCCGGCACCGCCGGCGGCACCACCTGCGGC
+ACCTGCACCACCACCGCCGCCACCTGCACCACCTGCTGCACCACCACCGCCGGCTGCGCC
+GCCGGCACCTGCACCACCACCACCGCCTGCACCGGCACCACCACCACCTGCGGCGCCTGC
+TGCACCTGCGCCGCCACCGGCACCACCTGCGCCACCGGCACCACCTGCACCACCGCCGGC
+GGCACCACCGGCACCACCACCACCGGCGGCGCCACCGCCGCCACCGCCACCGGCTGCGGC
+GGCACCTGCGCCGGCACCACCACCGCCGCCACCTGCACCACCTGCGGCACCACCGGCACC
+ACCACCTGCACCACCTGCACCACCGCCGCCGCCGCCACCGCCACCACCACCGCCACCACC
+TGCGCCACCGGCGGCACCACCACCGCCGCCACCACCACCACCACCGGCGGCACCACCACC
+GGCACCGCCTGCACCACCGGCACCACCTGCGCCGGCGGCGGCGGCTGCTGCGCCGGCACC
+ACCTGCGCCACCACCGCCACCACCACCGCCTGCACCTGCACCGGCACCACCACCGGCACC
+GCCACCGCCTGCGCCGGCTGCGCCGGCACCACCTGCACCACCACCACCGCCACCACCACC
+ACCACCGCCGGCACCGCCACCGGCGCCACCACCACCACCGCCGCCACCACCACCGCCGCC
+GCCGCCTGCGCCGCCACCACCTGCACCGCCGCCACCGGCGGCACCTGCGCCGCCGCCGCC
+GCC
diff --git a/tools/emboss_5/test-data/emboss_banana_out.txt b/tools/emboss_5/test-data/emboss_banana_out.txt
new file mode 100644
index 00000000000..ec63db01198
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_banana_out.txt
@@ -0,0 +1,562 @@
+Base Bend Curve
+g 0.0 0.0
+t 10.8 0.0
+t 18.5 0.0
+c 26.9 0.0
+g 22.1 0.0
+a 19.5 0.0
+t 20.7 0.0
+g 26.2 0.0
+c 25.2 0.0
+c 12.5 0.0
+t 6.8 0.0
+a 3.4 0.0
+a 0.0 0.0
+a 1.3 0.0
+a 5.9 0.0
+t 10.6 0.0
+a 14.9 0.0
+c 17.7 0.0
+c 17.3 0.0
+t 13.3 0.0
+t 10.2 23.2
+c 13.9 22.5
+t 8.8 21.7
+t 0.0 20.6
+t 5.7 19.2
+t 13.9 17.7
+g 17.3 16.5
+t 15.1 15.5
+c 16.1 14.7
+c 18.7 13.9
+c 12.5 13.2
+t 9.7 12.5
+a 14.5 11.8
+c 19.1 11.1
+a 19.1 10.6
+c 15.3 10.0
+a 12.2 9.2
+g 14.3 7.9
+a 17.7 6.4
+c 17.7 5.0
+c 19.5 3.5
+a 19.1 2.9
+c 15.3 3.9
+a 16.3 5.5
+g 15.5 6.8
+t 6.3 7.8
+t 0.0 8.5
+t 5.0 9.3
+t 11.0 10.0
+c 15.1 10.8
+c 12.5 11.6
+t 6.8 12.5
+a 4.5 13.4
+a 12.4 14.3
+t 19.7 15.1
+g 25.2 15.7
+g 28.5 16.2
+c 20.7 16.6
+t 8.8 17.0
+t 3.4 17.5
+t 9.3 18.1
+a 14.5 18.5
+c 19.1 18.6
+a 19.5 18.5
+c 16.5 18.3
+c 21.1 18.0
+g 22.3 17.4
+a 18.3 16.3
+c 13.2 15.1
+t 7.2 13.8
+a 9.0 12.6
+g 10.2 11.4
+a 5.0 10.9
+a 1.3 11.0
+a 2.4 11.4
+t 6.1 11.9
+t 10.2 12.3
+c 13.9 12.5
+t 13.9 12.4
+t 13.9 12.4
+g 19.1 12.6
+t 20.5 12.9
+g 19.7 13.2
+c 15.3 13.1
+a 13.9 12.7
+a 20.7 12.2
+g 22.1 11.8
+c 20.5 11.5
+a 20.1 11.3
+c 13.2 10.9
+t 6.8 10.2
+a 4.5 9.6
+a 2.4 9.9
+t 6.7 10.9
+t 14.3 12.1
+g 13.7 13.2
+a 5.0 13.8
+a 8.8 13.6
+a 20.7 12.9
+g 24.5 12.1
+c 19.9 11.3
+g 16.5 10.3
+g 14.9 9.0
+t 11.4 7.5
+t 14.3 6.2
+g 25.2 5.2
+g 32.5 4.4
+c 25.2 4.0
+c 12.5 3.8
+t 7.2 3.4
+a 9.0 2.8
+g 14.3 2.4
+a 18.3 2.5
+g 20.1 2.8
+t 19.1 3.1
+g 14.5 3.2
+t 9.3 3.1
+t 9.3 2.6
+a 14.9 2.5
+c 16.5 2.7
+c 15.3 2.7
+g 16.5 2.6
+g 14.9 2.8
+t 6.3 2.9
+t 5.7 2.8
+t 13.9 2.3
+g 14.5 1.6
+t 10.6 0.6
+a 9.2 0.7
+t 8.2 1.8
+a 16.1 2.7
+g 24.5 3.7
+c 19.1 4.6
+t 15.7 5.6
+g 17.7 6.4
+a 21.1 7.1
+g 24.5 7.7
+c 24.5 8.1
+g 24.5 8.2
+c 21.1 8.0
+g 17.7 7.8
+t 14.3 7.7
+c 14.3 7.7
+t 14.3 7.9
+c 13.9 8.4
+t 13.9 9.1
+t 15.3 10.2
+g 26.2 11.3
+c 26.2 12.2
+c 18.7 12.7
+c 15.7 12.9
+t 15.7 12.9
+g 17.5 12.9
+a 17.3 13.0
+t 17.5 13.2
+c 14.3 13.3
+a 5.7 13.3
+a 8.8 13.2
+a 17.3 13.0
+g 17.7 12.9
+g 14.9 12.7
+t 10.8 12.6
+t 13.7 12.6
+c 19.7 12.6
+a 12.4 12.7
+t 1.3 12.9
+t 0.0 13.1
+t 5.0 13.1
+t 10.2 12.9
+c 14.3 12.6
+t 14.3 12.3
+c 9.0 11.9
+t 9.7 11.6
+a 15.5 11.2
+c 17.9 10.6
+t 8.8 9.9
+t 5.7 9.0
+t 14.3 8.1
+g 15.1 7.4
+g 11.0 6.8
+a 13.3 6.3
+a 13.9 5.9
+g 14.3 5.6
+a 17.7 5.3
+c 17.7 5.1
+g 14.9 5.0
+t 11.4 5.1
+t 13.9 5.2
+g 19.1 5.2
+t 19.5 5.0
+g 15.1 4.9
+g 11.0 4.9
+a 13.3 4.9
+a 13.9 4.9
+g 10.2 5.1
+a 6.1 5.5
+a 5.9 6.3
+t 10.6 7.0
+a 14.5 7.8
+c 13.9 8.4
+a 11.4 8.6
+a 14.5 8.7
+c 13.9 8.8
+a 13.9 8.9
+a 17.9 9.0
+g 15.5 9.0
+t 12.0 8.8
+a 14.9 8.9
+c 22.3 9.1
+g 22.3 9.3
+a 18.3 9.6
+g 18.3 9.9
+t 14.3 10.1
+c 14.3 10.2
+t 14.3 10.5
+c 14.3 11.2
+t 15.1 12.3
+c 16.1 13.4
+c 19.7 14.2
+c 19.7 14.9
+c 19.7 15.1
+c 18.7 15.0
+c 15.7 14.8
+t 15.7 14.4
+g 17.7 14.1
+g 14.9 13.5
+t 6.3 12.9
+t 5.7 12.4
+t 15.3 11.9
+g 22.1 11.5
+c 19.1 11.1
+t 15.7 10.4
+g 17.5 9.4
+a 10.1 8.3
+t 4.5 7.2
+t 9.3 6.2
+a 15.5 5.2
+c 16.3 4.2
+t 15.7 3.2
+g 15.1 2.5
+g 14.9 2.3
+a 13.3 2.9
+t 10.6 3.7
+a 14.5 4.5
+c 15.3 5.3
+a 16.3 6.1
+g 15.5 7.0
+t 11.4 7.5
+t 13.9 7.7
+g 14.5 7.9
+t 9.3 8.3
+a 4.5 8.6
+a 5.9 9.1
+t 10.6 9.7
+a 14.9 10.4
+c 18.7 11.1
+c 18.7 11.7
+c 17.3 12.1
+t 13.3 12.6
+t 18.5 12.9
+c 25.7 12.9
+g 22.1 12.6
+c 15.3 12.2
+a 11.4 11.7
+a 14.5 11.0
+c 19.1 10.3
+a 19.5 9.7
+c 16.5 9.0
+c 19.9 8.1
+g 24.5 7.2
+c 21.1 6.4
+g 14.9 5.5
+t 9.3 4.5
+a 9.3 3.5
+a 15.5 2.5
+c 13.2 1.7
+t 8.2 1.0
+a 13.3 0.8
+t 14.1 1.6
+c 9.0 2.9
+t 8.2 4.5
+a 9.2 6.0
+t 9.2 7.4
+a 15.6 8.8
+t 19.7 10.3
+g 13.7 11.7
+a 6.1 12.9
+a 2.4 14.1
+t 4.5 15.4
+t 7.8 16.6
+a 5.9 17.4
+t 1.3 17.8
+t 0.0 18.0
+t 5.0 18.0
+t 11.0 18.0
+c 16.1 17.9
+c 18.7 17.9
+c 17.3 17.6
+t 8.8 17.4
+t 3.4 17.4
+t 7.8 17.4
+a 5.9 17.5
+t 4.5 17.6
+t 7.8 17.6
+a 9.2 17.8
+t 9.2 18.3
+a 15.6 18.7
+t 19.3 18.8
+g 14.5 18.5
+t 9.7 17.9
+a 13.2 17.3
+g 15.5 16.7
+t 9.7 16.4
+a 12.5 16.0
+g 17.7 15.7
+g 14.9 15.6
+t 10.8 15.7
+t 18.5 15.7
+c 22.3 15.8
+g 17.7 15.6
+t 14.3 15.3
+c 13.9 15.2
+t 8.8 15.3
+t 3.4 15.6
+t 6.4 15.9
+a 4.5 16.4
+a 10.1 17.0
+t 14.1 18.0
+c 13.9 18.9
+t 13.3 19.6
+t 11.0 20.1
+c 15.1 20.5
+c 17.3 20.8
+t 8.8 21.1
+t 3.4 21.3
+t 6.8 21.4
+a 16.1 20.9
+g 22.1 19.9
+c 15.3 18.9
+a 13.9 18.1
+a 17.9 17.4
+g 18.3 16.9
+t 14.3 16.5
+c 13.9 16.5
+t 8.8 16.6
+t 0.0 16.6
+t 3.4 16.6
+t 9.3 16.7
+a 15.5 16.6
+c 16.3 16.4
+t 15.3 16.1
+g 14.5 15.8
+t 6.3 15.5
+t 0.0 15.3
+t 5.0 15.1
+t 18.5 15.2
+c 26.9 15.3
+g 22.3 15.6
+a 17.7 16.2
+c 17.7 16.7
+c 17.7 16.9
+t 17.7 17.1
+c 14.3 17.0
+a 6.7 16.9
+a 12.4 16.5
+t 19.3 16.1
+g 14.5 16.1
+t 10.8 16.2
+t 13.7 16.1
+c 19.7 16.0
+a 21.7 15.7
+t 19.3 15.3
+g 14.5 14.7
+t 10.8 14.3
+t 10.2 14.0
+c 13.9 13.8
+t 11.7 13.5
+t 6.8 12.9
+a 12.5 12.3
+g 17.7 11.7
+g 14.9 11.2
+t 11.4 10.6
+t 13.9 10.3
+g 14.5 10.2
+t 6.3 10.2
+t 0.0 10.2
+t 5.7 10.4
+t 14.3 11.0
+g 15.1 11.5
+g 14.9 11.9
+a 13.3 12.0
+t 7.8 12.0
+a 4.5 12.0
+a 5.9 12.0
+t 9.2 12.1
+a 15.6 12.2
+t 20.7 11.8
+g 22.1 11.3
+c 19.9 10.5
+g 16.5 9.8
+g 17.7 8.9
+t 17.7 7.9
+c 15.7 6.9
+a 16.3 5.8
+g 15.5 5.0
+t 6.3 4.5
+t 3.4 4.5
+t 6.4 5.1
+a 4.5 6.2
+a 10.1 7.8
+t 14.1 9.7
+c 13.9 11.7
+t 13.3 13.4
+t 18.5 14.9
+c 22.3 15.9
+g 14.9 16.5
+t 11.4 16.9
+t 13.9 17.0
+g 14.5 16.8
+t 6.3 16.2
+t 5.0 15.3
+t 10.2 14.0
+c 13.9 12.6
+t 13.3 11.1
+t 10.2 9.7
+c 13.9 8.5
+t 11.7 7.2
+t 6.4 6.1
+a 3.4 5.5
+a 0.0 5.7
+a 1.3 6.7
+a 5.9 7.9
+t 9.2 9.1
+a 5.9 9.8
+t 1.3 10.1
+t 3.4 10.3
+t 7.8 10.7
+a 5.9 11.0
+t 6.1 11.3
+t 13.7 11.4
+c 19.7 11.2
+a 21.7 10.8
+t 19.7 10.4
+g 17.7 10.4
+g 14.9 10.8
+t 6.3 11.3
+t 3.4 11.8
+t 6.4 12.2
+a 4.5 12.6
+a 2.4 12.9
+t 1.3 13.2
+t 0.0 13.3
+t 0.0 13.2
+t 5.7 12.8
+t 14.3 12.3
+g 17.7 12.1
+g 14.9 12.0
+t 6.3 12.0
+t 5.7 12.1
+t 13.9 12.2
+g 14.5 12.3
+t 12.0 12.4
+a 15.5 12.5
+c 17.9 12.9
+t 13.9 13.2
+t 13.9 12.8
+g 14.5 11.9
+t 10.8 10.9
+t 13.7 10.1
+c 15.7 9.7
+a 15.7 9.7
+g 18.7 9.8
+g 19.7 9.7
+g 26.2 9.2
+g 32.5 8.8
+c 25.2 8.6
+c 15.7 8.5
+a 16.3 8.4
+g 15.5 8.4
+t 10.8 8.4
+t 13.7 8.6
+c 19.7 8.8
+a 12.4 8.7
+t 4.5 8.5
+t 7.8 8.1
+a 5.9 7.9
+t 1.3 7.8
+t 3.4 7.8
+t 9.3 7.9
+a 15.5 8.2
+c 18.3 8.5
+t 14.3 8.8
+c 12.2 9.1
+t 15.3 9.2
+g 14.5 9.0
+t 6.3 8.4
+t 5.7 7.5
+t 13.9 6.4
+g 14.5 5.5
+t 10.6 4.9
+a 9.2 4.5
+t 10.6 4.1
+a 14.5 3.8
+c 15.3 3.7
+a 19.1 3.8
+g 22.1 3.9
+c 16.7 4.2
+a 16.3 4.8
+g 15.5 5.6
+t 10.8 6.6
+t 10.2 7.6
+c 13.9 8.6
+t 8.8 9.7
+t 0.0 10.8
+t 3.4 11.8
+t 7.8 12.6
+a 5.9 12.8
+t 1.3 12.4
+t 0.0 11.8
+t 0.0 11.2
+t 3.4 10.6
+t 6.8 9.8
+a 13.2 9.0
+g 15.5 8.2
+t 10.6 7.8
+a 15.6 7.8
+t 19.7 8.2
+g 17.5 8.8
+a 10.1 9.2
+t 1.3 9.3
+t 0.0 9.0
+t 3.4 8.5
+t 6.4 7.9
+a 4.5 7.1
+a 2.4 6.1
+t 1.3 5.0
+t 3.4 3.8
+t 6.4 2.6
+a 3.4 2.4
+a 0.0 90.8
+a 6.3 0.0
+a 14.5 0.0
+c 13.9 0.0
+a 6.7 0.0
+a 2.4 0.0
+t 6.1 0.0
+t 10.2 0.0
+c 9.0 0.0
+t 6.8 0.0
+a 4.5 0.0
+a 12.4 0.0
+t 19.7 0.0
+g 17.7 0.0
+g 17.7 0.0
+t 17.7 0.0
+c 14.3 0.0
+a 5.7 0.0
+a 0.0 0.0
+a 0.0 0.0
+a 0.0 0.0
+a 0.0 0.0
diff --git a/tools/emboss_5/test-data/emboss_biosed_out.fasta b/tools/emboss_5/test-data/emboss_biosed_out.fasta
new file mode 100644
index 00000000000..d9276565bed
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_biosed_out.fasta
@@ -0,0 +1,11 @@
+>Sequence 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+GTTCGAGTCCTAAAATACCTTCTTTTGTCCCTACACAGACCACAGTTTTCCTAAGTGCTT
+TACACCGACTAGAAATTCTTGTGCAAGCACTAATTGAAAGCGGTTGGCCTAGAGTGTTAC
+CGGTTTGTATAGCTGAGCGCGTCTCTTGCCCTGATCAAAGGTTCATTTTCTCTACTTTGG
+AAGACGTTGTGGAAGAATACAACAAGTACGAGTCTCTCCCCCCTGGTTTGCTGATTACTG
+GATACAGTTGTAATACCCTTCGCAACACCGCGTAACTATCTATAGTAATTATTTTCCCTT
+TATTATAGTTAGTAGGTTCGTCTTTAATCTTCCTTTAGCAAGTCTTTTACTGTTTTCGAC
+CTCAAGTTTCAGTTTCTTAGGTTGTTTTGGATAATAGTCGGTCAGTTTAATCTTCGTTGT
+TTCTTCTTAAAATATTTATTCAGTGTTTAATTTTTGGTTTGTACTTGTTCAGGGGCCAGT
+TCATTATTTACTCTGTTTGTATACAGCAGTTCTTTTATTTTTAGTAGTATTTTAATTTAA
+AACAATTCTAAGTGTCAAAAA
diff --git a/tools/emboss_5/test-data/emboss_btwisted_out.btwisted b/tools/emboss_5/test-data/emboss_btwisted_out.btwisted
new file mode 100644
index 00000000000..f6f02baaa9c
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_btwisted_out.btwisted
@@ -0,0 +1,7 @@
+# Output from BTWISTED
+# Twisting calculated from 1 to 561 of Sequence
+Total twist (degrees): 19085.5
+Total turns : 53.02
+Average bases per turn: 10.58
+Total stacking energy : -4107.68
+Average stacking energy per dinucleotide: -7.34
diff --git a/tools/emboss_5/test-data/emboss_cai_out.cai b/tools/emboss_5/test-data/emboss_cai_out.cai
new file mode 100644
index 00000000000..fac887ecf4f
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_cai_out.cai
@@ -0,0 +1 @@
+Sequence: Sequence CAI: 0.188
\ No newline at end of file
diff --git a/tools/emboss_5/test-data/emboss_charge_out.charge b/tools/emboss_5/test-data/emboss_charge_out.charge
new file mode 100644
index 00000000000..093f28274e1
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_charge_out.charge
@@ -0,0 +1,560 @@
+CHARGE of Sequence from 1 to 561: window 5
+
+Position Residue Charge
+1 G 0.000
+2 T 0.000
+3 T 0.000
+4 C 0.000
+5 G 0.000
+6 A 0.000
+7 T 0.000
+8 G 0.000
+9 C 0.000
+10 C 0.000
+11 T 0.000
+12 A 0.000
+13 A 0.000
+14 A 0.000
+15 A 0.000
+16 T 0.000
+17 A 0.000
+18 C 0.000
+19 C 0.000
+20 T 0.000
+21 T 0.000
+22 C 0.000
+23 T 0.000
+24 T 0.000
+25 T 0.000
+26 T 0.000
+27 G 0.000
+28 T 0.000
+29 C 0.000
+30 C 0.000
+31 C 0.000
+32 T 0.000
+33 A 0.000
+34 C 0.000
+35 A 0.000
+36 C 0.000
+37 A 0.000
+38 G 0.000
+39 A 0.000
+40 C 0.000
+41 C 0.000
+42 A 0.000
+43 C 0.000
+44 A 0.000
+45 G 0.000
+46 T 0.000
+47 T 0.000
+48 T 0.000
+49 T 0.000
+50 C 0.000
+51 C 0.000
+52 T 0.000
+53 A 0.000
+54 A 0.000
+55 T 0.000
+56 G 0.000
+57 G 0.000
+58 C 0.000
+59 T 0.000
+60 T 0.000
+61 T 0.000
+62 A 0.000
+63 C 0.000
+64 A 0.000
+65 C 0.000
+66 C 0.000
+67 G 0.000
+68 A 0.000
+69 C 0.000
+70 T 0.000
+71 A 0.000
+72 G 0.000
+73 A 0.000
+74 A 0.000
+75 A 0.000
+76 T 0.000
+77 T 0.000
+78 C 0.000
+79 T 0.000
+80 T 0.000
+81 G 0.000
+82 T 0.000
+83 G 0.000
+84 C 0.000
+85 A 0.000
+86 A 0.000
+87 G 0.000
+88 C 0.000
+89 A 0.000
+90 C 0.000
+91 T 0.000
+92 A 0.000
+93 A 0.000
+94 T 0.000
+95 T 0.000
+96 G 0.000
+97 A 0.000
+98 A 0.000
+99 A 0.000
+100 G 0.000
+101 C 0.000
+102 G 0.000
+103 G 0.000
+104 T 0.000
+105 T 0.000
+106 G 0.000
+107 G 0.000
+108 C 0.000
+109 C 0.000
+110 T 0.000
+111 A 0.000
+112 G 0.000
+113 A 0.000
+114 G 0.000
+115 T 0.000
+116 G 0.000
+117 T 0.000
+118 T 0.000
+119 A 0.000
+120 C 0.000
+121 C 0.000
+122 G 0.000
+123 G 0.000
+124 T 0.000
+125 T 0.000
+126 T 0.000
+127 G 0.000
+128 T 0.000
+129 A 0.000
+130 T 0.000
+131 A 0.000
+132 G 0.000
+133 C 0.000
+134 T 0.000
+135 G 0.000
+136 A 0.000
+137 G 0.000
+138 C 0.000
+139 G 0.000
+140 C 0.000
+141 G 0.000
+142 T 0.000
+143 C 0.000
+144 T 0.000
+145 C 0.000
+146 T 0.000
+147 T 0.000
+148 G 0.000
+149 C 0.000
+150 C 0.000
+151 C 0.000
+152 T 0.000
+153 G 0.000
+154 A 0.000
+155 T 0.000
+156 C 0.000
+157 A 0.000
+158 A 0.000
+159 A 0.000
+160 G 0.000
+161 G 0.000
+162 T 0.000
+163 T 0.000
+164 C 0.000
+165 A 0.000
+166 T 0.000
+167 T 0.000
+168 T 0.000
+169 T 0.000
+170 C 0.000
+171 T 0.000
+172 C 0.000
+173 T 0.000
+174 A 0.000
+175 C 0.000
+176 T 0.000
+177 T 0.000
+178 T 0.000
+179 G 0.000
+180 G 0.000
+181 A 0.000
+182 A 0.000
+183 G 0.000
+184 A 0.000
+185 C 0.000
+186 G 0.000
+187 T 0.000
+188 T 0.000
+189 G 0.000
+190 T 0.000
+191 G 0.000
+192 G 0.000
+193 A 0.000
+194 A 0.000
+195 G 0.000
+196 A 0.000
+197 A 0.000
+198 T 0.000
+199 A 0.000
+200 C 0.000
+201 A 0.000
+202 A 0.000
+203 C 0.000
+204 A 0.000
+205 A 0.000
+206 G 0.000
+207 T 0.000
+208 A 0.000
+209 C 0.000
+210 G 0.000
+211 A 0.000
+212 G 0.000
+213 T 0.000
+214 C 0.000
+215 T 0.000
+216 C 0.000
+217 T 0.000
+218 C 0.000
+219 C 0.000
+220 C 0.000
+221 C 0.000
+222 C 0.000
+223 C 0.000
+224 T 0.000
+225 G 0.000
+226 G 0.000
+227 T 0.000
+228 T 0.000
+229 T 0.000
+230 G 0.000
+231 C 0.000
+232 T 0.000
+233 G 0.000
+234 A 0.000
+235 T 0.000
+236 T 0.000
+237 A 0.000
+238 C 0.000
+239 T 0.000
+240 G 0.000
+241 G 0.000
+242 A 0.000
+243 T 0.000
+244 A 0.000
+245 C 0.000
+246 A 0.000
+247 G 0.000
+248 T 0.000
+249 T 0.000
+250 G 0.000
+251 T 0.000
+252 A 0.000
+253 A 0.000
+254 T 0.000
+255 A 0.000
+256 C 0.000
+257 C 0.000
+258 C 0.000
+259 T 0.000
+260 T 0.000
+261 C 0.000
+262 G 0.000
+263 C 0.000
+264 A 0.000
+265 A 0.000
+266 C 0.000
+267 A 0.000
+268 C 0.000
+269 C 0.000
+270 G 0.000
+271 C 0.000
+272 G 0.000
+273 T 0.000
+274 A 0.000
+275 A 0.000
+276 C 0.000
+277 T 0.000
+278 A 0.000
+279 T 0.000
+280 C 0.000
+281 T 0.000
+282 A 0.000
+283 T 0.000
+284 A 0.000
+285 T 0.000
+286 G 0.000
+287 A 0.000
+288 A 0.000
+289 T 0.000
+290 T 0.000
+291 A 0.000
+292 T 0.000
+293 T 0.000
+294 T 0.000
+295 T 0.000
+296 C 0.000
+297 C 0.000
+298 C 0.000
+299 T 0.000
+300 T 0.000
+301 T 0.000
+302 A 0.000
+303 T 0.000
+304 T 0.000
+305 A 0.000
+306 T 0.000
+307 A 0.000
+308 T 0.000
+309 G 0.000
+310 T 0.000
+311 A 0.000
+312 G 0.000
+313 T 0.000
+314 A 0.000
+315 G 0.000
+316 G 0.000
+317 T 0.000
+318 T 0.000
+319 C 0.000
+320 G 0.000
+321 T 0.000
+322 C 0.000
+323 T 0.000
+324 T 0.000
+325 T 0.000
+326 A 0.000
+327 A 0.000
+328 T 0.000
+329 C 0.000
+330 T 0.000
+331 T 0.000
+332 C 0.000
+333 C 0.000
+334 T 0.000
+335 T 0.000
+336 T 0.000
+337 A 0.000
+338 G 0.000
+339 C 0.000
+340 A 0.000
+341 A 0.000
+342 G 0.000
+343 T 0.000
+344 C 0.000
+345 T 0.000
+346 T 0.000
+347 T 0.000
+348 T 0.000
+349 A 0.000
+350 C 0.000
+351 T 0.000
+352 G 0.000
+353 T 0.000
+354 T 0.000
+355 T 0.000
+356 T 0.000
+357 C 0.000
+358 G 0.000
+359 A 0.000
+360 C 0.000
+361 C 0.000
+362 T 0.000
+363 C 0.000
+364 A 0.000
+365 A 0.000
+366 T 0.000
+367 G 0.000
+368 T 0.000
+369 T 0.000
+370 C 0.000
+371 A 0.000
+372 T 0.000
+373 G 0.000
+374 T 0.000
+375 T 0.000
+376 C 0.000
+377 T 0.000
+378 T 0.000
+379 A 0.000
+380 G 0.000
+381 G 0.000
+382 T 0.000
+383 T 0.000
+384 G 0.000
+385 T 0.000
+386 T 0.000
+387 T 0.000
+388 T 0.000
+389 G 0.000
+390 G 0.000
+391 A 0.000
+392 T 0.000
+393 A 0.000
+394 A 0.000
+395 T 0.000
+396 A 0.000
+397 T 0.000
+398 G 0.000
+399 C 0.000
+400 G 0.000
+401 G 0.000
+402 T 0.000
+403 C 0.000
+404 A 0.000
+405 G 0.000
+406 T 0.000
+407 T 0.000
+408 T 0.000
+409 A 0.000
+410 A 0.000
+411 T 0.000
+412 C 0.000
+413 T 0.000
+414 T 0.000
+415 C 0.000
+416 G 0.000
+417 T 0.000
+418 T 0.000
+419 G 0.000
+420 T 0.000
+421 T 0.000
+422 T 0.000
+423 C 0.000
+424 T 0.000
+425 T 0.000
+426 C 0.000
+427 T 0.000
+428 T 0.000
+429 A 0.000
+430 A 0.000
+431 A 0.000
+432 A 0.000
+433 T 0.000
+434 A 0.000
+435 T 0.000
+436 T 0.000
+437 T 0.000
+438 A 0.000
+439 T 0.000
+440 T 0.000
+441 C 0.000
+442 A 0.000
+443 T 0.000
+444 G 0.000
+445 G 0.000
+446 T 0.000
+447 T 0.000
+448 T 0.000
+449 A 0.000
+450 A 0.000
+451 T 0.000
+452 T 0.000
+453 T 0.000
+454 T 0.000
+455 T 0.000
+456 G 0.000
+457 G 0.000
+458 T 0.000
+459 T 0.000
+460 T 0.000
+461 G 0.000
+462 T 0.000
+463 A 0.000
+464 C 0.000
+465 T 0.000
+466 T 0.000
+467 G 0.000
+468 T 0.000
+469 T 0.000
+470 C 0.000
+471 A 0.000
+472 G 0.000
+473 G 0.000
+474 G 0.000
+475 G 0.000
+476 C 0.000
+477 C 0.000
+478 A 0.000
+479 G 0.000
+480 T 0.000
+481 T 0.000
+482 C 0.000
+483 A 0.000
+484 T 0.000
+485 T 0.000
+486 A 0.000
+487 T 0.000
+488 T 0.000
+489 T 0.000
+490 A 0.000
+491 C 0.000
+492 T 0.000
+493 C 0.000
+494 T 0.000
+495 G 0.000
+496 T 0.000
+497 T 0.000
+498 T 0.000
+499 G 0.000
+500 T 0.000
+501 A 0.000
+502 T 0.000
+503 A 0.000
+504 C 0.000
+505 A 0.000
+506 G 0.000
+507 C 0.000
+508 A 0.000
+509 G 0.000
+510 T 0.000
+511 T 0.000
+512 C 0.000
+513 T 0.000
+514 T 0.000
+515 T 0.000
+516 T 0.000
+517 A 0.000
+518 T 0.000
+519 T 0.000
+520 T 0.000
+521 T 0.000
+522 T 0.000
+523 A 0.000
+524 G 0.000
+525 T 0.000
+526 A 0.000
+527 T 0.000
+528 G 0.000
+529 A 0.000
+530 T 0.000
+531 T 0.000
+532 T 0.000
+533 T 0.000
+534 A 0.000
+535 A 0.000
+536 T 0.000
+537 T 0.000
+538 T 0.000
+539 A 0.000
+540 A 0.000
+541 A 0.000
+542 A 0.000
+543 C 0.000
+544 A 0.000
+545 A 0.000
+546 T 0.000
+547 T 0.000
+548 C 0.000
+549 T 0.000
+550 A 0.000
+551 A 0.000
+552 T 0.000
+553 G 0.000
+554 G 0.000
+555 T 0.000
+556 C 0.000
+557 A 0.000
diff --git a/tools/emboss_5/test-data/emboss_chips_out.chips b/tools/emboss_5/test-data/emboss_chips_out.chips
new file mode 100644
index 00000000000..faf968beb2d
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_chips_out.chips
@@ -0,0 +1,3 @@
+# CHIPS codon usage statistics
+
+Nc = 61.000
diff --git a/tools/emboss_5/test-data/emboss_codcmp_out.codcmp b/tools/emboss_5/test-data/emboss_codcmp_out.codcmp
new file mode 100644
index 00000000000..8d2f34efd19
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_codcmp_out.codcmp
@@ -0,0 +1,9 @@
+# CODCMP codon usage table comparison
+# Ehum.cut vs Eacc.cut
+
+Sum Squared Difference = 3.044
+Mean Squared Difference = 0.048
+Root Mean Squared Difference = 0.218
+Sum Difference = 11.470
+Mean Difference = 0.179
+Codons not appearing = 0
diff --git a/tools/emboss_5/test-data/emboss_coderet_out.coderet b/tools/emboss_5/test-data/emboss_coderet_out.coderet
new file mode 100644
index 00000000000..86cf4927375
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_coderet_out.coderet
@@ -0,0 +1,3 @@
+ CDS mRNA non-c Trans Total Sequence
+ ===== ===== ===== ===== ===== ========
+ 0 0 0 0 0 Sequence
diff --git a/tools/emboss_5/test-data/emboss_compseq_out.compseq b/tools/emboss_5/test-data/emboss_compseq_out.compseq
new file mode 100644
index 00000000000..4bfc0c92264
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_compseq_out.compseq
@@ -0,0 +1,34 @@
+#
+# Output from 'compseq'
+#
+# The Expected frequencies are calculated on the (false) assumption that every
+# word has equal frequency.
+#
+# The input sequences are:
+# Sequence
+
+
+Word size 2
+Total count 560
+
+#
+# Word Obs Count Obs Frequency Exp Frequency Obs/Exp Frequency
+#
+AA 40 0.0714286 0.0625000 1.1428571
+AC 27 0.0482143 0.0625000 0.7714286
+AG 26 0.0464286 0.0625000 0.7428571
+AT 41 0.0732143 0.0625000 1.1714286
+CA 26 0.0464286 0.0625000 0.7428571
+CC 24 0.0428571 0.0625000 0.6857143
+CG 15 0.0267857 0.0625000 0.4285714
+CT 41 0.0732143 0.0625000 1.1714286
+GA 19 0.0339286 0.0625000 0.5428571
+GC 17 0.0303571 0.0625000 0.4857143
+GG 19 0.0339286 0.0625000 0.5428571
+GT 43 0.0767857 0.0625000 1.2285714
+TA 50 0.0892857 0.0625000 1.4285714
+TC 38 0.0678571 0.0625000 1.0857143
+TG 37 0.0660714 0.0625000 1.0571429
+TT 97 0.1732143 0.0625000 2.7714286
+
+Other 0 0.0000000 0.0000000 10000000000.0000000
diff --git a/tools/emboss_5/test-data/emboss_cpgreport_out1.gff b/tools/emboss_5/test-data/emboss_cpgreport_out1.gff
new file mode 100644
index 00000000000..3af78520968
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_cpgreport_out1.gff
@@ -0,0 +1,13 @@
+##gff-version 2.0
+##date 2007-10-15
+##Type DNA Sequence
+Sequence cpgreport misc_feature 4 5 17.000 + . Sequence "Sequence.1"
+Sequence cpgreport misc_feature 66 67 17.000 + . Sequence "Sequence.2"
+Sequence cpgreport misc_feature 101 102 17.000 + . Sequence "Sequence.3"
+Sequence cpgreport misc_feature 121 141 34.000 + . Sequence "Sequence.4"
+Sequence cpgreport misc_feature 185 186 17.000 + . Sequence "Sequence.5"
+Sequence cpgreport misc_feature 209 210 17.000 + . Sequence "Sequence.6"
+Sequence cpgreport misc_feature 261 272 43.000 + . Sequence "Sequence.7"
+Sequence cpgreport misc_feature 319 320 17.000 + . Sequence "Sequence.8"
+Sequence cpgreport misc_feature 357 358 17.000 + . Sequence "Sequence.9"
+Sequence cpgreport misc_feature 399 416 19.000 + . Sequence "Sequence.10"
diff --git a/tools/emboss_5/test-data/emboss_cpgreport_out2.cpgreport b/tools/emboss_5/test-data/emboss_cpgreport_out2.cpgreport
new file mode 100644
index 00000000000..3db6c63e2ee
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_cpgreport_out2.cpgreport
@@ -0,0 +1,15 @@
+
+
+CPGREPORT of Sequence from 1 to 561
+
+Sequence Begin End Score CpG %CG CG/GC
+Sequence 4 5 17 1 100.0 -
+Sequence 66 67 17 1 100.0 -
+Sequence 101 102 17 1 100.0 -
+Sequence 121 141 34 3 57.1 1.00
+Sequence 185 186 17 1 100.0 -
+Sequence 209 210 17 1 100.0 -
+Sequence 261 272 43 3 75.0 1.00
+Sequence 319 320 17 1 100.0 -
+Sequence 357 358 17 1 100.0 -
+Sequence 399 416 19 2 44.4 -
diff --git a/tools/emboss_5/test-data/emboss_cusp_out.cusp b/tools/emboss_5/test-data/emboss_cusp_out.cusp
new file mode 100644
index 00000000000..1675df9ef7d
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_cusp_out.cusp
@@ -0,0 +1,72 @@
+#CdsCount: 10
+
+#Coding GC 36.36%
+#1st letter GC 34.22%
+#2nd letter GC 35.29%
+#3rd letter GC 39.57%
+
+#Codon AA Fraction Frequency Number
+GCA A 0.200 5.348 1
+GCC A 0.400 10.695 2
+GCG A 0.400 10.695 2
+GCT A 0.000 0.000 0
+TGC C 0.500 21.390 4
+TGT C 0.500 21.390 4
+GAC D 0.667 10.695 2
+GAT D 0.333 5.348 1
+GAA E 0.500 5.348 1
+GAG E 0.500 5.348 1
+TTC F 0.316 32.086 6
+TTT F 0.684 69.519 13
+GGA G 0.000 0.000 0
+GGC G 0.200 5.348 1
+GGG G 0.200 5.348 1
+GGT G 0.600 16.043 3
+CAC H 0.667 10.695 2
+CAT H 0.333 5.348 1
+ATA I 0.429 16.043 3
+ATC I 0.143 5.348 1
+ATT I 0.429 16.043 3
+AAA K 0.600 32.086 6
+AAG K 0.400 21.390 4
+CTA L 0.152 26.738 5
+CTC L 0.061 10.695 2
+CTG L 0.152 26.738 5
+CTT L 0.273 48.128 9
+TTA L 0.182 32.086 6
+TTG L 0.182 32.086 6
+ATG M 1.000 16.043 3
+AAC N 0.286 10.695 2
+AAT N 0.714 26.738 5
+CCA P 0.250 5.348 1
+CCC P 0.500 10.695 2
+CCG P 0.250 5.348 1
+CCT P 0.000 0.000 0
+CAA Q 0.333 5.348 1
+CAG Q 0.667 10.695 2
+AGA R 0.143 5.348 1
+AGG R 0.143 5.348 1
+CGA R 0.143 5.348 1
+CGC R 0.000 0.000 0
+CGG R 0.143 5.348 1
+CGT R 0.429 16.043 3
+AGC S 0.136 16.043 3
+AGT S 0.227 26.738 5
+TCA S 0.136 16.043 3
+TCC S 0.227 26.738 5
+TCG S 0.000 0.000 0
+TCT S 0.273 32.086 6
+ACA T 0.400 21.390 4
+ACC T 0.100 5.348 1
+ACG T 0.200 10.695 2
+ACT T 0.300 16.043 3
+GTA V 0.231 16.043 3
+GTC V 0.000 0.000 0
+GTG V 0.000 0.000 0
+GTT V 0.769 53.476 10
+TGG W 1.000 21.390 4
+TAC Y 0.444 21.390 4
+TAT Y 0.556 26.738 5
+TAA * 0.500 26.738 5
+TAG * 0.400 21.390 4
+TGA * 0.100 5.348 1
diff --git a/tools/emboss_5/test-data/emboss_cutseq_out.fasta b/tools/emboss_5/test-data/emboss_cutseq_out.fasta
new file mode 100644
index 00000000000..071f3cfb847
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_cutseq_out.fasta
@@ -0,0 +1,11 @@
+>Sequence 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+ttcgatgcctaaaataccttcttttgtccctacacagaccacagttttcctaatggcttt
+acaccgactagaaattcttgtgcaagcactaattgaaagcggttggcctagagtgttacc
+ggtttgtatagctgagcgcgtctcttgccctgatcaaaggttcattttctctactttgga
+agacgttgtggaagaatacaacaagtacgagtctctcccccctggtttgctgattactgg
+atacagttgtaatacccttcgcaacaccgcgtaactatctatatgaattattttcccttt
+attatatgtagtaggttcgtctttaatcttcctttagcaagtcttttactgttttcgacc
+tcaatgttcatgttcttaggttgttttggataatatgcggtcagtttaatcttcgttgtt
+tcttcttaaaatatttattcatggtttaatttttggtttgtacttgttcaggggccagtt
+cattatttactctgtttgtatacagcagttcttttatttttagtatgattttaatttaaa
+acaattctaatggtcaaaaa
diff --git a/tools/emboss_5/test-data/emboss_dan_out.png b/tools/emboss_5/test-data/emboss_dan_out.png
new file mode 100644
index 00000000000..4a8248cc311
Binary files /dev/null and b/tools/emboss_5/test-data/emboss_dan_out.png differ
diff --git a/tools/emboss_5/test-data/emboss_degapseq_out.fasta b/tools/emboss_5/test-data/emboss_degapseq_out.fasta
new file mode 100644
index 00000000000..ac2f256f675
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_degapseq_out.fasta
@@ -0,0 +1,11 @@
+>Sequence 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gttcgatgcctaaaataccttcttttgtccctacacagaccacagttttcctaatggctt
+tacaccgactagaaattcttgtgcaagcactaattgaaagcggttggcctagagtgttac
+cggtttgtatagctgagcgcgtctcttgccctgatcaaaggttcattttctctactttgg
+aagacgttgtggaagaatacaacaagtacgagtctctcccccctggtttgctgattactg
+gatacagttgtaatacccttcgcaacaccgcgtaactatctatatgaattattttccctt
+tattatatgtagtaggttcgtctttaatcttcctttagcaagtcttttactgttttcgac
+ctcaatgttcatgttcttaggttgttttggataatatgcggtcagtttaatcttcgttgt
+ttcttcttaaaatatttattcatggtttaatttttggtttgtacttgttcaggggccagt
+tcattatttactctgtttgtatacagcagttcttttatttttagtatgattttaatttaa
+aacaattctaatggtcaaaaa
diff --git a/tools/emboss_5/test-data/emboss_descseq_out.fasta b/tools/emboss_5/test-data/emboss_descseq_out.fasta
new file mode 100644
index 00000000000..3ca0007f359
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_descseq_out.fasta
@@ -0,0 +1,11 @@
+>Sequencetest 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;test
+gttcgatgcctaaaataccttcttttgtccctacacagaccacagttttcctaatggctt
+tacaccgactagaaattcttgtgcaagcactaattgaaagcggttggcctagagtgttac
+cggtttgtatagctgagcgcgtctcttgccctgatcaaaggttcattttctctactttgg
+aagacgttgtggaagaatacaacaagtacgagtctctcccccctggtttgctgattactg
+gatacagttgtaatacccttcgcaacaccgcgtaactatctatatgaattattttccctt
+tattatatgtagtaggttcgtctttaatcttcctttagcaagtcttttactgttttcgac
+ctcaatgttcatgttcttaggttgttttggataatatgcggtcagtttaatcttcgttgt
+ttcttcttaaaatatttattcatggtttaatttttggtttgtacttgttcaggggccagt
+tcattatttactctgtttgtatacagcagttcttttatttttagtatgattttaatttaa
+aacaattctaatggtcaaaaa
diff --git a/tools/emboss_5/test-data/emboss_einverted_out.einverted b/tools/emboss_5/test-data/emboss_einverted_out.einverted
new file mode 100644
index 00000000000..cc15a7364ea
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_einverted_out.einverted
@@ -0,0 +1,20 @@
+
+hg17: Score 97: 63/77 ( 81%) matches, 3 gaps
+ 2684 gtggcaggctcggttcaccaacgtcatttgcagttccccgctttatgttatggg-t--tttgttttgttttgtttttttt 2760
+ |||| |||| | |||||| || |||| |||||||||||||| | ||||| | |||||||||||||||||| |||
+ 3298 caccatccgtacaaagtggacatagcaaacatcaaggggcgaaatgtactacccaaccaaacaaaacaaaacaaaacaaa 3219
+
+hg17: Score 94: 34/36 ( 94%) matches, 0 gaps
+ 7058 gacacacacacacacacacacacacacacacacaca 7093
+ |||||||| ||||||||||| |||||||||||||||
+ 7888 ctgtgtgtatgtgtgtgtgtctgtgtgtgtgtgtgt 7853
+
+hg17: Score 139: 213/305 ( 69%) matches, 11 gaps
+ 8604 ggtggctcatgcctgtaatcccagcattttgggaggccgaggcgggtggatcac--gaggtcaggagtttgagaccagcctggccaagatggtgaagcctcgtctctactaaaaatacaaa-aattagccaggt-gcggtg-gtgggcgcctgtatttccagctacccgggaggctgaggaggctgaggcaggagaatcgcttgaacccgggaggcggaggttgcagtgagccgaggtcacgccactgcactctagcctgggcaacagagcaagactccgtcaaaaaaaaaataaaaaaataaaaaaataaaaaaa 8914
+ ||||||||| |||| ||||||||| ||||||||||| |||| || ||||| | ||| |||||||| |||||||||||| | | | | | || | |||||| ||||||| ||| || | | | || | | |||| || || | | ||| | || |||||| ||| |||| | || ||| ||| ||| | |||| ||||||||| | |||| || ||||||| |||||| | ||| |||||||| || || ||||| |||| ||||| |||| |||
+ 9563 ccaccgagt-cggatattagggtcccgaaaccctccggttccgtcctcctagcgaactcgggtcctcaagttctggtcggacccgctgtgtcgttctggggtagagattttttttatttttatttttatttttatcgactcacaccaccgtttgcgaa-cacca-ggg-tcgatgaaccctccggttccaccctccaaacggactcgggtcctacagctccgacgtcactccatactagtg-tgtcacgtgaggtcggacacactgtgtcgttctggggtag-agaatttttgttttcggttttttctattacttt 9254
+
+hg17: Score 202: 70/72 ( 97%) matches, 0 gaps
+ 18075 tgcattttattctggatggatttgaagcaaagcaccagcttctccaggctctttggggtcagccagggccag 18146
+ ||| |||||||||||||||||||||||||||||| |||||||||||||||||||||||||||||||||||||
+ 18677 acgcaaaataagacctacctaaacttcgtttcgtagtcgaagaggtccgagaaaccccagtcggtcccggtc 18606
diff --git a/tools/emboss_5/test-data/emboss_epestfind_out.epestfind b/tools/emboss_5/test-data/emboss_epestfind_out.epestfind
new file mode 100644
index 00000000000..07e9bb6fa14
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_epestfind_out.epestfind
@@ -0,0 +1,41 @@
+PEST-find: Finds PEST motifs as potential proteolytic cleavage sites.
+
+ No PEST motif was identified in Sequence from 1 to 561.
+
+
+ ---------+---------+---------+---------+---------+---------+
+
+ 1 GTTCGATGCCTAAAATACCTTCTTTTGTCCCTACACAGACCACAGTTTTCCTAATGGCTT 60
+
+
+ 61 TACACCGACTAGAAATTCTTGTGCAAGCACTAATTGAAAGCGGTTGGCCTAGAGTGTTAC 120
+
+
+ 121 CGGTTTGTATAGCTGAGCGCGTCTCTTGCCCTGATCAAAGGTTCATTTTCTCTACTTTGG 180
+
+
+ 181 AAGACGTTGTGGAAGAATACAACAAGTACGAGTCTCTCCCCCCTGGTTTGCTGATTACTG 240
+
+
+ 241 GATACAGTTGTAATACCCTTCGCAACACCGCGTAACTATCTATATGAATTATTTTCCCTT 300
+
+
+ 301 TATTATATGTAGTAGGTTCGTCTTTAATCTTCCTTTAGCAAGTCTTTTACTGTTTTCGAC 360
+
+
+ 361 CTCAATGTTCATGTTCTTAGGTTGTTTTGGATAATATGCGGTCAGTTTAATCTTCGTTGT 420
+
+
+ 421 TTCTTCTTAAAATATTTATTCATGGTTTAATTTTTGGTTTGTACTTGTTCAGGGGCCAGT 480
+
+
+ 481 TCATTATTTACTCTGTTTGTATACAGCAGTTCTTTTATTTTTAGTATGATTTTAATTTAA 540
+
+
+ 541 AACAATTCTAATGGTCAAAAA 561
+
+
+ Symbols PEST motifs
+ +++++++ potential
+ OOOOOOO poor
+
diff --git a/tools/emboss_5/test-data/emboss_equicktandem_out.equicktandem b/tools/emboss_5/test-data/emboss_equicktandem_out.equicktandem
new file mode 100644
index 00000000000..4c0a0203ddc
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_equicktandem_out.equicktandem
@@ -0,0 +1,16 @@
+ 22 8881 8915 1 35
+ 33 7059 7093 2 17
+ 29 7847 7891 2 22
+ 27 3213 3248 5 7
+ 20 9430 9457 6 4
+ 39 19631 19709 36 2
+ 39 19851 19927 36 2
+ 37 20067 20141 36 2
+ 21 19550 19630 60 1
+ 21 19770 19850 60 1
+ 79 19928 20066 60 2
+ 24 8595 8793 133 1
+ 26 2844 3045 134 1
+ 35 10945 11179 136 1
+ 22 15264 15435 138 1
+ 29 11181 11429 168 1
diff --git a/tools/emboss_5/test-data/emboss_est2genome_out.est2genome b/tools/emboss_5/test-data/emboss_est2genome_out.est2genome
new file mode 100644
index 00000000000..cd7181b615b
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_est2genome_out.est2genome
@@ -0,0 +1 @@
+Note Best alignment is between reversed est and forward genome, and splice sites imply forward gene
diff --git a/tools/emboss_5/test-data/emboss_etandem_out.table b/tools/emboss_5/test-data/emboss_etandem_out.table
new file mode 100644
index 00000000000..ab70283e4bb
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_etandem_out.table
@@ -0,0 +1,2 @@
+ 24 7847 7886 10 4 92.5 tgtgtgtgtg
+ 22 7059 7098 10 4 90.0 acacacacac
diff --git a/tools/emboss_5/test-data/emboss_extractseq_out.fasta b/tools/emboss_5/test-data/emboss_extractseq_out.fasta
new file mode 100644
index 00000000000..ac2f256f675
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_extractseq_out.fasta
@@ -0,0 +1,11 @@
+>Sequence 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gttcgatgcctaaaataccttcttttgtccctacacagaccacagttttcctaatggctt
+tacaccgactagaaattcttgtgcaagcactaattgaaagcggttggcctagagtgttac
+cggtttgtatagctgagcgcgtctcttgccctgatcaaaggttcattttctctactttgg
+aagacgttgtggaagaatacaacaagtacgagtctctcccccctggtttgctgattactg
+gatacagttgtaatacccttcgcaacaccgcgtaactatctatatgaattattttccctt
+tattatatgtagtaggttcgtctttaatcttcctttagcaagtcttttactgttttcgac
+ctcaatgttcatgttcttaggttgttttggataatatgcggtcagtttaatcttcgttgt
+ttcttcttaaaatatttattcatggtttaatttttggtttgtacttgttcaggggccagt
+tcattatttactctgtttgtatacagcagttcttttatttttagtatgattttaatttaa
+aacaattctaatggtcaaaaa
diff --git a/tools/emboss_5/test-data/emboss_freak_out.freak b/tools/emboss_5/test-data/emboss_freak_out.freak
new file mode 100644
index 00000000000..6d6a5f72b1d
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_freak_out.freak
@@ -0,0 +1,534 @@
+FREAK of Sequence from 1 to 561 Window 30 Step 1
+
+1 0.400000
+2 0.400000
+3 0.400000
+4 0.400000
+5 0.400000
+6 0.366667
+7 0.400000
+8 0.400000
+9 0.400000
+10 0.366667
+11 0.366667
+12 0.400000
+13 0.400000
+14 0.433333
+15 0.433333
+16 0.466667
+17 0.466667
+18 0.466667
+19 0.433333
+20 0.400000
+21 0.433333
+22 0.466667
+23 0.433333
+24 0.433333
+25 0.433333
+26 0.433333
+27 0.466667
+28 0.466667
+29 0.500000
+30 0.466667
+31 0.433333
+32 0.400000
+33 0.400000
+34 0.433333
+35 0.400000
+36 0.433333
+37 0.433333
+38 0.466667
+39 0.433333
+40 0.466667
+41 0.433333
+42 0.400000
+43 0.433333
+44 0.400000
+45 0.400000
+46 0.366667
+47 0.366667
+48 0.366667
+49 0.400000
+50 0.400000
+51 0.366667
+52 0.366667
+53 0.366667
+54 0.400000
+55 0.433333
+56 0.433333
+57 0.400000
+58 0.400000
+59 0.400000
+60 0.400000
+61 0.433333
+62 0.433333
+63 0.433333
+64 0.400000
+65 0.400000
+66 0.366667
+67 0.366667
+68 0.333333
+69 0.333333
+70 0.300000
+71 0.333333
+72 0.366667
+73 0.366667
+74 0.400000
+75 0.400000
+76 0.400000
+77 0.433333
+78 0.466667
+79 0.466667
+80 0.500000
+81 0.500000
+82 0.466667
+83 0.500000
+84 0.466667
+85 0.466667
+86 0.466667
+87 0.500000
+88 0.466667
+89 0.433333
+90 0.433333
+91 0.433333
+92 0.466667
+93 0.500000
+94 0.533333
+95 0.533333
+96 0.533333
+97 0.500000
+98 0.533333
+99 0.533333
+100 0.533333
+101 0.500000
+102 0.466667
+103 0.466667
+104 0.466667
+105 0.466667
+106 0.500000
+107 0.466667
+108 0.466667
+109 0.466667
+110 0.466667
+111 0.500000
+112 0.533333
+113 0.500000
+114 0.533333
+115 0.500000
+116 0.533333
+117 0.500000
+118 0.500000
+119 0.533333
+120 0.566667
+121 0.566667
+122 0.566667
+123 0.533333
+124 0.533333
+125 0.533333
+126 0.533333
+127 0.566667
+128 0.533333
+129 0.533333
+130 0.533333
+131 0.566667
+132 0.600000
+133 0.566667
+134 0.533333
+135 0.566667
+136 0.533333
+137 0.533333
+138 0.500000
+139 0.466667
+140 0.433333
+141 0.433333
+142 0.400000
+143 0.433333
+144 0.400000
+145 0.400000
+146 0.400000
+147 0.400000
+148 0.400000
+149 0.366667
+150 0.366667
+151 0.366667
+152 0.333333
+153 0.333333
+154 0.333333
+155 0.333333
+156 0.366667
+157 0.366667
+158 0.366667
+159 0.366667
+160 0.400000
+161 0.366667
+162 0.366667
+163 0.400000
+164 0.400000
+165 0.366667
+166 0.400000
+167 0.400000
+168 0.400000
+169 0.400000
+170 0.400000
+171 0.400000
+172 0.400000
+173 0.366667
+174 0.400000
+175 0.400000
+176 0.366667
+177 0.400000
+178 0.400000
+179 0.400000
+180 0.400000
+181 0.400000
+182 0.400000
+183 0.433333
+184 0.400000
+185 0.433333
+186 0.400000
+187 0.400000
+188 0.400000
+189 0.433333
+190 0.433333
+191 0.466667
+192 0.466667
+193 0.466667
+194 0.500000
+195 0.500000
+196 0.500000
+197 0.533333
+198 0.533333
+199 0.533333
+200 0.533333
+201 0.533333
+202 0.566667
+203 0.566667
+204 0.566667
+205 0.566667
+206 0.566667
+207 0.533333
+208 0.533333
+209 0.566667
+210 0.533333
+211 0.533333
+212 0.566667
+213 0.533333
+214 0.533333
+215 0.500000
+216 0.533333
+217 0.500000
+218 0.533333
+219 0.500000
+220 0.466667
+221 0.466667
+222 0.433333
+223 0.400000
+224 0.366667
+225 0.366667
+226 0.333333
+227 0.333333
+228 0.366667
+229 0.400000
+230 0.400000
+231 0.366667
+232 0.366667
+233 0.400000
+234 0.400000
+235 0.400000
+236 0.400000
+237 0.433333
+238 0.433333
+239 0.433333
+240 0.466667
+241 0.466667
+242 0.466667
+243 0.500000
+244 0.500000
+245 0.500000
+246 0.466667
+247 0.500000
+248 0.466667
+249 0.466667
+250 0.466667
+251 0.466667
+252 0.466667
+253 0.466667
+254 0.466667
+255 0.466667
+256 0.466667
+257 0.466667
+258 0.433333
+259 0.400000
+260 0.400000
+261 0.400000
+262 0.366667
+263 0.333333
+264 0.300000
+265 0.300000
+266 0.300000
+267 0.300000
+268 0.333333
+269 0.333333
+270 0.300000
+271 0.266667
+272 0.233333
+273 0.200000
+274 0.200000
+275 0.200000
+276 0.200000
+277 0.166667
+278 0.166667
+279 0.166667
+280 0.200000
+281 0.166667
+282 0.166667
+283 0.200000
+284 0.200000
+285 0.200000
+286 0.233333
+287 0.233333
+288 0.233333
+289 0.233333
+290 0.266667
+291 0.300000
+292 0.300000
+293 0.333333
+294 0.333333
+295 0.333333
+296 0.333333
+297 0.300000
+298 0.266667
+299 0.233333
+300 0.266667
+301 0.266667
+302 0.266667
+303 0.300000
+304 0.333333
+305 0.333333
+306 0.333333
+307 0.333333
+308 0.333333
+309 0.366667
+310 0.366667
+311 0.366667
+312 0.366667
+313 0.366667
+314 0.366667
+315 0.400000
+316 0.366667
+317 0.333333
+318 0.333333
+319 0.333333
+320 0.300000
+321 0.300000
+322 0.300000
+323 0.300000
+324 0.300000
+325 0.300000
+326 0.300000
+327 0.300000
+328 0.333333
+329 0.366667
+330 0.333333
+331 0.366667
+332 0.400000
+333 0.366667
+334 0.366667
+335 0.366667
+336 0.366667
+337 0.366667
+338 0.400000
+339 0.366667
+340 0.333333
+341 0.366667
+342 0.366667
+343 0.333333
+344 0.366667
+345 0.333333
+346 0.333333
+347 0.366667
+348 0.366667
+349 0.366667
+350 0.366667
+351 0.366667
+352 0.400000
+353 0.366667
+354 0.366667
+355 0.400000
+356 0.400000
+357 0.400000
+358 0.366667
+359 0.333333
+360 0.366667
+361 0.366667
+362 0.333333
+363 0.333333
+364 0.300000
+365 0.300000
+366 0.300000
+367 0.300000
+368 0.266667
+369 0.300000
+370 0.333333
+371 0.333333
+372 0.366667
+373 0.366667
+374 0.366667
+375 0.366667
+376 0.400000
+377 0.366667
+378 0.366667
+379 0.366667
+380 0.366667
+381 0.333333
+382 0.300000
+383 0.333333
+384 0.333333
+385 0.300000
+386 0.333333
+387 0.366667
+388 0.366667
+389 0.366667
+390 0.366667
+391 0.333333
+392 0.333333
+393 0.333333
+394 0.366667
+395 0.366667
+396 0.366667
+397 0.400000
+398 0.400000
+399 0.366667
+400 0.333333
+401 0.300000
+402 0.266667
+403 0.266667
+404 0.233333
+405 0.233333
+406 0.200000
+407 0.200000
+408 0.200000
+409 0.200000
+410 0.200000
+411 0.200000
+412 0.233333
+413 0.200000
+414 0.200000
+415 0.233333
+416 0.233333
+417 0.200000
+418 0.200000
+419 0.200000
+420 0.166667
+421 0.166667
+422 0.166667
+423 0.166667
+424 0.133333
+425 0.133333
+426 0.133333
+427 0.133333
+428 0.166667
+429 0.166667
+430 0.166667
+431 0.166667
+432 0.200000
+433 0.200000
+434 0.200000
+435 0.233333
+436 0.233333
+437 0.233333
+438 0.266667
+439 0.266667
+440 0.266667
+441 0.300000
+442 0.266667
+443 0.300000
+444 0.333333
+445 0.333333
+446 0.333333
+447 0.366667
+448 0.400000
+449 0.400000
+450 0.433333
+451 0.433333
+452 0.433333
+453 0.466667
+454 0.466667
+455 0.466667
+456 0.466667
+457 0.433333
+458 0.400000
+459 0.400000
+460 0.400000
+461 0.400000
+462 0.400000
+463 0.400000
+464 0.433333
+465 0.400000
+466 0.433333
+467 0.433333
+468 0.400000
+469 0.400000
+470 0.433333
+471 0.400000
+472 0.400000
+473 0.366667
+474 0.333333
+475 0.333333
+476 0.300000
+477 0.300000
+478 0.300000
+479 0.300000
+480 0.300000
+481 0.300000
+482 0.300000
+483 0.300000
+484 0.300000
+485 0.300000
+486 0.300000
+487 0.300000
+488 0.300000
+489 0.300000
+490 0.300000
+491 0.300000
+492 0.266667
+493 0.266667
+494 0.233333
+495 0.266667
+496 0.233333
+497 0.233333
+498 0.233333
+499 0.266667
+500 0.233333
+501 0.233333
+502 0.233333
+503 0.233333
+504 0.233333
+505 0.200000
+506 0.200000
+507 0.166667
+508 0.133333
+509 0.133333
+510 0.100000
+511 0.100000
+512 0.100000
+513 0.066667
+514 0.100000
+515 0.100000
+516 0.100000
+517 0.100000
+518 0.100000
+519 0.133333
+520 0.133333
+521 0.133333
+522 0.133333
+523 0.133333
+524 0.166667
+525 0.166667
+526 0.166667
+527 0.200000
+528 0.200000
+529 0.166667
+530 0.166667
+531 0.166667
+532 0.166667
diff --git a/tools/emboss_5/test-data/emboss_fuzznuc_out.tabular b/tools/emboss_5/test-data/emboss_fuzznuc_out.tabular
new file mode 100644
index 00000000000..a79f0c5082f
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_fuzznuc_out.tabular
@@ -0,0 +1,41 @@
+SeqName Start End Score Strand Pattern_name Mismatch
+Sequence 12 13 2 + pattern1 .
+Sequence 13 14 2 + pattern1 .
+Sequence 14 15 2 + pattern1 .
+Sequence 53 54 2 + pattern1 .
+Sequence 73 74 2 + pattern1 .
+Sequence 74 75 2 + pattern1 .
+Sequence 85 86 2 + pattern1 .
+Sequence 92 93 2 + pattern1 .
+Sequence 97 98 2 + pattern1 .
+Sequence 98 99 2 + pattern1 .
+Sequence 157 158 2 + pattern1 .
+Sequence 158 159 2 + pattern1 .
+Sequence 181 182 2 + pattern1 .
+Sequence 193 194 2 + pattern1 .
+Sequence 196 197 2 + pattern1 .
+Sequence 201 202 2 + pattern1 .
+Sequence 204 205 2 + pattern1 .
+Sequence 252 253 2 + pattern1 .
+Sequence 264 265 2 + pattern1 .
+Sequence 274 275 2 + pattern1 .
+Sequence 287 288 2 + pattern1 .
+Sequence 326 327 2 + pattern1 .
+Sequence 340 341 2 + pattern1 .
+Sequence 364 365 2 + pattern1 .
+Sequence 393 394 2 + pattern1 .
+Sequence 409 410 2 + pattern1 .
+Sequence 429 430 2 + pattern1 .
+Sequence 430 431 2 + pattern1 .
+Sequence 431 432 2 + pattern1 .
+Sequence 449 450 2 + pattern1 .
+Sequence 534 535 2 + pattern1 .
+Sequence 539 540 2 + pattern1 .
+Sequence 540 541 2 + pattern1 .
+Sequence 541 542 2 + pattern1 .
+Sequence 544 545 2 + pattern1 .
+Sequence 550 551 2 + pattern1 .
+Sequence 557 558 2 + pattern1 .
+Sequence 558 559 2 + pattern1 .
+Sequence 559 560 2 + pattern1 .
+Sequence 560 561 2 + pattern1 .
diff --git a/tools/emboss_5/test-data/emboss_fuzzpro_out.tabular b/tools/emboss_5/test-data/emboss_fuzzpro_out.tabular
new file mode 100644
index 00000000000..a79f0c5082f
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_fuzzpro_out.tabular
@@ -0,0 +1,41 @@
+SeqName Start End Score Strand Pattern_name Mismatch
+Sequence 12 13 2 + pattern1 .
+Sequence 13 14 2 + pattern1 .
+Sequence 14 15 2 + pattern1 .
+Sequence 53 54 2 + pattern1 .
+Sequence 73 74 2 + pattern1 .
+Sequence 74 75 2 + pattern1 .
+Sequence 85 86 2 + pattern1 .
+Sequence 92 93 2 + pattern1 .
+Sequence 97 98 2 + pattern1 .
+Sequence 98 99 2 + pattern1 .
+Sequence 157 158 2 + pattern1 .
+Sequence 158 159 2 + pattern1 .
+Sequence 181 182 2 + pattern1 .
+Sequence 193 194 2 + pattern1 .
+Sequence 196 197 2 + pattern1 .
+Sequence 201 202 2 + pattern1 .
+Sequence 204 205 2 + pattern1 .
+Sequence 252 253 2 + pattern1 .
+Sequence 264 265 2 + pattern1 .
+Sequence 274 275 2 + pattern1 .
+Sequence 287 288 2 + pattern1 .
+Sequence 326 327 2 + pattern1 .
+Sequence 340 341 2 + pattern1 .
+Sequence 364 365 2 + pattern1 .
+Sequence 393 394 2 + pattern1 .
+Sequence 409 410 2 + pattern1 .
+Sequence 429 430 2 + pattern1 .
+Sequence 430 431 2 + pattern1 .
+Sequence 431 432 2 + pattern1 .
+Sequence 449 450 2 + pattern1 .
+Sequence 534 535 2 + pattern1 .
+Sequence 539 540 2 + pattern1 .
+Sequence 540 541 2 + pattern1 .
+Sequence 541 542 2 + pattern1 .
+Sequence 544 545 2 + pattern1 .
+Sequence 550 551 2 + pattern1 .
+Sequence 557 558 2 + pattern1 .
+Sequence 558 559 2 + pattern1 .
+Sequence 559 560 2 + pattern1 .
+Sequence 560 561 2 + pattern1 .
diff --git a/tools/emboss_5/test-data/emboss_fuzztran_out.tabular b/tools/emboss_5/test-data/emboss_fuzztran_out.tabular
new file mode 100644
index 00000000000..fc54aa49fd9
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_fuzztran_out.tabular
@@ -0,0 +1,133 @@
+SeqName Start End Score Strand Pattern_name Mismatch Frame PStart PEnd Translation
+hg17 3958 3963 2 + pattern1 . 1 1320 1321 AA
+hg17 3961 3966 2 + pattern1 . 1 1321 1322 AA
+hg17 4099 4104 2 + pattern1 . 1 1367 1368 AA
+hg17 4315 4320 2 + pattern1 . 1 1439 1440 AA
+hg17 5194 5199 2 + pattern1 . 1 1732 1733 AA
+hg17 8584 8589 2 + pattern1 . 1 2862 2863 AA
+hg17 9232 9237 2 + pattern1 . 1 3078 3079 AA
+hg17 9343 9348 2 + pattern1 . 1 3115 3116 AA
+hg17 9715 9720 2 + pattern1 . 1 3239 3240 AA
+hg17 9769 9774 2 + pattern1 . 1 3257 3258 AA
+hg17 9841 9846 2 + pattern1 . 1 3281 3282 AA
+hg17 9994 9999 2 + pattern1 . 1 3332 3333 AA
+hg17 10045 10050 2 + pattern1 . 1 3349 3350 AA
+hg17 10048 10053 2 + pattern1 . 1 3350 3351 AA
+hg17 12157 12162 2 + pattern1 . 1 4053 4054 AA
+hg17 12487 12492 2 + pattern1 . 1 4163 4164 AA
+hg17 12688 12693 2 + pattern1 . 1 4230 4231 AA
+hg17 12691 12696 2 + pattern1 . 1 4231 4232 AA
+hg17 15010 15015 2 + pattern1 . 1 5004 5005 AA
+hg17 17521 17526 2 + pattern1 . 1 5841 5842 AA
+hg17 17551 17556 2 + pattern1 . 1 5851 5852 AA
+hg17 1148 1153 2 + pattern1 . 2 383 384 AA
+hg17 2078 2083 2 + pattern1 . 2 693 694 AA
+hg17 2432 2437 2 + pattern1 . 2 811 812 AA
+hg17 3080 3085 2 + pattern1 . 2 1027 1028 AA
+hg17 3593 3598 2 + pattern1 . 2 1198 1199 AA
+hg17 3692 3697 2 + pattern1 . 2 1231 1232 AA
+hg17 4055 4060 2 + pattern1 . 2 1352 1353 AA
+hg17 5018 5023 2 + pattern1 . 2 1673 1674 AA
+hg17 5147 5152 2 + pattern1 . 2 1716 1717 AA
+hg17 8276 8281 2 + pattern1 . 2 2759 2760 AA
+hg17 9587 9592 2 + pattern1 . 2 3196 3197 AA
+hg17 9668 9673 2 + pattern1 . 2 3223 3224 AA
+hg17 9920 9925 2 + pattern1 . 2 3307 3308 AA
+hg17 9971 9976 2 + pattern1 . 2 3324 3325 AA
+hg17 10112 10117 2 + pattern1 . 2 3371 3372 AA
+hg17 10115 10120 2 + pattern1 . 2 3372 3373 AA
+hg17 11837 11842 2 + pattern1 . 2 3946 3947 AA
+hg17 12026 12031 2 + pattern1 . 2 4009 4010 AA
+hg17 12944 12949 2 + pattern1 . 2 4315 4316 AA
+hg17 12953 12958 2 + pattern1 . 2 4318 4319 AA
+hg17 13229 13234 2 + pattern1 . 2 4410 4411 AA
+hg17 13232 13237 2 + pattern1 . 2 4411 4412 AA
+hg17 15356 15361 2 + pattern1 . 2 5119 5120 AA
+hg17 15482 15487 2 + pattern1 . 2 5161 5162 AA
+hg17 16061 16066 2 + pattern1 . 2 5354 5355 AA
+hg17 17822 17827 2 + pattern1 . 2 5941 5942 AA
+hg17 15 20 2 + pattern1 . 3 5 6 AA
+hg17 33 38 2 + pattern1 . 3 11 12 AA
+hg17 3669 3674 2 + pattern1 . 3 1223 1224 AA
+hg17 3759 3764 2 + pattern1 . 3 1253 1254 AA
+hg17 5646 5651 2 + pattern1 . 3 1882 1883 AA
+hg17 5847 5852 2 + pattern1 . 3 1949 1950 AA
+hg17 5850 5855 2 + pattern1 . 3 1950 1951 AA
+hg17 5853 5858 2 + pattern1 . 3 1951 1952 AA
+hg17 7674 7679 2 + pattern1 . 3 2558 2559 AA
+hg17 9699 9704 2 + pattern1 . 3 3233 3234 AA
+hg17 9891 9896 2 + pattern1 . 3 3297 3298 AA
+hg17 10074 10079 2 + pattern1 . 3 3358 3359 AA
+hg17 10407 10412 2 + pattern1 . 3 3469 3470 AA
+hg17 12675 12680 2 + pattern1 . 3 4225 4226 AA
+hg17 13746 13751 2 + pattern1 . 3 4582 4583 AA
+hg17 17115 17120 2 + pattern1 . 3 5705 5706 AA
+hg17 17421 17426 2 + pattern1 . 3 5807 5808 AA
+hg17 19122 19127 2 + pattern1 . 3 6374 6375 AA
+hg17 19353 19358 2 + pattern1 . 3 6451 6452 AA
+hg17 -2312 -2317 2 - pattern1 . 1 772 773 AA
+hg17 -4073 -4078 2 - pattern1 . 1 1359 1360 AA
+hg17 -4652 -4657 2 - pattern1 . 1 1552 1553 AA
+hg17 -4778 -4783 2 - pattern1 . 1 1594 1595 AA
+hg17 -6902 -6907 2 - pattern1 . 1 2302 2303 AA
+hg17 -6905 -6910 2 - pattern1 . 1 2303 2304 AA
+hg17 -7181 -7186 2 - pattern1 . 1 2395 2396 AA
+hg17 -7190 -7195 2 - pattern1 . 1 2398 2399 AA
+hg17 -8108 -8113 2 - pattern1 . 1 2704 2705 AA
+hg17 -8297 -8302 2 - pattern1 . 1 2767 2768 AA
+hg17 -10019 -10024 2 - pattern1 . 1 3341 3342 AA
+hg17 -10022 -10027 2 - pattern1 . 1 3342 3343 AA
+hg17 -10163 -10168 2 - pattern1 . 1 3389 3390 AA
+hg17 -10214 -10219 2 - pattern1 . 1 3406 3407 AA
+hg17 -10466 -10471 2 - pattern1 . 1 3490 3491 AA
+hg17 -10547 -10552 2 - pattern1 . 1 3517 3518 AA
+hg17 -11858 -11863 2 - pattern1 . 1 3954 3955 AA
+hg17 -14987 -14992 2 - pattern1 . 1 4997 4998 AA
+hg17 -15116 -15121 2 - pattern1 . 1 5040 5041 AA
+hg17 -16079 -16084 2 - pattern1 . 1 5361 5362 AA
+hg17 -16442 -16447 2 - pattern1 . 1 5482 5483 AA
+hg17 -16541 -16546 2 - pattern1 . 1 5515 5516 AA
+hg17 -17054 -17059 2 - pattern1 . 1 5686 5687 AA
+hg17 -17702 -17707 2 - pattern1 . 1 5902 5903 AA
+hg17 -18056 -18061 2 - pattern1 . 1 6020 6021 AA
+hg17 -18986 -18991 2 - pattern1 . 1 6330 6331 AA
+hg17 -783 -788 2 - pattern1 . 2 262 263 AA
+hg17 -1014 -1019 2 - pattern1 . 2 339 340 AA
+hg17 -2715 -2720 2 - pattern1 . 2 906 907 AA
+hg17 -3021 -3026 2 - pattern1 . 2 1008 1009 AA
+hg17 -6390 -6395 2 - pattern1 . 2 2131 2132 AA
+hg17 -7461 -7466 2 - pattern1 . 2 2488 2489 AA
+hg17 -9729 -9734 2 - pattern1 . 2 3244 3245 AA
+hg17 -10062 -10067 2 - pattern1 . 2 3355 3356 AA
+hg17 -10245 -10250 2 - pattern1 . 2 3416 3417 AA
+hg17 -10437 -10442 2 - pattern1 . 2 3480 3481 AA
+hg17 -12462 -12467 2 - pattern1 . 2 4155 4156 AA
+hg17 -14283 -14288 2 - pattern1 . 2 4762 4763 AA
+hg17 -14286 -14291 2 - pattern1 . 2 4763 4764 AA
+hg17 -14289 -14294 2 - pattern1 . 2 4764 4765 AA
+hg17 -14490 -14495 2 - pattern1 . 2 4831 4832 AA
+hg17 -16377 -16382 2 - pattern1 . 2 5460 5461 AA
+hg17 -16467 -16472 2 - pattern1 . 2 5490 5491 AA
+hg17 -20103 -20108 2 - pattern1 . 2 6702 6703 AA
+hg17 -20121 -20126 2 - pattern1 . 2 6708 6709 AA
+hg17 17553 17548 2 - pattern1 . 3 863 864 AA
+hg17 17523 17518 2 - pattern1 . 3 873 874 AA
+hg17 15012 15007 2 - pattern1 . 3 1710 1711 AA
+hg17 12693 12688 2 - pattern1 . 3 2483 2484 AA
+hg17 12690 12685 2 - pattern1 . 3 2484 2485 AA
+hg17 12489 12484 2 - pattern1 . 3 2551 2552 AA
+hg17 12159 12154 2 - pattern1 . 3 2661 2662 AA
+hg17 10050 10045 2 - pattern1 . 3 3364 3365 AA
+hg17 10047 10042 2 - pattern1 . 3 3365 3366 AA
+hg17 9996 9991 2 - pattern1 . 3 3382 3383 AA
+hg17 9843 9838 2 - pattern1 . 3 3433 3434 AA
+hg17 9771 9766 2 - pattern1 . 3 3457 3458 AA
+hg17 9717 9712 2 - pattern1 . 3 3475 3476 AA
+hg17 9345 9340 2 - pattern1 . 3 3599 3600 AA
+hg17 9234 9229 2 - pattern1 . 3 3636 3637 AA
+hg17 8586 8581 2 - pattern1 . 3 3852 3853 AA
+hg17 5196 5191 2 - pattern1 . 3 4982 4983 AA
+hg17 4317 4312 2 - pattern1 . 3 5275 5276 AA
+hg17 4101 4096 2 - pattern1 . 3 5347 5348 AA
+hg17 3963 3958 2 - pattern1 . 3 5393 5394 AA
+hg17 3960 3955 2 - pattern1 . 3 5394 5395 AA
diff --git a/tools/emboss_5/test-data/emboss_garnier_out.tabular b/tools/emboss_5/test-data/emboss_garnier_out.tabular
new file mode 100644
index 00000000000..6c4ffb9b59f
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_garnier_out.tabular
@@ -0,0 +1,102 @@
+SeqName Start End Score Strand helix sheet turns coil
+Sequence 1 9 0.000 + . . T .
+Sequence 10 10 0.000 + . E . .
+Sequence 11 16 0.000 + H . . .
+Sequence 17 39 0.000 + . . T .
+Sequence 40 40 0.000 + H . . .
+Sequence 41 42 0.000 + . E . .
+Sequence 43 48 0.000 + . . T .
+Sequence 49 52 0.000 + . E . .
+Sequence 53 68 0.000 + . . T .
+Sequence 69 75 0.000 + H . . .
+Sequence 76 78 0.000 + . E . .
+Sequence 79 87 0.000 + . . T .
+Sequence 88 90 0.000 + . E . .
+Sequence 91 96 0.000 + H . . .
+Sequence 97 98 0.000 + . E . .
+Sequence 99 99 0.000 + . . . C
+Sequence 100 107 0.000 + . . T .
+Sequence 108 111 0.000 + . E . .
+Sequence 112 116 0.000 + . . T .
+Sequence 117 120 0.000 + . E . .
+Sequence 121 123 0.000 + . . T .
+Sequence 124 126 0.000 + . . . C
+Sequence 127 131 0.000 + . E . .
+Sequence 132 153 0.000 + . . T .
+Sequence 154 157 0.000 + . E . .
+Sequence 158 161 0.000 + . . T .
+Sequence 162 162 0.000 + . . . C
+Sequence 163 164 0.000 + . E . .
+Sequence 165 172 0.000 + . . T .
+Sequence 173 176 0.000 + . E . .
+Sequence 177 180 0.000 + . . T .
+Sequence 181 183 0.000 + . . . C
+Sequence 184 187 0.000 + . E . .
+Sequence 188 194 0.000 + . . . C
+Sequence 195 206 0.000 + H . . .
+Sequence 207 234 0.000 + . . T .
+Sequence 235 237 0.000 + . E . .
+Sequence 238 241 0.000 + . . T .
+Sequence 242 242 0.000 + . . . C
+Sequence 243 246 0.000 + . E . .
+Sequence 247 247 0.000 + . . T .
+Sequence 248 249 0.000 + . . . C
+Sequence 250 275 0.000 + . . T .
+Sequence 276 282 0.000 + . E . .
+Sequence 283 283 0.000 + H . . .
+Sequence 284 289 0.000 + . . . C
+Sequence 290 301 0.000 + . . T .
+Sequence 302 307 0.000 + . E . .
+Sequence 308 313 0.000 + . . . C
+Sequence 314 321 0.000 + . . T .
+Sequence 322 322 0.000 + . E . .
+Sequence 323 344 0.000 + . . T .
+Sequence 345 348 0.000 + . E . .
+Sequence 349 360 0.000 + . . T .
+Sequence 361 363 0.000 + . E . .
+Sequence 364 374 0.000 + . . T .
+Sequence 375 378 0.000 + . E . .
+Sequence 379 381 0.000 + . . T .
+Sequence 382 384 0.000 + . . . C
+Sequence 385 386 0.000 + . E . .
+Sequence 387 392 0.000 + . . . C
+Sequence 393 396 0.000 + . E . .
+Sequence 397 401 0.000 + . . T .
+Sequence 402 402 0.000 + . . . C
+Sequence 403 403 0.000 + . E . .
+Sequence 404 406 0.000 + . . T .
+Sequence 407 407 0.000 + . . . C
+Sequence 408 409 0.000 + . . T .
+Sequence 410 412 0.000 + . E . .
+Sequence 413 422 0.000 + . . T .
+Sequence 423 427 0.000 + . E . .
+Sequence 428 436 0.000 + H . . .
+Sequence 437 441 0.000 + . E . .
+Sequence 442 444 0.000 + . . T .
+Sequence 445 447 0.000 + . . . C
+Sequence 448 452 0.000 + . E . .
+Sequence 453 455 0.000 + . . . C
+Sequence 456 457 0.000 + . . T .
+Sequence 458 460 0.000 + . . . C
+Sequence 461 463 0.000 + . E . .
+Sequence 464 467 0.000 + . . T .
+Sequence 468 469 0.000 + . E . .
+Sequence 470 480 0.000 + . . T .
+Sequence 481 484 0.000 + . E . .
+Sequence 485 490 0.000 + . . T .
+Sequence 491 491 0.000 + . E . .
+Sequence 492 496 0.000 + . . T .
+Sequence 497 497 0.000 + . . . C
+Sequence 498 500 0.000 + . . T .
+Sequence 501 504 0.000 + . E . .
+Sequence 505 510 0.000 + . . T .
+Sequence 511 514 0.000 + . E . .
+Sequence 515 517 0.000 + . . . C
+Sequence 518 520 0.000 + . E . .
+Sequence 521 532 0.000 + . . . C
+Sequence 533 534 0.000 + . E . .
+Sequence 535 547 0.000 + H . . .
+Sequence 548 549 0.000 + . E . .
+Sequence 550 554 0.000 + . . T .
+Sequence 555 555 0.000 + . . . C
+Sequence 556 561 0.000 + H . . .
diff --git a/tools/emboss_5/test-data/emboss_geecee_out.geecee b/tools/emboss_5/test-data/emboss_geecee_out.geecee
new file mode 100644
index 00000000000..47685ffedbb
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_geecee_out.geecee
@@ -0,0 +1,2 @@
+#Sequence GC content
+Sequence 0.36
diff --git a/tools/emboss_5/test-data/emboss_getorf_out.fasta b/tools/emboss_5/test-data/emboss_getorf_out.fasta
new file mode 100644
index 00000000000..13fba1bde65
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_getorf_out.fasta
@@ -0,0 +1,65 @@
+>Sequence_1 [1 - 51] 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+VRCLKYLLLSLHRPQFS
+>Sequence_2 [14 - 94] 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+NTFFCPYTDHSFPNGFTPTRNSCASTN
+>Sequence_3 [94 - 129] 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+LKAVGLECYRFV
+>Sequence_4 [133 - 231] 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+LSASLALIKGSFSLLWKTLWKNTTSTSLSPLVC
+>Sequence_5 [155 - 250] 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+SKVHFLYFGRRCGRIQQVRVSPPWFADYWIQL
+>Sequence_6 [3 - 272] 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+SMPKIPSFVPTQTTVFLMALHRLEILVQALIESGWPRVLPVCIAERVSCPDQRFIFSTLE
+DVVEEYNKYESLPPGLLITGYSCNTLRNTA
+>Sequence_7 [235 - 309] 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+LLDTVVIPFATPRNYLYELFSLYYM
+>Sequence_8 [288 - 335] 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+IIFPLLYVVGSSLIFL
+>Sequence_9 [339 - 377] 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+QVFYCFRPQCSCS
+>Sequence_10 [254 - 391] 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+YPSQHRVTIYMNYFPFIICSRFVFNLPLASLLLFSTSMFMFLGCFG
+>Sequence_11 [395 - 427] 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+YAVSLIFVVSS
+>Sequence_12 [328 - 447] 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+SSFSKSFTVFDLNVHVLRLFWIICGQFNLRCFFLKYLFMV
+>Sequence_13 [411 - 521] 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+SSLFLLKIFIHGLIFGLYLFRGQFIIYSVCIQQFFYF
+>Sequence_14 [431 - 526] 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+NIYSWFNFWFVLVQGPVHYLLCLYTAVLLFLV
+>Sequence_15 [451 - 537] 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+FLVCTCSGASSLFTLFVYSSSFIFSMILI
+>Sequence_16 [531 - 487] (REVERSE SENSE) 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+NHTKNKRTAVYKQSK
+>Sequence_17 [536 - 450] (REVERSE SENSE) 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+IKIILKIKELLYTNRVNNELAPEQVQTKN
+>Sequence_18 [487 - 443] (REVERSE SENSE) 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+IMNWPLNKYKPKIKP
+>Sequence_19 [468 - 439] (REVERSE SENSE) 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+TSTNQKLNHE
+>Sequence_20 [439 - 410] (REVERSE SENSE) 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+INILRRNNED
+>Sequence_21 [446 - 405] (REVERSE SENSE) 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+TMNKYFKKKQRRLN
+>Sequence_22 [401 - 372] (REVERSE SENSE) 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+PHIIQNNLRT
+>Sequence_23 [368 - 327] (REVERSE SENSE) 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+TLRSKTVKDLLKED
+>Sequence_24 [426 - 292] (REVERSE SENSE) 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+EETTKIKLTAYYPKQPKNMNIEVENSKRLAKGRLKTNLLHIIKGK
+>Sequence_25 [279 - 238] (REVERSE SENSE) 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+IVTRCCEGYYNCIQ
+>Sequence_26 [234 - 175] (REVERSE SENSE) 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+SANQGGETRTCCILPQRLPK
+>Sequence_27 [334 - 158] (REVERSE SENSE) 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+RKIKDEPTTYNKGKIIHIDSYAVLRRVLQLYPVISKPGGRDSYLLYSSTTSSKVEKMNL
+>Sequence_28 [275 - 120] (REVERSE SENSE) 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+LRGVAKGITTVSSNQQTRGERLVLVVFFHNVFQSRENEPLIRARDALSYTNR
+>Sequence_29 [162 - 112] (REVERSE SENSE) 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+TFDQGKRRAQLYKPVTL
+>Sequence_30 [108 - 34] (REVERSE SENSE) 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+ANRFQLVLAQEFLVGVKPLGKLWSV
+>Sequence_31 [50 - 3] (REVERSE SENSE) 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+ENCGLCRDKRRYFRHR
+>Sequence_32 [154 - 2] (REVERSE SENSE) 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+SGQETRSAIQTGNTLGQPLSISACTRISSRCKAIRKTVVCVGTKEGILGIE
diff --git a/tools/emboss_5/test-data/emboss_helixturnhelix_out.tabular b/tools/emboss_5/test-data/emboss_helixturnhelix_out.tabular
new file mode 100644
index 00000000000..de42371b131
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_helixturnhelix_out.tabular
@@ -0,0 +1 @@
+SeqName Start End Score Strand Maximum_score_at Standard_deviations
diff --git a/tools/emboss_5/test-data/emboss_hmoment_out.hmoment b/tools/emboss_5/test-data/emboss_hmoment_out.hmoment
new file mode 100644
index 00000000000..61c31db8c3d
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_hmoment_out.hmoment
@@ -0,0 +1,556 @@
+HMOMENT of Sequence from 1 to 561
+
+Window: 10 Angle: 100 Max uH: 0.205
+Position uH
+1 0.100
+2 0.071
+3 0.127
+4 0.152
+5 0.127
+6 0.056
+7 0.049
+8 0.032
+9 0.066
+10 0.041
+11 0.019
+12 0.020
+13 0.081
+14 0.125
+15 0.092
+16 0.044
+17 0.040
+18 0.051
+19 0.063
+20 0.038
+21 0.063
+22 0.052
+23 0.065
+24 0.086
+25 0.106
+26 0.073
+27 0.048
+28 0.088
+29 0.082
+30 0.044
+31 0.007
+32 0.035
+33 0.041
+34 0.094
+35 0.035
+36 0.045
+37 0.073
+38 0.069
+39 0.024
+40 0.055
+41 0.040
+42 0.007
+43 0.066
+44 0.009
+45 0.071
+46 0.111
+47 0.095
+48 0.144
+49 0.138
+50 0.143
+51 0.113
+52 0.120
+53 0.078
+54 0.051
+55 0.042
+56 0.035
+57 0.055
+58 0.027
+59 0.037
+60 0.029
+61 0.032
+62 0.077
+63 0.148
+64 0.108
+65 0.035
+66 0.098
+67 0.128
+68 0.118
+69 0.083
+70 0.108
+71 0.112
+72 0.076
+73 0.116
+74 0.102
+75 0.043
+76 0.090
+77 0.073
+78 0.025
+79 0.031
+80 0.058
+81 0.043
+82 0.066
+83 0.075
+84 0.146
+85 0.173
+86 0.140
+87 0.142
+88 0.200
+89 0.154
+90 0.089
+91 0.140
+92 0.121
+93 0.063
+94 0.055
+95 0.051
+96 0.057
+97 0.075
+98 0.136
+99 0.132
+100 0.068
+101 0.067
+102 0.076
+103 0.055
+104 0.019
+105 0.043
+106 0.041
+107 0.022
+108 0.064
+109 0.060
+110 0.085
+111 0.090
+112 0.111
+113 0.049
+114 0.083
+115 0.131
+116 0.137
+117 0.099
+118 0.119
+119 0.120
+120 0.054
+121 0.064
+122 0.059
+123 0.042
+124 0.026
+125 0.032
+126 0.078
+127 0.104
+128 0.117
+129 0.096
+130 0.116
+131 0.108
+132 0.084
+133 0.056
+134 0.063
+135 0.058
+136 0.050
+137 0.048
+138 0.025
+139 0.047
+140 0.093
+141 0.072
+142 0.027
+143 0.021
+144 0.053
+145 0.022
+146 0.049
+147 0.040
+148 0.103
+149 0.154
+150 0.105
+151 0.076
+152 0.127
+153 0.126
+154 0.105
+155 0.088
+156 0.107
+157 0.131
+158 0.095
+159 0.052
+160 0.114
+161 0.088
+162 0.041
+163 0.071
+164 0.067
+165 0.008
+166 0.056
+167 0.060
+168 0.064
+169 0.059
+170 0.055
+171 0.046
+172 0.030
+173 0.092
+174 0.062
+175 0.036
+176 0.019
+177 0.038
+178 0.032
+179 0.037
+180 0.051
+181 0.100
+182 0.051
+183 0.036
+184 0.088
+185 0.090
+186 0.039
+187 0.080
+188 0.076
+189 0.079
+190 0.061
+191 0.074
+192 0.090
+193 0.042
+194 0.024
+195 0.063
+196 0.065
+197 0.050
+198 0.061
+199 0.077
+200 0.136
+201 0.116
+202 0.037
+203 0.092
+204 0.120
+205 0.066
+206 0.026
+207 0.070
+208 0.075
+209 0.041
+210 0.075
+211 0.082
+212 0.034
+213 0.031
+214 0.023
+215 0.048
+216 0.047
+217 0.098
+218 0.098
+219 0.083
+220 0.059
+221 0.103
+222 0.099
+223 0.085
+224 0.110
+225 0.127
+226 0.163
+227 0.132
+228 0.190
+229 0.194
+230 0.197
+231 0.154
+232 0.205
+233 0.171
+234 0.166
+235 0.148
+236 0.161
+237 0.106
+238 0.035
+239 0.026
+240 0.026
+241 0.038
+242 0.084
+243 0.016
+244 0.060
+245 0.121
+246 0.061
+247 0.028
+248 0.076
+249 0.046
+250 0.050
+251 0.072
+252 0.042
+253 0.033
+254 0.083
+255 0.031
+256 0.093
+257 0.106
+258 0.042
+259 0.055
+260 0.053
+261 0.008
+262 0.030
+263 0.062
+264 0.078
+265 0.037
+266 0.114
+267 0.108
+268 0.078
+269 0.107
+270 0.134
+271 0.117
+272 0.091
+273 0.150
+274 0.147
+275 0.071
+276 0.025
+277 0.064
+278 0.022
+279 0.069
+280 0.072
+281 0.044
+282 0.107
+283 0.170
+284 0.176
+285 0.116
+286 0.110
+287 0.128
+288 0.078
+289 0.059
+290 0.055
+291 0.061
+292 0.020
+293 0.051
+294 0.048
+295 0.055
+296 0.112
+297 0.139
+298 0.083
+299 0.055
+300 0.105
+301 0.100
+302 0.049
+303 0.087
+304 0.086
+305 0.069
+306 0.131
+307 0.096
+308 0.090
+309 0.095
+310 0.134
+311 0.102
+312 0.098
+313 0.062
+314 0.055
+315 0.111
+316 0.098
+317 0.106
+318 0.131
+319 0.132
+320 0.098
+321 0.097
+322 0.096
+323 0.059
+324 0.089
+325 0.083
+326 0.088
+327 0.025
+328 0.103
+329 0.065
+330 0.028
+331 0.086
+332 0.109
+333 0.100
+334 0.094
+335 0.116
+336 0.109
+337 0.111
+338 0.063
+339 0.043
+340 0.074
+341 0.099
+342 0.090
+343 0.073
+344 0.067
+345 0.086
+346 0.092
+347 0.089
+348 0.092
+349 0.044
+350 0.045
+351 0.066
+352 0.039
+353 0.019
+354 0.013
+355 0.059
+356 0.069
+357 0.070
+358 0.045
+359 0.079
+360 0.117
+361 0.081
+362 0.138
+363 0.135
+364 0.083
+365 0.034
+366 0.096
+367 0.071
+368 0.034
+369 0.029
+370 0.038
+371 0.083
+372 0.105
+373 0.112
+374 0.070
+375 0.096
+376 0.096
+377 0.079
+378 0.078
+379 0.072
+380 0.088
+381 0.036
+382 0.059
+383 0.056
+384 0.043
+385 0.114
+386 0.114
+387 0.107
+388 0.101
+389 0.089
+390 0.079
+391 0.029
+392 0.098
+393 0.100
+394 0.036
+395 0.106
+396 0.075
+397 0.085
+398 0.090
+399 0.091
+400 0.096
+401 0.048
+402 0.032
+403 0.049
+404 0.070
+405 0.110
+406 0.059
+407 0.107
+408 0.102
+409 0.106
+410 0.081
+411 0.138
+412 0.143
+413 0.112
+414 0.138
+415 0.136
+416 0.127
+417 0.113
+418 0.107
+419 0.111
+420 0.092
+421 0.134
+422 0.098
+423 0.055
+424 0.044
+425 0.055
+426 0.056
+427 0.040
+428 0.041
+429 0.095
+430 0.158
+431 0.153
+432 0.106
+433 0.186
+434 0.187
+435 0.118
+436 0.167
+437 0.162
+438 0.168
+439 0.108
+440 0.155
+441 0.121
+442 0.121
+443 0.059
+444 0.053
+445 0.098
+446 0.087
+447 0.119
+448 0.149
+449 0.149
+450 0.113
+451 0.069
+452 0.083
+453 0.084
+454 0.095
+455 0.119
+456 0.117
+457 0.100
+458 0.102
+459 0.096
+460 0.100
+461 0.116
+462 0.187
+463 0.150
+464 0.080
+465 0.106
+466 0.115
+467 0.085
+468 0.036
+469 0.098
+470 0.095
+471 0.112
+472 0.061
+473 0.077
+474 0.119
+475 0.141
+476 0.099
+477 0.154
+478 0.184
+479 0.185
+480 0.136
+481 0.194
+482 0.178
+483 0.177
+484 0.138
+485 0.132
+486 0.087
+487 0.055
+488 0.057
+489 0.051
+490 0.037
+491 0.087
+492 0.035
+493 0.031
+494 0.080
+495 0.053
+496 0.023
+497 0.045
+498 0.033
+499 0.030
+500 0.087
+501 0.089
+502 0.035
+503 0.064
+504 0.125
+505 0.132
+506 0.069
+507 0.085
+508 0.072
+509 0.088
+510 0.050
+511 0.049
+512 0.043
+513 0.064
+514 0.071
+515 0.111
+516 0.109
+517 0.082
+518 0.089
+519 0.054
+520 0.038
+521 0.032
+522 0.032
+523 0.038
+524 0.054
+525 0.059
+526 0.015
+527 0.068
+528 0.073
+529 0.026
+530 0.106
+531 0.055
+532 0.047
+533 0.103
+534 0.091
+535 0.049
+536 0.031
+537 0.032
+538 0.038
+539 0.068
+540 0.130
+541 0.077
+542 0.043
+543 0.104
+544 0.058
+545 0.045
+546 0.108
+547 0.084
+548 0.139
+549 0.189
+550 0.130
+551 0.062
+552 0.136
diff --git a/tools/emboss_5/test-data/emboss_iep_out.iep b/tools/emboss_5/test-data/emboss_iep_out.iep
new file mode 100644
index 00000000000..839b0dba134
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_iep_out.iep
@@ -0,0 +1,31 @@
+IEP of Sequence from 1 to 561
+Isoelectric Point = 5.0278
+
+ pH Bound Charge
+ 1.00 108.00 1.00
+ 1.50 107.99 0.99
+ 2.00 107.98 0.98
+ 2.50 107.93 0.93
+ 3.00 107.80 0.80
+ 3.50 107.56 0.56
+ 4.00 107.28 0.28
+ 4.50 107.10 0.10
+ 5.00 107.00 0.00
+ 5.50 106.91 -0.09
+ 6.00 106.67 -0.33
+ 6.50 105.94 -1.06
+ 7.00 103.73 -3.27
+ 7.50 97.29 -9.71
+ 8.00 81.33 -25.67
+ 8.50 53.56 -53.44
+ 9.00 25.75 -81.25
+ 9.50 9.75 -97.25
+ 10.00 3.29 -103.71
+ 10.50 1.06 -105.94
+ 11.00 0.34 -106.66
+ 11.50 0.11 -106.89
+ 12.00 0.03 -106.97
+ 12.50 0.01 -106.99
+ 13.00 0.00 -107.00
+ 13.50 0.00 -107.00
+ 14.00 0.00 -107.00
diff --git a/tools/emboss_5/test-data/emboss_isochore_out.isochore b/tools/emboss_5/test-data/emboss_isochore_out.isochore
new file mode 100644
index 00000000000..e12e4bae915
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_isochore_out.isochore
@@ -0,0 +1,7 @@
+Position Percent G+C 1 .. 561
+140 0.446
+196 0.414
+252 0.396
+308 0.357
+364 0.332
+420 0.282
diff --git a/tools/emboss_5/test-data/emboss_marscan_out.tabular b/tools/emboss_5/test-data/emboss_marscan_out.tabular
new file mode 100644
index 00000000000..6286b3c974d
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_marscan_out.tabular
@@ -0,0 +1,4 @@
+SeqName Start End Score Strand type start8bp end8bp start16bp end16bp
+hg17 440 492 0.000 + MAR/SAR recognition site (MRS) 440 447 477 492
+hg17 13640 13750 0.000 + MAR/SAR recognition site (MRS) 13640 13647 13735 13750
+hg17 15229 15392 0.000 + MAR/SAR recognition site (MRS) 15385 15392 15229 15244
diff --git a/tools/emboss_5/test-data/emboss_maskfeat_out.fasta b/tools/emboss_5/test-data/emboss_maskfeat_out.fasta
new file mode 100644
index 00000000000..ac2f256f675
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_maskfeat_out.fasta
@@ -0,0 +1,11 @@
+>Sequence 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gttcgatgcctaaaataccttcttttgtccctacacagaccacagttttcctaatggctt
+tacaccgactagaaattcttgtgcaagcactaattgaaagcggttggcctagagtgttac
+cggtttgtatagctgagcgcgtctcttgccctgatcaaaggttcattttctctactttgg
+aagacgttgtggaagaatacaacaagtacgagtctctcccccctggtttgctgattactg
+gatacagttgtaatacccttcgcaacaccgcgtaactatctatatgaattattttccctt
+tattatatgtagtaggttcgtctttaatcttcctttagcaagtcttttactgttttcgac
+ctcaatgttcatgttcttaggttgttttggataatatgcggtcagtttaatcttcgttgt
+ttcttcttaaaatatttattcatggtttaatttttggtttgtacttgttcaggggccagt
+tcattatttactctgtttgtatacagcagttcttttatttttagtatgattttaatttaa
+aacaattctaatggtcaaaaa
diff --git a/tools/emboss_5/test-data/emboss_maskseq_out.fasta b/tools/emboss_5/test-data/emboss_maskseq_out.fasta
new file mode 100644
index 00000000000..24722f3054f
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_maskseq_out.fasta
@@ -0,0 +1,11 @@
+>Sequence 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+NNNcgatgcctaaaataccttcttttgtccctacacagaccacagttttcctaatggctt
+tacaccgactagaaattcttgtgcaagcactaattgaaagcggttggcctagagtgttac
+cggtttgtatagctgagcgcgtctcttgccctgatcaaaggttcattttctctactttgg
+aagacgttgtggaagaatacaacaagtacgagtctctcccccctggtttgctgattactg
+gatacagttgtaatacccttcgcaacaccgcgtaactatctatatgaattattttccctt
+tattatatgtagtaggttcgtctttaatcttcctttagcaagtcttttactgttttcgac
+ctcaatgttcatgttcttaggttgttttggataatatgcggtcagtttaatcttcgttgt
+ttcttcttaaaatatttattcatggtttaatttttggtttgtacttgttcaggggccagt
+tcattatttactctgtttgtatacagcagttcttttatttttagtatgattttaatttaa
+aacaattctaatggtcaaaaa
diff --git a/tools/emboss_5/test-data/emboss_matcher_out.fasta b/tools/emboss_5/test-data/emboss_matcher_out.fasta
new file mode 100644
index 00000000000..57392f7fed0
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_matcher_out.fasta
@@ -0,0 +1,6 @@
+>Sequence
+CTTTAGCAAGTCTTTTACTGTTTTCGACCTCAATGTTCATGTTCTTAGGTTGTTTTGGAT
+A
+>hg17
+CTTCAGCAAGTTCCTTACTGTCTTTAAGCCTTGTTTTCATCATCT--GGATAATGGGGAT
+A
diff --git a/tools/emboss_5/test-data/emboss_msbar_out.fasta b/tools/emboss_5/test-data/emboss_msbar_out.fasta
new file mode 100644
index 00000000000..ac2f256f675
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_msbar_out.fasta
@@ -0,0 +1,11 @@
+>Sequence 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gttcgatgcctaaaataccttcttttgtccctacacagaccacagttttcctaatggctt
+tacaccgactagaaattcttgtgcaagcactaattgaaagcggttggcctagagtgttac
+cggtttgtatagctgagcgcgtctcttgccctgatcaaaggttcattttctctactttgg
+aagacgttgtggaagaatacaacaagtacgagtctctcccccctggtttgctgattactg
+gatacagttgtaatacccttcgcaacaccgcgtaactatctatatgaattattttccctt
+tattatatgtagtaggttcgtctttaatcttcctttagcaagtcttttactgttttcgac
+ctcaatgttcatgttcttaggttgttttggataatatgcggtcagtttaatcttcgttgt
+ttcttcttaaaatatttattcatggtttaatttttggtttgtacttgttcaggggccagt
+tcattatttactctgtttgtatacagcagttcttttatttttagtatgattttaatttaa
+aacaattctaatggtcaaaaa
diff --git a/tools/emboss_5/test-data/emboss_needle_out.score b/tools/emboss_5/test-data/emboss_needle_out.score
new file mode 100644
index 00000000000..825a2947c15
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_needle_out.score
@@ -0,0 +1,4 @@
+Sequence hg17 20190 (604.5)
+
+#---------------------------------------
+#---------------------------------------
diff --git a/tools/emboss_5/test-data/emboss_newcpgreport_out.newcpgreport b/tools/emboss_5/test-data/emboss_newcpgreport_out.newcpgreport
new file mode 100644
index 00000000000..fe019e38eb4
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_newcpgreport_out.newcpgreport
@@ -0,0 +1,11 @@
+ID Sequence 561 BP.
+XX
+DE CpG Island report.
+XX
+CC Obs/Exp ratio > 0.60.
+CC % C + % G > 50.00.
+CC Length > 200.
+XX
+FH Key Location/Qualifiers
+FT no islands detected
+//
diff --git a/tools/emboss_5/test-data/emboss_newcpgseek_out.newcpgseek b/tools/emboss_5/test-data/emboss_newcpgseek_out.newcpgseek
new file mode 100644
index 00000000000..3ae9d7e99e4
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_newcpgseek_out.newcpgseek
@@ -0,0 +1,9 @@
+
+
+NEWCPGSEEK of Sequence from 1 to 561
+with score > 17
+
+ Begin End Score CpG %CG CG/GC
+ 121 141 34 3 57.1 1.00
+ 261 272 43 3 75.0 1.00
+-------------------------------------------
\ No newline at end of file
diff --git a/tools/emboss_5/test-data/emboss_newseq_out.fasta b/tools/emboss_5/test-data/emboss_newseq_out.fasta
new file mode 100644
index 00000000000..97665ab4e3f
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_newseq_out.fasta
@@ -0,0 +1,2 @@
+>cytoc fragment_of_cytochrome_c
+KKKEERADLIAY
diff --git a/tools/emboss_5/test-data/emboss_noreturn_out.noreturn b/tools/emboss_5/test-data/emboss_noreturn_out.noreturn
new file mode 100644
index 00000000000..c2a830c75ed
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_noreturn_out.noreturn
@@ -0,0 +1,11 @@
+>Sequence 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gttcgatgcc taaaatacct tcttttgtcc ctacacagac cacagttttc ctaatggctt
+tacaccgact agaaattctt gtgcaagcac taattgaaag cggttggcct agagtgttac
+cggtttgtat agctgagcgc gtctcttgcc ctgatcaaag gttcattttc tctactttgg
+aagacgttgt ggaagaatac aacaagtacg agtctctccc ccctggtttg ctgattactg
+gatacagttg taataccctt cgcaacaccg cgtaactatc tatatgaatt attttccctt
+tattatatgt agtaggttcg tctttaatct tcctttagca agtcttttac tgttttcgac
+ctcaatgttc atgttcttag gttgttttgg ataatatgcg gtcagtttaa tcttcgttgt
+ttcttcttaa aatatttatt catggtttaa tttttggttt gtacttgttc aggggccagt
+tcattattta ctctgtttgt atacagcagt tcttttattt ttagtatgat tttaatttaa
+aacaattcta atggtcaaaa a
diff --git a/tools/emboss_5/test-data/emboss_notseq_out.fasta b/tools/emboss_5/test-data/emboss_notseq_out.fasta
new file mode 100644
index 00000000000..ac2f256f675
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_notseq_out.fasta
@@ -0,0 +1,11 @@
+>Sequence 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gttcgatgcctaaaataccttcttttgtccctacacagaccacagttttcctaatggctt
+tacaccgactagaaattcttgtgcaagcactaattgaaagcggttggcctagagtgttac
+cggtttgtatagctgagcgcgtctcttgccctgatcaaaggttcattttctctactttgg
+aagacgttgtggaagaatacaacaagtacgagtctctcccccctggtttgctgattactg
+gatacagttgtaatacccttcgcaacaccgcgtaactatctatatgaattattttccctt
+tattatatgtagtaggttcgtctttaatcttcctttagcaagtcttttactgttttcgac
+ctcaatgttcatgttcttaggttgttttggataatatgcggtcagtttaatcttcgttgt
+ttcttcttaaaatatttattcatggtttaatttttggtttgtacttgttcaggggccagt
+tcattatttactctgtttgtatacagcagttcttttatttttagtatgattttaatttaa
+aacaattctaatggtcaaaaa
diff --git a/tools/emboss_5/test-data/emboss_nthseq_out.fasta b/tools/emboss_5/test-data/emboss_nthseq_out.fasta
new file mode 100644
index 00000000000..ac2f256f675
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_nthseq_out.fasta
@@ -0,0 +1,11 @@
+>Sequence 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gttcgatgcctaaaataccttcttttgtccctacacagaccacagttttcctaatggctt
+tacaccgactagaaattcttgtgcaagcactaattgaaagcggttggcctagagtgttac
+cggtttgtatagctgagcgcgtctcttgccctgatcaaaggttcattttctctactttgg
+aagacgttgtggaagaatacaacaagtacgagtctctcccccctggtttgctgattactg
+gatacagttgtaatacccttcgcaacaccgcgtaactatctatatgaattattttccctt
+tattatatgtagtaggttcgtctttaatcttcctttagcaagtcttttactgttttcgac
+ctcaatgttcatgttcttaggttgttttggataatatgcggtcagtttaatcttcgttgt
+ttcttcttaaaatatttattcatggtttaatttttggtttgtacttgttcaggggccagt
+tcattatttactctgtttgtatacagcagttcttttatttttagtatgattttaatttaa
+aacaattctaatggtcaaaaa
diff --git a/tools/emboss_5/test-data/emboss_palindrome_out.palindrome b/tools/emboss_5/test-data/emboss_palindrome_out.palindrome
new file mode 100644
index 00000000000..6e142fa18df
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_palindrome_out.palindrome
@@ -0,0 +1,15 @@
+Palindromes of: Sequence
+Sequence length is: 561
+Start at position: 1
+End at position: 561
+Minimum length of Palindromes is: 10
+Maximum length of Palindromes is: 100
+Maximum gap between elements is: 100
+Number of mismatches allowed in Palindrome: 0
+
+
+
+Palindromes:
+
+
+
diff --git a/tools/emboss_5/test-data/emboss_pasteseq_out.fasta b/tools/emboss_5/test-data/emboss_pasteseq_out.fasta
new file mode 100644
index 00000000000..8b924679a5a
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_pasteseq_out.fasta
@@ -0,0 +1,371 @@
+>Sequence 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gtttgccatcttttgctgctctagggaatccagcagctgtcaccatgtaaacaagcccag
+gctagaccaGTTACCCTCATCATCTTAGCTGATAGCCAGCCAGCCACCACAGGCAtgagt
+caggccatattgctggacccacagaattatgagctaaataaatagtcttgggttaagcca
+ctaagttttaggcatagtgtgttatgtaTCTCACAAACATATAAGACTGTGTGTTTGTTG
+ACTGGAGGAAGAGATGCTATAAAGACCACCTTTTAAAACTTCCC----------------
+---------------AAATACT-GCCACTGATGTCCTG-----ATGGAGGTA-------T
+GAA-------------------AACATCCACTAAAATTTGTGGTTTATTCATTTTTCATT
+ATTTTGTTTAAGGAGGTCTATAGTGGAAGAGGGAGATATTTGGggaaatt---ttgtata
+gactagctttcacgatgttagggaattattattgtgtgataatggtcttgcagttaca-c
+agaaattcttccttattttttgggaa---gcaccaaag----tagggat---aaaatgtc
+atgatgtgtgcaatacactttaaaatgtttttg-----ccaaaataatt-----------
+-----aatgaagc--aaatatggaaa-ataataattattaaatctaggtgatgggtatat
+tgtagttcactatagtattgcacacttttctgtatgtttaaatttttcatttaaaaaaaa
+actttgagc-----tagacaccaggctatgagctaggagcatagcaatgaccaa------
+------------------------------------------------------------
+----------------------------atagactcctaccaa-----------------
+---------------------------------ctc-aaagaatgcacattctCTGGGAA
+ACATGTTTCCATTAGGAAGCCTCGAATGCAATGTGACTGTGGTCTCCAGGACCTG-TGTG
+ATCCTGGCTTTTCCTGTTCCCTCCG---CATCATCACTGCAGGTGTGTTTTCCCAAGTTT
+TAAACATTTA------CCTTCCCAGTGGCCTTGCGTCTAGAGGAATCCCTGTATAGTGGT
+-ACATGAATATAACACATAACAAA-AATCATCTCTATGGTGTGTGTTGTTCCTGGGGTTC
+Aattcagcaaattttccctg-ggcacccatgtgttcttggcactggaaaagtaccgggac
+tgaaacagttgatggccca-atccctgtcctct---taaaacctaagggaggagaTGGAA
+AGGGG-CACCCAACCCAGACTGAGAGACAGGAATTAGCTGCAAGGGGAACTAGGAAAAGC
+TTCTTTA---AGGATGGAGAGGCCCTAGTGGAAT-GGGGAGATTCTTCCGGGAGAAGCGA
+TGGATGCACAGTTGGGCATCCCCACAGACGGACTGGAAAGAAAAAAGGCCTGGAGGAATC
+AATGTG-------CAATGTATGTGTGTTCCCTGGTTcaagggctgg-gaactttctcta-
+aagggccaggtagaaaacattttaggctttctaagccaag--gcaaaat-tgaggatatt
+acatgggtacttatacaacaagaataaacaatt---tacacaattttttgttgacagaat
+tcaaaactttat----agacacagaaatgcaaatttcctgtaattttcccat-gagaact
+attcttct--tttgttttgttttgcgacAGGGTTGCGCtgatcctcccgcctcagtctcc
+ctaagtgctgagatgttgcaggaagtcagggaccccgaacagagagatcggctggagccg
+tggcagaggaacataaattttgaagatttcattttaatatggacacttatcagttcccaa
+ataatacttttataattttttatgcctgtctttgctttaatctcttaatcctgttatctt
+cataagctaaggatgtacgtcacctcaggaccactgtgataattgtgttaactgtacaga
+ttgattgcaaaacatgtgtgtttgaacaatatgaaatcagtgcaccttgaaaaagagcag
+aataacagcaatttttagggaacaagggaagacaactataaggtctgactgcctgcgggg
+tcgggcaaagggagccatatttttcttcttgcagagagcctataaatagacctgcaagta
+ggagagatattgctaatttcttttgctagcatggaatattaatattaacaccctgggaaa
+ggaatgcattcctggggggaggtctataaatggccgctctgggaatgtctatcctacgca
+atggagataaggactgagatacgccctggtctcctgcagtaccctcaggcttactagggt
+ggtgaaaaactccgccctggtaaatttgtggtcagaccagttttctgctctcgaacactg
+ttttctgttgtttaagatgtttatcaagacaatacgtgcaccgctgaacacagaccctta
+tcagtagttctcctttttgccctttgaagcatgtgatctactccctgttttacaccccct
+caccttttgaaacccttaataaaaaacttgctggttt-gaggctcaggtgggcatcacag
+tactaccgatatgtgatgtcacccccggcggcccagctgtaaaattcctctctttgtact
+ctctctctttatttctcagccagctgacacttatggaaaatagaaagaacctacgttgaa
+atattgggggcaggttcccccaataTCTGGTGCCCAACGTGGGAtactgagattacaagc
+atgagccactgcatctggcctcttcttttgatttttttttttcaaacttttacaaatgta
+gaaaccattcttagcttttgggcattaccaaacccggcagtgg-caggctcggttcacca
+acgtcatttgcagttccccgCTTTATGTTATGGgttttgttttgttttgtttttttt-at
+tgagacagagtttcactcttgttgcccaggctgtagtgcaatggtctgatcttggctcac
+tgcaacctccacttcccaggttcaagccattctcctgcctcagcctctcaagtagctggg
+attacagacactcaccaccacacctggctaattttgtatttttagtagagatgaggtttc
+accatgttggccaggctggtctcgaaatcctgacctcaggtgatccacccaccttggcct
+cccaaagtgctgggattacaggcttgagctaccacgcctggctGGGTTGGTTCTCAATGG
+AGTGGTTTGTTTTTGGAGCTGCTCT-GCGCAGtggggaccagaataggcctg--------
+-----------ggttcctagcccattgctattcctt----accagctgtggattctaagg
+aaagtcatttaacctcgctggaccttag-attcctcatccctgaaGCCCAAGGGTaaaac
+aaaacaaaacaaaacaaaacaaaccaaCCCATCATGTAAAGCGGGGAACTACAAACGATA
+CAGGTGAAACATGCCTACCACACCACTCACAGGCT--ATGATGACAAAAACGTGGCTACA
+TCTGGGACCACCCCCCAACCCCCACTTTGTACGTAGGAAATACGGAGTTGAGGATGGAGA
+CCCACAGTATGTCCAGAGTGTCCCCAAAGGCCACAGTGCCCGCCTGGAGCCCTCCAGAGA
+GCGTGCACTCCCTGGGGTGCCAGCCAGAGACAACTTGCCCTGAGGCTTGGAACTCGATTC
+TCCGCGTGCCAGAGAAGGGGTGGGACTTCAGAACCCCCAACCCCGCAATCTGGGTCGGGG
+AGCCTGGCGCACTGCGGGCCGCTCCCTCTAACCCTGGGCTTCCCTG------GCGTCCAG
+GGCCGTCGG-----------GGCCGAGTCCCGATTCGCTCCCACCCCGAAGCCGCGCCAG
+GACCAACGAGGGCGCAGCCGTATGCCCCAGCCCGCTCCGCGGAGCCCCTCACAGCCAccc
+ccgccccgaccgcgccccgcgcggcTCGAAGCACCTTCCCAAGGGGCTGGTCCTTGC---
+-------GCCATAGTCGCGCCGGAGCCTCTGGAGGGACATCAAGGATTTCTC-GCTCCTA
+CCAGCCACCCCCAAATTTTTGGGAGGTACCCAAGGGTGCGCGCGTGGCTCCTGGCGCGCC
+GAGGCCCTCCCTCGAGGCCCCGCGAGGTGCACACTGC---------GGGCCCAGGGCTAG
+CAGCCGCCCGGCACGTCGCTACCCTGAGGGGCGGGGCGGGAGCTGGCGCTAGAAATGCGC
+CGGGGCCTGCGGGGCAGTTGCGCAAGTTGTGATCGGGCCGCTATAAGAGGGGCGGGCAGG
+CATGGAGCCCCGTAGGAATCGCAGCGCCAGCGGTTGCAAGGTAAGGCCC-CGGCGCGCTC
+CTTCCTCCTTCTCTGCTGGTCTTTCTTGGCAGGCCACAGGGCCCCACACAACTCTGGATC
+CCGGGGAAACTGAGTCAGG-AGGGATGCAGGGCGGATGGCTTAGTTCTGGACTATGATAG
+CTTTGTACCGAG-----TTCTAGCCAGATAGAAGGTTACCGGGAGCTGGGGAGCGTTGGA
+TTTGCTGCTGGGCTGTGCCGGTGCCCAGAAGGCA------GGACCTTGCAGAACCAGCCA
+GGTCCCTGGGAGACTGTCAGACCCACCAACCTGGTGGCATTCGCAGAGCTGAGATGCATT
+GGAAATTGCCTTGGGCACATCCCCAAAGATCAGGATGTCCCACCCCAGTCTGAAGGAGA-
+--TAAAGTTGGGGGTAGGAGAGACGCAG-ATGCAAGTGATCAGTCTC---AGTCCCAGAC
+ATTGCCTTGCTCTGCGGGTAGGAATTCAGGATTCATTTTCCAGGGAAG--------TTCC
+TGACCTCTGAATGAGAGGGGCTGTGTAAGGCCAATGCCTGGG-AGGAAGGCAAGGATGAG
+TAGAGGTGGGGGGAAACAAGTGTCAGGAAGA-----------------------------
+---------------CTCAAA---------ATCTTC------------------------
+--------------------------------------CAGAGAAATTGT-----GCAGG
+GTCTTACCAGATCTGTCCTCAAAGCCATGCAAATTGCCTTCTTTGCAATGCAT-ACAATG
+AGGTGTCTCTGGGGGTCAGAACTGG-----------------------TTATTAGGGAAC
+TTCTAGCCAGGACTGCTAAATACGCGCTGTTGG---------CCCACCAGGCTCACCTAT
+AGCCT-TCCTTCAGTCTGGGCTTGGTTTGGATTTCACTGTGGGTGCCATCGCCTTTACAC
+TCCTGTTTCTATAGTTTAAAGATAGTGGTGCTTTGGGAAAG---TGACTCCTTAAATACA
+GTTAGGTCCAAGTGA-GACAAGTGGCCTGGCTGTCATTTCAGAATAGCAGCTTCCAAGAG
+G----------TGATTAATTTCTGTTGGAAGGGTGAT-CTTTGGGGAGGT--GGGTGAAG
+AGCAGAGACTTGGTGGTACCGTTCCAGGAGCACAGGCTCTCT-----TCCTTTGCA--GT
+GCAGAATGACCTCTGGCAGCCGGAGTTGTGTTTGTT--------CTGTAGGATTCTGAGG
+TGGGCCATGGGCAGCTGGAACTGGG-----GAATTTTGCCAATCTCTTTCATATTAGGAT
+TGTCTGCAGAACCAGATATGGAGG------CTTCTAGCAACGTGAGTGCTCCTGTTCTAA
+TGCCCTTAGAAACAAGAAGGCCACACTGATCATTTCTCTCACTTAGGCAGGGAGACAAGG
+CAAGAGAGAAACAGT-----------------GGATGC--TTTTAGGTTCTTTCCCTTCC
+CAAGCAGTTGTGGACATTGGGCTGA-GGGGAACATTTCCACATTGGCTAAAGGAGCGTCC
+TCCTCATATTTTGTACATTTTATACCCAA--AATAA-CTCTTCTTGGTATTT-GGGGAAA
+TATTTTCCTCCCCGTCC------------ATTCCAGGAAATGGCTCCAAGTGCCAAGGAC
+AGAGCCAGGGAAGTTGCAATGAATTCCTGCCCGTCAGCCCCAGGCAGATGCCTTGCACGT
+CTGAGTGGCCCATGCAGAGCGTGGAGGTGGCCGCC----------------ACGGAACC-
+TGGGTCAATGT-CCCACCCCCG----CTTAGATGCCA-CCAGGGG--CGTGGGAGCCAAG
+GAG--AGAAGAGGGGCTCCAGGAAGGTAGAGTCCTTGTGTCTTGTGCATCTGTGAACAGC
+ACTGGTATGATTTAAAGGAAAATTGAGCCAAATTTTCCGGCAGTCAGTT-----ACCCCA
+TCCCCACCGGGGTAGGAGTCTGGCAGCCGCAGCTCCATTCTGGCCAGTCGGCAGAGAGCC
+TTGAAATTCTTCTTTGTCCACACAGTTGTCTCAGAGAAACAG--AGAGGTT-GTTTCTGC
+TTAAAAACAACACACTTGGTGTCTGGGCCCACAGACTCCTTTGCACTTATTCCACGTGTG
+ACAGCCAATGTGCCTCGTTGCTTAGCAGACAGCATGTTACCGTCTTTCCTGCTCAGTTTG
+TTAG--------------CTCTATGGAATGGAATTTATAATCAATGCCCATACCAACATT
+TCACTAATATCATAGGAGATTTAGTCTCCATCTGGGTGTACATTACATTTGC--TCTGGG
+G-TGCTCCAGGC--TGGGGGGTTGCCAAGGAAGAGAAGAGAAACCGCAGAGAAGAC---G
+GGAGGGCAGGGCAGGGGTCTCTGAGAAGGGGAGGGGTCCCAGAGTGCAGGAGCAGGAGCC
+AGGCTC---------ATGAAAGGGGCCACGGGCGGGAGTATCCAGGGACGGCAGTCAAGA
+TGGAGCACAGCTTAGG--AAGCTGAAGGGAATCCTGGCCCACCTGGGTGCTAGAGGGCAC
+ATAGGAAGTGCAGGAAGCAGACCAAGGTCCCCAAGAGAGGGAGACCTGGACGCTGAAGCA
+TTTTCTGTCTTTATTAAG-------------ACAACTCCGTAAGAATTCCTGCTGGGCCA
+AAGTGAATTCTAGGATGCGACTTTAAGATGGGAGCAAGCGAACCATTGAGGAGGCAGGTT
+ACCCTAGTTAGCCAATGCAGATCGAGAATGGGAAATCTTTCatttattcatgcaacagat
+atttaacgaagccctgccgtgttccaggcctgtgatagatgctggaacaggtacagaga-
+---------tAc-------aggtgtcattaattgatcaggg--caacctctc---cttct
+gagt--cttgctggagcttcagatgc-ccctcacacagagctcgagggagcctc-aacaa
+ttgatcagaagtcaggcaccatggctcacgcatataatcccagcactttgggaggccaag
+gcaggtggatcactggagcccaggagttccagatcagctggggcaacatggcaaaacccc
+atctctattaaaaaaaaaaaaagtaactggatgtgatggtacacacctgtagtcccagct
+acttgggaggctgagaggtgggagaattgcttgagcccgggaagtcgggggtccagtgag
+ccttgatcacaccactgcactccagcctgagtgacagagcaagaccctgacacacacaca
+cacacacacacacacacacacacagattagagctgaaacaggagtagaaacctatctg-t
+atctctgATGA-GATCAGATC---------TTTCTGATGAACAGAAAGAATGTAACCCCT
+GTACTCACACCCTCTCTGCTGGTTACATATGTTAACACGATTTCTCAAATGAGGCTTTTG
+GTTGCAAATAAGAGAAAATCACTCACGCT-GGCCCTGTG--TTTTTCAAATTGTTTATTG
+TGATCAACATTTGAAAAAAGAGCCGAGACTCTCAAGAGTGCATTACCCACGGTAAGGGTG
+AATTTT-ACTTCTTGACACTTATTTCTCTTACATGTATCTATCTGTCTC-----AAATGA
+AAAATATATTTAGAAAGTTGAAAGCTATCCAAGTGAGTATAAGAAAAGAGTATCTCACCC
+TGAAGGCTAAGGACAGGGAGGGC---------------------------CACCAGGCCT
+CACGAGGACCCAGGAACCACAAAGAAGGCT-AGGAAGGAGCACAGGCGGTGACCATACTC
+TGGCTCAGTGGCTATGTGGGCTCTGGTCTCTCTCAGCTGTTCCATGCATATGAGGCCAAA
+TGTGGCTACCCTAGAGCTTCTGAGCCCTCAACAGAGATGAACTGGACTCTCTGCAGCCCC
+ACTCTAAATTCCTAAGAGAGAAGTTGATTGACCCAATCAGGGTCAGGAGAAGGAAGGGAG
+GAGGAAAGGGAGGAGAGAAGAGCCTCTTCGTCTCTTGCCTACCACTGGCCAGGCAATTGT
+AGCCAAGGGGGCTGGAGTGTAAATGCAAACATAGCCATCAAGGGTtgtgtatgtgtgtgt
+gtgtgtctgtgtgtgtgtatgtgtgtCTCTTGGGTAGGTTAGA-TCTCCCAGGAGGTCCC
+TACTAAACAGACTTAAGCCCGCAAAATTTTAGCTCTCCAGCCTCACACACTCCACCCCTC
+TACCATATTGAATCTTCCCAAACCAACTATGGCTTTCCCTAACTCCGGAGc------ttg
+gcctggaatgccctgcttcccctctttcccctggggaacgcctgtccttcaggcctcagt
+tcacacactgcctcccttgcaaagctctccTCCCATCCCCGGAGTCCCT--CTTCCCCTT
+TGTTCTTTGGGTTCTATGCTTCTTCCCTCATAACTCCCACCAGGTTGTGTTAAAATGAGT
+TGTTCAAGGTCCTGTCTGTTCCACTAGATTCTGAGCAACTTGGAGAACGAAGATCCAAAC
+TTCGCTGCCTTTATTTCCTCCTTTGTTCTTTTCTCATCCCCAAGTCCCTTCCAACTTGGA
+GTTATgaagaaaggaaggaaggaagggtgggagggaagaaCAGGAGGGGATCCCACAGG-
+AGAATGTGTATAGGGAGAGGACTCAGACTAGCTAAAGCTTTTCCCTCATAATTAATAGCA
+AATACCATGTTACCTGAATTTAATTCACAGTAGCATACAAAAGACTCGCTTTGTTCT---
+----CCCCA---------TTGATGTCATCAGAGG--------------------GCTGTG
+GG--------------CAGGCCTAATCTTGGCTCAGGAGGCCCTCCAGCCTGGATCTAAA
+GAGCAGCAGATGggccaggctcggtggctcatgcctgtaatcccagcattttgggaggcc
+gaggcgggtggatcacgaggtcaggagtttgagaccagcctggccaagatggtgaagcct
+cgtctctactaaaaatacaaaaattagccaggtgcggtggtgggcgcctgtatttccagc
+tacccgggaggctgaggaggctgaggcaggagaatcgcttgaacccgggaggcggaggtt
+gcagtgagccgaggtcacgccactgcactctagcctgggcaacagagcaagactccgtca
+aaaaaaaaataaaaaaataaaaaaataaaaaaaataaaGAGGAGCACACATCTCTGCCCA
+TCCTAACTCCCACTTTGACATTGAGGTCCCCAGGATGGAGGGTCTGCCTCCATCTGCCTT
+GTCCCCTG-CAATGGTGGGAAGGTGATGGAGCTCAAGTCTAGAGGCCACCAGCTTCTTAG
+GGAGG--TAGGAGGTG---------------GAGGGTGGGGTGC-GGGCCCTGCACACAA
+CTGCCAAGTGAGGATGGGGGTGGG-GTCCACCTGAGGATAAGTAACAGTGAGGCTGGTGC
+AGAGGACCCAGGTGGAGGTAGACAGCAGAATTTGTGGTGGGGT--GGATGGCAC-ATTAT
+ATAAGCCTCTCTTGC------TGCCCTGT---TTACTGAGATTGTTTCAttatctttttt
+ggcttttgtttttaagagatggggtcttgctgtgtcacacaggctggagtgcactgtgtg
+atcatacctcactgcagcctcgacatcctgggctcaggcaaacctcccaccttggcctcc
+caagtagctgggaccacaagcgtttgccaccacactcagctatttttatttttattttta
+--ttttttttagagatggggtcttgctgtgtcgcccaggctggtcttgaactcctgggct
+caagcgatcctcctgccttggcctcccaaagccctgggattataggctgagccaccacac
+ccagccACATTTCATCTGTGCAGCTCCAGGGGCTCCACATTCT-ACTCTTCTCATTTCTT
+CTCCAGGGTACCC----------ATGGCAAGGGATGAGGGT--AGAAGATGGGGCA--GC
+CAGGCCTTGATTAAAGGAGAAGGAAGGCAGCCTGTGGAGAGG---GCAGCC---C---AG
+GGAG---TGCAGAGAGAAGTGGGCCATGAGGGAGA---CAGCAGAGTGCAGGCTGCGTCC
+---CAAATGAGCATACAGCCCACTGTGAGCCCACC--ATCTTCCTAGA-GA--CCCCTCT
+CCTCTCC-AGGAGCTGCTTCAGTAGCACTCA---------GAGGAAAGAATGATGC----
+----TGTATCAACATTTCAGCAGCTCATCTTTTAACTCTAAGAAAATGGCAGCTCCTAAA
+TGTTCAA--AACTGCTTTGGAAACTTCT---GGAGAGAGGTTTTGCAGCTCAGGCAGACA
+GCTGATCGCGGCCTTTCTTCCACCCCAACCCATGCTCTCCCCATGCT--CTCCTGCCACA
+GCTGCAGCGGGCCCCTGGGTCCTACATTTGCAG-CCCTTTGTCTCTGAGCT-----CAGA
+CTTCCAATTCCAAGCGGCAGCTGGGCAGGCTCACCAGCATGT---CCAGCCAGTACTAGG
+ACATCAGCAGGAGC----CCAACCACCTCTTTCCAAAATCTCTCCTCATGTCTCTCCTAG
+TTTCCATCTCCATCCTTCTAGTCAGCCAGGCTGAAAACATT-----------------TG
+CTCCTCAGGGTGCAGAAGGGAAAGCTTTGCCTCCCTTCCTGGTGCTCACTGCCCCTGCGA
+TTCCAGCCCAAGCCCTCCCCGGCTCCTCACC----------CTGGTGTCAGCTGGAAGCC
+ACCATCTCCTAAACCCACCTGtgttcttccacctctgc--------cagggctgc-cctc
+tcctccaccttcacaaactcaattcctacccattctcaggtcccttatcaaatgccatct
+cctccatgatgcctccctgattccccTGCTGGAaataatggtgataacagctaag--gca
+ttggggttggctacgtgccaggcaaggagttggcactttacatgctttatctcatttcag
+ccacataacatcgacaggt-ggcattatgattcatatcatccccatctgatagccaggaa
+aactgagtcccagagaggttagc-cactttcctagggccCTGTGCTCTGACTCAAGCATA
+GCTCTGAGGAACTCTAGCATTCATCAGTTTAAGCACCATGACTTTCTTTGCTGAGTCACC
+CAAGGCAT-TTCTTCATTTAAATGTTCTTCCTTGGCCAGGCGCAGTGGCTCAggcccaat
+gcggtggctcacgcctgtaatctcaacactttgggaggccgaggtgggcagataatctga
+ggtcaggagttcaagaccagcctggccaacatggtgaaaccccatctctactaaaaatac
+aaaaaaatgaggctgggcgtgatgactcacacctgtaatcccagcactttgggaggccaa
+ggcaggtggattacatgaggtcaggagttcgagaccagcctggccaacatggtgaaatcc
+tatctctattaaaaatacaaaaaattagccaggcatggtggcaggcacctgtaatcccag
+ctacttgggaggctgaggcaggaaaatggcttgaacccgggaggtggaggttgcagtgag
+ccaaggttgcaccattgcactccagcctgggcaaaaagagggaaacatcgtctaaaaaag
+aaaaaaaaaaaattagccaggctgggtggtgcatgcccgtaattccagctactcaggagg
+atgaagcaagagaattgcttgaacccaggaggcagagattacagtgagctgagatcacaa
+cactgcactccagcctaggtaaagaacaagactccatctcaaaaataaataaataaaaat
+aaaTGTTCTTCCTTGCAATGAAGTTAAATATGTAAATTCTCAAACCAGTTGCTTAAGGGC
+ACAGTTTTGTTCTTTACCTATATTTTTAACAAATATTTTATGTAAGTAGTTGAC-AAAAT
+CAAATACTGT-GTACACTACCGAGGCTTCCCTGGGAAAGCCATCAG-CCTCTGCCCCATC
+CCTTCCCACTCCTGATT-CCACTTTCCTGTGTTTCCATATCTTTTTCATGTCTGTTTCTG
+GCCCACAGTGGGCGATCAATACATGTTAGCCACCAACCATCAAACCTATATTGAGTAATT
+ATGGTATGTCAGGCACTATGCTCAATGAAATTGTAttaggcttgtacaaaagtaattgtg
+gtttttaagagtaatggcaaaaacggcagttactttcgcaccaacTATTTGCTGCCTTGA
+ATTATTCCTCCTCTC-CTCATCCCTAAACCCTGCTCCTCCCAGCCATTCTTCCTCCCCTT
+CTTGGGCCATGGCCAGGCCCCACCCAGGTACTAAGACTCAGGTGAACCAAGGAAGACTTA
+ATGCCCACTCTTTTCTGATGCCCATGTT--GGCATGTGTTAAGtcggttagcattaagtt
+tggctgcatttagcagagacccaaaagaacagtgccttttaaaaggcagaggttatgtct
+ctcacacacacccagcacaagtccaag-------------------------accagcat
+ggcatctcagctccatcaa--cctcaggaaccgagctcctgcagctccctgccctgcagt
+tgataaggtgaggtctttgtcctcctggttcaagatggtgctagaatgttggctaccata
+tctatagtccaggcatcagaatggagcaagggatgaaaaaggaagagatgaaggcacacg
+acaggttcctgagagctggcacaggacacttctgcttatatttcactggccagaacttag
+tcacatggtcacacctagttgggagactctgagaagtaa----agtatttattctagatg
+gccatatccctacc-taagacttggagttttctatgactggggaagaacggaagacaaga
+tattgggaaagactagcagcctctactaAAAGGGTGATCtgtgttgatgtgcgtgtgtgt
+gtgatgtttgtatg---agcatgtgtgt-tatgtgttgt--gtgtTGGTGGGGCA--GAT
+TCTTGCGAGCACTTTGGTCTCAGATGGACCTGCTACCAGTTCTCTCTGCAGACCCCCATA
+GGTTTCTCCTAAACCTGGCCT-CTCCTATTAGGCAGCCTTACTCAGCGGCAGCTTCTCAG
+CTCCATGTTTTCAAGGAACCACAATTTATTTCCAGCATCCACTGAAGCATATTATCAGTG
+GTGATAGAGGGGGCTTGTAAAACTGTTTTTCCACTTAGGTATTAGAGGGTGGCCATTATT
+TGAGAGTGAC-----TATGACCACAGTTAATCTGGTAATAAATTCTCTTGGGTAGGAGGG
+GGAAAGGAAAGGATGCTTTAAGGAAGCATCTTGCCAGGAGACACAAAGCTAACAAGAGTG
+GAGCCTGCAG----------------------------CTGGAGCCGCAGAGCCTAATCA
+CTACACCCGCCCATCTCTGCTAGGGTTTCATGACTTCGTATCGGGGATTAGCAGTATTTA
+ACTCTGTTGCACAAACATTTGGTGTA-----TTATTCAGGTAACAAGTAGCTAATAGAGG
+AAGTTTTACTTTTTTAAGACATAA--------------------ATTTGCCTTTTCCCAA
+ATTACTTGGTACATAGTAC-TTTTCATGTTTGAAGTTGAGATGTGGGTACAATACCATAG
+CTTTATTCCAGAGCAGGGTATTTGTTTCCAAATGCCATGTTCCCAGCAGCTGCCCTTGAC
+TGGGAATTGGGGTG-----TGATTTGGGCTTTTCCTTAAATCCTTGA-----GGAGCTGG
+A---GGGGTGGGTGGCTCGCACTCCTGCTTTctgg---------atctgaatc-------
+-------ctgactctgtcatggacctgtt-tgactttgggcaagttgactcctattcctg
+agccccatat-ttttctcttctgtgaaattcagattaaaaA-AACATGGCTTTGATCAAA
+CATTATAAATAATATATAGACAGACTGCTTGTTTTTATTGTATTGCCAG-AAATGAATCC
+TACTAATATTGCCATCTATGGACAGAAAATGTATTACCTGTCTTCATCAAGACCCAGACG
+AGGAAGAACACGAAAAGCGGAGATTAATTTTACTGCCATCTCCAGAACCGTCATCCTAAT
+ATTTACTTACAT-TTTATTATTATTTCAGGCTCATGCACATATACTTAGCATGGATCATT
+GGCCACAGACTCGCATACATTTAACTTTATTACCTTT-TGCCTCATGTATCTCATTAAAA
+TTTTGCTGCTTAATCAAGGATCTGCATATTATTTTAATTTTAGAATTCACAGTTCCAAGA
+CTTTGAAAGTTTCAAGCGTTCTGGGTGaatgtgttatgc--tctctcccgccaccatgtc
+tttataccccctgatttctcagccact-atggcaaccactttctactcttagtagcccat
+atttag--tccaatccccagctcaggagacacttcttccaggg--agccccctgtgcctt
+ccagtagtatcttgtacctgccctttttgcaaagctctttcctcctggcttagaatggcc
+cattgacctgtttgtttctcctattaaactgtaagccactcgagggtagagagcatctgt
+tgttcaccattgcatcctcggtgctgagcactgcgtctgacatattatttagaaggtcag
+taagtgctagtgggatTCAGGCTCCCAGTGGGTGGGAGAGAAAGGACGTAAGGAAGCAAG
+TGGTAAAGGCCCTCACAGA-GTATCAGCAGGCTGGTGTGA-GGGAGAAATGCAGAGGATG
+GGTGAGTAGCA-----TAATCGCTAATGAT-AGGGTAATGATAGAGCACATTTCACAACA
+CCTTt-aagccctttcacgtgcatcagataatttgatcctcataaaagcctagagataga
+tatattacagg-gatgaaggtggagtattttgtggttatgtgatatg-tttaaaattatg
+cagtgagtaaatgactgggttcaaaccagaccttaaaagtctgttatctttccCTCG-AG
+CATGCAATGAAGTCTACATCATCCCTACCATGTCCATTTGATCACACCCTGGCCTCACAG
+CTCTGTGGTCTACAGGATACCTCATGGTGGTTTTATTGACCAGACAATAATCCTCTTTCT
+AAGGGGATGCATTTCATTAATACATATGTAGATCATGAATTGTCTTTGACTTTGAGGGGA
+TGGTAGC----CAGAGCAGAAAGCAAAGCTGATTTTCATCCCCGTCTGGTAATGTGGTTG
+GTAATGTGAAGA-TGGGTGTATTCTGAGATACCGGCTCCTTGCAGTGTGTGGTTCCTTCT
+GTTTTCAGGCCC------AAGAAGCCCATCCTGGGAAGGAAAATGCATTGGGGAACCCTG
+TGCGGATTCTTGTGGCTTTGGCCCTATCTTTTCTATGTCCAAGCTGTGCCCATCCAAAAA
+GTCCAAGATGACACCAAAACCCTCATCAAGACAATTGTCACCAGGATCAATGACATTTCA
+CACACGGTAAGGAG---AGTATGCGGGGACAAA---GTAGAACTGCAGCCAGCCCAGCAC
+TGGCTCCTAGTGGCACT-GGACC-CAGATAGtccaagaaacatttattgaacgcctcctg
+aatgccaggcacctactggaagctgagaaGGATTTGAAAGCACAGGGC-TCCACTCTTTC
+TGGTTGTTTCTTTTGGCCCCTCTGCCTGCTGAGATTCCAGGGGTTAGTGG----------
+----------------------------------------------TTCTAATTCTAAAC
+CACTCCAAGAACATTTGATTTTGCTACATGTTTCCATTTAAAAATCATAGGATTTGggct
+gggtgtggtggcttgtacctgtcatcccagcactttgggaggccaaagcaggaggatcat
+tcgagcccaagagttcgagaccagcctgggcagcatagggagaccccatctctacaaaaa
+taataaaaaatgttagctgggcatggtggtgtgtacctgtggtcccagctaggggaggct
+gagatggaaggatcacctgagcctgggaggttgaggctgcagtgggccctgatcatgcca
+ccgtgctccagcctgggtgacagagtgagaccttgtctcaaaataaataaataaataaat
+aaaAGTCATAGGATTTgatcaggcatgatgggtcacatctgtaagcccattgctttagga
+ggccaaggtaggaggatcagttgaggccaggagttcaagaccagcctgggcaacatggca
+agacctctctctctaatttttaaaaaaataaaaaTTAAAGATAAGAAAAAAATCATAGGA
+TTCTCATGAGGCCTCACGTGCTTATTTTCAACCTACCAAGGGGAAACCCAGGCCTCAGCG
+ATTAGCTGAGC----------CACATGCAGGCACAG------------------------
+CCACTG-----TCTCTTTCCTTCCTGTCCCCTCTGTCCCCACCTTCTGCGCTCGCCTTCC
+TCCCTGACTTCACTTCCTTGAATCTTAGTGCCTACGACCAGAGGGAGCTGTGAAGTTCCT
+TG----TGTCCCATTGGCAGGAA-CAAGACCCCCAGAAGCATCTCCTCAGGGC------C
+TCTA-----TCCCATCTC-TAGATGTGCTTGTCATTAGG-Gttct-------------tg
+tagttccagctgatctctggccctgccgctcaaagatacccaaaagagcgagtctaccct
+ttttcacattcaaccctctactgatttgcaaatagcagtcagtgcccaccctggtctttt
+ctctggggtccagcaggcctagaccttcagccattttcctgatgaGGTCTGTAtttgaaa
+ttaggaagattaagtttgaatcttcacacttctgat----gtctgtgagatcttcagcaa
+gttccttact--gtctttaagccttgt-tttcatcatctggataatggggatatcacaca
+cta-ttcacaaggttgttatgaggcctaaattagctaaagcaATTGAATCCTCCTTACCC
+CCTGCATGGAGCTCTCTGGAGACTTCCACGTCTCCTGGTCATTGTGGGTGTCTTATGGTA
+-GTCTTGGGCAGTTAGGGAGAAGTTAGGTGTCTGGAAGCAAAGATGGCTCAGAACTAGAT
+AGAGTC-TTGGGCATTTTATA-GATAAAAACTCTT--GTCTCCtttaaaaataataaaaa
+aaaattaGCTGGGCATATTAGCCACTCAGCAAGACTGCACGTGATAGATCCCGAGTGCCC
+CACCTTGGGTGGTGTAATACACAATATCACGGGAGCCCCGGGTAGTAACCACGGAGGTGT
+CAGCCTCAGTGCTGTGGGCAGATG-GATGGGGAGAGCC--TCCCGG-AACTGGAGTCACT
+GGAGCA----------------------------GGGTTGGGGGGCCTCACTGAGGGTAC
+GGCCTTGATCTCTAAGGAGGAGGGACTGCCTGGAAAAGC-TGACTGGGAGGGAGGACTCG
+GCTGGGGGTAGAAGGGA----------CTAGGGAAGGCTGGGGGTGGGGGTGCTTATGGA
+GGACCTCAGATGCCTGGGGAACAGACTCCACTAAATAAAACATATGAAACCATGGCTGGT
+TCTTCAGCAGAGGCCATGTAGAGAAAGGAATGACCTAGGAAAGTTGGCCTGGAAGTGGAG
+GGAAGGATGGTGTGGGAAAAGCAGGAA--------TCTCGGAGACCAGCTTAGAGGCTTG
+GCAGTCACCTGGGTGCAGG-ATACAAGGGCCTGAGCCAAAGTGGTGAGGGAGGGTGGAAG
+GAGGCAGCCCAGAGAATGACCCTCCATGCCCACGGGGAAGGCAGAGGGCTCT-GAGAGCG
+A--TTCCTCCCACATG-CT-GAGCACTTGTTCTCCCTCTTCCTCCTGCATAGCAGTCAGT
+CTCCTCCAAACAGAAAGTCACCGGTTTGGACTTCATTCCTGGGCTCCACCCCATCCTGAC
+CTTATCCAAGATGGACCAGACACTGGCAGTCTACCAACAGATCCTCACCAGTATGCCTTC
+CAGAAACGTGATCCAAATATCCAACGACCTGGAGAACCTCCGGGATCTTCTTCACGTGCT
+GGCCTTCTCTAAGAGCTGCCACTTGCCCTGGGCCAGTGGCCTGGAGACCTTGGACAGCCT
+GGGGGGTGTCCTGGAAGCTTCAGGCTACTCCACAGAGGTGGTGGCCCTGAGCAGGCTGCA
+GGGGTCTCTGCAGGACATGCTGTGGCAGCTGGACCTCAGCCCTGGGTGCTGAGGCCTTGA
+AGGTCACTCTTCCTGCAAGGACTACGTTAAGGGAAGGAACTCTGGCTTCCAGGTATCTCC
+AGGATTGAAGAGCATTGCATGGACACCCCTTATCCAGGACTCTGTCAATT--TCCCTGAC
+TCCTCTAAGCCACTCTTCCAAAGGCATAAGACCCTAAGCCTCCTTTTGCTTGAAACCAAA
+GATATATACACAGGATCCTATTCTCACCAGGAAGGGGG-TCCACCC-AGCAAAGAGTGGG
+CTGCATCTGGGATTCCCACCAAGGTCTTCAGCCATCA---ACAAGAGTTGTCTTGTCCCC
+TCT-TGACCCATCT-----------------CCCCCTCACTGAATGCCTCAATGTGACCA
+GGGGTGATTTCAGAGAGGGCAGAGGGGTAGGCAGAGCCTTTGGATGACCA--GAACAAGG
+TTCCCTCTGAGAATTCCAAGGAGTTCCATGAAGACCACATCCACACACG--CAGGAACTC
+CC--AGCAACACAAGCTGGAA---GCACATGTTTATTTATTCTGCATTTTATTCTGGATG
+GATTTGAAGCAAAGCACCAGCTTCTCCAGGCTCTTTGGGGTCAGCCAGGGCCAGGGGTCT
+CCCTGGAGTGCAGTTTCCAATCCCATAGATGGGTC-TGGCTGAGCTGAACCCA---TTTT
+GAGTGACT----CGAGGGTTGGG-TTCATCTGAGCAAGAGCTGGCAAAGGTGGCTCTCCA
+GTTAGTTCTCTCGTAACTGGTTTCATTTCTACTGTGACTGATGTTACATCACAGTGTTTG
+CAATGGTGTTGCCCTGAGTGGATCTCCAAGGACCAGGTTATTTTAAAA---AGATTTGTT
+TTGTCAAGTGTCATATGTAGGTGTCTGCACCCAGGGGTGGG-GAATGTTTGGGCAGAAGG
+GAGAAGGATCTAGAATGTGTTTTCTGAATAACATTTGTGTGGTGGGTTCTTTGGAAGGAG
+TGAGA-TCATTTTCTTATCTTCTGCAATTGCTTAGGATGTTTTTCATGAAAA--------
+----TAGCTCTTTCAG-GGGGGTTGTGAGGCCTGGCCAGGCACCCCCTGGAGAGAAGTTT
+CTGGCCCTGGCTGACCCCAAAGAGCCTGGAGAAGCTGATGCTTTGCTTCAAATCCATCCA
+GAATAAAACGCAAAGGGCTGAAAGCCATTTGTTGGGGCAGTGGTAAGCTCTGGCTTTCTC
+CGACTGCTAGGGAGTGGTCTTTCCTATCATGGAGTGACGGTCCCACACTGGTGACTGCGA
+TCTTCAGAGCAGGGGTCCTTGGTGT-GACCCTCTGAATGGTCCAGGGTTGATCACACTCT
+GGGTTTATTACATGGCAG-----TGTTCCTATTTGGGGCTTGCATGCCAAATTGTAGTTC
+TTGTCTGATTGGCTCACCC-AAGCAAGGCCAAAATTACCAAAAATCTTGGGGGG--TTTT
+TACTC-CAGTGGTGAAGAAAACTCCTTTAGCAGG-TGGTCCTGAGACCT-GACAAGCACT
+GCTAGGCGAGTGCCAGGACTCCCCAGGCCAGGCCACCAGGATGGCCCTTCCCACTGGAGG
+TCACATTCAGGAAGATGAAAGAGGAGGTTTGGGGTCTGCCACCATCCTGCTGCTGTGTTT
+TTGCTATCACACAGTGGGTGGTGGATCTGTCCAAGGAAACTTGAATCAAAGCAGTTAAC-
+TTTAAGactgagcacctgcttcatgctcagccctgactggtgctataggctggagaagct
+cacccaataaacattaagatt-gaggcctgccctcagggatcttgcattcccagtggTCA
+AACC-GCACTCACCCATGTGCCAAGGTGGGGTA-TTTACCACAGCAG--CTGAACAGCCA
+AATGCATGGTGCAGTTGACAGCAGGTGGGAAATGGTATGAGCTGAGGGGGGCCGTGCCCA
+GGGGCCCACAGG-GAACCCTGCTTGCACTTTGTAACATGTTTA-----CTTTTCagggca
+tcttagctt---ctatta-----tagccacatccctttga---aacaagataactgagaa
+tttaaaaataagaa-----aata--TGACCCCAAAGAGCCTGGAGAAGCTGATGCTTTGC
+TTCAAATCCATCCAGAATAAAACGCAGACCCCAAAGAGCCTGGAGAAGCTGATGCTTTGC
+TTCAAATCCATCCAGAATAAAACGCAGATGCTTTGCTTCAAATCCATCCAGAATAAAACG
+CAAATGACCCCAAAGAGCCTGGAGAAGCTGATGCTTTGCTTCAAATCCATCCAGAATAAA
+ACGCATGACCCCAAAGAGCCTGGAGAAGCTGATGCTTTGCTTCAAATCCATCCAGAATAA
+AACGCAGACCCCAAAGAGCCTGGAGAAGCTGATGCTTTGCTTCAAATCCATCCAGAATAA
+AACGCAGATGCTTTGCTTCAAATCCATCCAGAATAAAACGCAGACCCCAAAGAGCCTGGA
+GAAGCTGATGCTTTGCTTCAAATCCATCCAGAATAAAACGCAGACCCCAAAGAGCCTGGA
+GAAGCTGATGCTTTGCTTCAAATCCATCCAGAATAAAACGCAGACCCCAAAGAGCCTGGA
+GAAGCTGATGCTTTGCTTCAAATCCATCCAGAATAAAACGCAGATGCTTTGCTTCAAATC
+CATCCAGAATAAAACGCAgttcgatgcctaaaataccttcttttgtccctacacagacca
+cagttttcctaatggctttacaccgactagaaattcttgtgcaagcactaattgaaagcg
+gttggcctagagtgttaccggtttgtatagctgagcgcgtctcttgccctgatcaaaggt
+tcattttctctactttggaagacgttgtggaagaatacaacaagtacgagtctctccccc
+ctggtttgctgattactggatacagttgtaatacccttcgcaacaccgcgtaactatcta
+tatgaattattttccctttattatatgtagtaggttcgtctttaatcttcctttagcaag
+tcttttactgttttcgacctcaatgttcatgttcttaggttgttttggataatatgcggt
+cagtttaatcttcgttgtttcttcttaaaatatttattcatggtttaatttttggtttgt
+acttgttcaggggccagttcattatttactctgtttgtatacagcagttcttttattttt
+agtatgattttaatttaaaacaattctaatggtcaaaaa
diff --git a/tools/emboss_5/test-data/emboss_patmatdb_out.tabular b/tools/emboss_5/test-data/emboss_patmatdb_out.tabular
new file mode 100644
index 00000000000..439fcb729b7
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_patmatdb_out.tabular
@@ -0,0 +1,41 @@
+SeqName Start End Score Strand
+Sequence 560 561 2 +
+Sequence 559 560 2 +
+Sequence 558 559 2 +
+Sequence 557 558 2 +
+Sequence 550 551 2 +
+Sequence 544 545 2 +
+Sequence 541 542 2 +
+Sequence 540 541 2 +
+Sequence 539 540 2 +
+Sequence 534 535 2 +
+Sequence 449 450 2 +
+Sequence 431 432 2 +
+Sequence 430 431 2 +
+Sequence 429 430 2 +
+Sequence 409 410 2 +
+Sequence 393 394 2 +
+Sequence 364 365 2 +
+Sequence 340 341 2 +
+Sequence 326 327 2 +
+Sequence 287 288 2 +
+Sequence 274 275 2 +
+Sequence 264 265 2 +
+Sequence 252 253 2 +
+Sequence 204 205 2 +
+Sequence 201 202 2 +
+Sequence 196 197 2 +
+Sequence 193 194 2 +
+Sequence 181 182 2 +
+Sequence 158 159 2 +
+Sequence 157 158 2 +
+Sequence 98 99 2 +
+Sequence 97 98 2 +
+Sequence 92 93 2 +
+Sequence 85 86 2 +
+Sequence 74 75 2 +
+Sequence 73 74 2 +
+Sequence 53 54 2 +
+Sequence 14 15 2 +
+Sequence 13 14 2 +
+Sequence 12 13 2 +
diff --git a/tools/emboss_5/test-data/emboss_pepcoil_out.pepcoil b/tools/emboss_5/test-data/emboss_pepcoil_out.pepcoil
new file mode 100644
index 00000000000..490ea2e870b
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_pepcoil_out.pepcoil
@@ -0,0 +1,6 @@
+PEPCOIL of Sequence
+ using a window of 28 residues
+
+
+Other structures from 1 to 561 (561 residues)
+ Max score: 0.827 (probability 0.00)
diff --git a/tools/emboss_5/test-data/emboss_pepstats_out.pepstats b/tools/emboss_5/test-data/emboss_pepstats_out.pepstats
new file mode 100644
index 00000000000..a9af4eb89e2
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_pepstats_out.pepstats
@@ -0,0 +1,48 @@
+PEPSTATS of Sequence from 1 to 561
+
+Molecular weight = 48582.66 Residues = 561
+Average Residue Weight = 86.600 Charge = 0.0
+Isoelectric Point = 5.0278
+A280 Molar Extinction Coefficient = 0
+A280 Extinction Coefficient 1mg/ml = 0.00
+Improbability of expression in inclusion bodies = 0.520
+
+Residue Number Mole% DayhoffStat
+A = Ala 135 24.064 2.798
+B = Asx 0 0.000 0.000
+C = Cys 106 18.895 6.515
+D = Asp 0 0.000 0.000
+E = Glu 0 0.000 0.000
+F = Phe 0 0.000 0.000
+G = Gly 98 17.469 2.080
+H = His 0 0.000 0.000
+I = Ile 0 0.000 0.000
+J = --- 0 0.000 0.000
+K = Lys 0 0.000 0.000
+L = Leu 0 0.000 0.000
+M = Met 0 0.000 0.000
+N = Asn 0 0.000 0.000
+O = --- 0 0.000 0.000
+P = Pro 0 0.000 0.000
+Q = Gln 0 0.000 0.000
+R = Arg 0 0.000 0.000
+S = Ser 0 0.000 0.000
+T = Thr 222 39.572 6.487
+U = --- 0 0.000 0.000
+V = Val 0 0.000 0.000
+W = Trp 0 0.000 0.000
+X = Xaa 0 0.000 0.000
+Y = Tyr 0 0.000 0.000
+Z = Glx 0 0.000 0.000
+
+Property Residues Number Mole%
+Tiny (A+C+G+S+T) 561 100.000
+Small (A+B+C+D+G+N+P+S+T+V) 561 100.000
+Aliphatic (A+I+L+V) 135 24.064
+Aromatic (F+H+W+Y) 0 0.000
+Non-polar (A+C+F+G+I+L+M+P+V+W+Y) 339 60.428
+Polar (D+E+H+K+N+Q+R+S+T+Z) 222 39.572
+Charged (B+D+E+H+K+R+Z) 0 0.000
+Basic (H+K+R) 0 0.000
+Acidic (B+D+E+Z) 0 0.000
+
diff --git a/tools/emboss_5/test-data/emboss_plotorf_out.png b/tools/emboss_5/test-data/emboss_plotorf_out.png
new file mode 100644
index 00000000000..ffb3ce374d8
Binary files /dev/null and b/tools/emboss_5/test-data/emboss_plotorf_out.png differ
diff --git a/tools/emboss_5/test-data/emboss_plotorf_out1.png b/tools/emboss_5/test-data/emboss_plotorf_out1.png
new file mode 100644
index 00000000000..ffb3ce374d8
Binary files /dev/null and b/tools/emboss_5/test-data/emboss_plotorf_out1.png differ
diff --git a/tools/emboss_5/test-data/emboss_polydot_out.png b/tools/emboss_5/test-data/emboss_polydot_out.png
new file mode 100644
index 00000000000..a9dd751f6a6
Binary files /dev/null and b/tools/emboss_5/test-data/emboss_polydot_out.png differ
diff --git a/tools/emboss_5/test-data/emboss_prettyseq_out.prettyseq b/tools/emboss_5/test-data/emboss_prettyseq_out.prettyseq
new file mode 100644
index 00000000000..f074ab87632
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_prettyseq_out.prettyseq
@@ -0,0 +1,42 @@
+PRETTYSEQ of Sequence from 1 to 561
+
+ ---------|---------|---------|---------|---------|---------|
+ 1 gttcgatgcctaaaataccttcttttgtccctacacagaccacagttttcctaatggctt 60
+ 1 V R C L K Y L L L S L H R P Q F S * W L 2
+
+ ---------|---------|---------|---------|---------|---------|
+ 61 tacaccgactagaaattcttgtgcaagcactaattgaaagcggttggcctagagtgttac 120
+ 3 Y T D * K F L C K H * L K A V G L E C Y 9
+
+ ---------|---------|---------|---------|---------|---------|
+ 121 cggtttgtatagctgagcgcgtctcttgccctgatcaaaggttcattttctctactttgg 180
+ 10 R F V * L S A S L A L I K G S F S L L W 16
+
+ ---------|---------|---------|---------|---------|---------|
+ 181 aagacgttgtggaagaatacaacaagtacgagtctctcccccctggtttgctgattactg 240
+ 17 K T L W K N T T S T S L S P L V C * L L 2
+
+ ---------|---------|---------|---------|---------|---------|
+ 241 gatacagttgtaatacccttcgcaacaccgcgtaactatctatatgaattattttccctt 300
+ 3 D T V V I P F A T P R N Y L Y E L F S L 22
+
+ ---------|---------|---------|---------|---------|---------|
+ 301 tattatatgtagtaggttcgtctttaatcttcctttagcaagtcttttactgttttcgac 360
+ 23 Y Y M * * V R L * S S F S K S F T V F D 11
+
+ ---------|---------|---------|---------|---------|---------|
+ 361 ctcaatgttcatgttcttaggttgttttggataatatgcggtcagtttaatcttcgttgt 420
+ 12 L N V H V L R L F W I I C G Q F N L R C 31
+
+ ---------|---------|---------|---------|---------|---------|
+ 421 ttcttcttaaaatatttattcatggtttaatttttggtttgtacttgttcaggggccagt 480
+ 32 F F L K Y L F M V * F L V C T C S G A S 10
+
+ ---------|---------|---------|---------|---------|---------|
+ 481 tcattatttactctgtttgtatacagcagttcttttatttttagtatgattttaatttaa 540
+ 11 S L F T L F V Y S S S F I F S M I L I * 29
+
+ ---------|---------|-
+ 541 aacaattctaatggtcaaaaa 561
+ 1 N N S N G Q K 7
+
diff --git a/tools/emboss_5/test-data/emboss_primersearch.fasta b/tools/emboss_5/test-data/emboss_primersearch.fasta
new file mode 100644
index 00000000000..0830046bf31
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_primersearch.fasta
@@ -0,0 +1,7 @@
+# This is my primer file
+D1S243 cacacaggctcacatgcc gctccagcgtcatggact
+D1S468 aattaaccgttttggtcct gcgacacacacttccc
+D1S2845 ccaaagggtgcttctc gtggcattccaacctc
+D1S1608 gatggcttttggggactatt cactgagccaagtgacacag
+D1S2893 aaaacatcaactctcccctg ctcaaaccccaataagcctt
+D1S2660 cacacatgcacatgcac agtgacaccagcaggg
diff --git a/tools/emboss_5/test-data/emboss_primersearch_out.primersearch b/tools/emboss_5/test-data/emboss_primersearch_out.primersearch
new file mode 100644
index 00000000000..776748d9af5
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_primersearch_out.primersearch
@@ -0,0 +1,12 @@
+
+Primer name D1S243
+
+Primer name D1S468
+
+Primer name D1S2845
+
+Primer name D1S1608
+
+Primer name D1S2893
+
+Primer name D1S2660
diff --git a/tools/emboss_5/test-data/emboss_revseq_out.fasta b/tools/emboss_5/test-data/emboss_revseq_out.fasta
new file mode 100644
index 00000000000..01820aacbcd
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_revseq_out.fasta
@@ -0,0 +1,11 @@
+>Sequence 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+tttttgaccattagaattgttttaaattaaaatcatactaaaaataaaagaactgctgta
+tacaaacagagtaaataatgaactggcccctgaacaagtacaaaccaaaaattaaaccat
+gaataaatattttaagaagaaacaacgaagattaaactgaccgcatattatccaaaacaa
+cctaagaacatgaacattgaggtcgaaaacagtaaaagacttgctaaaggaagattaaag
+acgaacctactacatataataaagggaaaataattcatatagatagttacgcggtgttgc
+gaagggtattacaactgtatccagtaatcagcaaaccaggggggagagactcgtacttgt
+tgtattcttccacaacgtcttccaaagtagagaaaatgaacctttgatcagggcaagaga
+cgcgctcagctatacaaaccggtaacactctaggccaaccgctttcaattagtgcttgca
+caagaatttctagtcggtgtaaagccattaggaaaactgtggtctgtgtagggacaaaag
+aaggtattttaggcatcgaac
diff --git a/tools/emboss_5/test-data/emboss_seqmatchall_out.fasta b/tools/emboss_5/test-data/emboss_seqmatchall_out.fasta
new file mode 100644
index 00000000000..450d9a181eb
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_seqmatchall_out.fasta
@@ -0,0 +1,3 @@
+
+#---------------------------------------
+#---------------------------------------
diff --git a/tools/emboss_5/test-data/emboss_seqret_out.fasta b/tools/emboss_5/test-data/emboss_seqret_out.fasta
new file mode 100644
index 00000000000..ac2f256f675
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_seqret_out.fasta
@@ -0,0 +1,11 @@
+>Sequence 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gttcgatgcctaaaataccttcttttgtccctacacagaccacagttttcctaatggctt
+tacaccgactagaaattcttgtgcaagcactaattgaaagcggttggcctagagtgttac
+cggtttgtatagctgagcgcgtctcttgccctgatcaaaggttcattttctctactttgg
+aagacgttgtggaagaatacaacaagtacgagtctctcccccctggtttgctgattactg
+gatacagttgtaatacccttcgcaacaccgcgtaactatctatatgaattattttccctt
+tattatatgtagtaggttcgtctttaatcttcctttagcaagtcttttactgttttcgac
+ctcaatgttcatgttcttaggttgttttggataatatgcggtcagtttaatcttcgttgt
+ttcttcttaaaatatttattcatggtttaatttttggtttgtacttgttcaggggccagt
+tcattatttactctgtttgtatacagcagttcttttatttttagtatgattttaatttaa
+aacaattctaatggtcaaaaa
diff --git a/tools/emboss_5/test-data/emboss_sigcleave_out.tabular b/tools/emboss_5/test-data/emboss_sigcleave_out.tabular
new file mode 100644
index 00000000000..bb5daf9fd91
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_sigcleave_out.tabular
@@ -0,0 +1,6 @@
+SeqName Start End Score Strand mature_peptide
+Sequence 27 39 5.175 + CCACAGTTTTCCTAATGGCTTTACACCGACTAGAAATTCTTGTGCAAGCA
+Sequence 253 265 4.809 + CACCGCGTAACTATCTATATGAATTATTTTCCCTTTATTATATGTAGTAG
+Sequence 29 41 4.790 + ACAGTTTTCCTAATGGCTTTACACCGACTAGAAATTCTTGTGCAAGCACT
+Sequence 541 553 3.820 + GTCAAAAA
+Sequence 30 42 3.530 + CAGTTTTCCTAATGGCTTTACACCGACTAGAAATTCTTGTGCAAGCACTA
diff --git a/tools/emboss_5/test-data/emboss_sirna_out.fasta b/tools/emboss_5/test-data/emboss_sirna_out.fasta
new file mode 100644
index 00000000000..1998b4f50b3
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_sirna_out.fasta
@@ -0,0 +1,158 @@
+>Sequence_92 %GC 50.0 Score 9 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+aattgaaagcggttggcctagag
+>Sequence_53 %GC 45.0 Score 8 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+aatggctttacaccgactagaaa
+>Sequence_97 %GC 55.0 Score 8 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+aaagcggttggcctagagtgtta
+>Sequence_98 %GC 55.0 Score 8 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+aagcggttggcctagagtgttac
+>Sequence_201 %GC 55.0 Score 8 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+aacaagtacgagtctctcccccc
+>Sequence_14 %GC 40.0 Score 7 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+aataccttcttttgtccctacac
+>Sequence_85 %GC 40.0 Score 7 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+aagcactaattgaaagcggttgg
+>Sequence_181 %GC 40.0 Score 7 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+aagacgttgtggaagaatacaac
+>Sequence_196 %GC 40.0 Score 7 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+aatacaacaagtacgagtctctc
+>Sequence_204 %GC 60.0 Score 7 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+aagtacgagtctctcccccctgg
+>Sequence_252 %GC 60.0 Score 7 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+aatacccttcgcaacaccgcgta
+>Sequence_264 %GC 40.0 Score 7 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+aacaccgcgtaactatctatatg
+>Sequence_38 %GC 45.0 Score 6 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gaccacagttttcctaatggctt
+>Sequence_73 %GC 35.0 Score 6 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+aaattcttgtgcaagcactaatt
+>Sequence_96 %GC 55.0 Score 6 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gaaagcggttggcctagagtgtt
+>Sequence_118 %GC 50.0 Score 6 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+taccggtttgtatagctgagcgc
+>Sequence_200 %GC 50.0 Score 6 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+caacaagtacgagtctctccccc
+>Sequence_326 %GC 35.0 Score 6 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+aatcttcctttagcaagtctttt
+>Sequence_364 %GC 35.0 Score 6 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+aatgttcatgttcttaggttgtt
+>Sequence_12 %GC 35.0 Score 5 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+aaaataccttcttttgtccctac
+>Sequence_13 %GC 35.0 Score 5 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+aaataccttcttttgtccctaca
+>Sequence_16 %GC 45.0 Score 5 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+taccttcttttgtccctacacag
+>Sequence_32 %GC 45.0 Score 5 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+tacacagaccacagttttcctaa
+>Sequence_52 %GC 45.0 Score 5 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+taatggctttacaccgactagaa
+>Sequence_74 %GC 35.0 Score 5 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+aattcttgtgcaagcactaattg
+>Sequence_88 %GC 45.0 Score 5 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+cactaattgaaagcggttggcct
+>Sequence_91 %GC 45.0 Score 5 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+taattgaaagcggttggcctaga
+>Sequence_128 %GC 55.0 Score 5 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+tatagctgagcgcgtctcttgcc
+>Sequence_173 %GC 45.0 Score 5 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+tactttggaagacgttgtggaag
+>Sequence_193 %GC 35.0 Score 5 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+aagaatacaacaagtacgagtct
+>Sequence_198 %GC 45.0 Score 5 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+tacaacaagtacgagtctctccc
+>Sequence_243 %GC 45.0 Score 5 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+tacagttgtaatacccttcgcaa
+>Sequence_251 %GC 55.0 Score 5 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+taatacccttcgcaacaccgcgt
+>Sequence_313 %GC 40.0 Score 5 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+taggttcgtctttaatcttcctt
+>Sequence_340 %GC 35.0 Score 5 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+aagtcttttactgttttcgacct
+>Sequence_393 %GC 35.0 Score 5 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+aatatgcggtcagtttaatcttc
+>Sequence_489 %GC 40.0 Score 5 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+tactctgtttgtatacagcagtt
+>Sequence_34 %GC 40.0 Score 4 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+cacagaccacagttttcctaatg
+>Sequence_36 %GC 40.0 Score 4 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+cagaccacagttttcctaatggc
+>Sequence_61 %GC 40.0 Score 4 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+tacaccgactagaaattcttgtg
+>Sequence_63 %GC 40.0 Score 4 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+caccgactagaaattcttgtgca
+>Sequence_70 %GC 40.0 Score 4 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+tagaaattcttgtgcaagcacta
+>Sequence_84 %GC 40.0 Score 4 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+caagcactaattgaaagcggttg
+>Sequence_110 %GC 40.0 Score 4 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+tagagtgttaccggtttgtatag
+>Sequence_112 %GC 40.0 Score 4 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gagtgttaccggtttgtatagct
+>Sequence_135 %GC 60.0 Score 4 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gagcgcgtctcttgccctgatca
+>Sequence_180 %GC 40.0 Score 4 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gaagacgttgtggaagaatacaa
+>Sequence_183 %GC 40.0 Score 4 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gacgttgtggaagaatacaacaa
+>Sequence_203 %GC 60.0 Score 4 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+caagtacgagtctctcccccctg
+>Sequence_210 %GC 60.0 Score 4 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gagtctctcccccctggtttgct
+>Sequence_245 %GC 40.0 Score 4 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+cagttgtaatacccttcgcaaca
+>Sequence_254 %GC 60.0 Score 4 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+tacccttcgcaacaccgcgtaac
+>Sequence_263 %GC 40.0 Score 4 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+caacaccgcgtaactatctatat
+>Sequence_266 %GC 40.0 Score 4 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+caccgcgtaactatctatatgaa
+>Sequence_348 %GC 40.0 Score 4 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+tactgttttcgacctcaatgttc
+>Sequence_395 %GC 40.0 Score 4 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+tatgcggtcagtttaatcttcgt
+>Sequence_157 %GC 30.0 Score 3 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+aaaggttcattttctctactttg
+>Sequence_158 %GC 30.0 Score 3 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+aaggttcattttctctactttgg
+>Sequence_207 %GC 65.0 Score 3 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+tacgagtctctcccccctggttt
+>Sequence_325 %GC 35.0 Score 3 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+taatcttcctttagcaagtcttt
+>Sequence_392 %GC 35.0 Score 3 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+taatatgcggtcagtttaatctt
+>Sequence_409 %GC 30.0 Score 3 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+aatcttcgttgtttcttcttaaa
+>Sequence_11 %GC 35.0 Score 2 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+taaaataccttcttttgtcccta
+>Sequence_41 %GC 35.0 Score 2 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+cacagttttcctaatggctttac
+>Sequence_43 %GC 35.0 Score 2 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+cagttttcctaatggctttacac
+>Sequence_67 %GC 35.0 Score 2 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gactagaaattcttgtgcaagca
+>Sequence_72 %GC 35.0 Score 2 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gaaattcttgtgcaagcactaat
+>Sequence_130 %GC 65.0 Score 2 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+tagctgagcgcgtctcttgccct
+>Sequence_192 %GC 35.0 Score 2 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gaagaatacaacaagtacgagtc
+>Sequence_195 %GC 35.0 Score 2 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gaatacaacaagtacgagtctct
+>Sequence_236 %GC 35.0 Score 2 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+tactggatacagttgtaataccc
+>Sequence_241 %GC 35.0 Score 2 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gatacagttgtaatacccttcgc
+>Sequence_304 %GC 35.0 Score 2 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+tatatgtagtaggttcgtcttta
+>Sequence_306 %GC 35.0 Score 2 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+tatgtagtaggttcgtctttaat
+>Sequence_310 %GC 35.0 Score 2 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+tagtaggttcgtctttaatcttc
+>Sequence_358 %GC 35.0 Score 2 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gacctcaatgttcatgttcttag
+>Sequence_370 %GC 35.0 Score 2 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+catgttcttaggttgttttggat
+>Sequence_156 %GC 30.0 Score 1 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+caaaggttcattttctctacttt
+>Sequence_403 %GC 30.0 Score 1 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+cagtttaatcttcgttgtttctt
diff --git a/tools/emboss_5/test-data/emboss_sixpack_out2.sixpack b/tools/emboss_5/test-data/emboss_sixpack_out2.sixpack
new file mode 100644
index 00000000000..c0fbbc7d9a3
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_sixpack_out2.sixpack
@@ -0,0 +1,134 @@
+
+
+ V R C L K Y L L L S L H R P Q F S * W L F1
+ F D A * N T F F C P Y T D H S F P N G F F2
+ S M P K I P S F V P T Q T T V F L M A L F3
+ gttcgatgcctaaaataccttcttttgtccctacacagaccacagttttcctaatggctt
+ 10 20 30 40 50 60
+ ----:----|----:----|----:----|----:----|----:----|----:----|
+ caagctacggattttatggaagaaaacagggatgtgtctggtgtcaaaaggattaccgaa
+ T R H R F Y R R K D R C L G C N E * H S F6
+ X E I G L I G E K T G V C V V T K R I A F5
+ N S A * F V K K Q G * V S W L K G L P K F4
+
+
+ Y T D * K F L C K H * L K A V G L E C Y F1
+ T P T R N S C A S T N * K R L A * S V T F2
+ H R L E I L V Q A L I E S G W P R V L P F3
+ tacaccgactagaaattcttgtgcaagcactaattgaaagcggttggcctagagtgttac
+ 70 80 90 100 110 120
+ ----:----|----:----|----:----|----:----|----:----|----:----|
+ atgtggctgatctttaagaacacgttcgtgattaactttcgccaaccggatctcacaatg
+ * V S * F N K H L C * N F A T P R S H * F6
+ K C R S S I R T C A S I S L P Q G L T N F5
+ V G V L F E Q A L V L Q F R N A * L T V F4
+
+
+ R F V * L S A S L A L I K G S F S L L W F1
+ G L Y S * A R L L P * S K V H F L Y F G F2
+ V C I A E R V S C P D Q R F I F S T L E F3
+ cggtttgtatagctgagcgcgtctcttgccctgatcaaaggttcattttctctactttgg
+ 130 140 150 160 170 180
+ ----:----|----:----|----:----|----:----|----:----|----:----|
+ gccaaacatatcgactcgcgcagagaacgggactagtttccaagtaaaagagatgaaacc
+ R N T Y S L A D R A R I L P E N E R S Q F6
+ G T Q I A S R T E Q G S * L N M K E V K F5
+ P K Y L Q A R R K G Q D F T * K R * K P F4
+
+
+ K T L W K N T T S T S L S P L V C * L L F1
+ R R C G R I Q Q V R V S P P W F A D Y W F2
+ D V V E E Y N K Y E S L P P G L L I T G F3
+ aagacgttgtggaagaatacaacaagtacgagtctctcccccctggtttgctgattactg
+ 190 200 210 220 230 240
+ ----:----|----:----|----:----|----:----|----:----|----:----|
+ ttctgcaacaccttcttatgttgttcatgctcagagaggggggaccaaacgactaatgac
+ F V N H F F V V L V L R E G R T Q Q N S F6
+ S S T T S S Y L L Y S D R G G P K S I V F5
+ L R Q P L I C C T R T E G G Q N A S * Q F4
+
+
+ D T V V I P F A T P R N Y L Y E L F S L F1
+ I Q L * Y P S Q H R V T I Y M N Y F P F F2
+ Y S C N T L R N T A * L S I * I I F P L F3
+ gatacagttgtaatacccttcgcaacaccgcgtaactatctatatgaattattttccctt
+ 250 260 270 280 290 300
+ ----:----|----:----|----:----|----:----|----:----|----:----|
+ ctatgtcaacattatgggaagcgttgtggcgcattgatagatatacttaataaaagggaa
+ S V T T I G K A V G R L * R Y S N N E R F6
+ P Y L Q L V R R L V A Y S D I H I I K G F5
+ I C N Y Y G E C C R T V I * I F * K G K F4
+
+
+ Y Y M * * V R L * S S F S K S F T V F D F1
+ I I C S R F V F N L P L A S L L L F S T F2
+ L Y V V G S S L I F L * Q V F Y C F R P F3
+ tattatatgtagtaggttcgtctttaatcttcctttagcaagtcttttactgttttcgac
+ 310 320 330 340 350 360
+ ----:----|----:----|----:----|----:----|----:----|----:----|
+ ataatatacatcatccaagcagaaattagaaggaaatcgttcagaaaatgacaaaagctg
+ * * I Y Y T R R * D E K L L D K V T K S F6
+ K N Y T T P E D K I K R * C T K * Q K R F5
+ I I H L L N T K L R G K A L R K S N E V F4
+
+
+ L N V H V L R L F W I I C G Q F N L R C F1
+ S M F M F L G C F G * Y A V S L I F V V F2
+ Q C S C S * V V L D N M R S V * S S L F F3
+ ctcaatgttcatgttcttaggttgttttggataatatgcggtcagtttaatcttcgttgt
+ 370 380 390 400 410 420
+ ----:----|----:----|----:----|----:----|----:----|----:----|
+ gagttacaagtacaagaatccaacaaaacctattatacgccagtcaaattagaagcaaca
+ R L T * T R L N N Q I I H P * N L R R Q F6
+ G * H E H E * T T K S L I R D T * D E N F5
+ E I N M N K P Q K P Y Y A T L K I K T T F4
+
+
+ F F L K Y L F M V * F L V C T C S G A S F1
+ S S * N I Y S W F N F W F V L V Q G P V F2
+ L L K I F I H G L I F G L Y L F R G Q F F3
+ ttcttcttaaaatatttattcatggtttaatttttggtttgtacttgttcaggggccagt
+ 430 440 450 460 470 480
+ ----:----|----:----|----:----|----:----|----:----|----:----|
+ aagaagaattttataaataagtaccaaattaaaaaccaaacatgaacaagtccccggtca
+ K K K F Y K N M T * N K T Q V Q E P A L F6
+ N R R L I N I * P K I K P K Y K N L P W F5
+ E E * F I * E H N L K Q N T S T * P G T F4
+
+
+ S L F T L F V Y S S S F I F S M I L I * F1
+ H Y L L C L Y T A V L L F L V * F * F K F2
+ I I Y S V C I Q Q F F Y F * Y D F N L K F3
+ tcattatttactctgtttgtatacagcagttcttttatttttagtatgattttaatttaa
+ 490 500 510 520 530 540
+ ----:----|----:----|----:----|----:----|----:----|----:----|
+ agtaataaatgagacaaacatatgtcgtcaagaaaataaaaatcatactaaaattaaatt
+ E N N V R N T Y L L E K I K L I I K I * F6
+ N M I * E T Q I C C N K * K * Y S K L K F5
+ * * K S Q K Y V A T R K N K T H N * N L F4
+
+
+ N N S N G Q K F1
+ T I L M V K X F2
+ Q F * W S K X F3
+ aacaattctaatggtcaaaaa
+ 550 560
+ ----:----|----:----|-
+ ttgttaagattaccagttttt
+ F L E L P * F F6
+ F C N * H D F F5
+ V I R I T L F F4
+
+##############################
+Minimum size of ORFs : 1
+
+Total ORFs in frame 1 : 10
+Total ORFs in frame 2 : 11
+Total ORFs in frame 3 : 8
+Total ORFs in frame 4 : 14
+Total ORFs in frame 5 : 12
+Total ORFs in frame 6 : 14
+
+Total ORFs : 69
+##############################
+
diff --git a/tools/emboss_5/test-data/emboss_skipseq_out.fasta b/tools/emboss_5/test-data/emboss_skipseq_out.fasta
new file mode 100644
index 00000000000..ac2f256f675
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_skipseq_out.fasta
@@ -0,0 +1,11 @@
+>Sequence 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gttcgatgcctaaaataccttcttttgtccctacacagaccacagttttcctaatggctt
+tacaccgactagaaattcttgtgcaagcactaattgaaagcggttggcctagagtgttac
+cggtttgtatagctgagcgcgtctcttgccctgatcaaaggttcattttctctactttgg
+aagacgttgtggaagaatacaacaagtacgagtctctcccccctggtttgctgattactg
+gatacagttgtaatacccttcgcaacaccgcgtaactatctatatgaattattttccctt
+tattatatgtagtaggttcgtctttaatcttcctttagcaagtcttttactgttttcgac
+ctcaatgttcatgttcttaggttgttttggataatatgcggtcagtttaatcttcgttgt
+ttcttcttaaaatatttattcatggtttaatttttggtttgtacttgttcaggggccagt
+tcattatttactctgtttgtatacagcagttcttttatttttagtatgattttaatttaa
+aacaattctaatggtcaaaaa
diff --git a/tools/emboss_5/test-data/emboss_splitter_out.fasta b/tools/emboss_5/test-data/emboss_splitter_out.fasta
new file mode 100644
index 00000000000..026498633b4
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_splitter_out.fasta
@@ -0,0 +1,11 @@
+>Sequence_1-561 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gttcgatgcctaaaataccttcttttgtccctacacagaccacagttttcctaatggctt
+tacaccgactagaaattcttgtgcaagcactaattgaaagcggttggcctagagtgttac
+cggtttgtatagctgagcgcgtctcttgccctgatcaaaggttcattttctctactttgg
+aagacgttgtggaagaatacaacaagtacgagtctctcccccctggtttgctgattactg
+gatacagttgtaatacccttcgcaacaccgcgtaactatctatatgaattattttccctt
+tattatatgtagtaggttcgtctttaatcttcctttagcaagtcttttactgttttcgac
+ctcaatgttcatgttcttaggttgttttggataatatgcggtcagtttaatcttcgttgt
+ttcttcttaaaatatttattcatggtttaatttttggtttgtacttgttcaggggccagt
+tcattatttactctgtttgtatacagcagttcttttatttttagtatgattttaatttaa
+aacaattctaatggtcaaaaa
diff --git a/tools/emboss_5/test-data/emboss_supermatcher_out.fasta b/tools/emboss_5/test-data/emboss_supermatcher_out.fasta
new file mode 100644
index 00000000000..0d0591f9ae7
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_supermatcher_out.fasta
@@ -0,0 +1,24 @@
+>hg17
+CCCTAGAGCTTCTGAGCCCTCAACAG--------AGATGAACTGGACTCTCTGCAGCCCC
+ACTCTAAATTC-----------CTAAGAGAGAAGTTGATTGACCCAATCAG-------GG
+TCAGGAGAAGGAAGGGAGGAGGAAAGGGAG---------GAGAGAAGAGCCTCTTCGTCT
+CTTGCCTACCAC--TGGCCAGGCAATTGTAG---------CCAAGGGGGCT-GGAGTGTA
+AATGCAAACATAGCC----------ATCAAGGGTt---gtgtatgtgtgtgtgt------
+----gtgtctgtgtgtgtgtatgtgtgtCTCTTGGGTAGGTTAGATCTCCC---------
+---AGGAGGTCCCTAC--TAAACAGACTTAAGCCCGCAAAA---TTTTA--GCTCTCCAG
+CCTCACACACTCCACCCCTCTAC-----CATA-------TTGAATCTTCCCAAACCAACT
+ATG-GCT---TTCCCTAA-CTCCGGAGcttggcctggaa--------tgccctgcttccc
+ct--ctttcccctgg---ggaacgcctgtccttcaggcctcagttca-----cacactgc
+ctcccttgca-----aagctct
+>Sequence 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+ccctaca----caga-----ccacagttttcctaa-------tgg---ctttaca--ccg
+actagaaattcttgtgcaagcactaattga-aag-cggttggccta--gagtgttaccgg
+tttgta------------tagctgagcgcgtctcttgccctgatcaaaggttcattttct
+ct--------actttgg--aagacgttgtggaagaatacaacaag-----tacgagtctc
+tcccc--------cctggtttgctgattactggatacagt-----------tgtaatacc
+cttcgcaacaccgcgtaactatctatat-------gaa--tta-ttttccctttattata
+tgtagtaggttcgt-ctttaatcttcctttagc------aagtcttttactgttttcga-
+cctca------------atgttcatgttcttaggttgttttggat------------aat
+atgcggtcagtt---taatcttcgttgtttcttcttaaaatatttatt--catggtt---
+-taatttt----tggtttgta---cttg---ttcaggggccagttcattatttactctg-
+----tttgtatacagcagttct
diff --git a/tools/emboss_5/test-data/emboss_syco_out.syco b/tools/emboss_5/test-data/emboss_syco_out.syco
new file mode 100644
index 00000000000..7c8ce1c5bd8
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_syco_out.syco
@@ -0,0 +1,484 @@
+SYCO of Sequence from 1 to 561
+
+
+Frame 1
+Mid base Gribskov value
+46 1.007
+49 1.014
+52 1.012
+55 1.002
+58 1.003
+61 0.997
+64 0.998
+67 0.996
+70 1.005
+73 1.006
+76 1.007
+79 1.020
+82 1.008
+85 1.000
+88 0.995
+91 1.005
+94 1.023
+97 1.011
+100 1.008
+103 1.003
+106 1.017
+109 1.028
+112 1.029
+115 1.019
+118 1.013
+121 1.014
+124 1.003
+127 1.003
+130 0.990
+133 0.981
+136 0.975
+139 0.981
+142 0.983
+145 0.981
+148 0.987
+151 1.000
+154 0.989
+157 0.997
+160 0.995
+163 0.998
+166 0.988
+169 0.981
+172 0.993
+175 1.007
+178 1.016
+181 1.016
+184 0.994
+187 1.006
+190 1.017
+193 1.008
+196 1.016
+199 0.995
+202 0.987
+205 0.982
+208 0.983
+211 0.978
+214 0.989
+217 1.000
+220 1.006
+223 1.013
+226 1.008
+229 0.992
+232 1.002
+235 1.002
+238 0.996
+241 0.987
+244 0.988
+247 0.972
+250 0.966
+253 0.973
+256 0.972
+259 0.968
+262 0.956
+265 0.951
+268 0.942
+271 0.923
+274 0.923
+277 0.907
+280 0.897
+283 0.908
+286 0.888
+289 0.896
+292 0.891
+295 0.911
+298 0.923
+301 0.924
+304 0.914
+307 0.904
+310 0.896
+313 0.901
+316 0.910
+319 0.928
+322 0.918
+325 0.914
+328 0.915
+331 0.911
+334 0.910
+337 0.927
+340 0.926
+343 0.917
+346 0.922
+349 0.920
+352 0.917
+355 0.923
+358 0.917
+361 0.926
+364 0.931
+367 0.937
+370 0.937
+373 0.929
+376 0.930
+379 0.931
+382 0.940
+385 0.915
+388 0.908
+391 0.908
+394 0.899
+397 0.909
+400 0.918
+403 0.904
+406 0.896
+409 0.885
+412 0.884
+415 0.884
+418 0.885
+421 0.889
+424 0.889
+427 0.884
+430 0.892
+433 0.903
+436 0.902
+439 0.906
+442 0.900
+445 0.890
+448 0.893
+451 0.903
+454 0.903
+457 0.899
+460 0.910
+463 0.932
+466 0.935
+469 0.925
+472 0.915
+475 0.926
+478 0.925
+481 0.929
+484 0.943
+487 0.934
+490 0.920
+493 0.925
+496 0.925
+499 0.935
+502 0.936
+505 0.939
+508 0.940
+511 0.936
+514 0.932
+
+
+Frame 2
+Mid base Gribskov value
+47 1.003
+50 0.992
+53 1.002
+56 0.997
+59 1.006
+62 1.005
+65 1.007
+68 0.997
+71 1.001
+74 0.996
+77 0.997
+80 0.982
+83 0.975
+86 0.965
+89 0.971
+92 0.977
+95 0.975
+98 0.968
+101 0.979
+104 0.968
+107 0.978
+110 0.982
+113 0.984
+116 0.994
+119 0.984
+122 0.983
+125 0.984
+128 0.996
+131 1.004
+134 0.986
+137 0.992
+140 0.997
+143 0.980
+146 0.972
+149 0.966
+152 0.971
+155 0.956
+158 0.950
+161 0.943
+164 0.944
+167 0.933
+170 0.944
+173 0.944
+176 0.955
+179 0.949
+182 0.944
+185 0.945
+188 0.952
+191 0.941
+194 0.952
+197 0.946
+200 0.934
+203 0.943
+206 0.935
+209 0.940
+212 0.952
+215 0.953
+218 0.937
+221 0.923
+224 0.934
+227 0.938
+230 0.930
+233 0.936
+236 0.949
+239 0.943
+242 0.944
+245 0.946
+248 0.950
+251 0.954
+254 0.968
+257 0.968
+260 0.962
+263 0.960
+266 0.949
+269 0.943
+272 0.946
+275 0.956
+278 0.963
+281 0.963
+284 0.952
+287 0.947
+290 0.950
+293 0.930
+296 0.934
+299 0.936
+302 0.925
+305 0.915
+308 0.939
+311 0.943
+314 0.928
+317 0.930
+320 0.936
+323 0.941
+326 0.938
+329 0.943
+332 0.949
+335 0.939
+338 0.935
+341 0.934
+344 0.924
+347 0.929
+350 0.929
+353 0.932
+356 0.930
+359 0.934
+362 0.930
+365 0.911
+368 0.916
+371 0.925
+374 0.921
+377 0.917
+380 0.916
+383 0.924
+386 0.922
+389 0.919
+392 0.921
+395 0.930
+398 0.912
+401 0.916
+404 0.920
+407 0.909
+410 0.908
+413 0.908
+416 0.898
+419 0.890
+422 0.880
+425 0.885
+428 0.899
+431 0.907
+434 0.912
+437 0.904
+440 0.901
+443 0.901
+446 0.893
+449 0.897
+452 0.894
+455 0.903
+458 0.890
+461 0.886
+464 0.894
+467 0.894
+470 0.894
+473 0.885
+476 0.884
+479 0.875
+482 0.870
+485 0.879
+488 0.878
+491 0.875
+494 0.875
+497 0.876
+500 0.881
+503 0.878
+506 0.876
+509 0.883
+512 0.891
+515 0.896
+
+
+Frame 3
+Mid base Gribskov value
+48 0.929
+51 0.933
+54 0.930
+57 0.946
+60 0.940
+63 0.947
+66 0.947
+69 0.953
+72 0.968
+75 0.950
+78 0.949
+81 0.939
+84 0.929
+87 0.915
+90 0.910
+93 0.922
+96 0.921
+99 0.931
+102 0.925
+105 0.935
+108 0.945
+111 0.935
+114 0.930
+117 0.940
+120 0.949
+123 0.949
+126 0.960
+129 0.944
+132 0.947
+135 0.943
+138 0.946
+141 0.955
+144 0.949
+147 0.948
+150 0.953
+153 0.950
+156 0.960
+159 0.965
+162 0.958
+165 0.979
+168 0.987
+171 0.991
+174 1.003
+177 1.017
+180 1.018
+183 1.004
+186 0.994
+189 1.008
+192 1.010
+195 0.998
+198 1.002
+201 1.013
+204 1.021
+207 1.012
+210 1.002
+213 1.013
+216 1.001
+219 1.012
+222 1.024
+225 1.037
+228 1.035
+231 1.025
+234 1.028
+237 1.011
+240 1.007
+243 1.016
+246 1.006
+249 0.997
+252 0.999
+255 0.989
+258 0.971
+261 0.962
+264 0.950
+267 0.936
+270 0.931
+273 0.931
+276 0.928
+279 0.907
+282 0.897
+285 0.910
+288 0.915
+291 0.904
+294 0.902
+297 0.899
+300 0.905
+303 0.895
+306 0.905
+309 0.896
+312 0.887
+315 0.877
+318 0.879
+321 0.874
+324 0.875
+327 0.878
+330 0.880
+333 0.871
+336 0.871
+339 0.866
+342 0.853
+345 0.851
+348 0.861
+351 0.870
+354 0.874
+357 0.887
+360 0.892
+363 0.892
+366 0.897
+369 0.897
+372 0.903
+375 0.891
+378 0.881
+381 0.881
+384 0.879
+387 0.884
+390 0.875
+393 0.875
+396 0.866
+399 0.865
+402 0.861
+405 0.852
+408 0.852
+411 0.856
+414 0.852
+417 0.850
+420 0.859
+423 0.859
+426 0.867
+429 0.879
+432 0.893
+435 0.903
+438 0.912
+441 0.913
+444 0.910
+447 0.910
+450 0.908
+453 0.908
+456 0.906
+459 0.905
+462 0.918
+465 0.929
+468 0.939
+471 0.940
+474 0.940
+477 0.939
+480 0.943
+483 0.943
+486 0.942
+489 0.943
+492 0.948
+495 0.948
+498 0.948
+501 0.943
+504 0.958
+507 0.960
+510 0.954
+513 0.956
+516 0.947
diff --git a/tools/emboss_5/test-data/emboss_tranalign_out.fasta b/tools/emboss_5/test-data/emboss_tranalign_out.fasta
new file mode 100644
index 00000000000..871ff0a24cb
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_tranalign_out.fasta
@@ -0,0 +1,45 @@
+>HSFAU1
+cctctttctcgactccatcttcgcggtagctgggaccgccgttcagtcgccaatatgcag
+ctctttgtccgcgcccaggagctacacaccttcgaggtgaccggccaggaaacggtcgcc
+cagatcaaggctcatgtagcctca---ctggagggcattgccccggaagatcaagtcgtg
+ctcctggcaggc---cccctggaggatgaggccactctgggccagtgcggggtggaggcc
+ctgactaccctggaagtagcaggccgcatgcttgga---ggtaaagttcatggttccctg
+gcccgtgctggaaaagtgagaggtcagactcctaaggtggccaaacaggagaagaagaag
+aagaagacaggtcgggctaagcggcggatgcagtacaaccggcgctttgtcaacgttgtg
+cccacctttggcaagaagaagggccccaatgccaactct
+>HSFAU2
+cctctttctcgactccatcttcgcggtagctgggaccgccgttcagtcgccaatatgcag
+ctctttgtccgcgcccaggagctacacaccttcgaggtgaccggccaggaaacggtcgcc
+cagatcaaggctcatgtagcctca---ctggagggcattgccccggaagatcaagtcgtg
+ctcctggcaggcgcgcccctggaggatgcactctgggccagtgcggggtggaggccc---
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---------------------------------------
+>HSFAU3
+cctctttctcgactccatcttcgcggtagctgggaccgccgttcagtcgccaatatgcag
+ctctttgtccgcgcccaggagctacacaccttcgaggtgaccggccaggaaacggtcgcc
+cagatcaaggctcatgtagcctca---ctggagggcattgccccggaagatcaagtcgtg
+ctcctggcaggcgcgcccctggaggatgaggccactctgggccagtgcggggtggaggcc
+ctgactaccctggaagtagcaggccgcatgcttgga---ggtaaagttcatggttccctg
+gcccgtgctggaaaagtgagaggtcagactcctaagggggccaaacaggagaagaagaag
+aagaagacaggtcgggctaagcggcggatgcagtacaaccggcgctttgtcaacgttgtg
+cccacctttggcaagaagaagggccccaatgccaactct
+>HSFAU4
+cctctttctcgactccatcttcgcggtagctgggaccgccgttcagtcgccaatatgcag
+ctctttgtccgcgcccaggagctacacaccttcgaggtgaccggccaggaaacggtcgcc
+cagatcaaggctcatgaaatagcctcactggagggcattgccccggaagatcaagtcgtg
+ctcctggcaggcgcgcccctggaggatgaggccactctgggccagtgcggggtggaggcc
+ctgactaccctggaagtagcaggccgcatgcttgcccgaggtaaagttcatggttccctg
+gcccgtgctggaaaagtgagaggtcagactcctaaggtggccaaacaggagaagaagaag
+aagaagacaggtcgggctaagcggcggatgcagtacaaccggcgctttgtcaacgttgtg
+cccacctttggcaagaagaagggccccaatgccaactct
+>HSFAU5
+cctctttctcgactccatcttcgcggtagctgggaccgccgttcagtcgccaatatgcag
+ctctttgtccgcgcccaggagctacacaccttcgaggtgaccggccaggaaacggtcgcc
+cagatcaaggctcatgtagcctca---ctggagggcattgccccggaagatcaagtcgtg
+ctcctggcaggcgcgcccctggaggatgaggccactctgggccagtgcggggtggaggcc
+ctgactaccctggaagtaggccgcatgctttttgga---ggtaaagttcatggttccctg
+gcccgtgctggaaaagtgagaggtcagactcctaaggtggccaaacaggagaagaagaag
+aagaagacaggtcgggctaagcggcggatgcagtacaaccggcgctttgtcaacgttgtg
+cccacctttggcaagaagaagggccccaatgccaactct
\ No newline at end of file
diff --git a/tools/emboss_5/test-data/emboss_transeq_out.fasta b/tools/emboss_5/test-data/emboss_transeq_out.fasta
new file mode 100644
index 00000000000..9c39e21c5e2
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_transeq_out.fasta
@@ -0,0 +1,5 @@
+>Sequence_1 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+VRCLKYLLLSLHRPQFS*WLYTD*KFLCKH*LKAVGLECYRFV*LSASLALIKGSFSLLW
+KTLWKNTTSTSLSPLVC*LLDTVVIPFATPRNYLYELFSLYYM**VRL*SSFSKSFTVFD
+LNVHVLRLFWIICGQFNLRCFFLKYLFMV*FLVCTCSGASSLFTLFVYSSSFIFSMILI*
+NNSNGQK
diff --git a/tools/emboss_5/test-data/emboss_trimest_out.fasta b/tools/emboss_5/test-data/emboss_trimest_out.fasta
new file mode 100644
index 00000000000..8d9adee5f49
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_trimest_out.fasta
@@ -0,0 +1,11 @@
+>Sequence 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other; [poly-A tail removed]
+gttcgatgcctaaaataccttcttttgtccctacacagaccacagttttcctaatggctt
+tacaccgactagaaattcttgtgcaagcactaattgaaagcggttggcctagagtgttac
+cggtttgtatagctgagcgcgtctcttgccctgatcaaaggttcattttctctactttgg
+aagacgttgtggaagaatacaacaagtacgagtctctcccccctggtttgctgattactg
+gatacagttgtaatacccttcgcaacaccgcgtaactatctatatgaattattttccctt
+tattatatgtagtaggttcgtctttaatcttcctttagcaagtcttttactgttttcgac
+ctcaatgttcatgttcttaggttgttttggataatatgcggtcagtttaatcttcgttgt
+ttcttcttaaaatatttattcatggtttaatttttggtttgtacttgttcaggggccagt
+tcattatttactctgtttgtatacagcagttcttttatttttagtatgattttaatttaa
+aacaattctaatggtc
diff --git a/tools/emboss_5/test-data/emboss_trimseq_out.fasta b/tools/emboss_5/test-data/emboss_trimseq_out.fasta
new file mode 100644
index 00000000000..ac2f256f675
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_trimseq_out.fasta
@@ -0,0 +1,11 @@
+>Sequence 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gttcgatgcctaaaataccttcttttgtccctacacagaccacagttttcctaatggctt
+tacaccgactagaaattcttgtgcaagcactaattgaaagcggttggcctagagtgttac
+cggtttgtatagctgagcgcgtctcttgccctgatcaaaggttcattttctctactttgg
+aagacgttgtggaagaatacaacaagtacgagtctctcccccctggtttgctgattactg
+gatacagttgtaatacccttcgcaacaccgcgtaactatctatatgaattattttccctt
+tattatatgtagtaggttcgtctttaatcttcctttagcaagtcttttactgttttcgac
+ctcaatgttcatgttcttaggttgttttggataatatgcggtcagtttaatcttcgttgt
+ttcttcttaaaatatttattcatggtttaatttttggtttgtacttgttcaggggccagt
+tcattatttactctgtttgtatacagcagttcttttatttttagtatgattttaatttaa
+aacaattctaatggtcaaaaa
diff --git a/tools/emboss_5/test-data/emboss_union_out.fasta b/tools/emboss_5/test-data/emboss_union_out.fasta
new file mode 100644
index 00000000000..ac2f256f675
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_union_out.fasta
@@ -0,0 +1,11 @@
+>Sequence 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gttcgatgcctaaaataccttcttttgtccctacacagaccacagttttcctaatggctt
+tacaccgactagaaattcttgtgcaagcactaattgaaagcggttggcctagagtgttac
+cggtttgtatagctgagcgcgtctcttgccctgatcaaaggttcattttctctactttgg
+aagacgttgtggaagaatacaacaagtacgagtctctcccccctggtttgctgattactg
+gatacagttgtaatacccttcgcaacaccgcgtaactatctatatgaattattttccctt
+tattatatgtagtaggttcgtctttaatcttcctttagcaagtcttttactgttttcgac
+ctcaatgttcatgttcttaggttgttttggataatatgcggtcagtttaatcttcgttgt
+ttcttcttaaaatatttattcatggtttaatttttggtttgtacttgttcaggggccagt
+tcattatttactctgtttgtatacagcagttcttttatttttagtatgattttaatttaa
+aacaattctaatggtcaaaaa
diff --git a/tools/emboss_5/test-data/emboss_water_out.fasta b/tools/emboss_5/test-data/emboss_water_out.fasta
new file mode 100644
index 00000000000..34074586663
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_water_out.fasta
@@ -0,0 +1,32 @@
+>hg17
+GTTTGAAGTTGAGATGTGGGTACAATACCATAGCTTTATTC------CAGAGCAGGGTAT
+TTGTTTCCAAATGCCATGTTCCCAGCAGCTGCCCTTGACTGGGAATTGGGGTGTGATTTG
+GGCTTTT-----CCTTAAATCCTTGAGGAGCTGGAGGGGTGGGTGGCTCGCACTCCTGCT
+TTctggatctgaatcctgactctgtcatggacctgtttgactttgggcaagttgactcct
+attcctgagccccatatttttctcttctgtgaaattcagattaaaaAAACATGGCTTTGA
+TCAAA----CATTATAAATAATATATAGACAGACTGCTTGTTTTTATTGTATTGCCAGAA
+ATGAATCCTACTAATA-------------------TTGC-CATCTA-TGG--ACAGAAAA
+TGTATTACCTGTCTTCATCAAGACCCAGACGAGGAAGAACACGAAAAGCGGA--------
+---GATTAATTTTACTGCC-------ATCTCCAGAA---CCGTCATCCTAATATTTACTT
+A-CA----TTTTATTATTATTTCAGGCTC-ATGCACATATACTTAG-----CATGGATCA
+T-TGGCCACAGACTCGCATACATTTAA-CTTTATTACCTTTTGCCTCATGTATCTCATTA
+AAATTTTGCTGCTTAATCAAGGATCTGCATATTATTTTAATTTTAGAATTCACAGTTCCA
+AGACTTTGAAAGTTTCAAGCGTTCTGGGTGaatgtgttatgctctctcccgcca--ccat
+gtctttataccccctgatttct---cagccactatggcaaccactttctactcttagta-
+gcccat----atttagtccaatccccagctcaggagacacttct
+>Sequence 561 BP; 135 A; 106 C; 98 G; 222 T; 0 other;
+gttcga----------tgcctaaaatacctt--cttttgtccctacacagaccacagt--
+---tttcctaatggc---tttacacc----------gactagaaatt-------------
+--cttgtgcaagcactaa----ttga-aagc---------ggttggc-------------
+--ctaga--------------gtgt----taccggtttg--------------------t
+atagctgagcgc-------gtctctt---------------------------gccctga
+tcaaaggttcattttctctact---ttggaagac-----------gttgt-------gga
+a-gaatacaacaagtacgagtctctcccccctggtttgctgat-tactggatacag---t
+tgtaatacc---cttc-gcaacacc----------------------gcgtaactatcta
+tatgaattatttt----ccctttattatatgtagtaggttcgtctt--taatcttccttt
+agcaagtcttttactgt--tttcgacctcaatgttcatgttcttaggttgttttggataa
+tatgcggtcag-----------tttaatcttcgt--------------tgtttcttctta
+aaatat------ttattcatgg-------------tttaatttttggttt----gt----
+--actt--------------gttcaggg----------------------gccagttcat
+-tattta----ctctg-tttgtatacagc----------agttcttt-tatttttagtat
+g---attttaattta-------------------aaacaattct
diff --git a/tools/emboss_5/test-data/emboss_water_out.score b/tools/emboss_5/test-data/emboss_water_out.score
new file mode 100644
index 00000000000..92f9bf2fa74
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_water_out.score
@@ -0,0 +1,4 @@
+Sequence hg17 884 (610.5)
+
+#---------------------------------------
+#---------------------------------------
diff --git a/tools/emboss_5/test-data/emboss_wobble_out.png b/tools/emboss_5/test-data/emboss_wobble_out.png
new file mode 100644
index 00000000000..5ecc58b0c81
Binary files /dev/null and b/tools/emboss_5/test-data/emboss_wobble_out.png differ
diff --git a/tools/emboss_5/test-data/emboss_wobble_out.wobble b/tools/emboss_5/test-data/emboss_wobble_out.wobble
new file mode 100644
index 00000000000..8fa8f88ec4a
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_wobble_out.wobble
@@ -0,0 +1 @@
+Expected GC content in third position = 36.36
diff --git a/tools/emboss_5/test-data/emboss_wordcount_out.wordcount b/tools/emboss_5/test-data/emboss_wordcount_out.wordcount
new file mode 100644
index 00000000000..56d6c267c64
--- /dev/null
+++ b/tools/emboss_5/test-data/emboss_wordcount_out.wordcount
@@ -0,0 +1,202 @@
+ttta 13
+tttt 13
+tctt 11
+gttt 10
+ttgt 10
+taat 9
+ttct 8
+attt 8
+tttg 8
+gttc 8
+tgtt 8
+ggtt 8
+cttt 8
+aatt 6
+tatt 6
+ttaa 6
+ttat 6
+ttca 5
+ttcg 5
+tttc 5
+cagt 5
+gttg 5
+taca 5
+aata 5
+ccct 5
+agtt 5
+tgta 5
+tact 5
+cttc 5
+atac 5
+ttac 5
+aaaa 5
+atta 4
+tctc 4
+ctaa 4
+gtct 4
+ccta 4
+tata 4
+ctct 4
+cctt 4
+tatg 4
+ttgg 4
+acag 4
+tgga 4
+atat 4
+tcat 4
+tggt 4
+atct 3
+aaat 3
+ttcc 3
+taaa 3
+tcta 3
+attc 3
+tgat 3
+cggt 3
+agca 3
+aaca 3
+cccc 3
+agta 3
+tacc 3
+aatg 3
+caag 3
+cttg 3
+atgg 3
+atgt 3
+acaa 3
+acac 3
+tcaa 3
+aggt 3
+gcaa 3
+ttag 3
+ctga 3
+accg 3
+gtat 3
+acta 3
+tccc 3
+tgaa 2
+tcct 2
+actt 2
+ggaa 2
+gcct 2
+gtca 2
+ctac 2
+gaaa 2
+ctag 2
+gaag 2
+gctg 2
+ggat 2
+ctat 2
+gaat 2
+agcg 2
+tgcc 2
+agtc 2
+aatc 2
+cgac 2
+ggcc 2
+caaa 2
+caac 2
+gacc 2
+cctg 2
+tgtg 2
+caat 2
+ggtc 2
+ctta 2
+gata 2
+atga 2
+atgc 2
+tcga 2
+gatt 2
+gcgg 2
+tcgt 2
+ttgc 2
+gcgt 2
+cgcg 2
+caca 2
+cacc 2
+cgtc 2
+aaga 2
+catg 2
+aagc 2
+cgtt 2
+tcag 2
+catt 2
+aagt 2
+tggc 2
+taga 2
+tagc 2
+tagg 2
+gtaa 2
+ctgg 2
+gtac 2
+gtag 2
+tagt 2
+ctgt 2
+gagt 2
+agaa 2
+agac 2
+acct 2
+aaag 2
+actg 2
+gccc 1
+ccag 1
+tgag 1
+taac 1
+attg 1
+caga 1
+tctg 1
+cagc 1
+gtcc 1
+cagg 1
+gctt 1
+gtta 1
+agct 1
+tgca 1
+aact 1
+tgcg 1
+agtg 1
+tacg 1
+ctca 1
+cgag 1
+ctcc 1
+cctc 1
+tgct 1
+acga 1
+gacg 1
+tgtc 1
+cgat 1
+ggct 1
+tatc 1
+gact 1
+acgt 1
+gatc 1
+tcgc 1
+gatg 1
+gcgc 1
+ttga 1
+cgca 1
+gtgc 1
+gtgg 1
+cgta 1
+gtgt 1
+cact 1
+aggg 1
+ataa 1
+aagg 1
+atag 1
+ccga 1
+ccgc 1
+ccgg 1
+gcac 1
+gcag 1
+gggc 1
+gggg 1
+gagc 1
+acca 1
+accc 1
+atca 1
+agag 1
+aaac 1
+actc 1
+gcca 1
+ccac 1
diff --git a/tools/emboss_5/tool_dependencies.xml b/tools/emboss_5/tool_dependencies.xml
new file mode 100644
index 00000000000..1a92a32183c
--- /dev/null
+++ b/tools/emboss_5/tool_dependencies.xml
@@ -0,0 +1,6 @@
+
+
+
+
+
+
diff --git a/tools/fastqc/.shed.yml b/tools/fastqc/.shed.yml
new file mode 100644
index 00000000000..38726ef9760
--- /dev/null
+++ b/tools/fastqc/.shed.yml
@@ -0,0 +1,14 @@
+categories:
+- Fastq Manipulation
+description: Read QC reports using FastQC
+homepage_url: http://www.bioinformatics.bbsrc.ac.uk/projects/fastqc/
+long_description: |
+ FastQC aims to provide a simple way to do some quality control
+ checks on raw sequence data coming from high throughput sequencing pipelines. It
+ provides a modular set of analyses which you can use to give a quick impression
+ of whether your data has any problems of which you should be aware before doing
+ any further analysis.
+name: fastqc
+owner: devteam
+remote_repository_url: https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc
+type: unrestricted
diff --git a/tools/fastqc/rgFastQC.py b/tools/fastqc/rgFastQC.py
new file mode 100644
index 00000000000..76bc1e42fc6
--- /dev/null
+++ b/tools/fastqc/rgFastQC.py
@@ -0,0 +1,165 @@
+"""
+Rewrite of rgFastQC.py for Version 0.11.2 of FastQC.
+
+Changes implemented from tmcgowan at
+https://testtoolshed.g2.bx.psu.edu/view/tmcgowan/fastqc
+and iuc at https://toolshed.g2.bx.psu.edu/view/iuc/fastqc
+with minor changes and bug fixes
+
+SYNOPSIS
+
+ rgFastQC.py -i input_file -j input_file.name -o output_html_file [-d output_directory]
+ [-f fastq|bam|sam] [-n job_name] [-c contaminant_file] [-e fastqc_executable]
+
+EXAMPLE (generated by Galaxy)
+
+ rgFastQC.py -i path/dataset_1.dat -j 1000gsample.fastq -o path/dataset_3.dat -d path/job_working_directory/subfolder
+ -f fastq -n FastQC -c path/dataset_2.dat -e fastqc
+"""
+import bz2
+import glob
+import gzip
+import mimetypes
+import optparse
+import os
+import re
+import shutil
+import subprocess
+import tempfile
+import zipfile
+
+
+class FastQCRunner(object):
+ def __init__(self, opts=None):
+ '''
+ Initializes an object to run FastQC in Galaxy. To start the process, use the function run_fastqc()
+ '''
+
+ # Check whether the options are specified and saves them into the object
+ assert opts is not None
+ self.opts = opts
+
+ def prepare_command_line(self):
+ '''
+ Develops the Commandline to run FastQC in Galaxy
+ '''
+
+ # Check whether a given file compression format is valid
+ # This prevents uncompression of already uncompressed files
+ infname = self.opts.inputfilename
+ linf = infname.lower()
+ trimext = False
+ # decompression at upload currently does NOT remove this now bogus ending - fastqc will barf
+ # patched may 29 2013 until this is fixed properly
+ type = mimetypes.guess_type(self.opts.input)
+ if linf.endswith('.gz') or linf.endswith('.gzip') or type[-1] == "gzip":
+ f = gzip.open(self.opts.input)
+ try:
+ f.readline()
+ except:
+ trimext = True
+ f.close()
+ elif linf.endswith('bz2'):
+ f = bz2.open(self.opts.input, 'rb')
+ try:
+ f.readline()
+ except:
+ trimext = True
+ f.close()
+ elif linf.endswith('.zip'):
+ if not zipfile.is_zipfile(self.opts.input):
+ trimext = True
+ if trimext:
+ f = open(self.opts.input)
+ try:
+ f.readline()
+ except:
+ raise Exception("Input file corruption, could not identify the filetype")
+ infname = os.path.splitext(infname)[0]
+
+ # Replace unwanted or problematic charaters in the input file name
+ self.fastqinfilename = re.sub(r'[^a-zA-Z0-9_\-\.]', '_', os.path.basename(infname))
+ # check that the symbolic link gets a proper ending, fastqc seems to ignore the given format otherwise
+ if 'fastq' in self.opts.informat:
+ # with fastq the .ext is ignored, but when a format is actually passed it must comply with fastqc's
+ # accepted formats..
+ self.opts.informat = 'fastq'
+ elif not self.fastqinfilename.endswith(self.opts.informat):
+ self.fastqinfilename += '.%s' % self.opts.informat
+
+ # Build the Commandline from the given parameters
+ command_line = [opts.executable, '--outdir %s' % self.opts.outputdir]
+ if self.opts.contaminants is not None:
+ command_line.append('--contaminants %s' % self.opts.contaminants)
+ if self.opts.limits is not None:
+ command_line.append('--limits %s' % self.opts.limits)
+ command_line.append('--quiet')
+ command_line.append('--extract') # to access the output text file
+ if type[-1] != "gzip":
+ command_line.append('-f %s' % self.opts.informat)
+ else:
+ self.fastqinfilename += ".gz"
+ command_line.append(self.fastqinfilename)
+ self.command_line = ' '.join(command_line)
+
+ def copy_output_file_to_dataset(self):
+ '''
+ Retrieves the output html and text files from the output directory and copies them to the Galaxy output files
+ '''
+
+ # retrieve html file
+ result_file = glob.glob(self.opts.outputdir + '/*html')
+ with open(result_file[0], 'rb') as fsrc:
+ with open(self.opts.htmloutput, 'wb') as fdest:
+ shutil.copyfileobj(fsrc, fdest)
+
+ # retrieve text file
+ text_file = glob.glob(self.opts.outputdir + '/*/fastqc_data.txt')
+ with open(text_file[0], 'rb') as fsrc:
+ with open(self.opts.textoutput, 'wb') as fdest:
+ shutil.copyfileobj(fsrc, fdest)
+
+ def run_fastqc(self):
+ '''
+ Executes FastQC. Make sure the mandatory import parameters input, inputfilename, outputdir and htmloutput have been specified in the options
+ '''
+
+ # Create a log file
+ dummy, tlog = tempfile.mkstemp(prefix='rgFastQC', suffix=".log", dir=self.opts.outputdir)
+ sout = open(tlog, 'w')
+
+ self.prepare_command_line()
+ sout.write(self.command_line)
+ sout.write('\n')
+ sout.write("Creating symlink\n") # between the input (.dat) file and the given input file name
+ os.symlink(self.opts.input, self.fastqinfilename)
+ sout.write("check_call\n")
+ subprocess.check_call(self.command_line, shell=True)
+ sout.write("Copying working %s file to %s \n" % (self.fastqinfilename, self.opts.htmloutput))
+ self.copy_output_file_to_dataset()
+ sout.write("Finished")
+ sout.close()
+
+
+if __name__ == '__main__':
+ op = optparse.OptionParser()
+ op.add_option('-i', '--input', default=None)
+ op.add_option('-j', '--inputfilename', default=None)
+ op.add_option('-o', '--htmloutput', default=None)
+ op.add_option('-t', '--textoutput', default=None)
+ op.add_option('-d', '--outputdir', default="/tmp/shortread")
+ op.add_option('-f', '--informat', default='fastq')
+ op.add_option('-n', '--namejob', default='rgFastQC')
+ op.add_option('-c', '--contaminants', default=None)
+ op.add_option('-l', '--limits', default=None)
+ op.add_option('-e', '--executable', default='fastqc')
+ opts, args = op.parse_args()
+
+ assert opts.input is not None
+ assert opts.inputfilename is not None
+ assert opts.htmloutput is not None
+ if not os.path.exists(opts.outputdir):
+ os.makedirs(opts.outputdir)
+
+ fastqc_runner = FastQCRunner(opts)
+ fastqc_runner.run_fastqc()
diff --git a/tools/fastqc/rgFastQC.xml b/tools/fastqc/rgFastQC.xml
new file mode 100644
index 00000000000..e79280e3983
--- /dev/null
+++ b/tools/fastqc/rgFastQC.xml
@@ -0,0 +1,135 @@
+
+ Read Quality reports
+
+ fastqc
+
+
+
+
+
+
+
+ ''
+ -c '$contaminants'
+ #end if
+ #if $limits.dataset and str($limits) > ''
+ -l '$limits'
+ #end if
+ ]]>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+.. class:: infomark
+
+**Purpose**
+
+FastQC aims to provide a simple way to do some quality control checks on raw
+sequence data coming from high throughput sequencing pipelines.
+It provides a modular set of analyses which you can use to give a quick
+impression of whether your data has any problems of
+which you should be aware before doing any further analysis.
+
+The main functions of FastQC are:
+
+- Import of data from BAM, SAM or FastQ/FastQ.gz files (any variant),
+- Providing a quick overview to tell you in which areas there may be problems
+- Summary graphs and tables to quickly assess your data
+- Export of results to an HTML based permanent report
+- Offline operation to allow automated generation of reports without running the interactive application
+
+-----
+
+.. class:: infomark
+
+**FastQC**
+
+This is a Galaxy wrapper. It merely exposes the external package FastQC_ which is documented at FastQC_
+Kindly acknowledge it as well as this tool if you use it.
+FastQC incorporates the Picard-tools_ libraries for sam/bam processing.
+
+The contaminants file parameter was borrowed from the independently developed
+fastqcwrapper contributed to the Galaxy Community Tool Shed by J. Johnson.
+Adaption to version 0.11.2 by T. McGowan.
+
+-----
+
+.. class:: infomark
+
+**Inputs and outputs**
+
+FastQC_ is the best place to look for documentation - it's very good.
+A summary follows below for those in a tearing hurry.
+
+This wrapper will accept a Galaxy fastq, fastq.gz, sam or bam as the input read file to check.
+It will also take an optional file containing a list of contaminants information, in the form of
+a tab-delimited file with 2 columns, name and sequence. As another option the tool takes a custom
+limits.txt file that allows setting the warning thresholds for the different modules and also specifies
+which modules to include in the output.
+
+The tool produces a basic text and a HTML output file that contain all of the results, including the following:
+
+- Basic Statistics
+- Per base sequence quality
+- Per sequence quality scores
+- Per base sequence content
+- Per base GC content
+- Per sequence GC content
+- Per base N content
+- Sequence Length Distribution
+- Sequence Duplication Levels
+- Overrepresented sequences
+- Kmer Content
+
+All except Basic Statistics and Overrepresented sequences are plots.
+ .. _FastQC: http://www.bioinformatics.bbsrc.ac.uk/projects/fastqc/
+ .. _Picard-tools: http://picard.sourceforge.net/index.shtml
+
+
+
+ @unpublished{andrews_s,
+ author = {Andrews, S.},
+ keywords = {bioinformatics, ngs, qc},
+ priority = {2},
+ title = {{FastQC A Quality Control tool for High Throughput Sequence Data}},
+ url = {http://www.bioinformatics.babraham.ac.uk/projects/fastqc/}
+ }
+
+
+
diff --git a/tools/fastqc/test-data/1000gsample.fastq b/tools/fastqc/test-data/1000gsample.fastq
new file mode 100644
index 00000000000..2f37bff4155
--- /dev/null
+++ b/tools/fastqc/test-data/1000gsample.fastq
@@ -0,0 +1,20000 @@
+@ERR005448.1 IL40_2446:5:1:0:964/2
+GTCTCAGCTGCTTAGTCCAATGGCTCCCACACACACAGAAGCATGGCCAGCTCT
++
+40539<=3<.<@@697;A=;79:9<9974.;9:8@=551%0)5+.2%*,02*0)
+@ERR005448.2 IL40_2446:5:1:0:451/2
+ATAAAGACCAGCCTGGCCAATGTGGTGAAACCCTGTCTCTACTAAAAGTACAAA
++
+>?A?<8=AB?:<>@@>8/3>9=;?
+@ERR005448.3 IL40_2446:5:1:0:1205/2
+ATTCTACTCCAACTGATTCCATTCCATTCTATTCCTTTCTATTCCATTTCATTC
++
+?:B7C;6<<;B6/7.09=05973.7864./288235A3&&/244,.056.322.
+@ERR005448.4 IL40_2446:5:1:0:17/2
+CACTTCCAGATACTCCAAAAAGAGTGTTTCCAACCTGCTCTAGTAATGGGAATG
++
+BBBA=<=B6ABA>@7=?>44>8;88=@=6B9??;B=6;8<:BB?@9=@>AA99975,382146;94:2009>5&.8-54;63-005896:3040+3343
+@ERR005448.6 IL40_2446:5:1:0:156/2
+CAGGAAAGGGCCTGGTGGGAGGTAATTGGATCATGGGGGTGGTTTCCTCCATGC
++
+<:<=;A=4=A?@?4>>?0=84=?AAA>@:8BB<;=09;?'?;4??:A@>@?A>;
+@ERR005448.8 IL40_2446:5:1:0:1162/2
+GCTTATCAACAGAAAGCAAGGGTTAGCTATACTGACTTTAGACAGAATAGATTT
++
+0=;=;8*<;7;=8A804848)15?:59?=090945?<789,+;<5'6)8595
+@ERR005448.9 IL40_2446:5:1:0:257/2
+ATGGAATCAACATCAAACGGAATAAAACGGAACTATCGAATGGAATCGAAGAGA
++
+@-+6:7<::9<>?;7:;>=59:>78:<:<4@9*?@=:>8@A8894=7;3.3618
+@ERR005448.10 IL40_2446:5:1:0:842/2
+TGGATTCCACTCCATTCCATTGCACTCGCGTTGATTCCATTCCATTCCACTCCC
++
+>81>?>5>?=@?>@>?>=9;>79=6122,/&6'+,0'50)6&606-)5%%5)'+
+@ERR005448.11 IL40_2446:5:1:0:947/2
+AAAAAAAAAAAGCTGGGAGTGGGGTGTGGTGATGAGCGCCTGTAGTCCTAGCTA
++
+AAAAAAAA?=>:8?:;539)=5><6511)347;674040443642-)8/6348:
+@ERR005448.12 IL40_2446:5:1:0:389/2
+CAGAGATGTTTAATATGAGCCAGGAATTCTGCTAGGCACTTTGTGTATGTTTTA
++
+@?559>@76>CCC@CC;A80=B>7?B?=<;>>;>6A><;?B>>
+@ERR005448.13 IL40_2446:5:1:0:435/2
+ACTGAATTTGGAAAGGGTCACTAGTGAACTTTTTTTTGGTGATACTAAGTAATT
++
+89=7)?>C;8997/456>ABA8=588=4858@@>B>?0(6<9;7,34%586:;==
+@ERR005448.15 IL40_2446:5:1:0:770/2
+AAAAAAGTGCTGTTGGACAACAGTAAAAATTGAGTCTGTGTATATTGAGCTGAA
++
+>>>60298:,:35?5,399;-9-19:4)8728460%2;5./.35)8332&5125
+@ERR005448.16 IL40_2446:5:1:0:788/2
+AATGGCTTTGACCAAAATGCTGATAGTAATATGGACAATGATGTCGAGGCTGAG
++
+>>>6;:AB8)6;=?=??=8<@=9;9;8:=9;854;9?;9748488752755707
+@ERR005448.17 IL40_2446:5:1:0:813/2
+CGGAGTTTGAAAACACTTGAACTGATCTATACTCAATGAGAGGAGGTCATTGAT
++
+<;3'6BBB?=C=@BA>>C@>B=<@A<>:;,7/.>710
+@ERR005448.18 IL40_2446:5:1:0:1012/2
+TGCCTACAATAGCAAATTTTGAAAAACATAGAGACCAAAATAAACCATAGTTAA
++
+>;4?4=??@B7'8>AA>?@;8=C?C;;:>=,=559*E<98B4>;85
+@ERR005448.19 IL40_2446:5:1:0:1150/2
+TTATATGCAAGCGAAGAAGGTAAGTAGGTTACTGGATTTATGAGCCTGAGGTCA
++
+>=?AB8<:8438><=48;921<<00:3:69798)879:;;37<8639594/,0,
+@ERR005448.20 IL40_2446:5:1:0:1254/2
+TGTCTCTTCTCTCTTGAATTCCTGATCTGGCCTAAATTCGCACATACATTCTTT
++
+95?<<@C?;A8;
+@ERR005448.21 IL40_2446:5:1:0:1669/2
+CAGCACCTGCTTTGTTGGCCTGGGGATGTTTCCTAGGTGGTTTATAGGTGGTTT
++
+8>3@616<3199:6:730:4%6@9964,.&20'@52@6,16)/'.3
+@ERR005448.22 IL40_2446:5:1:0:178/2
+TCAGAGAGCCTTGGGCCAGAGTTCCAGGGTCTCTGGCAGTGGCTGCCAGGTGAG
++
+)<806'29<.6?2%%+121''
+@ERR005448.23 IL40_2446:5:1:0:57/2
+ATGATGGTAGAGAGGACATTGTCAAAGATGCCAAAATTTTAGACTCATTGGGAG
++
+A:3??AA9>>>B99;>ABCC>>C?B=0:BA=:ABB>@99?B;39B?79;06926
+@ERR005448.24 IL40_2446:5:1:0:971/2
+AAAATAATTCCCATTGCTATTTCTCGTGGATAGCATTAGAGCATCTGAATTTGG
++
+AAB@>ACCCA>@B=<1:C>;=?>@=>6-18<4.287:6.0/4<:65-.::=6+1
+@ERR005448.25 IL40_2446:5:1:0:685/2
+TTCCATTCCACACGGGTTGGTTCCCTTGCATCCCTTTCCATTCCATTCTATTGC
++
+:?A@@AAA?@@@95<:79393=:6<==4;7>0;9>973;4<352638%8724
+@ERR005448.26 IL40_2446:5:1:0:311/2
+GCTGACTGATAGGCCCCACTCGCGGTAGGGTGCTTCTAGCCCTTCCTACTGATA
++
+=?99?=<>>33==?=A@=<6@74752277=4=<3<:(7977<7<78582:97
+@ERR005448.27 IL40_2446:5:1:0:528/2
+AGACTGGATTAAGAAAATGTGGCACATATACACCATGGAATACTATGCAGCCAT
++
+BACB<.;;?C@:=ABC@891:6@?8;<79=9>=?<@9-7-6<;;
+@ERR005448.28 IL40_2446:5:1:0:315/2
+AACTTTTACTATCTGTACCATTCCTGTACTCTGACATTACCTGGTTATGTCTGA
++
+AAC?CA@?=ABB=A;>@>;6>>;53=854
+@ERR005448.29 IL40_2446:5:1:0:1616/2
+TATAATCTTAATGGGATCCATCATTGACCAAAATGCAGCCCATCATTGACCAAA
++
+C>:@ACCBCCC=8677B>?C?6>:@:@=;=@CC=6:>863:@<<=<609<;?;B
+@ERR005448.30 IL40_2446:5:1:0:852/2
+TGATGTGTGCCTTCAACTCACAGAGTTTAACCTTCCTCTTGATAGAGCAGTTTG
++
+?6B>7;=3?BA?9869??B=A:27?91716;98@;6
+@ERR005448.31 IL40_2446:5:1:0:1684/2
+AGAAGGATACCGACTGGAGATGAGGCTGGAGAGGGTACCAACCTCTTCAGATAT
++
+=/;>85:A>;:4=<<44648848.5:1,0/-/))140)24%,0./.,/1*1,0*
+@ERR005448.32 IL40_2446:5:1:1:881/2
+GTCTAGGAATTTATTTATTTTCCCTATATTTTTCAGTTCACTAGCATATAGTTG
++
+C7?6>B@==8>>8@CCA@A=@<>>@@ACCACB:::;3A5=4?>3><8=CA=826
+@ERR005448.33 IL40_2446:5:1:1:412/2
+GTCCCAGGGCCCAGAAGAGCTTGTGGCCTCCTTGCAGACATCAGTAGTGGCCCC
++
+<8>A?=5929@@><=?7?9@A<4:49>A?>AA;289>:;9<:3?6969<<8<
+@ERR005448.34 IL40_2446:5:1:1:439/2
+AAAGCAAGCACTCAGCTCTTTGGAAATTTCTAAGGGTGTTTCTTTCACTCTTAA
++
+?A=3:BB@BBCCC=:8?@B>;7;897CCB>@?:88:056<=;;@>AC
+@ERR005448.35 IL40_2446:5:1:1:231/2
+TTGTGAGCTACTGGTTTAAGGATTTACACTCAAAACTTTTAATTCAACATAGCT
++
+C<5449<=AA?=<99>@C@61;@@A@?=>AC>@=A?C?@@@B>>?>B@947B
+@ERR005448.63 IL40_2446:5:1:1:10/1
+TGATAAAGACAACAAGAAGAGAGACATCAGCAGACAAGAGATATCAATAAATTA
++
+A;@>@46=A?7:8763-4593:6;885-796175//36/'--168386*043
+@ERR005448.114 IL40_2446:5:1:3:1330/2
+TTTTCCCACACTCTTGACAACACTGTATTATCATACTTTCTTAGCTTTGTCAAA
++
+;=9=31855%1@=,&9=96>5913>??76%8B;8@<>@C?@:B82>?787278=8/496997:98045
+@ERR005448.339 IL40_2446:5:1:8:8/1
+TAGCAGCATGATTTATAGTCCTTTGGGTATATACCCAGTAATGGGATGGCTGGG
++
+B?=A?8=BA=>BBBAB=:;@ABB=438?C@BCACC@CC>4;A;AAB@>@C?CCCAA@AA
+@ERR005448.557 IL40_2446:5:1:14:11/1
+CTTTTTCGTAGAAGTCACCATCTTGGAAATAACACAAGTACTTTCCACTGTCAG
++
+CCCCCC?8;@8=@:=CCAACC>C?;7>8?A@>AB>@>@===61
+@ERR005448.734 IL40_2446:5:1:19:4/1
+CAAAGAGTAAACCTTAAAGTAGAAGTAAAGCTTGATCTGAAATTTGAAGAATGA
++
+;9<==<96B>@??0:988BB@A;>7>@6.>=;;;>9464594'/4=<:=/-/<>9=98=7/3
+@ERR005448.846 IL40_2446:5:1:22:6/1
+GTGAATGCACAAATCACAAAGCGGTTTCTCAGAAAGCATCTGTCTAAGTCTTTT
++
+<@<;?;;<844;;9=@:@@>>.>@;B21>7=9>8686;=2;>61?80&/7;<@@B;;@B>94;A>??80;8@>;<:,73'54<99
+@ERR005448.1029 IL40_2446:5:1:26:6/1
+ATATTAAAAAGACAACATTACTGTCAAAAGCCTGGAGCAATATGAACTTTTCAA
++
+CCCA9BB?C?98@@C>@CCB=B;=@CCAA;@@>759=:9@CA?5?:@>B<=;
+@ERR005448.1227 IL40_2446:5:1:31:2/1
+AATTTTCTGGGATGTCTATTATCCTGTAAAAAACATGTATTTCCGCAGTTATAA
++
+ABCBCBCCC?:?BC=@@>=CA>?=;8<898:>@A7;
+@ERR005448.1311 IL40_2446:5:1:32:9/1
+CTCGTGATCTGCCTGCCTCGGCCTCCCAAAGTGCTGGGATTACAGGCATGAGCC
++
+>B@>88?BA>7@<@@?BB:4:BBB<9?837>336::7.5=@<<=40<<;5<95<
+@ERR005448.1548 IL40_2446:5:1:37:9/1
+GGTTCATTGGTTCTTAGATCTCTGGATTTACAGTTTTTCTCAAATTTAAATTTT
++
+:@=BCB?CB@@CCCCCBCCC>B?0BCBCA:;>A>BB@@A?AC
+@ERR005448.1624 IL40_2446:5:1:39:3/1
+GATATGTTGAATTAACTTCGCAGTATGTTTATACTTCATTTCAACACTAAAACT
++
+AABC@>>AA?CCCA?>=C>;7A8@AB?;=<@<>@@CBCCBACB;?CCBCC@CCC7(1@?:<=C?@?@4*3@?@>
+@ERR005448.1767 IL40_2446:5:1:42:7/1
+GAGAATGGTAAACATGCTCCGTAGAAATAGAGAAAGTAGGTATGACTCCCCTCC
++
+:?@@;<>8+;B?;?94;)3;A=?:749:=)53:3<')5;=;:51'547-28&3&
+@ERR005448.1921 IL40_2446:5:1:45:4/1
+TATGTTCCTTGATAGACATAAGCCATAGTCAGCTGAAGCTGCAGCAAAAAAATA
++
+?@CC>?B>:?2.==6>>>@C@95.0<<27;330(105,7*'055025(5669))
+@ERR005448.2030 IL40_2446:5:1:48:6/1
+AATTAAACTAAAGAGCTTCTGCACAGCAAAAGAAAATACCATCAGAGTGAACAG
++
+CCCCC=??BB?9;935<:4<:@=:86;@>=;;?'3><>>:377-(2147321
+@ERR005448.2050 IL40_2446:5:1:48:10/1
+GAATTCATCTTTTATTAGAGCAACTCAGAGGTTACTGGATTGTACCACCAACAA
++
+CCA=?BAAAB:BB=C<=1:?=A><>;98@<>7'5.:28<
+@ERR005448.2111 IL40_2446:5:1:49:8/1
+TTCCTTGGACAATTAAAAAAATTAAAAGCAATTCAGATTCACTTGAAATATTAG
++
+.A@A?<4<=/44AC;?<@=;<=<==*9?7<>==@:==7/1968&27:8?=9:
+@ERR005448.2255 IL40_2446:5:1:52:8/1
+AAACAAATGTAGTAGTATAAATAAAATGCTCAATGTAGTATAAATAAAACAAAT
++
+@CCCBCBCC@CB>BCA=:
+@ERR005448.2628 IL40_2446:5:1:60:10/1
+GAAGTGATTAAGACATAAGGGTGAGCCCTCATGCATAGATCGGAAGAGCGGTTC
++
+==><>9<@B@@;@AA>A;===AA:=;1;>A76>>?9/515@;=>7;6=7378:9:
+@ERR005448.2813 IL40_2446:5:1:64:7/1
+ATTCCTTGCTTGAGACCTATGCCTTTGAGGAGACGCGGTCTCGCTCGCTGCCTC
++
+5AB@B@,;B@@=?+=A>?+B?8;68+?:4=*;A@?64)??>48<><46/2602(
+@ERR005448.2940 IL40_2446:5:1:67:3/1
+TCCAGCCTGTGTTGTTTTCTGGCCATGATGAAAGCAGGGAGGCAGCTCCAGCTT
++
+ABB>BBBAB@;>AA=BA=AA?AAA?;>9;4=>:;=:=6<;@9>;7:1-:66776
+@ERR005448.3000 IL40_2446:5:1:68:9/1
+GTCAACCTCCCTGCAACTTCTGAACATCCTCCAGTAAGATCTGAAGAGCGGTTC
++
+627<@@@@@>=7<>@4&7@@:46:.;>29<:37/'7;;;7-7*173627,5(/&
+@ERR005448.3073 IL40_2446:5:1:69:3/1
+TTGCTACCTCCATTTCTATTCTGAAAACCCTATTCTCCTTCAATACTTAGTTCT
++
+CB:?CCD?CB@;@;=CABC>=A-=CCA9:BC=<8CB@:C9;@@;;=>@=@@>>?6);@3?1<;;98/84>)07);<;543;603;6)
+@ERR005448.3342 IL40_2446:5:1:74:9/1
+AAGTAACACAGGAATGGAAAACCAGACCTTGTATGTTCTCACTTATAAGCGGGA
++
+B=7;9C;<9@?@C?C>4<=<2('27:).:4;4?6177=///5:,8::20*32.-
+@ERR005448.3407 IL40_2446:5:1:76:2/1
+AAATCAGCATAAAATAAATCTCACAGAAATACAGACATCAAACAGAGATATCTG
++
+@C?BB?5@@@@AA@CB?:@@AA<=><>>?@@9?=A<@@<<=@9;4<4:=>?6=4
+@ERR005448.3834 IL40_2446:5:1:84:1/1
+CTTAGGGGCACTATCTGCTAATACGGTCACACTAGGGATTAGGGCTTCAACATA
++
+BBBA:;;=@@B?@@?@?@BA@B?@<>3:@@?B@?>;?:??;9=6?;>@@:6:9:
+@ERR005448.4351 IL40_2446:5:1:94:5/1
+GACTATGGGATTCTGGTCGTGGCTGGCCTAGATCGGAAGAGCGGTTCAGCAGGA
++
+?BBBBB?<>?BB@AB?>?9?>4:B?;55=:220/2<-7*2999827.*/'134(
+@ERR005448.4691 IL40_2446:5:1:100:6/1
+TTGTACGATTTTGTCTACAATAAAGACTATGCTGCTCGGGGTGATCATGTGGTT
++
+AB=BB===CCCA?A<>>;8517(::<;28:>9;28?9>9<619>+4/50
+@ERR005448.4810 IL40_2446:5:1:102:1682/2
+TGGAATTGAATGGAATGGAATGGAATGCAATGGAATGGAATCAACCCGAGTTCA
++
+A>>=@??;B>>@C@:BCCAC?=@;9AC?>8BB<@>;A<@A>6?@9??@BBAB=>;8>?A>:464=@<=@=>A?:>BA??5459;46==>CC@C?CAB;@@<=9=B@BA=@@?:8;=
+@ERR005448.5143 IL40_2446:5:1:108:10/1
+AATTTACATCCCCACCAACAGTATATAAGCATTCCCTTTTCTCCACAGTCTTGC
++
+@CCCBCCACCCCABCCC@BBB>?B;:69=5::;74:;842=?889=:9499
+@ERR005448.5354 IL40_2446:5:1:112:11/1
+GAAGAAACCTGTCTATGAACCAGTAAGCAGGCCTCACAAAACACCAGACCTGCC
++
+6BBBA@A?@@BB?<9B:A=BB>;(:=:>97.:5(
+@ERR005448.5481 IL40_2446:5:1:115:6/1
+TGGAATGGAAAGGAATGGAATAAACCCGCGTGGAATGGCATGGAATGGAGTGGA
++
+B@@@@@=55?BB@@<;@A>9>:>>9?78'1(8;:<98849628449691<1249
+@ERR005448.5513 IL40_2446:5:1:115:10/1
+ATGCCATAAATTAATTATCTGGCCTTACCCTGAAAATAGGCCATAAGACCCCCA
++
+CB?4=A=@CA@@5C?70A>@::,;A03277=980;>677'-29:,;:02,35
+@ERR005448.5617 IL40_2446:5:1:117:6/1
+AAGCCCCCATAGCCTGACCAGCAATTCTTTTAGGGTGGAAAGACGGAAAGATAA
++
+66@?9A;?:8==<96;;A/-<()-=@C<8@=BA@<77A=;=C==:C=99@<@=9>8<8'>;9:?;:;96../-/,60282';0,26<>60,.43?
+@ERR005448.6022 IL40_2446:5:1:125:4/1
+ACTGAGATGGGAGGATCGCTTGAGCCCAGGTGGTCAAGACTGCAGTAAGCTGTG
++
+@7@?@@;8@907339=<9/89?;368=:';2,69<:6<9:,07.2*2,.='9
+@ERR005448.6161 IL40_2446:5:1:127:4/1
+AATCATCATCGAATGGAATCGAATGGAATCATCGAATGGACTTGAATGGAATAA
++
+BBCCC>=;>C@2@@54243;6?AA>4=<;A?@
+@ERR005448.6315 IL40_2446:5:1:130:11/1
+TCTCTCAATAATAGCATGTACTTTTATTAGAAACAATATTCAGAACGGCAAAGA
++
+CCCBBB>:AC@@ACC@CB@BCAACA<@CBBC@@AC@@>A>2;?A=2
+@ERR005448.6335 IL40_2446:5:1:130:6/1
+TTAGATTTAGAGAATTGCTTAGGGTTTTGCTGAAGCAGAGGATGTTTTCTTTGT
++
+CC=A9@CCC:<3BCC?=<,=;>@4??4;@79<=AB>@=,:>9/3&5*8
+@ERR005448.6405 IL40_2446:5:1:131:3/1
+AGTATTGCTTCATCAGGGAAGCCTTCCTTGAACCTCAGGCTAGATCAGGAATCC
++
+@>=?BA@?3;AA@A=8;>@?@@=AA><@<+44?
+@ERR005448.6581 IL40_2446:5:1:134:2/1
+AATCCAGTCCATTCCATTCCACTCAAGTCCCTTCCACTCGATTCCACTCCACTC
++
+@+33?B6>752,=61=<@@<68;:<:92;.-(36>1.5/2=164<.(5B.22;4
+@ERR005448.6953 IL40_2446:5:1:140:10/1
+CTGGGAATTCAAGACCAGACTGGCCAACATGGCAAAAATCTGTCTCTACTAAAA
++
+@;A<*=B7:?BB=?BB<9.>;:*ABB<;<6.94@<::,)8<;*4>8>1,812/8
+@ERR005448.7121 IL40_2446:5:1:143:1/1
+GCCTGAGAAGGTTTATACTCCTGCTGATGAACGCAAGCACTGAGAACATACAGC
++
+@B==>;<>?<;6;96>33=@?B8'59;@><<@=185.5957>2877.9:8065,
+@ERR005448.7238 IL40_2446:5:1:145:4/1
+TGCCACGACATAATTTTAAGAATCAGGCCAGACGTGGTGGCTCATGCCTGTAAT
++
+@>>A9@@A<;@9@BB=;2:629==.=8A4?;:+/'74048(-)&-/
+@ERR005448.7272 IL40_2446:5:1:146:8/1
+GCATTTTTGTGGTAAAATACTAATACTAAAATTTGTTAACGCACTGTTCATTTA
++
+AB?@:@B??5849/:'(7-.2(.-//1310166162581'+30+&/&
+@ERR005448.7531 IL40_2446:5:1:150:9/1
+GTATTTTGTTATAGCAGCACAGACTAAGAATCGTTTTTTTTTCTTTACAAGATG
++
+C?@<9A7=8?@1>A@;736D=??
+@ERR005448.7570 IL40_2446:5:1:151:1/1
+GAGTGCCTCATATGTACCAGACACTGTATAGGCTCACAGTTGATAATCAATAAA
++
+6><=B@=CCBBC?88@CCBCAA==ACAA>?<8=;;3>8
+@ERR005448.7705 IL40_2446:5:1:153:8/1
+CACCCACTGCAGGGACTTGGGCCTGATTCAGACTCATTGCTTCCAATAGATCGG
++
+2>?ABBBA?>BA6?===A<8;?0;=>>>?>BB:>>;3=>7B@;>>BA6/(A8??
+@ERR005448.7805 IL40_2446:5:1:155:6/1
+ACTCATGGGAACAGCATTTGATACAGACATGGGGCTAATGGGGCTGGGGGTAGG
++
+BAB@BBBAA@BA=@?BABB==?B>@B@>A@<>@;@B@@<7;=A;9:'1<:
+@ERR005448.7951 IL40_2446:5:1:157:9/1
+CACAGGAATCTTCTCTTTAGCTTCCTCGATACCTGTGTCTAAAGATAGCTTCCA
++
+>?B?BB;B@>BB?B@B=B@=@B<>BBAB:B<>?B=67BAA>>1BACA;5>@755
+@ERR005448.8049 IL40_2446:5:1:159:6/1
+ACACACACATGCATACACACGCGTGCACACACACCAGTGCATGCCCACGCAGAT
++
+BA@<@@BAB@=:?@>@A?A59525?6:4<8><:=23/,55;544488'*/5132
+@ERR005448.8583 IL40_2446:5:1:168:2037/2
+GTTATATGTGTATTCTGTGCATATGTTGTGTGTTGTCTGCGTGGGGTGTGGGTT
++
+?4@AB<;B:8(<1/+8545(7;7@>25=5;75'820420.,16'118>(1(8)&
+@ERR005448.8743 IL40_2446:5:1:171:7/1
+TCTGATATTTTCACACTGGTAAATGTTACCTGTATTTTAATTACTGCTATAAAC
++
+CBACCDCCCCCBCCD;BA?;===B@=C?>?:;C@C?=77
+@ERR005448.9191 IL40_2446:5:1:178:4/1
+GGAGAAGAGCTGTTGGGCCTTGAATAATCAGCAGTGATACCGAAGGACTACATC
++
+AA@BAA?>8@BB@B@>@??BAA>8>B@B?@A>;47?;@==4669::85916;>7
+@ERR005448.9262 IL40_2446:5:1:179:8/1
+TGTTGTTAAAATGCTCATGGATAATGGAGAATTGTCGGTTTGGGGAAGGGGAGG
++
+@<8@B>B@B=8>BB?B@B??@@AA===;@9?;A?<869'9:'2>>(091@<'1=
+@ERR005448.9430 IL40_2446:5:1:182:6/1
+GATGTTTTCTCATGATTAGATTCGGGATTTTCAGGGATATATCACAAAAATGAT
++
+>4*<8-4C<96B@A@@;B52=7:;0*@;>C@8<7;5=5@4@954A@A,4-&*+6
+@ERR005448.9594 IL40_2446:5:1:184:1605/1
+CGGTAATACCCCCTATCTTAGAGGTTTGGATTGCCGGTAACTCAGCAATCTCCC
++
+(2:?:<@;=551<6116..1))681.''155'7BB
+@ERR005448.9655 IL40_2446:5:1:185:6/1
+TGGAATGGAATGGAATGCAATGCAATGGAATCATCCGGAATGGAATGGACTGGA
++
+?BB@A;A=@AA?AB=8A@@@AA8<0<@?58@96B?<77@AA(;2>:6
+@ERR005448.10097 IL40_2446:5:1:192:8/1
+GGGAATATCTTCCTATAAAATCTAGACAGAAGCATTCTCAGAAACTGCTCTGTG
++
+CBB?CCCCCCC>ACAA?>@C??C?=@=:@?8)6=BB>A6=?=4>?<>4;;69
+@ERR005448.10325 IL40_2446:5:1:195:425/2
+ACATAAAAACAAACAAACAGAAAACCAAACAAAAAAAAAAAACAAAAAAAACAA
++
+444,%657;+5%4(*1+1*/?A(%2+-*2((%*//'/%36(5'1(6663(*'-6
+@ERR005448.10356 IL40_2446:5:1:196:4/1
+ATGAAGTTCGTACAAGGCACTAAGTCATTTAAAACATTTTAATTGTGTGCTGAG
++
+C@8=>=;>@C*?;>=;<>=;:.0A1>BA:+?=A?=@AAA6><=<51@2*42=3,
+@ERR005448.10422 IL40_2446:5:1:197:1579/1
+GGTCCTGCCTCACCCAATTCTCCTGCTCACTCTTTCCTAGATCCACGTCAGGGC
++
+7.34.,>448A;%-/%<>844,)6,43())84,66.,4)(<1)0-%-/2.,(..
+@ERR005448.10433 IL40_2446:5:1:197:7/1
+TGTAGATCATTCTGGCTAAATAATGGGATTCACTTTTAAGTGAAGGAGGCCTTG
++
+CC@@?@C?BCCACA@@CA@@B@@C@;BB<==@?=A=:BA@9'8:==88=:>;;?6;;A:A<8?9A<:?6:;<
+@ERR005448.10914 IL40_2446:5:1:205:9/1
+TCCTCCTCAAAACACACACAAGCCAAGACTAAGGATGAGAAGCATCTGCCAAAC
++
+B?ABB=BB@>@=AAAA@B@@BA>869>>>BB;9?=;>9/3>B:<<,36:@23>51:>9364322*'1646<8.055612<68-5'0-?
+@ERR005448.11173 IL40_2446:5:1:209:11/1
+CTATTCTTACTCATCAAGGGAAAGCAGCAGGTCTAGTACAATCCTTTGCATTCT
++
+BCC@@@CC@@=;BACBA@>@AB>CB=C?AC?7@C=?;59BAB;,.AA?=;B;;:8>??84??>C;)401;12)'&(<+(4/'31)&'&))/:4
+@ERR005448.11907 IL40_2446:5:1:220:3/1
+GCCCCAGTACCCTAGAGCCCACTGAAATGATTCAAACCAGCCAATCCTCAGTCT
++
+9@>>?5A@B7:=46694;(3;8@8(;@?==)5-'7(-277633+190'-6
+@ERR005448.12013 IL40_2446:5:1:222:9/1
+TTGGAAAGGAAGGTTTGAAAGAGTGAGAAGGGTAGGTGTAAGGGTTCCCTAATT
++
+BBB@>;4A?>>B<5??>>?=B993B@B?<@B91-9A6>;8;:7<9<8;379259
+@ERR005448.12321 IL40_2446:5:1:227:2/1
+GCAGACAAGGCTAAGAGTCTACGGGAAAGGCGGACTAAGAGGGGAAAAGATGCA
++
+6AA<@A;:3:AA1::9=8>=;540;1''7/62;-'54)8/=>7=54-737091(
+@ERR005448.12441 IL40_2446:5:1:229:295/2
+ATCCAAGCACTTGGGAGGCCCAGGCGGATGGATCGATTGCGCCCAGGCGTTTGA
++
+A@A3%5:::07@<*41,063;9/,564.(8<5/0820+%)*3-0720%20'+%)
+@ERR005448.12534 IL40_2446:5:1:230:7/1
+CACCCTCTGGTACAGCTGACCTAGAAGCAAGAGCGGAAGAGCGGTTCAGCAGGA
++
+(90?>>6?<3>=58B??4,4:8?;?:<::8('4?787@@<;4(1',6(8714
+@ERR005448.12547 IL40_2446:5:1:231:2/1
+TACTGAGACACCCCATTGAGATATATAACAGTTATTGGAGAATGGTCTGAGGCT
++
+CC?@=A@?@BBB@;59@B?B<=@@BC:7<=?:@:@<<9.=7;;2:85>:18-3=
+@ERR005448.12889 IL40_2446:5:1:237:5/1
+ATGCCCCTGTAAGTACCCAATTCCCTGACTTAAATTCACTTCTCCTTACACTAG
++
+@:;=>5;9;:?===9?9515?=?24
+@ERR005448.13051 IL40_2446:5:1:239:8/1
+CCACCTGTGTGGGCCTTGTCTCCTCAGCTAGACTCTGAATTGTTTAAGGACAGA
++
+AAAAB@?@@@=9@BBBBBB?BB?A@>@@@@@??B>?=77?@@?@=7<7>77<=5
+@ERR005448.13269 IL40_2446:5:1:243:5/1
+AGTTAGGAAACACTCTGTTTGTAAAGTCTGCAAGTGGATATTCAGACCTCTGTG
++
+@A?AC@@A:?B@;CBBC>ABC?AB:@9??A:1:B1<=:<;;>=8:70-7<8*:1
+@ERR005448.13503 IL40_2446:5:1:247:4/1
+CATCCTCAGTCTCTACATGAGGAAACCAAAGCCTGGTCTACATGAGGAAACCAA
++
+ABAABAA???BBBA@?>AA5;?<;57:<>?>@779;770797<:456;;<58??
+@ERR005448.13662 IL40_2446:5:1:249:7/1
+AAAGCCAACATGTTTTTCCTCCACTGCTTTAAAGGATCATCAATAGGGACGGCA
++
+?>A=-'829/36)=;865*:&&)(*8243(52-''.
+@ERR005448.13817 IL40_2446:5:1:252:789/1
+TGTGCATTTAGGCAAGGTTACTTGACATTTATGGGTTTCCTTTTCTTTGCCAGA
++
+>=6=6>507'8A>:7=A>>8&8@358@4&,=>8>7C@75&3:9;
+@ERR005448.13831 IL40_2446:5:1:252:11/1
+GTTTAGTGCTTCCTTCAGGAGCTCTTTTAGGGCAGGCCTGGTGGTGACAAAATC
++
+9@AB><*<=BB@@@BA@@AA>?@:@=@A82<=@=AA@:;A>2@;(860707=67
+@ERR005448.13843 IL40_2446:5:1:252:8/1
+TACATCAATTGGATTAGGACGACAACATCTTGTTAAAATTTCTGGTCTTGATAC
++
+CBCA=152=;CA>57;?@=61:2.8<87,;8>:>@9@:;59-12:(7-063366
+@ERR005448.13955 IL40_2446:5:1:254:10/1
+GTCCTCTCTGACTTCTTTTGGCAATGTTAGTTTCCCGTCTGAAGGTGGGTCACT
++
+@5<0)AB@B1:97>@74:@9A8@:B@9?<@529.140><681.+9039'&/&6@
+@ERR005448.14149 IL40_2446:5:1:257:5/1
+TGTAATTCCAATTATATGGTTGAGTTACAGATTCCTTACTCCCAAGTGTTGTTT
++
+A:89CCBA@C@C?CAA@CB>B=1>>C@==B9?@B?;>?3<89?;=@85&4?8:9
+@ERR005448.14385 IL40_2446:5:1:260:9/1
+TGTGTTGTAAATTTTAGATCCAAATCTTTTGTTATCTGGGCAGATTTTATCTTT
++
+;AA?;B=A=3>=CCCC@?;5=9@A;;97@=BB=BB@BA<@@B>BABA@<5>@@@4@:;?=9A:@5=?48>
+@ERR005448.14747 IL40_2446:5:1:266:1820/1
+GTATTGCCTTCTTGGAGATTGCTTCAGAGAACAGGCCATGTGCACTCTTCTGAA
++
+B=<-=)1<9:4>4)8@9;2=>94;2=56;5((41--71;70/015
+@ERR005448.15019 IL40_2446:5:1:271:6/1
+AAAGTCATATAAATGCCATTACAATTATACTTTGTGTCTCTGACAATCAAAATA
++
+DABCBCBCAB?:=?A@A?CC:7;@BBA?<@=878:;974+366
+@ERR005448.15311 IL40_2446:5:1:276:2/1
+ACAAGCAGTTTATTTTCTAAACAAATTTGTAAGTTTATTTCCTTGTTGATGAGC
++
+>C@A<;>;87AAA<@=?>=B>CC=/>BA>?B?<97
+@ERR005448.15473 IL40_2446:5:1:278:5/1
+TCTTGCTGAGTAAATCACATTTGCATTCTGGTTTGGCAAAGATTACAAGCTGGG
++
+@B@=>;AA?>:???CCAAABACCA<>>;<<<>=6:5959>
+@ERR005448.15755 IL40_2446:5:1:283:1674/1
+CCAGAACAGTAATCTCTTAGCATGAGGCCATCTAGAAAGATGGAGACCAAGGGA
++
+BAB?A@A?=;B;:)<@;=A>AB<4*=<;6,=69A:(:>;>@7>6/692292
+@ERR005448.15991 IL40_2446:5:1:286:92/1
+GGCATTTCGGGGGCCCTGGCTCTGAACTCACTTGTAGGCATGGAAGGCCTCCAA
++
+BBB?A@BA@9@9.:;:;83;6:;6/6::8:<9/,/3418/,82%-/4%,1,,/%
+@ERR005448.16107 IL40_2446:5:1:288:2/1
+TAGAGACGGGGTTTCACCATGTTGACCAGGCTGGTCTTGAACTTCTGACCTCAG
++
+BA;>AB?BABB?AA>7>>?@>;@5:@=7>A<:8?478?77<7>;
+@ERR005448.16513 IL40_2446:5:1:295:8/1
+TTTTAAGTGTACAATTCAATGGCTTTAAATTCATTCACAATGTTGTGCAGCCAT
++
+ACCCAB?@?C>;@@C@@A??=>@<;:==@><>/<64
+@ERR005448.17115 IL40_2446:5:1:304:6/1
+AATAAGTAGTAACCTGTGTTCCCATAGATTGTGTAAATATCTCATTTGTAAATA
++
+C?C;=>BBC@B;?@>>/=AC473?B=A>D=?=?73:7@8:<=9BB=@B=AB@BA
+@ERR005448.17314 IL40_2446:5:1:307:4/1
+TCTTATTGAATGAATTGTCCCATCTTTGGCTGGTGTAAACCTCTTCACGCTGGC
++
+?A?=@BBBAB>=BBBB>A>:=@A=>?>@==AA?67(6@;;=::<5<=5>=94
+@ERR005448.17765 IL40_2446:5:1:314:7/1
+AATAAAGTGCCTTTAAACAATTGTCCCTAAACGTGGGTGGAGGGATGGGGGGCA
++
+;A@ABAB5<<@B@@BAB4;;=73==A<4;/<63?=B5(:C==>?;ACABAC@3?=;=->(BAB<:A6=:
+@ERR005448.18035 IL40_2446:5:1:318:5/1
+CACACACAACCCTTCCATCTTTCCCGGTCTCCAGTGTCTATTATCCCACACGCT
++
+@B>>;:7;:,67=7=;157)=66166:171613&05
+@ERR005448.18181 IL40_2446:5:1:320:10/1
+TATTGTTGGGTGGTATGCTTTTTGTCTATGTGTTAGGTCCAAATGGCCTATCAT
++
+C=@CC>CBBB;A?=BCCABCCCCC?BC@A=6??>;:765618766/69<<:318
+@ERR005448.18350 IL40_2446:5:1:323:9/1
+AAATAGCAGTCTAATTTGGATGAGAAGGACTGCTACAAACATGATGACTGTAAG
++
+C>>9?>C:7&4B4/5>?@>5>;4=;2:/52=:8'2,/6/*0.2724301/-'11
+@ERR005448.18706 IL40_2446:5:1:329:6/1
+ATAAAAGCCCTTACTACACATTCTCACATTCTTCAAAGACTGGACAGAACCACT
++
+A>;769<26;158971946407158/.9
+@ERR005448.18873 IL40_2446:5:1:331:10/1
+ACTATGCAGCCATAAAAAATGATGAGTTCATATCCTTTGTAGGGACATGGATGA
++
+CCCBCCAAABCCCB=AACCBCBBC@CAC?>ACBB@C>BB:0?8=7:;BA:<=@A
+@ERR005448.18928 IL40_2446:5:1:332:3/1
+TATTTGTGTGTTTATGATTACATCTGTGTGGTTGTGTGTGTATCTGTGTGTAGC
++
+C@BA?A5?CCBCCCCCB?)==@C>CCAA>6;?C=8AC9?=CBC@B=73':??:C:B>:C
+@ERR005448.19365 IL40_2446:5:1:338:3/1
+AGAAGAGATCATGGAAAAATTGAGTGACAAAGTAAAATCTTAGAAATGAGCTGT
++
+CC;8>CEB;B>BCC;67A-A77=<@B=A87;C57:7;;?@66<(=;A@<@=67&
+@ERR005448.19732 IL40_2446:5:1:344:10/1
+TTACACCGTCTTCATCCCAACTTTTGTGCCAAAACCAGTCCCATATTACAGGGG
++
+B?9>@@>74?9*9?=>A:6;AB;95<:<:<3)3353-3/4<.11.7'&68773<
+@ERR005448.19925 IL40_2446:5:1:347:4/1
+AGTTCTTTGGAAGATAGCTGGTTGAGGAAGATTGATGTTAATTCTTTAAGTGTT
++
+A;@A79=<>C6C=@>?8;;5*>CA8AA8;96:9>;?C@@>;:=<<@===B::2;
+@ERR005448.20031 IL40_2446:5:1:349:5/1
+GAGTCAAGAGGTCCATAGAATGGCAGTCAGGTGACAGCCTAATAAGGACTGTTG
++
+:0>A>;>?<':=7=@@<8:;?:?>=:-2,75*8*5,&5+&,)00))&.((/))1
+@ERR005448.20219 IL40_2446:5:1:352:5/1
+TGTCACTTTATAAATGGCTGGTCTTTTAGCCATTTGCAAAGGGGTGGGGGAAGG
++
+@A1>9>@B@??BA=,?@@@?56.1)&+1'12&)::(+&&/*'-&&//=80..(4
+@ERR005448.20239 IL40_2446:5:1:352:9/1
+AGTCAAGGTAAGAGGGAGGCATTTTGAGTGAGGAGGGGACACACCAAGCACTTT
++
+AB;B>=@@7>A<5=AA>=>@?ABB@;;?=>1=@5==;>76:59527;104453+
+@ERR005448.20476 IL40_2446:5:1:355:4/1
+AATTGTGATATTTTAATTTTTTTTAACCCAAAGTTCAACTTTTATTGCATCTCA
++
+C@CDCBC@D?DDCC8?CCBCCDCCCA@>B@CB@B>@>AC;B@@:5
+@ERR005448.20638 IL40_2446:5:1:358:5/1
+GGTTAAAAAACATTATTTTCAATTAGAAACACTTATTTCTTGTAGGATTAATAA
++
+ED.E?=A?A@B@C@9B@ECA8>@@9;@CAAB>A79??B=@<:94-
+@ERR005448.20754 IL40_2446:5:1:360:10/1
+CTGCCACAGGGTTGGGATGCAACAAATCTGTTTGGCTTACCTGACAAACATAGA
++
+BAABBB?@@==AAA=AABBAAAAB@:@@BBAB?;=A@<>@?>A==?<=@=97
+@ERR005448.20966 IL40_2446:5:1:363:5/1
+TGGAGTGCGGTGGCACAATCTCAGCTCACTGCAACCTCTGCCTCCCGGGTTCCA
++
+@4<9:@@B=?>?>>66?>>87>:<>2>4;288?4=?>@?<270::<@@8,90)6
+@ERR005448.21018 IL40_2446:5:1:364:2/1
+ACCAAAACTAAAACGATGAGTCTTCTGCCCTGTCTTCCTTAAGGTCCAACAGAA
++
+B@AB<9:??@BA<;;BA=<<=?B@:?B<<=<:88?B>;@>?<;63;717;7676
+@ERR005448.21478 IL40_2446:5:1:370:7/1
+TGTATTGTGGCATGATTTACATCTAATAAATGCACCCACTTTAAGTTTTTGTTT
++
+CCBCCBB@C?@BCA=ACCC@@<);@@=@@;>CB;35<=BACAB@AB
+@ERR005448.21488 IL40_2446:5:1:371:3/1
+ACTTGGGTGAATTTAACTTGCCCAGCTATTAACAAATATAGCACAATTATACTT
++
+=@BA@DACB<@ACCCCCCAAA@1<=?@>@?;;
+@ERR005448.21690 IL40_2446:5:1:373:10/1
+TGCTCTATGAAAGGGAATGTTCAACTAGGTGACTTGAATGCAAACATCACAAAG
++
+A=CCCA?>===???AA@BBB?=:A;?<9?68?>=89:;:<<=<787>==6,0
+@ERR005448.22005 IL40_2446:5:1:378:9/1
+GCAATTATGCTTCCATAACTTTCCGCTCATCAAGATGACCTAGTAAGAAGATAG
++
+@BA?AA;?=<>CC@@A><;CBB=;<>9;;?>94:9<=49381:52.822;2344
+@ERR005448.22201 IL40_2446:5:1:382:4/1
+CACCCCCTGGCCCTGGACAGGAAGCAGGCATGACCTGGAGGAGTGTAGCCATTC
++
+BBB@?>?@<<9@;349:>=6:?;:>;5668965586*64,3)3//201/3/4
+@ERR005448.22219 IL40_2446:5:1:382:11/1
+ATAAGGTTGAAATCCACAAAATAAAAGTTCTTGGTTTTATAGCAGATTTTTTAA
++
+ACCACCDCCCABCA@>DA8@?6?B?AB==/@@=?C@
+@ERR005448.22647 IL40_2446:5:1:388:7/1
+TATCATGTTATGGTCAATAGAATGTACTGGAGGGATATTGCAGGACATAGGGAT
++
+CCA@CC=ACC?AB=BC?C@BC=<;:A9@9@<<7;=>=<2-7<826;:<;97=
+@ERR005448.22778 IL40_2446:5:1:390:2/1
+ATCCCTCAGCCCTTCTTCCCACTCACTTAGATAAAGCAGAGACCTGTGGTTTTC
++
+?@AA@?@@??><>??@>><><;>@?=;?;>>848;=97:=;7:<3<2556::
+@ERR005448.22824 IL40_2446:5:1:391:7/1
+CGGCATGCCTGTCCCCCTCTGCTGCCTGCAGCCCTCTGCCCCCCCTCCTCACGA
++
+@<@<:94;B;?7@B?@8559=539<;:9:278?64:0,491,6:2723'.-%.)
+@ERR005448.22862 IL40_2446:5:1:391:1768/1
+CGGTTCAGCAGGAATGCCGAGAACGATCTCGTATGCAGTATTCTGATTGAGAAA
++
+=B=;AB?=??B>A=?=7;@;;@7AA;2)2;A4B<;=(=4:;=-;('3**2*2<=
+@ERR005448.23039 IL40_2446:5:1:394:11/1
+GGCCTTGCTAGAGACCTAGACATCCAAACACAAGAAGTACAAAGAACACCTGGA
++
+?@ABBBBBB>A@88=,>;>+.9;6.=6/B938=285.)96>7//56(646,82?
+@ERR005448.23078 IL40_2446:5:1:395:2/1
+GGTGCTAACAGGTTTTGCCATAATAAAGAAAAACGTTACCAAATACGTAGTACA
++
+CCBCAC?7AB@@A7>CD<9A=?:=?8@:==50<<=;=6=<;;2:77
+@ERR005448.23493 IL40_2446:5:1:401:11/1
+TGCATTCAGCTCATGGAGTTGAACACTTCCTTTCATAGAGCAGGTTTGAAACAC
++
+BBAA?AA@BBBBB@@B?A?BBAB@:>BB=;=A@9=B>;<:6;<9:?89;:;7
+@ERR005448.23690 IL40_2446:5:1:404:1032/2
+TCCCACCCGCCGCCCTCCCCCCCCTGCCCCCCCCCCCCCCCACCCCCCCCCCCC
++
+'3,2'5/1'92'(,'(/'282625''469'%5032,'2:(5%3,'5%'9992'7
+@ERR005448.23800 IL40_2446:5:1:406:6/1
+GTATTCCCAGAACTTCTCAGGGTGGGAAAAGGATAACAGTGGTTGAGATGACTA
++
+A<=@?7@8=B=@:B??@=;>B@(=B=597/<6/:975:>7:857=3:.791555
+@ERR005448.23801 IL40_2446:5:1:406:2/1
+TTAGGGAGAACACAGTAATATGAGTAACTATGATGAAACCAGGTTAAGTCAAGT
++
+@CCCB;:A=@@BA?C=@?CACA=?;BA4?@A@=A@BA?>87>99<>4>24<@;/
+@ERR005448.24231 IL40_2446:5:1:412:4/1
+TGTTCACATTTTTTGTTTTAAAAGATCACTCTGCTTCCAGGGGGAGGGCAGGTG
++
+ABAB?=>=?BBBBBBBBBA>=A@BA?>?=BBAB;@?;;6=<<583;9;91=9&7
+@ERR005448.24569 IL40_2446:5:1:417:2/1
+CATGTGTAGCAGGCCTGTGGCGAAAGATCGGAAGAGCGGTTCAGCAGGAATGCC
++
+B@?@6>@@@BA@>=???<@8=;/5??:>:9?,681849?33/,34/35'236.0
+@ERR005448.24672 IL40_2446:5:1:419:10/1
+GGTGGCTCATGCCTGTAATCCCTACACTTTGGGAGGCTGAAGTGGGTGGATCAC
++
+?@?ABB@@A@>AA@B@<6=;=>??;28@=<98:86>8:5,,953%34?5,//),
+@ERR005448.24689 IL40_2446:5:1:419:7/1
+AAAATAGCTCACCTTGAAAATGACTGTACTGAAGATAACTCTGTATACTAATGG
++
+??B?BC@@>@A>9<8=@AC?;A7>@:&18@94;B?AA?B3BBBB@BAB@BB;@=;@>29B@@?>=/)84??;6:9;>:=;;/
+@ERR005448.24938 IL40_2446:5:1:423:2/1
+AACCATAATAAAGATGCCTTCCTGAGCAGGTGAGTTATATTTGATCTACATTTA
++
+C==9@<<>><=?99/33/1-4:/;<;<;03-+5;45;846919954&-8?22
+@ERR005448.25220 IL40_2446:5:1:427:8/1
+GATATAGGAAAATTTAAGTGGTCTGGATAGACGATCAAACCAGCTACCACATTC
++
+C87=B=@B9:A6CB@=936?@8<><:3>824739=4175447773048;
+@ERR005448.25368 IL40_2446:5:1:429:10/1
+TGAAGGAAGGGACATATATAAATATGATTTTAGTATCAGAGAGATATTGTACAT
++
+884;A8)6<=@AEA;4A5:><@;A9=A=<4<<59:>;A118<:;/
+@ERR005448.25761 IL40_2446:5:1:435:6/1
+CGTGTGGTCTTTGTCAGGGAATGCGATTGGAGCAGCTGCTTCGAGGGCTTGTTT
++
+>>@>?;3=??BA1888;AA><8=9221>@;:7=;=:?=766?(<83;1'55''/
+@ERR005448.25822 IL40_2446:5:1:436:4/1
+GTGTGTGTGTGTGTGTGTTTAGAGAGAGAATGAGAATAGCATATTCTGTCTTAG
++
+>=97?6A8@8<5;B>=2<9>:?==39432)&7:;53,15)63.-1&11&&)/3,
+@ERR005448.25832 IL40_2446:5:1:436:1473/1
+ACCTTGGGGGAACAGCATGTATAATGGGCCAGAGGGCAGAGGCATGGAATGTTG
++
+B<@BB@???BB?BA>A===>A@B@B8;>A??788@;15><6@@
+@ERR005448.25847 IL40_2446:5:1:436:10/1
+TCCTCAAACTTGGCCTCACTGCTAATGATTCCTCGCACCCAGATGGTAGCCAGT
++
+BB@@>>??>@@?7@=@@?;AB=?8:@?<@B@?A;866;5;>A><<:47564)51
+@ERR005448.26252 IL40_2446:5:1:442:4/1
+GGGCCAGACATCCTCTCTAGATCCACCTTCCTCCAGGTGGGGGGGCCCCTCTGG
++
+64'7BB@@849>;97B@/82<:51682/'23343%)%5-0.//'4674,)*'12
+@ERR005448.26253 IL40_2446:5:1:442:6/1
+GGTTCTATTGCTGTGCAGTAGCTCTTTAGTTTAATTAAATCCCATTTGTCAATT
++
+9):;=@CCA3<;;.=:8=)7@B=>A9:2@B@??B=A?=?>3<@A99;9<@
+@ERR005448.26432 IL40_2446:5:1:445:6/1
+GAGTAGCCAGGACTACAGGCATGCACCACCAGGCCTGACCAATTTTTTAATATT
++
+;=??@@B@?A@A5<:9>>=@:?89);9+3;1&76958-89=<;>=?=>=;;18?
+@ERR005448.26770 IL40_2446:5:1:450:9/1
+TAGTTTGTATGTGAAGATATCCCGTTTACAACGAATTCCTCAACGAGCTCCAAA
++
+6<::?<<23<=?39>=9CC?5:=@3B:?7@<:;;-;;@><>>8&4958;6/(54
+@ERR005448.27287 IL40_2446:5:1:458:1/1
+ATAAATCACACAGGACCTATAAATCAAAATACAAGTTAAAAAACAAAAACAAAC
++
+?D@>;CA@7A7@>A?BC>6AC>67@BC:2
+@ERR005448.27477 IL40_2446:5:1:461:7/1
+GAATGGCATGGAATGGAATGCAATGGAATGGAATGGATTGGAATCAACTCGCGT
++
+?=9=B4<>@??>=>ABB@BA?>>AA=:=8@<;699638>B:25A9;;7==>'>4
+@ERR005448.27630 IL40_2446:5:1:464:6/1
+GTGGCAGGGATATCCTGGATTTTATTACATTTTTAAATATATAATCTACTTATG
++
+=D?CD@A=C:06>AA47<2>C?=B9:=C92;@B@/5-;;<>=5:@8B88@9-7:
+@ERR005448.27816 IL40_2446:5:1:467:9/1
+TCTCAGAAACTTCTTTGTGATGTGTGCATTCATCTCACAGAGTTGAACCTTTCT
++
+.1ACA>@9:??>@;<8=;A48?.8-+8>1;:A?;;A;41<:895947*1A
+@ERR005448.27926 IL40_2446:5:1:468:231/2
+CCGTCTGTCACCCCTTTCCTTGGCAAGGAAAGGGAGCTCCCTGACCCCTTGCAC
++
+A?8;>86:@89@B<<<@=<;;AAAA?29<734/9?0:
+@ERR005448.27948 IL40_2446:5:1:469:10/1
+GCCCACAAGAGAAAGCAGGAAAGATCTAAAATTGATACCCTAACATCACAATTA
++
+B>C>9;8/7A<;>6>@@@;:?2::<;A>>:6:;A?;8674:<;:;548-8=702
+@ERR005448.28360 IL40_2446:5:1:475:559/2
+ACCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCC
++
+'3(7752,5<<<9;9;@=(2435<359=:;<39<;<93//8(.(8.44(9669.
+@ERR005448.28595 IL40_2446:5:1:479:3/1
+TGACCATCCCTATGCAAATTTATTTGCTTGAGATTTTGTGTGTACTTTTACCAA
++
+BBACCCBCCCC?ABAA>;ACAABCCCBCA>2;=BAB?=9<:B?<7?AC<:976?
+@ERR005448.28974 IL40_2446:5:1:485:4/1
+ATTTTCAGCTGATAAGGTCAGCCAACTATGGTGACGTATATGATTTGCTAGGTT
++
+?::<9ACCCA??@A=8;;=A=@;B<+6=>,;7=:7<;:5&5@;?<;61=678<=
+@ERR005448.29096 IL40_2446:5:1:487:10/1
+AGTGTGTGACACATCTCTGGATCAGAAATGTCTTCCTTTCTACCTTTCACCTTC
++
+BB?B>BABB@@ABBBBBBBB?AB@A=9;AA;@BB?@BBB@B?=;AB@:7:
+@ERR005448.29605 IL40_2446:5:1:494:2/1
+CATCTGTGTGTATGCTCAGCAATCCCTGTTGGTTTTGAGCCACCAGTTATATAA
++
+BBBBBB@B>B>=?A;A><=:?<;>>=3=?A>@=6=826987;45/:986,
+@ERR005448.29747 IL40_2446:5:1:497:9/1
+GTAGGCTTTTTTCTTTTTTTTTCTTCAACTGTTACTTTAAGTTCTAGGATACCT
++
+C?A@<>;>CC978?@CBBBB=B1<>4.16==7=62<=9&-219,8+43&3/&)-
+@ERR005448.30132 IL40_2446:5:1:503:2/1
+TGTTCTCTCTGGAGGAAGGGAAGCCTTCCTGTGCACAAGTTTCACTCCTGTAGA
++
+@@?AAAABBA@>@?@=:>=<7;=?@?@?==@?<;;9=8=>><;<:7;=75:7
+@ERR005448.30173 IL40_2446:5:1:503:9/1
+CTTATTTTTTAGAGCAGTTTAGGTTCACAGCAAAATTGAGCAGAATGTACATCC
++
+CCB>ACCCCCBCBBA;ACCCCAC=CCCCAA@>91A?;7<=@@:?96BB@AA97>6%097<7:?0%,:;:2.,.33;.,%%45+'6'
+@ERR005448.30481 IL40_2446:5:1:508:11/1
+GCCCTTGAGCATCAGACTCCAAGTTCTTCAGCTTTTGGACTCTTGGACTTACAC
++
+A@>ABBB>B@5?=?=B>@>?;?=1=?<>8=57;<;949:
+@ERR005448.30528 IL40_2446:5:1:509:7/1
+TGAAGGCCAGGACCGGGTCTGGTTTTCATGGTATCCCCAGCACAGTGTCTGGCA
++
+B@@:5@B1?@68,8:79::74<72//9444'2..95361
+@ERR005448.30873 IL40_2446:5:1:515:6/1
+TTACTGTGGTATCCTATTGGTGAATTCATATTTCCATCTTCTTTCTACATTTAT
++
+?A;;CC=@=4=ACCBABC@<;C;:@CA;>>ABB;;6?:AB7@AA=@C?C@97:-09>=BB@B<25
+@ERR005448.31132 IL40_2446:5:1:519:6/1
+GAGTCACATGGTGAGTCCAGTGAATAACAGCTGGTGCCAGAGCCCAGAGCTGGC
++
+><>B@@@A?@B?@@@<@><9;?><@;04>=;69;2;5.-35496844-4.-40%
+@ERR005448.31318 IL40_2446:5:1:521:9/1
+AACCGCATTAACTCTTTCAGCCTAGGTGGATTTTCTTTTGCACATTTAAAGAGT
++
+@BCCC?BC@;;@BCCCC@>??::;A>/A=0;@?@=>>=??:2:6:@<3/5;9>=
+@ERR005448.31331 IL40_2446:5:1:522:3/1
+TAACTGCATTTCCTTGACTATTAATGGTTTGAATACACATTTACTGCCATTTTG
++
+BA=AD@@:@CCCCCCCBAD?DBAAD@@@CA:>ACCB?;>AB@@BBC@>=A@BA?
+@ERR005448.31564 IL40_2446:5:1:526:6/1
+AATGGCAAGGTAGCTCCTAGATTCACTGATTTCTCTATCACATTGTATAAACAA
++
+;6;8==8:89;>:;98;@8:>14./788)6;9/44781*57
+@ERR005448.31971 IL40_2446:5:1:532:5/1
+GATGACTGTGTTCTCCCCAAAAGACACCAAGTTTCCAGAACGCTTGCATGGACA
++
+@>@BB>@?=??9=?5:94<><<<17:?8&8:./'57<>:4:=4:8:9588
+@ERR005448.32464 IL40_2446:5:1:540:11/1
+AGGTTACACAAAAATGTATAAAACTCAATCTTTTTGTTTTTATGTGGAATCCCA
++
+?ACB@;@<@@@;:@CB7?B=9?7;B@@AB;CC?CBCBECDC@CC:@>/;;9??C
+@ERR005448.32625 IL40_2446:5:1:542:8/1
+TTTCTGTAACTTTTATTATTTTATGTTCTCTCTCATAGAAGTGTATGTTTCTGG
++
+:ACCCA<:=ACCA@AB>:ACCCBCA>BBC@CCCCB>;@6<6)=1<,@5>A8:29
+@ERR005448.33066 IL40_2446:5:1:549:7/1
+CGGTAACCTCAAAGCAAAAATCCCATGAGAGATACGCACACAAAATAGTAAACA
++
+51589>@?8319=?>891(457BA@?@;7<=A9?>:>;=14@=><<<885'8
+@ERR005448.33311 IL40_2446:5:1:553:6/1
+TGAGGCAGGAGAATCGATTCAACCCAGGAGGTGGAGGTTTCAGCGACCCAAGAC
++
+>>B@?@<>>@7,*4;(32144;94,,9,<9,*-*''/'7'()%2&.1,'7
+@ERR005448.33378 IL40_2446:5:1:554:1835/2
+CAAGAAATTTATACTTCAATTATATAAGAAACTTTCAAGCTGTTTTCCAAAGTG
++
+BAA@<<=BCCCCBCCC><>BCCCCCAAAB@@@BBBB??C??C;?B<@?<67@4;
+@ERR005448.33526 IL40_2446:5:1:556:9/1
+AGCTTGTTCCATTGTAGGCTAAACCATATTTGTATGTTACATAAGCATATAATA
++
+@BCCCCCCCBAABA6A@ABAABCB?>A=A@A?>>AB?AAAA?><><9<7:;9
+@ERR005448.33867 IL40_2446:5:1:562:7/1
+CATTGCAAAACCCTGTCTCCACTAAAAATTTTAAAAAGCAGCCACGTGCCTGTA
++
+=:?@C>6=BA?>??A=BC?=5;C?>=;?A;@BAA???<7AA?<<:;0;83:@5,
+@ERR005448.34122 IL40_2446:5:1:566:11/1
+TGAATGATATGTATACACATAAACATTATACAATATCAATAGTTAATGATCAGA
++
+@CA><>B@B@ACBCA@A@:'=B>;=5:=>>A5<9:86
+@ERR005448.34386 IL40_2446:5:1:570:8/1
+CGGAAGAGCGGTTCAGCAGGAATGCCGAGATCGGAAGGGCGGTTCAGCAGGAAT
++
+BBB:8;/;A>3'2A@A7:<;274>>@A;?71';>6.3%62:4)/-6452672**
+@ERR005448.34441 IL40_2446:5:1:571:2037/2
+GCTGAGAGTGAAAGAGAACAAAGAACTAATGTAACCCTGGTAGATCTTGAGAAA
++
+BDC>8=<<:BBAB@CBA??BC?@CC=B;?BA???>?1@??5@?A@@@@@@@;4>??;29@?>>>==;=>>?69=>=39:13771
+@ERR005448.35028 IL40_2446:5:1:580:6/1
+AGATTGGAATTGAATCAAGGCAGCCTAGTTTCAGAGTACATACTCTGTGTTTTC
++
+?==AA=?A<>CA<<<==?@;9>:CA>;9;=966>5=9>6;;86?A/<2<;8:9729:)749;;=:36-&':;1-3402'7;13-*2'155:61/-)
+@ERR005448.35380 IL40_2446:5:1:586:1/1
+AAATTACTAGAAGAGATATTCAAGATCGGAGCAGAAGTAAATGAAATTGAATTA
++
+A=>AB6>=BABBB?-9?;=77?296:BB957=??6:<:=
+@ERR005448.35470 IL40_2446:5:1:587:11/1
+TCTACCTCTTCTACTAGAGTTAAGCTCACCAAAGCAAGAACTCTTTTATATCTC
++
+A;=28=;C<4;;=?;A?.?)=AAC>4@@;;;8;?=7:8):=9>?9?>=7=<0;;
+@ERR005448.35791 IL40_2446:5:1:592:5/1
+AACCCTAATGTATACACATTTATGTTTACTTAGAAGGTTTAAAAGACCTTCACA
++
+>A?AB==@BAB=>>=<:5;<>?AB@CA<@@B@AA:?<18(7&
+@ERR005448.35875 IL40_2446:5:1:594:10/1
+TATCTAGCCAGTGATAATGGCTTAGCATTACACGGTTTCTTTGTCGCTGGCCAG
++
+>=<@@>2?=?=88>;:==9<74985:::60'77/4-5
+@ERR005448.35908 IL40_2446:5:1:594:2/1
+TGCATATCACAGCTGGAATATCCTGCCTTTCTTTAATTAAAATCAAAGTGCCTG
++
+CC?9;?C?;@:9ABA?>A<>B@A=ABA@B=BAA<34A7.72/9;-51;.;993:
+@ERR005448.36270 IL40_2446:5:1:600:9/1
+GGGAAGGCATGCCTTTTTCATGGCATCCACAGTGAACATGAGAAATTCATGGGC
++
+@@;+6>==;???97??@AA@;<:<>@;605::2579.3;4)40,)'<2-7982/
+@ERR005448.36506 IL40_2446:5:1:604:4/1
+CTGGGTTTGAAGCGTGGCTCTGACATTTACTAGCCTGGTGCCCTGGCTGAGTTG
++
+BBBBB5<<=89@@86819/9:
+@ERR005448.36684 IL40_2446:5:1:606:5/1
+CACTATTACAGGCCAGGCGCAGTGGCTCATGCCTGTAATCCCAGCACTTTCGGG
++
+BBABBBBBBBB?BB=@@=<@>:,>B>A@96?<>>:6;609=8&44%459@86<8
+@ERR005448.36772 IL40_2446:5:1:608:3/1
+GCATGATACTGGCACCTGTTTGGCTTCTGGGGAGGCCTTAAGAAACTTACAATC
++
+B@?B=1>0;=9>A@A>>B=;7AB?>@<<>=AA<=609;=85>079596845'16
+@ERR005448.37117 IL40_2446:5:1:613:1/1
+AAGAGGGGGTAAGGGCTGAAAATCTTCCTATTGGATACAGATGTTCACTATCTG
++
+<@B@A?ABB:ABBBBB<9AA@@BBBBBB@?=BB;@?8&1<9;=::99=7:=6<9
+@ERR005448.37264 IL40_2446:5:1:616:6/1
+TGGCACTAGATAAACCCACTGAAAAACATTATCAACAGAAGAAAGGATCTAGCT
++
+:AB=CA?9=?;:413&9)9=>7@:87+=>28;:;/;56),.3<6;1613--69)
+@ERR005448.37421 IL40_2446:5:1:618:10/1
+AATGGAATCATCCGGAATGGAATGGAATGGAATGGAATGGAATGGAATCAACGC
++
+@:@5B<89>:8906?:617;3:*A7'/014652:0-'5=6/5;054.63.106.
+@ERR005448.37429 IL40_2446:5:1:619:2/1
+TCCTCTCCCCACACCTGATCAGAATGTACCAGCCACCAGCCCTGTGTAGAATTA
++
+>>B=7=66=9+?>><==<@A45?:9;:;6==:;:7;*65&5//054/55
+@ERR005448.37699 IL40_2446:5:1:623:5/1
+AAAGGCTGGAGTAGATGGTGTCTGATTTCCATAGGGAGATCGGAAGAGCGGTTC
++
+1?BB@>@@@@@==?AA@@@@B@>?B@@:6>@><>9=>@@?=8=?>;1:<*63
+@ERR005448.37933 IL40_2446:5:1:626:10/1
+CTTTAATCCATCTTGAATTGATTTTTGTATAAGGTGTAAGGAAGGGATCCAGTT
++
+ACA8?A??AAAC>CBCCCCBABCCCCC=<@B@@?;@?5'8@:>A@B?<;=;A
+@ERR005448.38331 IL40_2446:5:1:632:7/1
+CTCATCATCACAGACCTCAGACAGCGGCAGGGGACCCGCGGCACCCTGCTGGGG
++
+@A78+'7@31.78830=>?;85@?=2774%6*.840'+3.''%,&0+,043.
+@ERR005448.38609 IL40_2446:5:1:637:1/1
+GATTCCATTCCATTCTATTCCTTTCCATTCCATTTCATTCCATTCCATTCCATT
++
+C@A=?9B@?ABBA@@8:=@?:C@=B>A>CB5=4;<@>=:>=9.9524<==
+@ERR005448.38749 IL40_2446:5:1:639:9/1
+GCGGAGCACGTTTTAGCTGGAGTGCTTGGTGTGGTGTGTATTTGGTTTGCGCTT
++
+@BB>8?@9?A?AA?8>?@@@4><=6@A?<0:4@?8?9:,.14938*5;8/9/8:
+@ERR005448.39069 IL40_2446:5:1:644:1/1
+GGAAACATTGACTTTGGGTTGACAATCACCCGTTTGCCCTCTCCCTACTCTTCC
++
+:;6>6=A6/.>7'16=@B92=;2=<7'/4:?(95>;;67==>=>619?@@>@
+@ERR005448.39097 IL40_2446:5:1:644:1523/2
+GAGCCTCGGGTCTTCACCTCTCCCAAGGACCTGCTGCATTTCGGGAATGAAAAA
++
+*?099A8(800A<(9<&4?6=6:@@@:28;?@A?:68A;>8=8224/<@945;5
+@ERR005448.39166 IL40_2446:5:1:645:7/1
+AAAAAGAAGTGCCGCTTCAGACCAGAACAGGCCTCAGATATGAACCCTTTGTTT
++
+@A=B8=?A:'@?;?@B?=??>@?>@@9=69:5<75479969:941/10,2
+@ERR005448.40296 IL40_2446:5:1:663:10/1
+AGAGGCACAATCTCCAGAGTGACACAGGGAATGAAGGAATCTTCATTTCCAGCC
++
+>?>>?>=??7;@@B=>>>@?>AA?<8>?>1<8;59?@2-85/7;39=>923929
+@ERR005448.40323 IL40_2446:5:1:664:582/2
+AAGCAGCTGGAATAACAGGCGCACGCCACCAAATCCAGCTAATTTTTTTGTATT
++
+0081(;C>>0;;8=@<>?B::82=??4>87'4@;B>:=688B;;:<>=1:BA
+@ERR005448.40371 IL40_2446:5:1:665:4/1
+TGTGGGCATGAGGGTGCAGTGGTTCTGAATCTGGCTTCAGGTTCACACAGGCCT
++
+BB?@@@@?.?@>9B>@@@B?@AA@@<<@?>=93;@9;884'6@;.;0929;:.,
+@ERR005448.40432 IL40_2446:5:1:666:667/1
+CCGTGCCCAGCCGTAATTTTTTTCTTCAACTTTCATTTTAAGTTCAGCGGTACA
++
+AB?>@@CC@CAA?A?;?CA>@CCC@??A>BCCCC>>A=@B>7?B=??B;5/>;8
+@ERR005448.40807 IL40_2446:5:1:671:1/1
+GGATTCTTCAATACATAGCGATTAAAACAAAATGATTGTACTCCAAGTACAGAA
++
+;CC>4?;4?7==@@AABB<*6;?A<:(/>?<:7B@@:@:11387))61:0;@7*
+@ERR005448.40884 IL40_2446:5:1:672:6/1
+AGAAAGTTAAACATAGAGTTTCCATATGACCCAGCAGTTCTGCCCCTACGGATA
++
+BB@A@?B=A??B=-==7209=>=7;8;?49*547:5&3).'5&&1<45)2)/8<
+@ERR005448.41058 IL40_2446:5:1:675:11/1
+TCTGCACTGCCCTAGCAGAGGTTCTCCATGAGAGTTCCACTCCTGCAGCAAACT
++
+A?9?@>@@?>A=:@@@@?>1?3;8;@@@?>:>4?6=;7.1=(:688:;29,44;
+@ERR005448.41136 IL40_2446:5:1:676:5/1
+GTTAGTGTAGTCCCACTTGTAGGGCATGGAGAAGACAAGGGGTTCATGTGCTCT
++
+93@>94??>A8>@9@@>:5*<9>9:;37A:A;;?8:/,9A:8*1.3897B8'6:
+@ERR005448.41207 IL40_2446:5:1:677:8/1
+ATTGTGAAGATTTTCTCCCACTCTGTGGGTTGTCTGTTTACTCTGATGACTGTT
++
+@BBC@CB5B9ABCCC@CA>@>CCCCBCBA7AC=?BA@>@9?=<=;8?<59?><6
+@ERR005448.41359 IL40_2446:5:1:679:5/1
+GATGCTTTGAATAGTTTAGTAAAGATAATTTTCTTGAAAAGCATGCCAATATGC
++
+?=CC>9>>:4@@7?@48;?@?@=A>;:3A<@?CAA@82<;9;:>AA9=6;:>6,
+@ERR005448.41541 IL40_2446:5:1:683:8/1
+TGAAAGCAAACATCCCATAGAATAAAGGGCAGGTGGGGCACAGTGGCTCACACC
++
+A=8>??@;*:><;@@;3=8?:7=@>6;=<8;?;-;?=9765)8,5=;28:8;78
+@ERR005448.41554 IL40_2446:5:1:683:3/1
+ATATTTTGGGACACTTAAAAGTTGTGGTTATATGAGAATACAAAGTGTCATTTT
++
+:@,>C?B?>=<@AB?>;>>;;B=58@@=>;:869257:242'4'2+5))292'9
+@ERR005448.41978 IL40_2446:5:1:690:7/1
+AGGGGCTTAGGAAATATCCCGTGAATTTGACAGAGGTCTGACAAAATTAGTTTT
++
+:ABCC?C?6>=>:AAAACB@A=?=CA;A@<>A>7?57?AA><9(/7=A?;:=A>
+@ERR005448.42057 IL40_2446:5:1:691:10/1
+TTAAGGTTGTGTTCTAAATGTACCTCCACCTTACAAATGAAGAAACTGAAGAAG
++
+=A<=@7:B7;>>9&9=:=?97==>8>:49&7;5;91;.86&8/&/,395596/:
+@ERR005448.42344 IL40_2446:5:1:695:11/1
+AGAACAGCTCAGTACCAAACTCTGAGAGCTGGCATGTTCAGAAAAGGCTTTCTT
++
+BBA;A?A@BB=B;:;?@<@@@BBA8?3?A>A@9;>B7=6/7:511<5783;<9=
+@ERR005448.42602 IL40_2446:5:1:699:11/1
+AACCTGTGTCTCATTCACTGGCTCTGCATCTCGTCTTCCGCCCACTAAACATGG
++
+@);B57*8=A@@@:@A8:=5>B8?:88?=;83(-'88/&36;&&7&&,5;64/'
+@ERR005448.42641 IL40_2446:5:1:700:8/1
+CCATGTTCCAGGTGCTGTAAAGGGAGCCACAAATACAAAGATGAGCCACTAGCT
++
+B?;@A@@@A>;<>>8;<:39:9696::6797574/&3057'22/
+@ERR005448.42688 IL40_2446:5:1:700:1/1
+TAATTTACATTCCCACCAACAGTGTATAAGCATTCCCGTTTTTCAGCAGCCTCG
++
+AB@BBBBBBB><:>3<@?99>6==807?A<9=857>738=9:6
+@ERR005448.42837 IL40_2446:5:1:703:11/1
+AGATTGCTTTTCCTAATGTGAGTGGTCCTCATTTAATCAGTTGAAGTCCTGAAT
++
+BACCCCCCCCCCC?CCCCCB8BB?4?@=BBBB?=<??==:68<=9A:7>>856;;7995943
+@ERR005448.43153 IL40_2446:5:1:708:7/1
+AGTATCTGTAAAAAGTAAATACATGATCCTGGATATTTGTGTACCAGAAGGGAG
++
+::>C@@:C49==@==:>==@C@@=<6'6@?@?3===836<>889@:7)+8>6.8
+@ERR005448.43317 IL40_2446:5:1:710:11/1
+GACCAACAAGCAGACTATAGCATATTTGGAGTCACTGTATTAGGATTTTCCAGA
++
+BAC???CB>??8=0<<0=<>>=A8@B?A?6?9@=6<;58<<;;2-1===8133-
+@ERR005448.43526 IL40_2446:5:1:713:7/1
+AATTACCCTAAAGTCAACTGATATTAGACCTTAATTATATGTGCATAATGCTTT
++
+=CACCCEBC:C?<8@*:;CD@A@AC@C:B@@?;9;?@@@>><>>;5>606;604;;787)4)64,7,'4',6%466
+@ERR005448.44238 IL40_2446:5:1:725:6/1
+AACTGTGCTCCTTATCTACAATGTAGCTCCTATGGTCAGACCCTGTCCCGCAAG
++
+9/?@@>7@>AB@@BAA79?>=>>7978;<37-4;7/33158:314'8731/,..
+@ERR005448.44649 IL40_2446:5:1:731:6/1
+TCCAGATCTCCTCATGGTAGAATGGCAGGATCAGCCAGGCATGGGGGGTGATAC
++
+BB@A>@@BBB@A?:@?B?<:A=;=A;6<@?87==?:;>75:7,7:=9><;:;@391?885<
+@ERR005448.44821 IL40_2446:5:1:734:6/1
+TATAGATTATATTTATTGAGCTTCCATAAGTATCAGTTATCTTCCAGGCACATT
++
+CCC@A=>AC@A@ACC>?@@??=9AC?C?A>3=C=@4;>@@5?9:<:776<>4???3;;8793-=?A@9;8)5;;95=6/)83-1/)1;98/'
+@ERR005448.45246 IL40_2446:5:1:741:9/1
+ACAGTGGCAAACACAGGCAAGAGGAACATACCACTGTGGGGGTAAGGGGAGGAA
++
+B@BB*BBBB>>?15:=4B;5:7;;-(;:;:=167==.:?>54&1.::>5&58,3
+@ERR005448.45445 IL40_2446:5:1:744:1661/1
+CTCACCCATGGTGGGTCAAAGAGGTATGGAGAAATGTGAAAGAAAAAGTTGCTT
++
+B@B=,8?=?>A-ABB.BA4<>-/=A?:B<57=97<:;6=//6>/9
+@ERR005448.45488 IL40_2446:5:1:745:7/1
+AAAATACATCATAACAAAAATAAACAGACAAGCAACAGACTGGGGGGAAATGTT
++
+=A8@A?=CBA>@BB@;<;BCCA>>B?C>8=?>?<0=<==:9153592:
+@ERR005448.46100 IL40_2446:5:1:755:2/1
+AGACCCTATACATATTTTATTAGGCTTATACCTTAAGTATTCCATGATTTTTGG
++
+BBBCABC>65<0:<5@A<<>CAAC?<>;?9?C?=B;?=?@7@@?>@CA?@8/
+@ERR005448.46486 IL40_2446:5:1:761:10/1
+CAGGCTGGTCTCAAACTCCTGACCGCGGGTGATCCACTCACCTCGGCCTCCCCA
++
+B@><7>AB0@>AA<09BA@@??B@;>?@?8@===>>>0>:8A8;686:,0=621
+@ERR005448.46574 IL40_2446:5:1:763:2/1
+CCTCAGGTTTTTTCTAGAACGGGATAGGCTGGGTGCGGTGGTTCACCCCCGTAC
++
+;@0>::?=9?@BBB?:?<7<<=?<;?9??<><<@<795'.6''44,.6.'.'6'
+@ERR005448.46719 IL40_2446:5:1:765:6/1
+AAATGGAATCATCTAATGGACGTGAATGGAATCATCATCGAAAGCAATGAAATA
++
+B;?ACCA@AB?BCC@9?A@:@?6>A=;>=8=;>=;6517:;871:7:778&63<
+@ERR005448.46926 IL40_2446:5:1:768:1355/1
+CCTCCCTCCTGAGTTTTACCCCTTCCTTTACCATGAGGTTTATCACTTTAAGCA
++
+@@=BB=??>4?;A7?B:BB;7?@BA:;:;A=@B?=698:;67??
+@ERR005448.47202 IL40_2446:5:1:773:7/1
+ATAAAGAAAGAGAGATTTAATGGACTCACAGTTCCATGTGGCTGGGGAGGCCTT
++
+>=68==?4(8=>0>><:;?><6<;==;<8;76)6913+8
+@ERR005448.47314 IL40_2446:5:1:775:11/1
+AGGTCTAGCACTAAGAGGCACTAAATTTGCATCATGGACCTCTTGACCTGCAGC
++
+<70:>9@AA@;?979><;==><92;:9493979>2<71:529:3-5=<;73)5'
+@ERR005448.47437 IL40_2446:5:1:777:9/1
+TGAGAACATGCAGTGTTTGGTTTTCTGTTCCTGTGTTAGTTTGATGAGAATGAT
++
+??@A?>>>===-<9==CAA@A@<<;<AA;=>>5:37:=79
+@ERR005448.47910 IL40_2446:5:1:785:3/1
+TTTATTCATTTGAACTCGAAAGGCAAGTTGACCTCAGAAAACATCTCACCTTTC
++
+BB@CB>??ACCCB?:?=??CC@AAA=::-645=:6*8>@:/6
+@ERR005448.48236 IL40_2446:5:1:790:5/1
+TTCTCCAATTGGTGGTCCATCCGATTTTACAGACTATAAACCGAAGACAGAGAC
++
+B@BBBB;(8?BB@?<7?=35?==1=?<>9;9548538896594+2/+857.)+7
+@ERR005448.48274 IL40_2446:5:1:791:2/1
+CAGTGGTGCAATCACGGCGCACTGCAGCCTCGACCTCCCACGCTCAAATGATCC
++
+@<>4@B:B@@>@<:<9:5?@@?9<848>951-&44,716-%.1185/%0441.-
+@ERR005448.48402 IL40_2446:5:1:793:7/1
+AAATACTAAAGAAAACCAATTATTAGATATCAGATATAGTAAGAGGTACCTGAA
++
+CDC:?=??@;>BA8A9?><<7>@6:A96684@<5.77<
+@ERR005448.48656 IL40_2446:5:1:797:8/1
+TGGCCCACACGCACAGGGCGCCATCCCTCTGATCTTCTCCAGTCCCCCTCCCCC
++
+;>?39>@@4-0<>>856?6<6:67A67:;;0%,20.@3)4,&<3'/4@(67<3,
+@ERR005448.48675 IL40_2446:5:1:797:5/1
+CGTGAACGTATGCCTGACTGAAGGTTCAGCTGCCATTTACAACAGTGAGGTTAT
++
+BBB@>=?;6>;;ABB@@;;89;><<>>9:=9=@5,99;=;:6247.9197&7/7
+@ERR005448.48808 IL40_2446:5:1:799:7/1
+ATTATAAAAAAACCCTCACAAAGGTTTCTGAAGTACTTGCAGTTTATGAATTAT
++
+C?BDB=A<@3;<>@C9@A=9;19<9=?=;@<<>;=;:8:7330989;?99:05/
+@ERR005448.49167 IL40_2446:5:1:805:5/1
+TGTTAGAAGGACCAATTCTGCTTCTGTATTTATGGAGTAAAAAGGGATGGTGAA
++
+1;A>7<4>=?>=;83616?=;@>@?999<@@=<<.77-7;57;6=7365'/785
+@ERR005448.49266 IL40_2446:5:1:806:7/1
+TGCTGAAGCGCTGGCTTGTTCTGCGGCTTCCTGGGATGTGAGCTAGAGGGAAGG
++
+BBBB>BBBA@?B??@A@:<>@A?????8>?@<><7*2;/4)6)0895987%%47
+@ERR005448.49519 IL40_2446:5:1:810:7/1
+CCACACAATTAACCCCTTACTATACTGCTCTCCCTAGACAAGCTTAGCTAAATT
++
+CCCA6>>:ABBABCBB???;-;=?@=>=?@@?>7)673276994:55/)3/
+@ERR005448.49536 IL40_2446:5:1:810:919/1
+GCTCAGACCACTGGCTGAACCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCC
++
+BBBB@?>?;88>?<@<<>:<@@@@??@@??A@@@@@@@@AAAABAAA@A@A@AA
+@ERR005448.49570 IL40_2446:5:1:811:10/1
+TATATATGTACCACATTTTTAAAAATCCAGTCTGCTGTTGATGGGCATTTAGAT
++
+CBCC:?@C8C>@><;A==@?<7;@B6>9<:.6:=@78841/49;67,647-228
+@ERR005448.50062 IL40_2446:5:1:818:4/1
+GGCAATTTCTTAAAATAACAATGAAGATTCCCTTATCAGTTGACTCTTCCCTTT
++
+B>ACA=CACBC=A;9@?B@6)11:9:(:;+7,742=?:.9==982>54'3):77
+@ERR005448.50368 IL40_2446:5:1:823:2/1
+TTTGCTTGTTTTGTTTTGAGAGGGCACACACTGAAGTCTTTGAAGCCTGAACTC
++
+@?BB;=>36AB;6>A?<:6B<8>897:94<@8;47,2=.-722'/8
+@ERR005448.50566 IL40_2446:5:1:826:3/1
+AACTGTGGGATTTTTTTTTAACTTATTTAATCTGTGCATCAATAACATTGCTTA
++
+A>CDCACCD@A@CCCDBCB>BCDCDBCCC8ACA?=DBDCCA@DC<@A??CCA?B
+@ERR005448.50606 IL40_2446:5:1:827:6/1
+ATATTCCATTAAAGGAGTCCACTTTGGGTAAAACTCTTCACACCACTATCTTGT
++
+@@C:6<>A=:7,/;;5>897?;:/7'96;>;=:=61/9.9>5*:9
+@ERR005448.51299 IL40_2446:5:1:838:8/1
+TAACAAGACATAAAATACCAGGTTAAAGACTATCTGGTCATCATAAGTACATGA
++
+CA>@;?A==9>/>;==>?<<:=77>>63(7<6=:5(:55;1592-)9:7;87
+@ERR005448.51337 IL40_2446:5:1:839:4/1
+TCTCTGCAGATGCCTTCACTGCTTGTACATAGAAAAGGCAGGACCCCCCCCGAC
++
+073:AB<67:>=..?@@8::084?44::4,6.959/3/9(3&4'7...%%/3
+@ERR005448.51363 IL40_2446:5:1:839:11/1
+ATGTGACCTCTGGTGCCAGAATGAATCCTGACTCATCCACTCAATAGCTCTATG
++
+A>;?9;?ABB<@>9@B>>@777>078@::@2=944;@=;64;3&/-2943.0+.
+@ERR005448.51418 IL40_2446:5:1:840:6/1
+AGGGATGGGTTGGGCTAGTTATCTGCAGAAGGGGAATGTCCTTAGGGCACAGAT
++
+AABBB=41B;=@>=A6)(;;A>;8<;:)(9;9)711/5207;;4)/3(&&-,.-
+@ERR005448.51576 IL40_2446:5:1:843:2/1
+ACCAGGAAATGACACAGAAGCCTTTGGAGTGGTGCCCAAATGCTCACGTAGGCC
++
+BA?3::<@>;@@?9?64<;3/17,&5:;7'97*6=<8/576779/66/)2.24,
+@ERR005448.51923 IL40_2446:5:1:848:8/1
+TAGCCACTGGAGTACAATAGTCAAAAGGTGAACACTGGAATGCCAGGATATCTG
++
+@@?@BABAB<2>:+=AC;@?4;@@C?7:=ABB;67=;3?=:=:69;=9:6-79;7)7>?B?5,8/
+@ERR005448.52194 IL40_2446:5:1:853:2/1
+CTGCAACATGTGGCATCCTCCACCACTCCCCTTTGGCGCCCACGTGACAAGAAG
++
+@BBABB>7<>3><=654>?9?<<:8>3>A@<21'4/%,696/-)%..-%-,/*)
+@ERR005448.52269 IL40_2446:5:1:854:5/1
+GGTGGCCCTCTTTCACTGTGGTTGGAGCCTGAGACTGGGATGAGATCGGAAGAG
++
+9<,<9@AB@BBBB@?<@@>:?9@>:6:<90;39.9;5591/956,2372/)6)4
+@ERR005448.52466 IL40_2446:5:1:858:6/1
+AAATGCCAATGAAATATAAAACTCTGGATAGAGTTAAGTGACAAGGTACTGATC
++
+=8;AAAA=8?A<>>?><66?A@AAAA<><:<;:;;=497:;697/578=:7;
+@ERR005448.52915 IL40_2446:5:1:865:10/1
+ATGAAATGGAATGTAATGCAATGGGATGGAGTGGAATCAACCCCAGTGGAATGG
++
+AB@A7<>=;=<>?<8=;@>8;=@?@<><9-6?::9:99;=;>:9&451/1;=
+@ERR005448.52917 IL40_2446:5:1:865:7/1
+CTTAGTAGATAAAATAGCTTAGTCATCGTTTTGTAACTTATGTGCCTGTTTAAT
++
+?A=<>9?A8>?;:>=;>BB<3=8=3;?@;B=@;4:77@;4;?;=::??92;71=
+@ERR005448.52975 IL40_2446:5:1:866:4/1
+AAGAGGTTGTGTGGTTATAATCTGGTGCTGGGAAGCTTAAATGGGATAATGAAC
++
+A9@7:=48@415<@3:659463,:4-5)+466(10+,+00078405/+/),,,2
+@ERR005448.53533 IL40_2446:5:1:875:965/2
+GTGATGGATTAAGGTGACAGCTAAATATGGATTAAGGAGGCAGATGGATTAAGG
++
+BBC??=A76/;;7>@@:;:>;:9-8?==?>99;8?@?9;=:<3>7=>
+@ERR005448.53710 IL40_2446:5:1:878:5/1
+CTAACCACAAATCTGCTTCTCCTACAGATTTTCTCTTCTCAAAAAATAGCAACT
++
+CA=<=<1:==:<=?@@>:?=<8:99/7<;;:=9=<=<=4-5/310/160*.)
+@ERR005448.53773 IL40_2446:5:1:879:2/1
+GCCCAAAACCTTCAATTTGTAAAAAACACACTATCTGTGAAGTGCAATAAAGAA
++
+>@A>916:2;A@A>8>A@<9>?736<@@@7'8?99;8&77/(259:76>528&1
+@ERR005448.53905 IL40_2446:5:1:881:8/1
+GAGACCATCCTGGCTAACACGGTGTCATTTCTTACTAATGAGTTAGACACAGCC
++
+?=;;>@>?B9':B@>=9@:><;2>3;66<<@===78016705707;4.6763:;
+@ERR005448.54250 IL40_2446:5:1:887:6/1
+TTTATGCCTAGTGCATCTGTGTGGTGGCGTATAATGGTGTGCCAGTTTGCATTC
++
+@>@@@@B@?@@2A?7?@@@>?=??9??=?<=:28=69199<:4&87675/+/7:
+@ERR005448.54682 IL40_2446:5:1:894:8/1
+AAAAGATGTGCAACGCCTCCACACTGAAGACTACAAAACTGATAAAATAAATTA
++
+<9;CCCCACAB@=CBCCAB=8=7:>?@A<55:5=916;A17118:681+=>1/>
+@ERR005448.55300 IL40_2446:5:1:904:8/1
+ACTGTTGTATTCTACCAAACATTTAAATAATTAGCAATCCTCAAACTCTTCCAA
++
+C?4@?BB?;ACCCCC@=<;=5?BA>B?A:;>;7;@<56;;:793.4<509=65;
+@ERR005448.55515 IL40_2446:5:1:907:7/1
+CTATACTGTTAGTTTTATAAAATATTCTGATCTCACTTTTGTGATGAAAAATAC
++
+BCCCACBDBC1>CCCA?AD?8??4AA2>C;??3>??CBCCC?C;?BB<--9C==
+@ERR005448.55974 IL40_2446:5:1:915:6/1
+TCTTGGTAAAGGCTGTGTCTGCCAGAACTCTCCACCACAAATTTACTATTTTTC
++
+ABCBCC@==@@BCAC?58>=>B<46)1<<=???3;A??425;<===<8;A=?B?
+@ERR005448.56116 IL40_2446:5:1:917:11/1
+CTATCTCTATAATATATGTGTGTGTGCGTGTGTGTGTGTGCATGTGTGTGTATG
++
+C@<=B@@@8>A<;7=ABBBBA@?@B<516A:;9;8=5>7>5/895@37/>/55/
+@ERR005448.56193 IL40_2446:5:1:918:7/1
+CGGTTCAGCAGGAATGCCGAGATCGGAAGAGCGGTTCAGCAGGAATGCCGCGAC
++
+BB?>BBBB>48>@89@@@B;B?A=@4%%6%4:?<198354).6/%/-486+3%-
+@ERR005448.56432 IL40_2446:5:1:922:10/1
+AGTCTACACATCCTGAATGTTAATGTGCATTTTAATTATGTGAATTTTAAAAAT
++
+CD?@B@A9D<=?@AC>A?D=>;3;B,@=19=CAAABBAAB=CB??=2:@>AAA9??>5=>8/5>8@
+@ERR005448.56611 IL40_2446:5:1:925:6/1
+GTTTATCTGACTTTATGACAGGATTTACCTAGTAAGATCGGAAGAGCGGGTCAG
++
+B@B<2@B@B>@BBA9BA4=3;@:?B<2;<<2=:5<@=956=;=5&8'8443
+@ERR005448.56615 IL40_2446:5:1:925:1/1
+GCAAGACTCTCTCAAAAAAAAAGATTGAAAAGAAACACGCAAATGTATATAGTG
++
+CACA?>BACCCCCC>>9;=7=AAA@C@<<>A=7;<.9=5<>46B<6>@A<<>=5
+@ERR005448.56822 IL40_2446:5:1:929:6/1
+ATGCCAATTTTACATGTAAAGAAACTGAAGTTCCCACCGGGCACGGTGGCTCAC
++
+=@BBB;;?<@===?<=@;;?>@@@>@?;;@@A>6<=?>>?<>=64><80-1?
+@ERR005448.57044 IL40_2446:5:1:932:9/1
+GCTTATGCCAAAAACAAAGATCCCCCAGGCAGAGGCGAAACATGATATTTTCAA
++
+@7>B;>=?A;11.67A@9;89=9<@=2;<65&2@:87-4776'76904587,),
+@ERR005448.57199 IL40_2446:5:1:935:5/1
+GCAGGCCCCTGACCTTCTCCTTCTCTCCTTTCACCTGTTCCTGCCTTTCTGATT
++
+=>:?@AAA>AAAAA@>BAA?:?A@?7>@>87<:87?A@4*5>
+@ERR005448.57402 IL40_2446:5:1:939:11/1
+GATGTGTGCCTGAGTTGCTCATGTAAACCGACTTTGAAGGAATCAAATCACATT
++
+B=BC9B;@BB@?:?=BABBCAAA@<68=>;59==@=61:703483337;<<=:9
+@ERR005448.57440 IL40_2446:5:1:939:616/1
+CAACCTCCGTACCCTGGATTCAAGCAATTCTTCTGCTTCAGCCTCCCACGTAGC
++
+?:>@B=88:<::;<;>835<<:53<<6:3:2&3/137
+@ERR005448.57450 IL40_2446:5:1:939:2/1
+CACCTTCTCACTTTCTGGCACAAGATGTTCCAGGATCACTTGTATTTTCCCTGA
++
+@99BBB@A<8==AAB=A>AA?::>6:8*5<;;=9259,8=9;0;;;:9=<;513
+@ERR005448.57718 IL40_2446:5:1:944:4/1
+CCATCGCACCCGGCTTTTTTTTTTGTTTTGAGACCGAGTCTTGCTCTGTTGCCC
++
+B?7?BB?6?BA@@?AAAAAAABB@?@<651&4;5.76777-79:63077266
+@ERR005448.57751 IL40_2446:5:1:944:7/1
+GGCAGGAGAATCGCTTGACCCCGGGAGGTGGAGGTTGCAGGGCGCTGAGATCAC
++
+@9?::<3;?<7;.6&69<>=6<6.66*07-97,0'2-'%3&0104,4%3//4
+@ERR005448.57883 IL40_2446:5:1:947:8/1
+AAATAGCACCCTCAGTATTTCTAGTGGTGAGTGTAGAATACAGCATGCTAATGC
++
+?<599@;79/554528;5977&35+)+317,,50
+@ERR005448.58118 IL40_2446:5:1:950:4/1
+TTTGCATTTTTAGTAGAGACGGGGTTTCACTATGTTGGTCAGGCTGGTCTCGAA
++
+9=?=A?ABBBA;;>B=8?BBBBA=9=A>>?=/;==<8;/51994/68/69;722
+@ERR005448.58325 IL40_2446:5:1:954:10/1
+TACTTAACCTGATTCCTGCTACATTGCAAGCACTCAGTATATAGTGGCTCTCTC
++
+:A=BB7:;B=A?B==>;A?>;8===;9;;;>88737815--31577/+&&+
+@ERR005448.58371 IL40_2446:5:1:954:1/1
+TGGAACACTATGGAATGGTACCGAATGGAATGGAATGGAATGGAACAGAATGGA
++
+3?A;?>>>;A70?BB?<=@><:<=??0<@=<7>B>9;8;;1.597/99=>@
+@ERR005448.58561 IL40_2446:5:1:957:7/1
+GGGTCCACATTTACTCACCCTCCAGGGAGCCCCATACTGGCCACCAAATATACC
++
+@:?(A1(85>9>@=,2:B@<7=@:;=4<6+0=228',,450/03%)'/9%%%3%
+@ERR005448.58657 IL40_2446:5:1:959:3/1
+CTTTCTAAATTCCTGTCTCATGGGATTGCAAACTATAATAATAATATAATGTTG
++
+EBCCAC?;;A@CC@B>@C@7A=BA6=@A>;;9=@=@=;>;;>:4:5:06<=8;8
+@ERR005448.59107 IL40_2446:5:1:966:6/1
+GTCCGTTAGAAGCAATTAGCCAATGAGTCTTGTCACATCATCCTTTACAACTTT
++
+?BACCC97;;<@A=9=1.7C@>;8<2=.7@76,745.664477=<0/43*/72;
+@ERR005448.59191 IL40_2446:5:1:967:8/1
+GTATACTATTATAACTAACATCTCTCTTCCCTATTACCTTCAGAAAAAAAGAAA
++
+>)>982.76;90;44.873,/61/1>2./7*37<6>8.5-3<:>:7;=5=3>3>
+@ERR005448.59278 IL40_2446:5:1:968:4/1
+ACATGTGATAATGGGTTAATATTCAACGTATATAAGAAACTCAAACAATTCAGT
++
+CCCCA8@=;4>A@@@=>C>9;B?;=??87>7;9775&/&5<<:67&
+@ERR005448.59563 IL40_2446:5:1:973:3/1
+ACCTGGAGCTTCTCCTGGGTCTGGGGATAGATTGTAGATCGGAAGAGCGGTTCA
++
+BB???=3=<;5=?B=>=57=@=8:=:?<>;-53&
+@ERR005448.59824 IL40_2446:5:1:977:7/1
+GGTGGCACGTGCCTGTAATCCCAGCTACTTGGGAGGCTGAGGCAGGAGCATCCC
++
+?@=@;5;:@@@>6875/;>959=39;9:<>3/7<;36*4;5'46)6)1%%%,
+@ERR005448.59872 IL40_2446:5:1:978:3/1
+TAAGACACAGATGAGTCCTATGATTGCCTGACTCCCTGCTTCATAACAGATTCC
++
+@?@AAAA@>A;A>6>?BB@ABA@ABABAA?=?@@@A?==<==9=946>958:=:
+@ERR005448.60200 IL40_2446:5:1:984:1/1
+TGGTAATACTGTTTGCTAGGGAACAAAGACTGCAATAAATTCCTCATCTGCTAA
++
+?BC;<9A@<9?CB:@C?:=AA;AB?=1<>=5<@@=>A?9?;?B>A<1>?=3'
+@ERR005448.60327 IL40_2446:5:1:986:8/1
+AGATACTTTATAGTTTGTGTTGCTATTGTGAATAGATTGTTTCTCATATGCTTT
++
+=?6=;@AAA?:3>?739:7<=>9<>>:A?BB>:<6=?>A??
+@ERR005448.61048 IL40_2446:5:1:998:9/1
+CAGTGAGGAGCTGGAGTCCAAAGCTTCCCACCTGTGTACCCTTGAGGGCGGGAA
++
+BB./;AA>94?4@@6?99?922>;5'5;8/2565(80.%/5-+%/4,-'857))
+@ERR005448.61190 IL40_2446:5:1:1000:10/1
+TTTTATTCACAGGTGTAACAATAGCACCTAGCATTTTGGCACATTAAAAAACTT
++
+BCBCA<>;>A?@7=?)=??87:;6=A<9:?@?;2640-2<<2
+@ERR005448.61329 IL40_2446:5:1:1003:7/1
+CTCCCTATCCCTGTGCCCATGCCCAATCTCTCATTAAACTACCATTCTACCTCC
++
+@@@BBB@AB@AB@@?B@B>>@B><>*<02>87>7)<4A;:;7,3?
+@ERR005448.61505 IL40_2446:5:1:1006:4/1
+TGATGGAAATTAGGGAATTAAAGCTATAATCTCTTTGGGTGTTTATTTTTCTAA
++
+0>?475/(1?.5(95;:9(<=6)<99;=>.&71>=7+7)+19076':@@@BA?<=7@=8==9@90@AA<->9:A@8?<;58?<;0;>921?
+@ERR005448.61887 IL40_2446:5:1:1012:2037/2
+CAGGGTTTCACCATGTTGACCAGGCTGGTCTTAAACTCCTGAGCTCAAGCGATC
++
+A?@>?;::>@?<<:2=?>9.9:838A
+@ERR005448.62104 IL40_2446:5:1:1015:9/1
+AAAGCCAAGAAGCGAAAAAATAAATGACAGGAGAGAGCAAGTAAGGATGAGCAA
++
+C@=?BA>=?49@@AA:@:>C>;@@><1;?=<:A7)19>5)5/5/;;4/7/6,,0
+@ERR005448.62322 IL40_2446:5:1:1019:1902/1
+TGCCAGGCTGGAGTGCAGTGGCGAGATCTCGGCTCACTGCAACCTCCGCCTCCC
++
+95=;588>>?>>>=?>35;85;;.9>?><;5;?=@A??BC@CCB:@
+@ERR005448.62652 IL40_2446:5:1:1025:3/1
+CGTCATCTACATTAGGTATTTCTCCTAATGCTATCACTCCCCTCGCCCCCCACC
++
+BBB?;?A=3?@@>?>>;=??;>=@??8:=;=7'7;8;>@A?;2&2=A@>@;)7A
+@ERR005448.62725 IL40_2446:5:1:1026:10/1
+TATTTCCCCTTAAACTGATCATTTAAATGTTCTATAGTAATTTGTTTTAACCAT
++
+=6C@@CDCA?5;?A<@<6;7'6C>14(=;9;7;:;3?;@C<==<7515,'
+@ERR005448.62941 IL40_2446:5:1:1029:8/1
+GATTTTTAAAATGAGGATCTATTTTTTTAAAACGACACCACTGAAGTACTGTGA
++
+;=>3>8;7(;6)3<6:?44:B?;A?<(8/87=27,83&49<0*927&5:5=<
+@ERR005448.63236 IL40_2446:5:1:1034:1/1
+GATTGCCCTGGCAGGAACTTCCAATATTATGTTGAATAGGAGGGGTGAGAGAGG
++
+?;>BBBBBB@@??>@?6?@@A?4'67:>59>>5<9/8<06)9;2:3;35,18
+@ERR005448.63408 IL40_2446:5:1:1037:8/1
+GCGGACAGCTGGGTTCAAGGGAAGGCATCAGTATTAAATGTTGTTCTGTTAGGC
++
+@BA=6=08:9?;>27=6/9<8818>>558*937;466--23/;845==73&224
+@ERR005448.63461 IL40_2446:5:1:1038:11/1
+ATCACTGTGGCATGGAGTAGGTTTTACCAAGAAGACAGAACTCTGTGAAAGCCT
++
+9;BB@A=?BAA>@A@=@:8?A6==5=>;9><:9&5;;9-+
+@ERR005448.63486 IL40_2446:5:1:1038:4/1
+TAGTGAAATAGGTATTATCCTCTGTTTATAACAGCTCATAATGGAAGTGGAGGA
++
+=+BB>55996>=35>-<4&98'
+@ERR005448.63556 IL40_2446:5:1:1039:6/1
+CATAACATATAGTATATATCATATATAATTTTTTTTCAGGCAGAGTCTTCTCCT
++
+>::@;=8?CB=@>?@AD@CB=:<:BC31?CCCCACC>:B?><3C?;CC?BC<92;:9B>?4:1<9.6'=777&8-)4;'30&5<963,916
+@ERR005448.64228 IL40_2446:5:1:1050:4/1
+GTTCTGCAGGCACCTCGTTTTGTCATGAAGCTCAATGACAAGCTCGTGAGAATT
++
+@?BBB@@>=@=?A@9)=>:A66:=>;>==5'776=44&6+94<1.1<
+@ERR005448.64605 IL40_2446:5:1:1057:4/1
+ATCTCTATCCCTGGAACACATGTGGTTCCCAAAAGCCAATGACAAACAGCAGCA
++
+A=ABA@=@BAAAB=8;>3>4?@<>@=>?A;4769<:28848<=63?9/3797.'
+@ERR005448.64660 IL40_2446:5:1:1058:11/1
+ATTCAGACCACAGAAGGTGTGTTCTGGAATACTATGTGAGGGACAAACATTCAG
++
+=ABA8@>?A:AAA=6?@9A?:=>7>A=?:?;:6:9;1<><:<;9
+@ERR005448.64821 IL40_2446:5:1:1060:4/1
+CGGGTTGATTCCATTCTATTAGTTTCCATTCCATTCCATTCCCTTCCATTCCAC
++
+@BBA6:AA?BBA=A@B@0?<;@AB@BBA>)>=>=@?:7<;>=?9>?256?=7)3
+@ERR005448.65072 IL40_2446:5:1:1064:4/1
+CCCTCAGGAACTCAGCAGGTACAGGCAGATTCTAGCTGAGTGGTTTTTGAGAAT
++
+BBBB@>=?99?A><=?7>=67;27867?;=;;617;;728788,7;9///6-04
+@ERR005448.65393 IL40_2446:5:1:1069:9/1
+CATTAGGTATCAGGGTCAGGGTCCTAGCCAAGGGTGGTCACCACTCTTCCTGAG
++
+@??:???855?85<>98>?@@75;=8::7,69;4)04.4'196969/*3/.908
+@ERR005448.65534 IL40_2446:5:1:1071:3/1
+CTCTTCACTTTGCTAATTCTTTCCTTTGCTGTGCAAAAGTTTTTGAGTTTGATT
++
+B@=4881;8)1.,)+8&/:C22(>:9?;40>
+@ERR005448.65829 IL40_2446:5:1:1076:4/1
+ATCTGGCCAAGAAAACTTGTAAGTTCTTAGATTGTCCGAAAGGTGGCGCATGAA
++
+;;BB=BBB@9@2:@=9A@AA==?=???@@A5/2;@1=<;==7:;;9
+@ERR005448.66004 IL40_2446:5:1:1079:10/1
+AGACATGATAACCTTCTGCTAACACTGGGAGAGTGTAAACACCCAAGAGGGGAG
++
+8;??9????<8?=?>@@=<>8==;?==>:;>9;:>;=47<9==7644'9:4<16
+@ERR005448.66016 IL40_2446:5:1:1080:1/1
+CACTAGGTGATGTAACACTTGTCTAAGCTCTGTCTACACGGGAATTTTCACATA
++
+C>B@=8C9>:@@=;::4;>=A<@B=/=A==;>A7116<>A<4))5?<=9;943)
+@ERR005448.66030 IL40_2446:5:1:1080:665/1
+CCTCTCTCTTCTCCTTTTTTCCGCATTGGGCTACCTTCTCCACTTTTACCGATA
++
+.2,.,))(&,&&-&1'&)&,21&3&&&)&&.&&)&&+)&&&&1/,'&)&+&&&&
+@ERR005448.66241 IL40_2446:5:1:1083:3/1
+GCACCCAAGGGGCCTCTCCATGCCTTCTTAGGAAGCAGCTATGAATCCATTGCC
++
+B?9@?BB:0?(/;B@@BB@2=@BAB<@8.9>31:9:,82)52:5.1=4,:50%3
+@ERR005448.66395 IL40_2446:5:1:1086:8/1
+AGCAATAGGAGCTTTGCCATGGGCCCCTTTATGGAGATTGCAACAATGAAAGAC
++
+=;??<7><@3>?A>91?:6;?@@AB@;@>;;?84/71:<=5139;;81/(481;
+@ERR005448.66547 IL40_2446:5:1:1089:8/1
+ATAGACAGTGGAGCATACAGGGCAAGGCACTTTATTAGGGGCTCCTCCTCTTTG
++
+>AA>B??=.=?@5=8@>?51/6;27?=?8<>59'77-969=,/*551&)/4368
+@ERR005448.66624 IL40_2446:5:1:1090:5/1
+TTTACATCTTCTGTTACATGGCAACAAGGAACTAAATATTAATCATAAACCCCC
++
+CCA;??BCCCCBC@CA?9>>>@97<=6B?A@7>@A??4,6;8:;6'50:>@AB?:95,48;'69550/,3739
+@ERR005448.67186 IL40_2446:5:1:1099:3/1
+ATGTTCATTTTCTAAATAGAACAGAAAACCTTTGGCTCAGAAAACTACGATGTT
++
+>A@+=B@A>B;@CC?@B6A;7@;4;45'4836;69;@59:;88>=<43;/:<+'
+@ERR005448.67393 IL40_2446:5:1:1103:6/1
+TCCACTCACAATCTTTAATAGGGTTAATAGGTTTGTTTCATGTTGCTGTTTTTG
++
+CCA8ABA=B6.>BCCB>:<7?@@9?8+99>?;@@A><><39?>A@=@@8?@@;6
+@ERR005448.67596 IL40_2446:5:1:1106:5/1
+CCAGATGGTTAGTGCTCTGAGCTACTAGAGACCCCATTTGATGCCCCAGTTACC
++
+B@?><@BB??:=@AA?AA?;?A????:?6=<<@?:9:><:7;?==:;0:731:7
+@ERR005448.67619 IL40_2446:5:1:1107:9/1
+TAAGTGGGTATGGTCCAGACCCAGAGAAAATGATGACAGACCCCAGCACTTCTA
++
+@<6>;@@@:=8>95?;==<=A=9>==<973878:;3;:70&8<9-6:6,1/558
+@ERR005448.67823 IL40_2446:5:1:1110:2/1
+CCCTGACCACCTTCGGCACATATCAGGATTTCCTGAGGCTATGTCACGGGCACC
++
+BBBB?:?@;@BA@@@@>3>0;7?>3=<>>???@>?:;3;<<<;2887257/%/'
+@ERR005448.67932 IL40_2446:5:1:1112:7/1
+TCCAAAAAAAAACCTTGTTATTTATGAAAACACTGCAGTTTTTACTTTCTGCAA
++
+CCA@1@@:=A=7A@A?@?<9<7??7=49<5;:=;57:A@A82*;=A@9314&
+@ERR005448.68406 IL40_2446:5:1:1120:2/1
+GCCAAATTTCTCCACTGCAGAGTTATTATTTTTCCTTCCATAATTAATTATCAT
++
+A@><@9@CCCCAB3>C@C@<@A=CB>>AC?BBA6ACBC??A8<=@?68AAC<1;
+@ERR005448.68449 IL40_2446:5:1:1121:4/1
+GTGTTATGGACTTCTTCTTATCTTAAGTCAGAAGGCTAAATGATTAAGTTATTT
++
+BA>;4AB<(:CC@:A*B?C=;<82;;86><,:(4.<66.;7:
+@ERR005448.68552 IL40_2446:5:1:1123:9/1
+CCCTAATGTTACTATATTAGAAACCATGATACATCTGTAAAAACTAAGACCTAG
++
+CAC@9@@CB=:><@A8>7@:??@<<966>;369<89><;67)7;/96/&/)
+@ERR005448.68727 IL40_2446:5:1:1125:2037/2
+ATGTCTGAACCTCAGAGACTAGGTTCCAGCAGAGGTATAGCCTATATGTGCTGC
++
+@+;-;:8/7;?A=:A>>>?<(=A=842:;6.<6;/3/190/30,,30*64
+@ERR005448.68728 IL40_2446:5:1:1125:2/1
+AAAGCCATAAATGAGATGCAGGAGTTAAAGAATGCTTTTGTTAACTTTAAGTGT
++
+;)54=:0>=7=A?8=55>:<>A5;.=CA=@<97@5/9@<9,6354>=83,,186
+@ERR005448.68873 IL40_2446:5:1:1128:6/1
+GTTAGAATATCATAAGTAGCAGAGGAATATGGTTCACAGAAACATCATATAGTA
++
+@>AA?81;<=:9;86=79<:4:.9<38787<)6;9585--1-275657592/
+@ERR005448.68927 IL40_2446:5:1:1129:623/2
+AAAAAAAACAAAAAAAACAACACAAAACAAACAAAAAAACAAAAAAAAAAAAAA
++
+5><9(6B8(8=7<:;56(9<)655?>>=?9/(8B837?5(7@=ADB7(6?5)18
+@ERR005448.69139 IL40_2446:5:1:1133:8/1
+CTGCTATAATCATGAGTGTACAGATATCTGTTCTAGTCCCTGCTTTAGTTTGTC
++
+CCCCBAB@5@@:@@<@?C?ABB@3===?=A;@B>=@7?@;96;;@=479:?@64
+@ERR005448.69383 IL40_2446:5:1:1136:10/1
+TGTTGACTGGGTGTTTCAGGACTGGCTGCTTTTAGCTATCCGAATACCTTGTCT
++
+BB>A=>?B6@7)978?@9559;;?6(5=3<=>>:3&4725&/&4/31:;;7+5'
+@ERR005448.69385 IL40_2446:5:1:1136:2/1
+AACTAACATTTATCAAGGTGCTGTGCTATCTGCTGGGGATAGAAAATCAAATAA
++
+ACACCBA>ACA?B@:<671<982'892:4:66
+@ERR005448.69756 IL40_2446:5:1:1142:10/1
+GATGAAACCCCAAATATCATAAATATAGGGCTTATCTTCTCCTATGCCCTTTTA
++
+CCCCAA@BCC?0=A=9=CB?3;@?><4>>@=8@?@B@B><=1=<;:;:?>8'
+@ERR005448.69889 IL40_2446:5:1:1145:2037/2
+ACCTCTCAGAGATAGAATTTGAACTTAGCCTTGAAGGAGATAGGCAGGCAAGAT
++
+>B?AC@<>C?CA;8??A?9AABBB43;8>/;;98A<8-=B<3;:A8=
+@ERR005448.70096 IL40_2446:5:1:1148:2/1
+ACCGCTTGGGGCAGGACCTAACACAAATACAAACCACAGGGACTAAAGAGTATC
++
+7?BBB@BBBBB;<;<@@@?>9;@@7?@@;;<<<9126473<;4.98<
+@ERR005448.70341 IL40_2446:5:1:1152:4/1
+ACTAGAAAGTAACGTTCTCAGAAACTGCTTTGTGAATTGTGCATTCATCTCACA
++
+<>+<@56:;;6?A;B>?@@0=91?8@9<88?B=685:;8=>><=?63=B@A@87
+@ERR005448.70483 IL40_2446:5:1:1154:8/1
+TCTTCAGCTAGACTCTAAGCTTCTTCAGGATAGGAATCATGGTTTCTTTTTATT
++
+;ABC<69A>CCA<@*@;0>@7@=CC?8:A9A>@7;CBA:@@A=A?<1=<>>?9@==9A:7<77629;>;=A>B>8<5:<;
+@ERR005448.70953 IL40_2446:5:1:1162:2/1
+TTTGGGAGGCCGAGGTGGGTGGATCATTTGAGGTCAGCAGTTCGAGACCCGCCG
++
+>@@A@?7>A?@:7?=6>@@?@<<>=8<5;;8=;67/97.662591;276%253%
+@ERR005448.71137 IL40_2446:5:1:1165:7/1
+AAAAGCTGACTGAAGAGCCCTCAGGACTTAAGGGAACATTGGCAGGCGGCTAGC
++
+/7?@B?2=B@;:?=?@B@@??5;?>/;=;=;;?8==8;8771&7/02.5,
+@ERR005448.71179 IL40_2446:5:1:1165:794/1
+TCCCACTTTGCTGGAGCTGCAGCTACTTTTGCCGGAAAGCCTGAGTATCTGACG
++
+BBB?3>AB;>A@@58BBB>=>A?:;:@>=89:;96+517:<76/-5:6=-*4&/
+@ERR005448.71376 IL40_2446:5:1:1168:1/1
+AATGGAATCAGGCTATAATGAAAACAACATCTGGATGTGATTGTTTAAAACCAA
++
+<6<<9=5=@A==:=91629?:7=861/5<;47
+@ERR005448.71651 IL40_2446:5:1:1173:6/1
+ATATTTTGGTTTACAATGTAAAATGTTTTCTCTTTTCTCTCGTGAACATTATTT
++
+C=9>BCCCC9CCC?89??::668@=;@@@A?7?BABAA<<;:7:/6735:79@>>=7>CCB?@=>C>=@==>9CCCCBCCCA?BB>BCCCBCA>BCBCC@@4@9A>338>AA@?AA6A<;39@;6<65;95(:<<9><53(/-361268/*
+@ERR005448.72356 IL40_2446:5:1:1184:5/1
+GCTAAACGTTTTACGTCTCTCCTTTCTTTAGATTACTAAGGCTGAAAACTACGC
++
+A8=B??>B@>CAAAA@AC?A>>:44&3./.;1&+(
+@ERR005448.72891 IL40_2446:5:1:1194:7/1
+TACAGGCAAAATTATTATTCAATAGTGATGGCACTCAGGAGTTGCTTCTCAGAG
++
+CC>8==A8*8=A>8A>6@B?91==6,6<=>9>:=?<79<6>5=<=?>9;?85-?
+@ERR005448.73302 IL40_2446:5:1:1200:2/1
+TTGATCAGCTGGCTTTAAGTTAATCAAGATGGTCAGAGTGGGACTGCCCTAATC
++
+@A@;A?BB???A?BA=10;98999)7696/194>6418022695'2:5,&2*
+@ERR005448.73674 IL40_2446:5:1:1207:10/1
+AGTGGAATGAGATATTACCTATAAACTATCCTAGTCAGCTCACAACAGAAAGAA
++
+:>BAB=8>B=A<>5?A?ACCBA;=AB>:>BA>5>A;6:A??3>8??6><=<<8/
+@ERR005448.73935 IL40_2446:5:1:1211:8/1
+GAACTGCCTTTATCTCATCCTCGACTCTAAGTTTCTTGAAGATCGGAAGAGCGG
++
+>+9>ABBBBBB>AAAAABBABA>29A@=43?;8@>@A=58=049@7&)90527<
+@ERR005448.74031 IL40_2446:5:1:1213:4/1
+GGTATCTGAGCAGAAATCTCAGGGAAGAAGATACACAGACAGCCAGAGGTGAGC
++
+BA<:;@B<(=@?<646;@=:9?@?:7=5,7<:3:::.7&5&2:5-5&/5-351-
+@ERR005448.74102 IL40_2446:5:1:1214:8/1
+CTGTGCTTGCCATCTATCACATGAATAACTTCACAACATGAATACATTCATAAG
++
+CCB@BCBBCC>1:?=<;747;98:69'9:=B<;::78566686<8/3.5//-
+@ERR005448.74734 IL40_2446:5:1:1224:9/1
+ATGGCTTTATAACTGTGTGTCCCAGTGTGGTTTGTTTTGAAGCTTTCTCCTCCC
++
+=>?B=6<<=><9<6;2939=;>9(9/<7<<:<79=6@9935855:<;?6,7=:2
+@ERR005448.74770 IL40_2446:5:1:1225:4/1
+CTCCAAGGAAAGACAAACAGAAAATAAACCTCAGAAAGCACAGACATCAATCAA
++
+CCCA??A@7:;@<:759>6.9967,7967;8597637619973167
+@ERR005448.74964 IL40_2446:5:1:1228:6/1
+GATTATTAAGGGCTGCAAACAGGAAGGATTTTATTCACCATTGATGCGGCTCCG
++
+B<@B?B?3:B@B@>B=87):4=?7:9;<;828;5-0:373./423
+@ERR005448.75101 IL40_2446:5:1:1230:8/1
+AGATCAAGGACAACTCCTGTAGCAGCTATCCGAAAATCAGGCTAACAGGAACCC
++
+A=8:?;?7@@@4(9@@=4;-65966;5/3::.-671/2,3.4*-.,,,)+.017
+@ERR005448.75213 IL40_2446:5:1:1232:11/1
+ATTGCAGTGCCGTGCAGCTTGTCTCCCACCACATGCACCACCTACCTGTCCCTA
++
+(>BB;;;7?=@><>B@A@??7922@>?5<>68)7/=;48'6(((464'1.9>4'
+@ERR005448.75361 IL40_2446:5:1:1235:7/1
+CACAACATAAAATGTTTTTAATAGGCCAGGCGCAGTGACTCCTGCCTGTAATCC
++
+?@<0=A@=:4:.:?5=?=?:58=4.7837+556&72/+.-/&-+//.))-).16
+@ERR005448.75775 IL40_2446:5:1:1241:10/1
+TGTTTGGTTTTTTGTTCTTGTGATAGTTTACTGAGAATGATGATTTCCAATTTC
++
+C;>>AA@<>?>47;<6;;67A@?5'5;=>;
+@ERR005448.75913 IL40_2446:5:1:1244:8/1
+GTTCCCTTCTGGCCCAGGGTGTGCCTAGAAGTGTTGCCCAGGAGCTGGGGCCTG
++
+9@/7%4=B4?735?;;6?8.6,4,/6),&67454)4.&.6-%*282*%4
+@ERR005448.76094 IL40_2446:5:1:1246:10/1
+TGGAGGGAAGATGGCGATTGTGCCTTCATTTGGCAGACATCCTAGATCAACATC
++
+BBA=?ABAB?A;<98><=?<3;@:7;89;55'7==?<7-3:158&+2
+@ERR005448.76219 IL40_2446:5:1:1249:4/1
+AGTCAGAAATTAGCAAGGAATAAATGTTGAAAGAACTGGATTGAAGATTTATTA
++
+ABACBB6A:>BAA@:8@CCCBA?9?CBC?A=7?3:?A=@5?C9)5@9@@>;@8'
+@ERR005448.77339 IL40_2446:5:1:1268:10/1
+GCCAACTCCTTCCCCTCCTTCAAGTCTTTGCTCAATTTTCACTTAGGAGGTGAC
++
+AB;96=BB@A>ABBBABB@>?6-:6>A>=;;<:(,5?<:>6:>;:95/48,57;
+@ERR005448.77348 IL40_2446:5:1:1268:2/1
+CATGCGAAGAGTTTGTTTAGTCATATATCAAACATTTATTGAGCATCTTCTGTG
++
+?7?AC@:A?>CCC>A?9?@@???CBCA:>C=4@B=:=BC:@:3;A>??B=8;
+@ERR005448.77504 IL40_2446:5:1:1270:9/1
+GGGTCCATGGCAGCCAGTATTCCCTAGGGGAGGGAAGTGGGCCAGAGAGGGGAA
++
+@@@AA=88?@>>==;0;=<7'7747<=4/;>;*24%6>9/4,4.3&4%64)0
+@ERR005448.77646 IL40_2446:5:1:1272:5/1
+GCAAGGATATCTTCCCAGCAACTGCCTGTCCAATCTTGGACTGGCATCATCTTT
++
+A?8?BAA>;>BBBBA?:><+878<@;0;/=>6/4;>8525<6/15-27009274
+@ERR005448.77801 IL40_2446:5:1:1275:7/1
+ATACTAAAAATACAAAAACAAAATTAGCCAGGCGTGGTGGGGGGCGCCTGTAGC
++
+>?4;=6;;96=2:?;<4074'8>:;?+<:>@>2<5+87&495/214.6-&-&
+@ERR005448.78179 IL40_2446:5:1:1281:8/1
+GCAGAGAACACCCTGACAGGAAGCGGAGGGTGTGCTGACTGTGCAGAGCTGACG
++
+@:7.4;177+7<;/;9;5<<6,45>7%6<;19/94*4/,,+)6)*2))*.6.'2
+@ERR005448.78354 IL40_2446:5:1:1284:1287/1
+GATAGAAATGTTATCTTCCTAAAAGGTCCACTTATGGGATTTGTTGGTTAATTG
++
+C?=A?>9?6@8=1>A@CBCA@<@?A69A@DA<@58ACC@8?;98<99>42
+@ERR005448.78565 IL40_2446:5:1:1287:2/1
+TTAGTGAAGCTCTCAAACCACTGAAGATTTTTTTCTTTCAAACGTTTCGAACTC
++
+>:==8<=6<@B<@<<>:<>1=B==<=77>@C??ABA>@81.7<96===8,6<86
+@ERR005448.78686 IL40_2446:5:1:1290:3/1
+ACAAAAAGAGTGTTTCAAGTCTGCTCTGTGTAAAGGATCGCTCACCTCTGTGAG
++
+??;4;=9>7>@>6=8909=9247.'/95)8&97;6:6:
+@ERR005448.78994 IL40_2446:5:1:1294:2/1
+GCTTTAAAGCATTAGGACTTATTCTCTTGTGTAACCATGTTTAAGAAGTGCTGG
++
+=@>A?>A>>A9>A:8@->@<+>3(9(1@;@?=1<
+@ERR005448.79206 IL40_2446:5:1:1298:8/1
+GGGAGGGGAGGTCAGGGGGAGGAGCAATCACTCAAGAGATCCTTGTCTCCTTCC
++
+A?>7><><.87'6436649*590563-/5*563.*/,-/3310/1/1,01,%,2
+@ERR005448.79491 IL40_2446:5:1:1303:10/1
+CAATATTCTTGTCTCCATGATGCTGTCTCATGGGTTTCTGAGATCGGAAGAGCG
++
+@;4=:?BBBB@BBBB?9>????@?;6@;>9<>9?1<=?@>26/5:=8/37-9
+@ERR005448.79567 IL40_2446:5:1:1304:4/1
+TAATTTAAATCAAATGAAGAAATTTCTTCTGCTTTCTTCTAGCGGTTAACATGA
++
+B>2@BB>@=<>9:7=>6:>6)1=CBBBBA?B9<=@@B?A:48+935.043&.7+
+@ERR005448.79846 IL40_2446:5:1:1309:3/1
+CAACAAAAGGAATAAGGATTTTAGTAACACTGTTGTACATGGATTATTTCATAC
++
+A;8@A=6-??7=A2)9A9;@BA9?<=9==>?@9=@631-5<87:69<;9;95*3
+@ERR005448.79930 IL40_2446:5:1:1310:5/1
+GTTCTGTGCCGATTCTTAGGTGCCTGTGATTCATCTGTGCCTGATCAGAATCCG
++
+:5=@9<<><;=;<:79@@;B:2;7(5710837.5,+947)/'.&7
+@ERR005448.79992 IL40_2446:5:1:1311:9/1
+TTTGTAATAAAACATAAATATATCCCTGTAAGTGACCATGAGCAAGCCTTCTGT
++
+CA?<=7:@:??AB:??B?>7;=AC>1=;>B:6796?=8:<38@8'5'599;<96
+@ERR005448.80302 IL40_2446:5:1:1316:10/1
+GATTCCATTCCATTCCTTTCCATTCTGTTCCATTCCATTGCATTCCACTCGGGT
++
+>6@BB=8@BB??ABBAABBB;7@::B=>>>=@@??>997@:<;<=<:87:4773
+@ERR005448.80312 IL40_2446:5:1:1316:5/1
+TATTTATCCTTTCTTGGTAAGAATTGGGGAGGGGTTTAAGAAAAGGCTAAGCAA
++
+@8@C7=@CCC@A:CCB@5;8<98?=<=?>/>?A=9=<;7<375,89:3/+5,&3
+@ERR005448.80561 IL40_2446:5:1:1320:678/1
+AAGGAGAAGGAAATACCAAGTTAAAGTTGTGGGAAGGGAAGGAACCCCCCCCCC
++
+?3=?>9;7<<65=;:;8;/522579274,36A?;:>8;?;>
+@ERR005448.80562 IL40_2446:5:1:1320:4/1
+TGAGCCTCTAAATATCTTCTCTGTTCCCAGTCCTCCTGCTCCAAGAGGTCATCA
++
+@>;?A@@@@=33>6=????AA@>>?>@8(67;???>27<:=7/'8'75&8657'
+@ERR005448.80799 IL40_2446:5:1:1324:9/1
+CTTTTGTAAGTTGATCTTAGAAGTGACTTCTGGCTGGTCATGGTGGCTCACACC
++
+ABBBABA???BB???@BAA>=?@6@=>?>;7?=?B@93=7449-;>768&8283
+@ERR005448.80923 IL40_2446:5:1:1326:5/1
+CACACATCACAAACAAGTTTCTGAGAATGCTTCTGTCTAGTTTTTATGAGAAGA
++
+>6<8>:?==><<7=57?:<725;:??>?A=>=:@6?=8=><;<;479/
+@ERR005448.81027 IL40_2446:5:1:1328:9/1
+TTAAGGATAATTTGGACCCTATTAGCCATGTAGAACATGATACATGATTACATT
++
+C>;6;A;@::ACCA=>A?B<;>=93;9477)9:94976531'--2757435&89
+@ERR005448.81115 IL40_2446:5:1:1329:4/1
+AATTCTTCTGTCTAGCCTTATATGAAAAAAACCCGTTTCCAACGAAGGCCTCAA
++
+(5@CCBA=CBBCA@>=8?A=?8>?8<0;1:688??3829;13117'74?6'8'1
+@ERR005448.81530 IL40_2446:5:1:1336:6/1
+TTAGCACAGGGCCAGGTTTATAATACTCAATATGTGAATACTACTTTTAACTGT
++
+C??AA=A=ACBAB@CC?C@7@>=?+9A=6:A9>A9A9.9A>9<>;><:1/6>8)
+@ERR005448.81684 IL40_2446:5:1:1339:9/1
+CACCCCTTTATACTATGTAAGGGATCAGTTACCATTTTCCCTCCATGCCCTGGT
++
+A=?BAABB>=@B>=3=@95*<@>;;;7>::<<8/5=<9>:80860*-:7.)0-+
+@ERR005448.82219 IL40_2446:5:1:1347:3/1
+ACATGGGAGGTACACATCATCCACAATGGACGAAAAGGAGAGAAGATTCCTGCC
++
+AA;AB@>4@@2>?@?9??;AA??=95?A<.9>4>>9@<:=6=;797;28;59
+@ERR005448.82556 IL40_2446:5:1:1353:9/1
+ATTAGCTTTACAAAGGTGACTGAGTTTACAGAAAGGCTATTAGCATCTAAACTA
++
+:A@;@CCCA>A=?;>A=A<@A?=A@AA>=>@6*4=;=<8<8:9:68:996'34-
+@ERR005448.82748 IL40_2446:5:1:1356:2/1
+ATCACAGCTCACTCAGCCTTGACCTCCTGTGCTCATTTGATCCTCCTGCCTTAG
++
+AA@:>8?@B?7=A?@@@@?4;@@@BBA=@@@=9;@?8&7@A?><93:>;7&,
+@ERR005448.82853 IL40_2446:5:1:1358:6/1
+GTCCTGTCCTGGGGATGTCCACACTTGCCTTCCCCCCTGGTTCCCGGGGACACC
++
+888:@>@@AA?;>;);::>=2=998908:8896)734'*.*)47%4+,,*,'.=
+@ERR005448.83107 IL40_2446:5:1:1362:8/1
+GTAACATTTTTATTTATTTGCTTTGGTAACAAAACTGAATGTTGTTTTTCAGCT
++
+>99.856?CA6-.4=@?6+=,2;C=81945=8-634>3-58/256:=5&&)--5
+@ERR005448.83197 IL40_2446:5:1:1363:10/1
+TGAGCAGGTAACCTGGAATGAGCCAGGGCAGAGCCGGGGGCTGGGAATCCAGAG
++
+8?@??8>>55<=80733=769@777:80*+'.7.-;/274'*;,&*%4'0%,';
+@ERR005448.83267 IL40_2446:5:1:1364:7/1
+AATCCTCTGACATTTGCTACCACCCAGCTAAAGGCGCATGGTGTATTTTTTTTT
++
+9/>CCB;?AA@AAC?>;@:<>8>A<(75.(7.59=5').=)7(558*.849<89
+@ERR005448.83406 IL40_2446:5:1:1367:3/1
+ATCATTGAAAACCACTAGGCATGCCAGGAAAGTGTACTTACTGAAATACTGAAA
++
+:ACCBCC>:8?BA9A>:<>?9:?@<;=;85/76?/'4:=4:=:3'16/9=6/21
+@ERR005448.83901 IL40_2446:5:1:1375:11/1
+ACAGTACCTAACAGTTTTTCAACCCTTGTCCCCCTCCTTCTCTCCTGCCTCTAT
++
+>?7?5)>??BB><<;@AAAA?6=A@@A@>A?>@@><;9=74@?>18;<<>?8.:
+@ERR005448.83967 IL40_2446:5:1:1376:7/1
+GCAACACAATCTACATGCTATACAGGGCTTTACATAACCCATAAGCTGGGTTCC
++
+B409?51>:AA??<:69A;:88:8?::.79=>6<<6'&6703652,)8-:-05:
+@ERR005448.84238 IL40_2446:5:1:1380:4/1
+GCTGGATTGCCTTGGACAAAGAGATAACTAAGACCAGACACCTCCCTACTCTCG
++
+?:@@>@<4;AABAB@9;5:<:;>79<:;=86>;=7&9+4&585&0=5-516-)9
+@ERR005448.84259 IL40_2446:5:1:1381:1/1
+AATACCTGAGAGGTAGAACTCCCTATGGAAGACTACTGCATGCAAGAAAATGCA
++
+7;A5?@@;;<*;B.7=?7?>B@B?@A?>8(;694-;0:6)5>81;:'3078;;9
+@ERR005448.84413 IL40_2446:5:1:1383:5/1
+AAGAACTCAACCCCTTTTACAATAGCTGCAAACAAAAAAATAAAATACTTAGGA
++
+:><:2@CBCCCACAB?;67=6<0=>6/518<=59-887<49.-7.:643/7
+@ERR005448.84566 IL40_2446:5:1:1386:9/1
+GAATATGCCAAAGGAATGGAACAAATGCACCTGGATATAGATCGGAAGAGCGGT
++
+=51=8325>9;??@3;<?73:=;:7755'2;71569172;27/).
+@ERR005448.85226 IL40_2446:5:1:1396:4/1
+ACAATCCCTTATCTTAACTCTGAAAGCCAGAAAGCTATGAAAACCAAAACGTTT
++
+:@==ACCCCA=@CCA;8@BCAA<88=CAA@:52>A:88<9;7'6<66(/9:259
+@ERR005448.85359 IL40_2446:5:1:1399:8/1
+AGGAGAATCTATTCATCCATCCAGCCAGTCATCTATCTGTGCATGTATTCGATA
++
+;A@3>=BBC@8ACCCCCA@ACA??C=3>0>8;A>(9BB@7@819?@;@=?9872
+@ERR005448.85397 IL40_2446:5:1:1399:1/1
+AAGACCAGCCTGGCCAATATGGTGAAATCTCATCTCTACTAAAAGTACAACAAT
++
+:>8:@C>BC<9CCCA@=755C?7C5,29:;6=??==>7:7598:;,>5*1&.5;
+@ERR005448.85601 IL40_2446:5:1:1403:3/1
+GAATGAGTAATAAGAGTTCTACCATAACTTTTCAATGTTCACATTGGGAGTGAG
++
+=6:>;3<6(8B@@@<;9??<=><63;=?;62?76&6
+@ERR005448.85620 IL40_2446:5:1:1403:7/1
+TATTTGAAAATCATTAGGGTTCAGTACTTGGTGAAGCTTTCAAAACTTCACCTA
++
+=5>C?@<:<;ACACAC>9<<>=A;??==82>@BBAB?99;AA<=0;B<2
+@ERR005448.85889 IL40_2446:5:1:1408:251/2
+AGAGTATTTTACCATATGGTCATTAATTTTTCAGCATTATAAAAATTGAGAAAA
++
+B;7<;CBCB?9>;8::4?>:=?@A:6A;;3:528526=57;8849<=;69%0.4
+@ERR005448.86026 IL40_2446:5:1:1410:8/1
+CAATCACACTAAAAGATGCAAATATTCAATAATTGATTAATTCACCAAAGAGGA
++
+?=8:<=0<9<>A>4>BA<7>89@9<0?;93;ABBA?BB=A9AA:BCA08A>8@873@>2A
+@ERR005448.86479 IL40_2446:5:1:1417:2/1
+CCTCCAGAAAGAGCCAGCGGTGGCAAGCAGTTAGCTTAAGCCACCCCGTCAAGG
++
+BBAB>:<793;:BA?-97AA=@;>AAAB=7:?>A<=BA;A@?A<@=?<:@9)7=9,81
+@ERR005448.86918 IL40_2446:5:1:1424:2/1
+AGGTGTGACATTTGAACCACGAACTAAAAGACACAAGGGAGCAAGCCAAGCAAA
++
+@?B<=AA@>9;A>;?@===B?966=>>=;49A::9?<95:6:7.;94+0
+@ERR005448.87507 IL40_2446:5:1:1434:5/1
+GCTGTGTCCGGCTGCAAGTTTATTTTTTATGATTTTATGTGACGTGGGAGCCCT
++
+=?B=+?1??B?BBB94*6@9:6@8>>A;=?A:@>=7:?-=:4,524&1
+@ERR005448.87656 IL40_2446:5:1:1436:5/1
+AAATTAGGCAGATGTGGTGGCAGGGGCCCGCAATTCCCGCTTCTCCGGGAGCCG
++
+B9?*>B@7404=47'043B@7<24-69:'7(*)'44.72-,04-,%*4+,)(6(
+@ERR005448.87841 IL40_2446:5:1:1439:9/1
+AATGTGGCACATATACACCATGGAATACTATGCAGCCATAAAAAATGATGAGTT
++
+@6=C9C?:>C>6:B>99:3::<:>:1;;/*63.+3*-9957>7:31
+@ERR005448.88231 IL40_2446:5:1:1446:2/1
+ACCATTGTAGGCAGAGCCTAGACAAGAGTTACATCACGTGGGTGATCAGTGCCG
++
+???7=@@;/=@??;5;??;4:2;85;9878=;8:;197)773/8)42/7)23&7
+@ERR005448.88235 IL40_2446:5:1:1446:9/1
+CGCGAGGGTCCGTGGCTTCATTCTGGACGTCAGTGAGCCCCAGAACCCCCCACT
++
+@B@;9=>B4BA;05>84/52:2<0590%33467)4%3)6;04//,57,/35'%.
+@ERR005448.88399 IL40_2446:5:1:1448:8/1
+AAAGATAACCTTTGACTTCCAGAAAGTATGCTCTATGATGGAGTCTTGGCTTGC
++
+?8?=85<8>CB?BAAC;85=<>@=4;AA=@@:/;C@AB9'?8=?:?;4;@7&
+@ERR005448.89099 IL40_2446:5:1:1460:10/1
+TGGGTTTGGGGAGCCCCCTAAAGTAGATACAGCTTAGATCACAACACCCAATCC
++
+????AB@@;@BB>?@B?BA2(=:54'7?@@=6574:4797(:(6=7&.)-37
+@ERR005448.89428 IL40_2446:5:1:1465:9/1
+TTGTTGAGGATTGCTTTACAGCCCAGCAGATTGATTTATTTGGGTAAAGATCGG
++
+76=7:6864>49=:02>:1'5:61981&4':/8'5<2/070731&794;;176+
+@ERR005448.89593 IL40_2446:5:1:1468:9/1
+AGTAAGTGGTCAGACATTTCGTCCCTTTTGACACTCGTGGGATGTGGCCTCAGG
++
+0=<64;=AAA?4;?@BBBB@@@BBBBBAA=6?8:B?@=A>?7;?:?=;=<;6;=
+@ERR005448.89808 IL40_2446:5:1:1472:4/1
+AAATGATAGTTCTATTTTTAGTTTTTTAAGGAATCTCCACACTGTTTTCCATAG
++
+2=AC;8<79@A<>0@B?B@6A?=@BC>B<@A>?ABCAA?>:=@8:@?=>>;>+9
+@ERR005448.89944 IL40_2446:5:1:1474:637/1
+TCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCC
++
+@@??@@@>?BA@A?A@@??A?@?ABBBBBBAAAA@A@?@BBBB@??@@A@@@@A
+@ERR005448.90397 IL40_2446:5:1:1482:9/1
+CATTTGCAGAAAAGGTGGCAGTCAGCTGAAAATGTGGACAATAGACTTAATAGC
++
+?1=A>CA;A:647?>3A?95<091;96:503)4;988&46223213/.,54)3,
+@ERR005448.90524 IL40_2446:5:1:1484:3/1
+TTGTGGTTTAAGAACGCCTTTAAGCAGTGTTCCACCCTGGGTGGGCCAGGTGTT
++
+3;?7;>*==8::A;BB=B=8?:7;>;?1'7>>@=38<=:5::4'08=885,1(2
+@ERR005448.90791 IL40_2446:5:1:1489:4/1
+GAGGTTGCAGTGAGCCAAGATGGCACCACTGCACTCCACCCTGGGTGACACAGC
++
+?:?2<<@>5=?>8>9>><6'3;9;8:7382/594396%*57112/),/4/1151
+@ERR005448.91608 IL40_2446:5:1:1502:9/1
+CGGGGCGGGGCGGGCAGGGAGGGGGCGGAGCCACTCACCTAACCATCCCTGATG
++
+@??2:667<=1672;>4,795=7-83%)/.%3%4274%%)1%**)%),,%%*
+@ERR005448.91670 IL40_2446:5:1:1503:3/1
+ACCACACCTACAAACACTGAGTAAAACCCACAATAAAATGTATCTGCAAGAACG
++
+59;589+;5<58?>8491?;>4>9=6:>8<<3741.87,4)/8/+1/''8/5)(
+@ERR005448.91733 IL40_2446:5:1:1504:10/1
+ACCCAATTCCTGCATCCCCATTGGATGTAGGAAGTTTCTCAATTCATTTTGCTT
++
+B?><,3=?6)>A<;<2<=7548*2'4;/-514&5,&320,')25732&79
+@ERR005448.91871 IL40_2446:5:1:1506:1994/2
+TACACCAAAATATGAATGTTTACAAAAGAATAAAATGCTTAGACTAGGAGAGGA
++
+A>A??@=:?>?ABB>5<==A>=?8::;>A@A@5;><4<15;=@6-66;<6
+@ERR005448.91932 IL40_2446:5:1:1507:1/1
+GCAGTGGTTCTCCCAGCACGCAGCTGGAGATCTGAGACCCGGCAGACCGCCCCC
++
+@@2@BBBBBAB>2??B@@>>8<>.>70085184'67484,4'4%'44*4;
+@ERR005448.92006 IL40_2446:5:1:1508:5/1
+GCAGCCAGACTGCCCGAGTTTAAGCTTGACTATGTCTCTTTCTAACTGCACCAT
++
+9@?@A?9>=@>;9?=@=57<;+183:4:3=7:?><=;;81+2)53)3&,/
+@ERR005448.92301 IL40_2446:5:1:1514:1383/1
+TTATCATATGTTTTGTTCACAATCCCATCTTTCAGGGACTCTGCTTAGGCTGCC
++
+:;67?7?>?A=A>=>763>A??6=:775;::83
+@ERR005448.92484 IL40_2446:5:1:1516:6/1
+GGTATATGTGAACATGCATTCTGTATGAAAGAATATATTCCTAAATGATTGCCC
++
+@@:6?@>A=:?8??<7=?AA?94<=<<468::,818:865/3-71)565&/7
+@ERR005448.92649 IL40_2446:5:1:1519:8/1
+GAGATCTTATTAGTCTGTTTTTACACTGCTGATAAAGACAAGATCGGAAGAGCG
++
+;1@4?BA?1?@ABBCCCAC@C?0<7:>928<984&9&76?
+@ERR005448.92840 IL40_2446:5:1:1522:4/1
+TACCAAATAGGCATAAAAGAAAAAGTTGTTCCTGACAGAGGATACAGTATATGC
++
+?;A>:@>=0?@>:@97=;:;=:7=B;:=<;>==;8677688)1966715+)+.)
+@ERR005448.93057 IL40_2446:5:1:1526:6/1
+AAGCACCATATAGATAGGGTTATGTATAAAAGCATATGTGCTACTCATCTTTGC
++
+74?8,9A??8A>@B<8>CB?>5;<;8=66786;9;:68753793'+7:3111
+@ERR005448.93331 IL40_2446:5:1:1530:9/1
+TTACATTTTTCCACCAGCTTCTTTTTTTTTTTGTATGTCTCATTAAGCACTTCT
++
+C@=B9BCCBCC@8>CCCABBACCCCCCCC@3=A;7:4:436492'&3/)&25&4
+@ERR005448.93484 IL40_2446:5:1:1533:4/1
+TGGGACGTACAAGCCATTTTGAATATCAGCATTATAAGTTGTTGGATTCGTCAC
++
+BCCC==C:/A@??C7:?=A<;?<<=?A?=?9<9:?8:98B@59<7.55&5-53:
+@ERR005448.93506 IL40_2446:5:1:1533:9/1
+AGTGGTTTGTAGTTCTCCTTGAAGAGGTCCTTCATGTCCCTTGTACGTTGGATT
++
+0>9BBB@AAA@A???=A?A@;04?>?6&7A4?;2;;;>4:6;=;3/853=8)39
+@ERR005448.93626 IL40_2446:5:1:1535:6/1
+TAAACAGTTAATTTAGAAGAAATATGATATAAAATTCACATTTACAGATGTATC
++
+C<<;;@@<<95@3>CDC7.37(9:ACC<@<@?9,.9@C:0=<::8=A<<=-:87
+@ERR005448.93793 IL40_2446:5:1:1538:3/1
+ATTCTTTTGTCACAGTATAATCAGTTGGCTGAGAGGAAGGAGAATAGTAATGAA
++
+/?CCCBCCC@B@C?A@CC9/B?=@@BBBC??=A=AC7,4?2>?25&63'585&3
+@ERR005448.94134 IL40_2446:5:1:1543:533/1
+AGGTTCGCAGCAAGGGAGCGTGTGATTCGGGATAGATTGTGCAGGTAGACCTAG
++
+8?===?==;=A;==3=8;==6=9;1/;???;47/8985=6;5075127)1;;/4
+@ERR005448.94475 IL40_2446:5:1:1549:8/1
+GGTACTGGTCAGTGCCCTAGAGGTATAAAAAATGGGAAGTTTTTAAATCAGGGA
++
+@9:9=A@A9@5=4<>@8732&88394-5914)/296+)3//45/..,-/)36/&
+@ERR005448.95140 IL40_2446:5:1:1560:8/1
+GGTTATTTTTATAAATTATACATCACTCCCCTTCTAGAGTAATAATCCTTTAAC
++
+CC6?CCCCBCAA@CBAA;BBBA6>?CB@@@>>;.>.843077*5:8:=7.27
+@ERR005448.95398 IL40_2446:5:1:1564:9/1
+AATAGCCTTACTCTTAAATATGAGCAGACAATCAGATACCTGAAGAAAACTGTT
++
+9;?>=?CCB@>C@A?=6*?=@?;=A?;@A@4,3:@8;2;98:177<>02-::61
+@ERR005448.95481 IL40_2446:5:1:1565:2/1
+TCTTTTGTAATGTCAGGCAACAAGTTAGCTGATGCTTTTGCTTTAAAAAGTCCT
++
+B@=BCCC>::ACAABACA:?>:=AA>2>B?<59>CB>??A9A>98::5)7/8:8
+@ERR005448.95601 IL40_2446:5:1:1567:38/2
+AAAAAAAAAAACAAAAAAAAAAAAAACAAAAAAAAAAAAAAAAAAAAAAAAAAA
++
+,><>ABCAA715(6
+@ERR005448.95681 IL40_2446:5:1:1568:6/1
+GATGGGAATTCTGGGAAGTCTACTTTCAGCTTAGTTACACTGACACATACGAGA
++
+=4B??=B;6-=<;=7AA=?@=94=4>/8685884298458:,1-
+@ERR005448.96257 IL40_2446:5:1:1577:9/1
+CAGCTTCCCAAGTAGCTGGGATTACAGGTGCTCACTACCATGGCTGGCTCATTT
++
+@??BBBBB?6=?98;@?@?;07;5:78;3879<:;3'45,-/633:0,-*,..7
+@ERR005448.96262 IL40_2446:5:1:1577:5/1
+TTCTCCTCCTCTGGCCCGCTCGTGTCTTGAGGGTTTGTTTAGGCCCCGGGTGGG
++
+@A@@@@@@@<@?><>?=;;4%457425;6,7=4,62+.&4%)0204,4/%,34*
+@ERR005448.96982 IL40_2446:5:1:1589:6/1
+TTTTTAATAGAAAATATAAAGGGTCAGTAACCCCTAACATCAAAGATGCAAAAA
++
+CCAC@=;A>AAB?>9/7@;A;@BC?=33@=1&525.1<@:=(71+
+@ERR005448.97174 IL40_2446:5:1:1592:6/1
+TTCTTATATGGGCATGGTTCTTGATACCCCAAAACAATTACAATGTAACATTAA
++
+CCCB?@?AA?@C???AC@C@C@<@@9>C;936.786/759:7&7-28'11:;4(
+@ERR005448.97208 IL40_2446:5:1:1592:3/1
+CCTGACCTGGACATGATAAGGGCCGGAACAGGAGGAAGGAAGAAGGAAAGGCGT
++
+BB@?B?<8?<750;:6,657;0705<1532.4%480098,35*,2832.9/*%)
+@ERR005448.97386 IL40_2446:5:1:1595:5/1
+TAACCAACCTCTGGCTATCCCCCCCTTCCCGTTCCCTCTCCCCACCCCTCGCAC
++
+<77<@@@@;'8@A>B;74;;*.9?A<89-/42*%)8*'20.45'2*'2+%.0.2
+@ERR005448.97615 IL40_2446:5:1:1599:7/1
+CTAATCAGTAATAACTGACAGGAGGGAGAAAGGGGGATGTCATGGGGGGGAGGG
++
+B;/=B@@@<==?44>7=6;-=;/=@;-860.:7&7:'*7**&194&3&77&3&1
+@ERR005448.97936 IL40_2446:5:1:1604:3/1
+AGAAATGAGAGAGACCTAGTCATTTGACCTTTCAGAGCCTATTTTTCTTCATTT
++
+9A8A8AB>BA@4@C>:;6>C?<7<=7@AACC81;@B
+@ERR005448.98029 IL40_2446:5:1:1606:874/1
+AGCTAAGGGGGGCCGGCAAGGGAGTGCTCCACGGACTCTGCAGCCTGAGCGGGG
++
+2=B>.7?><8;==?80;;8;@734/5>7<:5;*;4;7>955;;>854,4;9351
+@ERR005448.98065 IL40_2446:5:1:1606:6/1
+ATGCTTGGCCTAGTGCTGTGTTTTTAATTTGAAATTCCAGTTGTTCAGAGATAG
++
+6>BDBCC@CBC;B>CACB?BCBCCC=BCCCA=;1?CB@@BA;:3:?BC@C>BCB
+@ERR005448.98118 IL40_2446:5:1:1607:2/1
+AAAAGATTAACTGTCAAAATTTACGTTTTCAAAAGTTTGTCTTCTTTCCCGAGA
++
+A48=?@CC711?C@CCBCA?5:?=@?A@@A@C=?B?>?A8?=
+@ERR005448.98145 IL40_2446:5:1:1607:8/1
+GGACAAACCGTTACTTATGATGGTTTGATTTACGCTTTTTCAACGTTATGATGG
++
+AA>ABA;C@C7@*B>C;BA8>A?0;@A874;339'1;@>>:777<6626/-0:9
+@ERR005448.98429 IL40_2446:5:1:1612:8/1
+GCCCACTTGTTGATGGGGTTGTTTGTTTTTTTCTTGTAAATTTGTTTGAGTTCT
++
+CBC?9B>64/&8==;<<<6'858:>
+@ERR005448.98464 IL40_2446:5:1:1613:3/1
+ACCTCTCCCCAGCTTGGCTCTCCAGGCCCCCATCACCTCTGGATGACACCCTTC
++
+';AB@@BABB7;A@;>9<:>9@B9?5.=@?;'/;)7;/74+43.3%')244-3=
+@ERR005448.98602 IL40_2446:5:1:1615:11/1
+CATGAAACAAAAGTTTCTGGAAATAGTGATCTTTACTATGTACCACATGCCCTG
++
+CCC@1:4?=8;7=?=:=5>8<;?A=9=;2==40<953676>4:48
+@ERR005448.98707 IL40_2446:5:1:1617:5/1
+GAGTAAAGACGTAATTTCACCATTTTGGCCGGGCTGGTCTCGACCTCCCGCCCC
++
+::0@?;2=.5?556>B@>84;';@7><9@8050.078/++43/,-0153,/.-,
+@ERR005448.98719 IL40_2446:5:1:1617:8/1
+AACGCTGCCTCGCCAGTGTTCTCCCTGCTCCCCCTTAGAACAGGGACCTCACCC
++
+73>B5A@A;>B7B>/21@=:>+0084792;A;A6-2'<-27)<)52863..%0%
+@ERR005448.98995 IL40_2446:5:1:1622:8/1
+CCTCCTGAGACATGAAATTCCAATGAACTTTGTTTGAACTATTTTAGGGCCCTT
++
+CCBCAB@6?9;9?A8<8@>?920:=899=;??9;>:-*5517815134569773
+@ERR005448.99392 IL40_2446:5:1:1628:2037/2
+GGAGGGCAAATGTGGAGACTGGAAACCCAAGGGGAGCTGGAACATAGGGTCATT
++
+@@@;=;9<51>26><:>>?995:(49;98<9.;7+765?4/4%187409,65.5
+@ERR005448.99553 IL40_2446:5:1:1631:5/1
+TTAGCTCTTATACTTATCCTGAAATGGTTTTCATTAGAGTGGAGCCAGAGACAG
++
+@>8ACCCCA4>ACB4;>=8C<@==A??78=2;8&'&7-8)4260(
+@ERR005448.99621 IL40_2446:5:1:1632:9/1
+GGAAACACGGTACCCATAAACCAACAACTCCCCATTCTCCGCCCCTCCCACTCC
++
+>@=@@;597?6>5:6-58,%485024,2,8644+.,.,5*%,%&+032.%%%/3
+@ERR005448.99622 IL40_2446:5:1:1632:2/1
+CATTCATTTATATCTAAATCTCAGTCAATATGATCTAAATATTTGTGTTTAAAG
++
+:7>>=@?D?C?<>@;98/7->9<<@B49).
+@ERR005448.100032 IL40_2446:5:1:1639:6/1
+GCACACATCACAAACAAGTTTCTGAGAATGCTTCTGCATAGTTGTTACGGGAAG
++
+@A?=;>9??9A==:>A>?39AA;94?7?=>A>:>=><572918==8<:<<;13:
+@ERR005448.100347 IL40_2446:5:1:1644:3/1
+TGACATACTAGGATCTTGCCTTTAACAATGACAGAATGCTACACAAAAATACTG
++
+C@C@@::==<>B=@BCCCCCBCB?AA?=6>=ACA8;@CB@2>@@;61<2<6=96
+@ERR005448.100440 IL40_2446:5:1:1645:11/1
+ATATTCAACTTCAGTTGCTTATTTGTAAAAAATAAATAATATCTACTTCATAGC
++
+:;88>6>?;=<:<<=>>>96964:7&
+@ERR005448.101126 IL40_2446:5:1:1656:9/1
+CGGAAGAGCGGTTCAGCAGGAATGCCGAGATCGGAGGAGCGGGTCAGGGGGACG
++
+BB;08>;@BB?6<>;>;0=<5.6?@>4970*3:4%)4%-'36.%/)/&%*1%%)
+@ERR005448.101204 IL40_2446:5:1:1657:5/1
+TTCGATGATGATTGCCTTCCAGTCCATGGATTATTCCATTCCATTCCATTAGAT
++
+2?B@;B@:A:<;??@C?=B?6?;;;89>?9?=9><>7,8?A=29;C=42;2813
+@ERR005448.102353 IL40_2446:5:1:1676:8/1
+GTGGCAGAGCCAATATTTGAACCCATGTCTGAGTCACTCCAGAAACTCTGCTTA
++
+B@B@A=>4>@B8(548;7=75>?<298495;5;78-:3<6*53-&1/32'1//,
+@ERR005448.102510 IL40_2446:5:1:1679:3/1
+TAATGTAATAATAATAATAGGCAACATTTATGTCATATTTACTATGTGACATGC
++
+B?:>CB?@C;=>DA=3.6>CC9?;>C?>;<3==>6>A@;5><<;7A=689>=
+@ERR005448.102734 IL40_2446:5:1:1682:9/1
+AATGTATGTTGTAAATGTATGCAACAACTATAAGCTAGGCAGTTATGTTAGATC
++
+28AC9>=<=A;>=84:?<7:&77897/&.+&7
+@ERR005448.102799 IL40_2446:5:1:1683:5/1
+AGTTCAACCATTGTGGAAGACAGTGTGGTGATTCCTCAAGGATCTAGAACTAGA
++
+1>?<>89?848A=0738:=A;5;)9>*>94;@<6<566:7;6566&6;09:<
+@ERR005448.103013 IL40_2446:5:1:1687:3/1
+GATCATTAGTGATGTTGAGCATTTTTTCAAATGTTTGTTGGCCATTTGTATATC
++
+BCA?;BB@C8;5:??BCAB>1A7;?<<>;=>?A55590.
+@ERR005448.103019 IL40_2446:5:1:1687:9/1
+CTCAGGAGTAGATGGGACTACAGGCTCCTGCCACCACGCCCCGATAATTTTTTG
++
+<6;<<85646<69??;0731522853952-34&,3)/124441*&&&-.12/*&
+@ERR005448.103023 IL40_2446:5:1:1687:1851/1
+AGAGGCGGCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCCC
++
+974@@;'9;<@?@AAA@@@@:@@>:@:@?@?@??@ABA?@A?8>BB@:>@ABBB
+@ERR005448.103397 IL40_2446:5:1:1693:2/1
+AGGGAACATGCCCATTTATAGTGCCTGGTCAATAAAATAATCTTGATTTATTCA
++
+8@?A;<7@;ABCB@C7C@:<>=9;;:::8==:5;@:78><7
+@ERR005448.103748 IL40_2446:5:1:1698:8/1
+GATGGTTGATCGTTGCTGCACTGGGTGTCTGTGGTCCGCATTCTGTATTTCCTA
++
+=6?AA?@@@@A@@?=?@@=;;??;?8?::=?8=;4;9;56699993.1775-,/
+@ERR005448.103968 IL40_2446:5:1:1702:3/1
+AAGATACATGCACACGTATGTTCATTGCAGCACTATTCACAATAGCAAAGACAT
++
+3>A?@;<99==2<<7,8337457'5&3&-.-
+@ERR005448.104333 IL40_2446:5:1:1708:2/1
+CCTGAGCAAAACTCAGGCAAAGATGCCACCAGCCACAGAGGTTTACACCCAGAA
++
+BBB@@@@@@>@?><2?AA?;8;<;?A?:?;63=3',,1*3/)3023&&---/)&
+@ERR005448.104536 IL40_2446:5:1:1711:5/1
+CGTTCAGACACCTCTTCGCATTTCCTTTGGCTTTCCAGATCGGAAGAGCGGTTC
++
+BB>B?3=?=/;BABA?@@?3=AABBA<=>@A?=@A:1;5;@<<2-;8=97731<
+@ERR005448.104871 IL40_2446:5:1:1717:4/1
+GGAAGCCATTATCCTCAGCAAACTAATGCAGGAACAGAAAACCGACCACCACCT
++
+>?99;@>4;<4:@@;=;=?38.;;8=:>;3<83263632/&56/367-59&,&)
+@ERR005448.104907 IL40_2446:5:1:1717:2/1
+AGGAATAGAGGTGGAAGCTGGAAGGCTGCAGAGCAGGAACCCCAGCCCTCATGG
++
+4>>.0;85><8>8300;>>>889;1637706)30.++,'7'72),64+/)0%),
+@ERR005448.105167 IL40_2446:5:1:1722:5/1
+TGAAGCTGTATGAATGAAAGCTGTTGTAGAAGACTTTTGTGGTTACCTATCAGA
++
+CA8=ACBB@7@A>ABA?AAA@C=>AA>@@<:?3>:CACC=BB@;:;:3267'69
+@ERR005448.105259 IL40_2446:5:1:1724:3/1
+TGGTGCACTTGGGACCAGGAGCATGGCCTGTTTGAATGGCGCTTCCCTGTCTAT
++
+BB?3@@@@@@<3?999:0<;.;@B@??@@?@<>6>>A8%15544&61692*'
+@ERR005448.105499 IL40_2446:5:1:1728:10/1
+TGTCATCCCAGCACTTCCTGAGGCCGGGGAGGGCGGATCACCTGAGGTCGGGAG
++
+2<@8/?@@6764.48>:A<838>@A>9>7'49?>9;'.0;7.17957'016333
+@ERR005448.105605 IL40_2446:5:1:1729:6/1
+GTTTCCTTCCAGTCTATGGCTCATCTTTTTTTTTTAACTGAGCATTTACTAGGT
++
+B<>AB@@?@A=<7;<7>@?>@7.78><>?B@B>@>74949.9<5994)/7.9<;
+@ERR005448.105859 IL40_2446:5:1:1733:10/1
+GGATGAGTAGCAGGGAGAATGCAGGGTATATTTGGCAGGGGGGGGAGCACAAAG
++
+??9??:?6<>=:?>;5;457?<;=?4*533369993,4%4:4%4/&32/-/%)3
+@ERR005448.106182 IL40_2446:5:1:1739:2/1
+ACTCGGCAAATCTTACCCCGCCTGTTTACCAAAAACATCACCTCTAGCATCCCC
++
+AABAAB=:=/<@@<9?@@=<@<:>8?899?;6343970,&58422)&,&'3&3:
+@ERR005448.106338 IL40_2446:5:1:1741:9/1
+TTATCCATTCACACAACTCCAGCCTTTTCTGATGTCCCAGGTCATAATTAGTTT
++
+A@99=;C7)7?7?<9:62:.:94:6/'7625)2++73)1,3<
+@ERR005448.106488 IL40_2446:5:1:1743:5/1
+ATGAAAAGATACCGATTCAGAGTCAAGAAACAGCTGAGAGGTAAAAGGCAAAAC
++
+<:=<96,?=6@887/3493;293@86;23.5)213<-9)66/6353&,/35'2&
+@ERR005448.106494 IL40_2446:5:1:1743:8/1
+CATTCCATGCCATTCCACTCGGGTTGATGCCATTGCTTTCTATTCCATTTGGGT
++
+=8;4>?;6=@7>89,73>>94;;+87-1(6:;6)85=8=59463-2)1772449
+@ERR005448.106720 IL40_2446:5:1:1747:1929/1
+CTTAACAGCTGAGAAAAGAAGTAGTAATCACAAACACCCCCCCCCCCCCCCCCC
++
+BB?7>?8=?A<>=834:<3(870?89:>>>:;-46%89/97?<:9<:<>>@?@@
+@ERR005448.106932 IL40_2446:5:1:1750:6/1
+TTTTTTTATGCAATATTTGTTAACCTGCTAACACCCAGCAGATGTTATTGCATT
++
+;:>A=@;7?C<:?@C=<><>9366<=@9.
+@ERR005448.107302 IL40_2446:5:1:1756:6/1
+AGGCCCTGGTGATGTGAGCTCACAAGGGGATCTCCTGATCCGGCGGGGGCAAAG
++
+28=A>=9=@?<5938;8>75595;999-15600%4.%3/*-)%0
+@ERR005448.107597 IL40_2446:5:1:1761:1/1
+CATGGTGTATTATCTTTTTGATTTGGTGTTGGATTTGGTTTGCTAGTATTTTGT
++
+A<>CC8A?ACB;6@88ACA:@<
+@ERR005448.107754 IL40_2446:5:1:1763:5/1
+ATGTTGCTGCAAAGGACATAATCTCATTCTTTTTTTATGTCTGCATAGGATTCC
++
+7>9?BA<:=675;097;;:>B>9A;@319?67;=94756&17758
+@ERR005448.107952 IL40_2446:5:1:1767:7/1
+CATTCAATTTCATTCCATTCCTTTCCATTCCACTCCACTCCATGCCATTCCACT
++
+B<@BB@@BBBBBBBBBBBBBBABBBA>ABBB8@;BA<<>B=46;<=635=:6;,
+@ERR005448.108131 IL40_2446:5:1:1769:10/1
+TATTTTACTGGGAGAACAAACGGCTAAAATAGTTTCCAAAATGTGTCCTATCAG
++
+?6?CC@8@AAC@:@:=?89==>;?=<79649<8:;9;<:7375//05/-/0655
+@ERR005448.108139 IL40_2446:5:1:1770:5/1
+CAGGCTGTTGACTACTTTATGTGCCATCGTGTGTTGTGCAGTAAATGTGCTCTC
++
+969BBB?;6=>A>2<>AB?A<-@>?ABBBB@A?7:=>@<>:9;;=6)8<>;;9;:7)5984+397305
+@ERR005448.109122 IL40_2446:5:1:1786:8/1
+CTATGTGGTCAATTTTGGAATAGGTGTTGTGCAGTGCTGAAAAAGATGTATACT
++
+A=>A=?AC@6./>?AB;2575&8;=A378879
+@ERR005448.109188 IL40_2446:5:1:1787:380/1
+TCTGCCATTTATTAGCTGGATAAAATGAAAGCAGTCTCTGAGGCACCCAGATTT
++
+CCCCCA@BCA=A>:;9:<>?8?>?<8/7=>7=?7291;;2
+@ERR005448.109189 IL40_2446:5:1:1787:1199/1
+ACAATGTGTAATGATCAAATAAGGGTCCAGTTTTTAGCTGGGTTGTTTACTTTT
++
+ABB@BB@ABA?BA>A?A@>=977AA>>;?BBC
+@ERR005448.109190 IL40_2446:5:1:1787:1535/1
+ACACCTGATGGCCACTTCGCTCCCACGGAGAAGCCTATTTCACGTTCCTATGTG
++
+B;0=?18*((9@?;83221;;8?;07.53516:973&197/7:.133*,&1,-7
+@ERR005448.109191 IL40_2446:5:1:1787:466/1
+AGGACACAGTAACAAGGCACCATCTATGAAGCAGGGGAACCCTCATCAGATACC
++
+9?@@?:?@@?>:?=;97??@>:97;26:1&5018:
+@ERR005448.109192 IL40_2446:5:1:1787:1807/1
+CATTCTGTTCCATTCTATTCCGTTCCATTGCATTCCATTCCATTCGGTACCATT
++
+A;?>8=?>@==:7==@848;7>518;<664972266
+@ERR005448.109193 IL40_2446:5:1:1787:203/1
+CAGCTAGGATCTGTCCCCTCCTTCCCTGTCTGGTAACAAAACAATAAACAGCCT
++
+>6=A:2;<8=B?;@BAAAAA?>?@9<;?<<;3'6:5-3)77**3&175*78&
+@ERR005448.109194 IL40_2446:5:1:1787:1965/1
+CCTCTAATATGAGCTTTGGGAGAAAAGTTTTAAAGTATTTGATAACCATGATTC
++
+CCCC?==A>A;59?A@@=;<:<;90/6:AB?=;:937;@?;;<:6::7:6/855
+@ERR005448.109195 IL40_2446:5:1:1787:138/1
+GTCCCCAACCCTTGTGCCACAAACCGGTCCTAGTCACAGGCCTGTTCGGACCGC
++
+:<>AA>5/>@@>;1;.;?:=;..>60*4'740+-7'4%.-43+*.3'03''4,'
+@ERR005448.109196 IL40_2446:5:1:1787:793/1
+AAATAATAAGTAAAAATATTGGAGCAACCAATAGAAAAGAGTTTTCTTGGGCAG
++
+=5?A;@C;:=?B;?<:<8AA@CB<@;@C>B<@?;;<>=6=BBA8A<@?9::<<6
+@ERR005448.109197 IL40_2446:5:1:1787:1473/1
+GAAGTTGGTTGTCCCTGCAGCCCTGAGCAGAGCTCTCAAAGTTACGTCACCCAA
++
+?:8?<@A@;ABBA@@@@??BA<;35?:;;<9>A=>;33759<;>2:8:;/'/
+@ERR005448.109198 IL40_2446:5:1:1787:1097/1
+TGTGTGCATAGAGGTATTTGCAGGCATTTCTGAGGTTTATTTTTATTTCTGTAG
++
+?6-9@=4:>:@91;?>9@<:?@C??=<0*
+@ERR005448.109199 IL40_2446:5:1:1787:1406/1
+GCTTATGGAGTTCCTACTATGTGGCAACCACTGTTCTATTAGGTTGGTGCAACC
++
+8:5?>3B?9?<;??7=>>>412;7;;:>@?=9)-:@>:9<-1).335583,662
+@ERR005448.109200 IL40_2446:5:1:1787:1124/1
+AAATTACTTTGGGCAGTATGGCCATTTTCACGATATCGATTCTTCCTATCCATG
++
+88=AB?ACCA;A>>59?A@;:AA=@CBA<<=96>97509=?<=?:8717<6655
+@ERR005448.109201 IL40_2446:5:1:1787:607/1
+TTCCTACATTTCCTTCTACTGAGCTGATAGACTTACCTTTCACATTTTGGTCTT
++
+CCCCB?@9@CCCCCBC?;AA=3:A>???::=BBA=A;7;@A>:3=@@;839C>>
+@ERR005448.109202 IL40_2446:5:1:1787:1950/1
+AAGATATCGCCCATGCTGGAGGAAACTTGGATGACAGTCCCTGGCTGGTATGGC
++
+5/8=>B@@@:7?52:'73/31;75561;/3'798(&&3451:914.67.-'&-/
+@ERR005448.109203 IL40_2446:5:1:1787:1945/1
+TCATCATTTTAAAAATATCCTCATCAGAAATTCACAAAAAAGACTCCTAGAACT
++
+EA;AA<@BCCBA;>>=;?@>@AA<8419;
+@ERR005448.109204 IL40_2446:5:1:1787:1238/1
+AATTGTTAGCTATAATTATTAATATTCTTGCCTGAATATTGTAGGAGTTAAATA
++
+;;CCA@C:>AC>?98C@?CC=7?>@CCB=9>BC=<9?;CC;;=<69=?=;;;=<
+@ERR005448.109205 IL40_2446:5:1:1787:67/1
+AATTCCACATGGAATTTATGAAATTATCAAGTCCCCAGCACATCAAGACCCACG
++
+;899>BA@CB=B>8?@;9<=1)=?=9;>:9A6BC@?399'3&.<77;1&15)&1
+@ERR005448.109206 IL40_2446:5:1:1787:981/1
+ACATCGACCATGGCCATGTAATTGATGGCAACCAGTCAATAGATCGGAAGAGCG
++
+AAB?BABBAB@@<@@=?=;<><<=>;;;8.9;<572707/,/35760.)43438
+@ERR005448.109207 IL40_2446:5:1:1787:790/1
+AGCTGCTGAAGGGAAAGGGTCTCATTCACAGGTGTAATGTCCAAGGTCCCCTGT
++
+::AB@?<::1?=;4'48;=8@?AA72:=8=;7;;07?A;=>2/??84>5'
+@ERR005448.109208 IL40_2446:5:1:1787:625/1
+GATGTTAAATGCTGGTTGACTTTTCCTGAATTCCAAAAGGGAGGAGGGCATAAT
++
+?9A6)5>4-9CCAB;1/<=>?9>>;<>9:9:?<;98-4>75.07+8:0;;6503
+@ERR005448.109209 IL40_2446:5:1:1787:820/1
+ATCCTGTCACCACTCACTGACTCACTCAGAGCAACTTCCAGTCCTGCAAGCTCC
++
+:?AB??@?:?@?@@?5?=73>@@>=@?=4::?;;?>;??666=?448)2379;>
+@ERR005448.109210 IL40_2446:5:1:1787:1093/1
+TGTTTGTGTGTGTATGTCTGTGTGTGTGTGTTTATGTGTGTGTGTCTGTGTGTT
++
+AC>CCC?@BAB?=ACC>CA;;8;<5>;99:9A?<>5:5;44;899:=>3/521(
+@ERR005448.109211 IL40_2446:5:1:1787:91/1
+CTAAGTGGAGGAGGCCACAAATGGGAAATTTATCCCATAAGACATCAATCAGGC
++
+B>8;?;A?<=;?>-;:2217:7;(9:<959>>;:9<:7::-677(/:12.&
+@ERR005448.109212 IL40_2446:5:1:1787:1301/1
+CAGGTGATTGGGATGCAGAAAGTCCCTGGCTTGACTAACTACAGATTTATATCC
++
+<2=B9963/57<4>7625,//;<65.137;/-1:5/22'/&+&49787693:
+@ERR005448.109213 IL40_2446:5:1:1787:1886/1
+TGTTTAACATAACCTATTTTTTGCTGCTATTTTTCCTTGCAAATTTATGCTTTG
++
+@B@CC>:>@B=4=C?8?CCBCA?CACCA;BCCBCBCB;?A>7'BC=8?CA>=<>;@;=BBBA>@8=A???A??1:><4988.
+@ERR005448.109215 IL40_2446:5:1:1787:801/1
+TTAGAATGAAGCCACAGCAGGAGCAGCAAAGGTTGGTTTAATTATGTTAAAAGC
++
+CA>@>?B@==9AA?=2:>;:6/::28;932742:6758<::::6716;76525=
+@ERR005448.109216 IL40_2446:5:1:1787:1552/1
+GTCTCGAACTCCTGGGTTCAAGCGATCTGCCCACCTAGGCCTCCCAAAGTGCTG
++
+?6AB@;::@ABB>8:<:?>:?8>@<>B@=AB@=?B<826<><@B<706%.199;
+@ERR005448.109217 IL40_2446:5:1:1787:1295/1
+AATTTCTTTGATCAGCGTTTTCTAGTTCACCTTGTAGAGATCTTTCATTTCCTT
++
+<8?=93=BC;;A><;<1.A=>C=86::A9=9A@9>A6=2>CCC=CA>??==<>=
+@ERR005448.109218 IL40_2446:5:1:1787:1380/1
+ACTTGTGTGCTATTCACAGGCTGGGGGGGGATGAGGAGATAGCAAACAGGTGGA
++
+A<==?8;9;=ABBB<*>599:==584.381+1002*),4'222/2/-)--'//2
+@ERR005448.109219 IL40_2446:5:1:1787:342/1
+GAGTAACTTCTATACTGTAGAAATTATCTTCAAATCATTTTCCTGTAAGATCGG
++
+CCC??=1=AA<9>006??:?=BAA<=6?;5:A@?BB@:9:3&1:=15
+@ERR005448.109220 IL40_2446:5:1:1787:217/1
+AGGGAAGCATTTGTTGATAGGGTCTCAAAATCAACATGGTGAAACACCGTCTCT
++
+;A>A<==A>AB?@;A97<0::?5B@==>996B=;55)58*249;6<;6;4:;=7
+@ERR005448.109221 IL40_2446:5:1:1787:1132/1
+CCATTTTGCAGACAGGCACTACTTTGTAATGACAGCCGCTGACCCCTTCTCATC
++
+B@@@BB?:>@<:=:==?2?:7@=;673=<::5667,4/&.5>>6-82&)/*:
+@ERR005448.109222 IL40_2446:5:1:1787:250/1
+TCCGTGTCTCACGTCCAGGTCACACTGATGCAAAAGGCAGGTTAGATCGGAAGA
++
+BAB@B?1?@BBAA=B?3=A<=/>AA=:;?;8:;==';>>8;69=;?>=;:7'
+@ERR005448.109223 IL40_2446:5:1:1787:194/1
+AAAGCATTTCTTAAAATAGTAAATTTAGTTGATGGTCTAGTCTGATTAAAGGGT
++
+?A>BB>AB@BACB?31=<>3>><@A@>A9C<<87?=::6@9<9:6:4&
+@ERR005448.109224 IL40_2446:5:1:1787:1365/1
+GAGGTATACTAAGTTTCAGCACCTCAGCTCATGAAGAGCAAGGGCTAGGCTGAG
++
+:(;>,@:>@?::;:@BB?;>.=@:?;8=7737:;3.4673735/7255/2--.7
+@ERR005448.109225 IL40_2446:5:1:1787:974/1
+TATCATTTTTCATTTGTTTTTATTTCTTCTTAGTAATTGGAAAGATAATATAAC
++
+CDCA:7CD>@C7CE@C==@CA:<@@9+1
+@ERR005448.109226 IL40_2446:5:1:1787:356/1
+AGTCCCATATTTCTTGGAGGCTTTGTTTGTTCCTTCTCATTCTTTTTTCTCTAA
++
+A@=?C@6?:AACCCBC93;AACB?;8?A;=CC@BA>7305@<3>6?:?9=89.<07'36,79==7*6=>@?>37@
+@ERR005448.109228 IL40_2446:5:1:1787:1263/1
+ACCAGCCTGGCCAACATGGTGAAACTCCATCTCTAGTGAAACTACAAAAATTAC
++
+?AAA;AB=77??68>6=<:29379<:==7=@?@:/,45436:96;:37&70'/)
+@ERR005448.109229 IL40_2446:5:1:1787:498/1
+CTTAAGTTGTTGAAAGTACATGTCAAAAAAGGCTGCCTGCAGGGACCAGGGCAC
++
+BBB=7>:<>?B@86*41??9?:<>68(<2;90:8>=;29<483/86'26339'6
+@ERR005448.109230 IL40_2446:5:1:1787:567/1
+TCTGGCCTTTTGGGAGAACGTTCAGCGACAATGCAGTATTTGGGCCCGTTCTTT
++
+BBA??@BBBB@??<)<66??>??=:?:.=2:;:<29/)7190/5=?<739>>9=
+@ERR005448.109231 IL40_2446:5:1:1787:19/1
+TGAAAAAACAATCTTGCCAACCCTACCAACTGCTGATGAGTCCTTTTCTGTTTT
++
+9?;=;991586/437?>>5)<::9<<<693:77(9/7),4/65//65&6464-&
+@ERR005448.109232 IL40_2446:5:1:1787:716/1
+AGAAAAGAGGTTTAATTGGCTCATGGTTCTGTAGGCTGTATAGGAAGCATGGCC
++
+8;;;:;<3;6:@?5.9?<9?=79/1,6'6)341'126-/02//3+
+@ERR005448.109233 IL40_2446:5:1:1787:1453/1
+TGGAATCATTGAACGGAATTGAATGGAACCGTCATCGAATGAATTGAATGCAAT
++
+A=<;>AA<@:;88?=9/(9=;96<;7.5?=999(5=53'64129617;67:3',
+@ERR005448.109234 IL40_2446:5:1:1787:892/1
+AAAAGCAGACAGCAGCATTGTAAGAAACTACTTTGTGATGTTTGCATTCAAGTC
++
+??>=15331><=?99>=453).;;<4>><4;29,6:8:<<7(695;9-=<;4':
+@ERR005448.109235 IL40_2446:5:1:1788:442/1
+TGAGATTACCCTTAACATTCTTATATATGATTAATCAACAGAAATCTTAATTTA
++
+CA@>:CCDCACCA<@<@DCCC:;<.'(464;A==><30:<8<:@C@48311B?;2+;(6.4(9@>((0(9/84'%(8;1%
+@ERR005448.109237 IL40_2446:5:1:1788:2008/1
+AGTGCTCAGTCTGTCCTCACTGTCCTCTGCGTGATTGGTGCTCAGTCCATCCTC
++
+?64BABB>?BBB@?@@@<<:@>:<:>@B?=5;8-5@920?@:4'25<7489689
+@ERR005448.109238 IL40_2446:5:1:1788:1254/1
+GAATGAAAGAATTAGTCCAGTTAAAGGAGCAGCTTCAGGGACTGGGCCGCTTCC
++
+@9/;A)76<.6?B8;6?/2.<4><6A6(>@<8;6(6-)-7/(8540(4(9.248
+@ERR005448.109239 IL40_2446:5:1:1788:600/1
+GCAGCGGGTGAGTCCGGGATACCCTGGGACACCCCTCACCCACACCCCGACGCG
++
+>>:><<>95535:3'4;:971>775.06'7+%4<92315/4%-%390&%-).))
+@ERR005448.109240 IL40_2446:5:1:1788:1441/1
+CCAGGACCTTTGCCTGAAAGACTTACCTGGGATTCCTAGAGTTTTAATTATTCA
++
+C=1694?C<2=6AC=655)25<=09>@=8/517=?>;-7/42;;61&6:9;6:5
+@ERR005448.109241 IL40_2446:5:1:1788:462/1
+TTTTGAGACGGAGTCTCGCTCTGTCGTCCCGGCCCGCGTGCAGTCGCGCGCTCC
++
+>??:<<>:;;33;6:>>8:@@0-393-.70,,45'*3%/14'3,%2.,4/).3*
+@ERR005448.109242 IL40_2446:5:1:1788:1207/1
+TGAGCCTCCCAGAGATGTTATCTTGCCTGGAATCCCCTCGTTTTAGTTTACTCG
++
+B9BA>=7BB?9@>A6:?4;7=4><(-64954@A<,-5<)+910>(9;5&1).
+@ERR005448.109243 IL40_2446:5:1:1788:846/1
+TGCTGGCAGATTAGGGAAGATGGCTAAGGGATGGATTGTTGGTTTTAGCAATAT
++
+BBBB@AA;@;=?7=624893:;>><75=<9/8?7/5<.986:48?;7389.3/3
+@ERR005448.109244 IL40_2446:5:1:1788:1356/1
+TCCCCTTGAACGCTTATGACTCTTATAAGCCTCAGAGCTAGAGGATAAGACATC
++
+A>AB97:)6<6?=?A?9;2:A6?;9:<:;=B@?<937881;/89.773728(/-
+@ERR005448.109245 IL40_2446:5:1:1788:926/1
+GGGTCCTAGAATTAAATAGACCAAGTGGAAAGTGGATTTAGTGTGTGGTATAAA
++
+ABA=CCA<>37?@:;;?=83?@7'56;;;4773=769<528:873677,55,&5
+@ERR005448.109246 IL40_2446:5:1:1788:935/1
+CCCAGGGTACAGCTGTAGGCTATAAAATTGCTCAATTGCAGTCTAGAAATGGCT
++
+BBA@AA')38&829=<8?=A;3101'6://1.7<6+==,/82;37=5/,+''1)
+@ERR005448.109247 IL40_2446:5:1:1788:455/1
+AGGCCCACCCCTCCCAGCCCCAGGGGCCCAGGGCGCCCACCCCCCTCACCCCCC
++
+::;543.8<<85:'66--.60633%%*.-,57+*%'
+@ERR005448.109248 IL40_2446:5:1:1788:1323/1
+GCGCTACTCATAATAGCAAAAAAGAACCAAAAACAAGAAACCGCCTAATATCCA
++
+A@:7:<6??;-A@<8?8==<;1<<>/'8>:<7'.8?-=1(3'3&8,.',/&'76
+@ERR005448.109249 IL40_2446:5:1:1788:838/1
+CCCCTCTGGGGAAAAAAGCACAGGCCTATCATGCTTATCATTCATCAAGTACAC
++
+ABB?@B>6>?@9077717=<>5>9>@809>'7=?>;19;47958547149/9
+@ERR005448.109250 IL40_2446:5:1:1788:450/1
+ATAGACTGACTTGCTTTGGATTCTATTAATGTAGATGTAGACAGTTTCATCTTT
++
+?@?CCCC?2>CBCB@C=;=3;?BA;>@86?9:;>6<;6:==A;?-@@<3=28<@
+@ERR005448.109252 IL40_2446:5:2:0:1500/2
+AAGCAAACCCATTTCTAGGAACTTTTTTCGTATCTTCTTTCTAATTTTCACAAC
++
+C=0:ACB=;?CABA7@@@B??><@BBBB?<<>8?A?B?9>@?9:BBA@ABBA>7>>??;?
+@ERR005448.109254 IL40_2446:5:2:0:141/2
+TAAAAAAACTATTTTTTAAAACTAAAGGACACTATCATTTATCTAAAAAGGGGC
++
+@A?<6BCCBCA@CCAACA??BCACBECCBCBAAB=?FEF>@>B>BBBC<;973>
+@ERR005448.109255 IL40_2446:5:2:0:394/2
+GCCCAGGCTGTTCTTGAACTCCTGACCTCAGGCAATCCGCCTAGATCGGAAGAG
++
+4<272<<57??7<35:41=?9.<9>??..':.7-/<59401.'%0'6'767<
+@ERR005448.109256 IL40_2446:5:2:0:496/2
+GACACAAGCATTCTCAGAAACTTGTTTGTGATGTGTGCCCTCTACTGACAGAGT
++
+9??7>B?:>?>AA?8<:<<<=A?=:B@A??=@<9783;99@@@@>::?:?:25;
+@ERR005448.109257 IL40_2446:5:2:0:553/2
+AGAATTCCCCCAGTCTGAAATGGACACTGCAGCTCTCATTATGTGGTGAATCTT
++
+@7/)5?59;75;=88:88B;0652;88=45.%.048753:638633'23266.6
+@ERR005448.109258 IL40_2446:5:2:0:990/2
+AGGCCGGGTCCCCGCTTGGATGCGAGGGGCATTTTCAGACTTTTCTCTCGGTCA
++
+?48A:608;7=4714?6',:632638438.848833,/4/78?8-601,*)204
+@ERR005448.109259 IL40_2446:5:2:0:386/2
+TGCCTGATACCATTTTGTTGAAATGGGTCTGGCTAGGCAGTTGGATGGGCAGAC
++
+=69;<8<>;9<:;=;=?5:9@>>5(53'5222:@=9<=A6/8)8(.9;?8<9<;
+@ERR005448.109260 IL40_2446:5:2:0:1001/2
+CCTGGCTGCTCTGTGTCTGAGCAGCAATCGAGAAGTGACTGCCATCCACTATCA
++
+>:85/<9499<5514<=>/<41939@?<>9<95<:2'795'5<725?>9;68?8
+@ERR005448.109261 IL40_2446:5:2:0:1663/2
+CTACTTGGGAGGCTGAGGTGGGAGGATTGCTTGAGCCAAGAAGTTTGAGGTTAT
++
+AA>>4.1;32;309=8=
+@ERR005448.109262 IL40_2446:5:2:0:27/2
+CATGACTATGCAGTAGTTATGATTCCTACTCATTCTGACATGCTGTTAAACTGC
++
+@==89>:;;24>9;::;?A:57>?@<>=9;;?;?<;399=956;7:9<4,/62/
+@ERR005448.109263 IL40_2446:5:2:0:61/2
+CGGCGGGGGCCCAATCCGCTCCTGGCGACCCCGAGCGTGCTTCGCCGTGGCTGG
++
+/5,05>/.29<4@;<62'55%2/1'0526.',2*')00.12%38(..,)2%-'9
+@ERR005448.109264 IL40_2446:5:2:0:111/2
+ATGTGGTAGCTATAGGCATTATGTTACTTTTATGCCAGCATGTGAATGTAAACA
++
+A>746'2?1>@>;@:88???A;3;=:<@5B@<9175::739(,08863,<83'9
+@ERR005448.109265 IL40_2446:5:2:0:1055/2
+TAGGAAAGAAGAAACCAGATTTATTTAACATAGCATTAAGCTTTAAAAATGATC
++
+E?>>A<=>BA8=>=:7@=CDECCEC@?==EBC909;ABED;A9A?CCB=;?B?B
+@ERR005448.109266 IL40_2446:5:2:0:1181/2
+ACAAAGTGTACAATGAACCATCAGAAAGCAAAGGTGTCACTATCTCAGCCACAC
++
+?B>B@A:<=BBB?>8@BA=?=5=3=@@<=BB>>>5=65<9+/1/<@9'79242=4486+97>
+@ERR005448.109268 IL40_2446:5:2:0:1807/2
+CTTAACAGAAAGAGCAACTACAATAATGAACACCAATATCCATGGACAGCATCT
++
+?C?6>9;@A?BCBBAC=35<64?AB=@9>?248AAA@A?2:9+98;-;218((1
+@ERR005448.109269 IL40_2446:5:2:0:1966/2
+GGGATGTGTGAGCTCAGCTAACTTGAAAAGAGAAGACGTGTGCCAGAGATCGGA
++
+/9697/73:/;:>A=;.6@==9?;19??@<;:;;6949222'230,1147-218
+@ERR005448.109270 IL40_2446:5:2:0:446/2
+AGCCATGGCACCAGCCCAGCACTGTGTACATCGAGCTTGCGGAGTCCACCGGAG
++
+::9,65<<<<@8@A@A2=A60/388==<17-3986+2:44.*-%-823,),.
+@ERR005448.109271 IL40_2446:5:2:0:527/2
+CACTAGCCTTTCCCAAAACAGACAGTTGAAGTTGAAGAAAGAGTTGAAGAAACA
++
+AAAB<98?BB?BA@?@@B@@>?B?<8;<9;=37=55<><;51:09<.59?8=
+@ERR005448.109272 IL40_2446:5:2:0:1524/2
+TATAAAGGACCCCTTCAGCTCAATAATAAAAAGGCAAATCATTCAATCTAAAAA
++
+B>?@D?27?@@@@=AB=@;@B@=AC?CCB?>=817@?B;4B=B?
+@ERR005448.109273 IL40_2446:5:2:0:137/2
+ACATACATAAATGATGGAACAGCATTCAGAATCCAGAAATAAACCCTCACATTA
++
+B=;9=AB=>1<=<>904=A@923-8@?>9===@:>:>??89;:6<<<@=>:<9>
+@ERR005448.109274 IL40_2446:5:2:0:459/2
+TATAGCAGTGTGAGAATGGACTAATACACCTTGATACCTTAGATATTCAGTTAG
++
+A>=93=>3%%//;3:B@634=:;39=443)
+@ERR005448.109275 IL40_2446:5:2:0:516/2
+TACCTGCCTGAATGAGGCAGTGTTCTAGTTTGCATTCACACAACATTGCTTACA
++
+AC@>2>@?;0939A<68;9428/:<=9>3<:198<:7:/<5A7994./4@<85,
+@ERR005448.109276 IL40_2446:5:2:0:1513/2
+AAAGATCTCACATGATTTTCTCTCTCCTATGACAGTATTGAATGAGCTTAAACT
++
+AB<;=<,;.6293-;??><4?6;9:39@<80769,15@81875)-,28>686-/
+@ERR005448.109277 IL40_2446:5:2:0:1341/2
+TTCTGCTTTCCATCCTCTAGTATTAAAACCACCCAATGATTCTCAGTCCCTTGC
++
+<<>6;9=BB=?@?>=>@A>=;@8;<=89A?557;@>B;;-/-121<63
+@ERR005448.109278 IL40_2446:5:2:0:407/2
+TTCTCAAATACTCTTAAGACAGTTTTCATCTGTTCCTAATTTTCTCTTTTTAAA
++
+A?:C?>=A>:=@CBBC?;=?;<:??=;=@<9<;?=>A77:<:>8BB@@?:@A:<
+@ERR005448.109279 IL40_2446:5:2:0:417/2
+TTCCTCCCCCTCTCTCTGTCTCTCTGTCTGTCTCTTTCTCTCTCTTTCTCTTTT
++
+AA?A?@<=BAA:=<66>0/<83<56'60884:8;3/5/968+36=A7&61,,/&
+@ERR005448.109280 IL40_2446:5:2:0:1439/2
+TCTTCAAGTTAGTCTTTCTCTGACACTGATTTATATTATAGATCAATAGCCTCA
++
+AA@>99<=?;:8=@A9;>?:::@=A<;?AAB=7>@=?><=;4=;::,8;;AB
+@ERR005448.109281 IL40_2446:5:2:1:727/2
+GACGTTGAAAAATGGCTTAAATTCTCTAACTAAAATAACTCCTTCATTGTGGAA
++
+0;=:?B>>ACCCB;39CCBA>ACACAB?>CCBCACCCDCAA:A@DFCB?>9><8
+@ERR005448.109282 IL40_2446:5:2:1:1111/2
+CAAAAAGACCCACGCAAAGAAACATCATCATTAAAAAACAGAAACACCAGGAAA
++
+=A=<8?:;0:>A@9@>???:B@AA;@@>>5'8@;5=@@AB:=7B?:?
+@ERR005448.109283 IL40_2446:5:2:1:1548/2
+GTCTTGCTTTCCATTGTTTTAGGTATATACTCAGAAATGGAATTAGTGGATTAT
++
+39AA@BA79BAB?B=?8=@AAC=7B?>BC5%7:2;BB?=
+@ERR005448.109371 IL40_2446:5:2:3:9/1
+AAGTAAGGGCATGGGCACGGAACTGGCAGAGAGGGCGTCATGAAGGTGCAGGAG
++
+6%68>?466::>.3-4=823<=;26..8563865'3.)-3/*6*-,%/1'1111
+@ERR005448.109643 IL40_2446:5:2:10:7/1
+GGATTCGGGGCACTAATGCTATCAACACAATTGTTTCCCTCCATCTGACGTGGC
++
+:/99?B?BA3A@BB@A?=@BBBA>@>9>A>9/97.4'/8
+@ERR005448.109645 IL40_2446:5:2:10:5/1
+GCAGACATTCACAAACATCTGTCTTTCAACCCTGAAGAAATGTGTGGGTCTAAG
++
+3.5:977;@48B;???A;A<9=<=?;1969@;:71;8<;8094>94284<9:90
+@ERR005448.109865 IL40_2446:5:2:15:8/1
+TGCTTTTGATTTTACAGGCTCACAGAAGGAAGAGACTTGCCTTGTCTCAGATGA
++
+<06AB?946@>A>A2871=:6/45:.4
+@ERR005448.110159 IL40_2446:5:2:22:8/1
+CGTCGGGCAATGAACCTATTACAGTTACAGGAGTGTTAACCCCCTGCACTTCCA
++
+==6@94;?=BA?;89A@@>>B;19?4975;://74417>
+@ERR005448.110266 IL40_2446:5:2:24:1173/2
+CAGGAGTTCGAGGCCAGCCAGGCCAACACGGTGAAACCTCGTCTCTACTAAAAA
++
+B?6=?;>A@?A?7=>@<@?A===@BB@@A;<9;A@@BBA
+@ERR005448.110319 IL40_2446:5:2:26:5/1
+AGAGTCAGTCAATGGTTGGTGGTCTTCTTATCAGGAGAAAGTTACTGAAATCAG
++
+>;?<;B??A?>@@=<>A<9:7=9A@B>BBB??@BBBB=BB?<850:6:B:8>?<24=<@=>8<84B>78@A7<;4
+@ERR005448.110510 IL40_2446:5:2:30:1/1
+GGTACTTGGGAGGCTGAAGCAGGAGCATCACTCGAACCCAGCAGGCGGAGGGTG
++
+''1?B<;73'5:35=9?@;<:6>:1,92:84>;'282:654%44:4%4346%6<
+@ERR005448.110678 IL40_2446:5:2:34:7/1
+CACTTGATCGAATCAACTATTGATTCTTTTGCATGTGTCATGAAGTTTTCGTAC
++
+CAACABBBA9?=>@?A?BC@B@=?C@ABBAB79>=@@=9;>9/7<;=?C@6:?=
+@ERR005448.110684 IL40_2446:5:2:34:4/1
+TAATTTTTAAGAAAAAAATGTAGAAGAAGATATACCAAAATGAGAAGCGGATGC
++
+?BCCB@A>A=4:BA<>>@?=230455-16@?=;<447>;:729+63+&01,448
+@ERR005448.110927 IL40_2446:5:2:39:2/1
+ATTGTGGTGAGCCTGCAGGGTAGGGCTGCTGCTCATCTGACATTTCGGAAGGGT
++
+>B<854;:9;2B>5.26<282550025,33'3.4;<@:5519>2:1.172)),/
+@ERR005448.110962 IL40_2446:5:2:40:1022/2
+ATTTCACATACACTAGAAGAATGTGATGGTACCTGGCACCACATCTAGAGGATT
++
+CCCBC?7?CC@B>C=:@A=@?B>8@??<46C;5==7.>;1A;@>5@;6;;;8;:
+@ERR005448.111238 IL40_2446:5:2:46:8/1
+ATGATCAAGTGGGTTTCGTACTAGGGATGCAGGGATGGTTTAACATATGCAAGT
++
+B@@ABBBA?=<;;=B?=:98761
+@ERR005448.111443 IL40_2446:5:2:50:2/1
+AAGGTGCCCAGGACAGAATTGAGATCATTCACACAGTGAGATCGGAAGAGCGGT
++
+B@;8>:;BB:7=@A?9;<@=5=??@@AA?@@<><<*2.9/7<9*3577863427
+@ERR005448.111702 IL40_2446:5:2:56:404/2
+ATGCTCTTAGTGGCATAGTTTACAATCACTGTACAGTAAGGACTTCACCCATGC
++
+?<36BBBB887BBBB?<@:ABBB@?BBBB?BA>A=<;=?BAB=
+@ERR005448.111823 IL40_2446:5:2:58:11/1
+CGGTTCAGCAGGAATGCCGAGATCGGAAGAGCGGTTCAGCAGGAATGCCGAGAC
++
+==80BB54>>;@BB@>>>5<5<63723<;9259.3;484@:8882/-55.995.
+@ERR005448.111960 IL40_2446:5:2:61:4/1
+AAACTAGACAGAATCATTATCAGAAACTGCTGCGTGATGTGTGCGTTCAACTCT
++
+?CCAAA@>=@17>A4@>;';>A=;=<>::0.8::9:9:33?122-0<6997889
+@ERR005448.112409 IL40_2446:5:2:70:6/1
+AAGAATGTGGAAGTTAAGGGAGAAGAAATGTCAGTGTCATTCCTAAAGATAGTG
++
+BA<>;95-;><88141<<6<<>:9,9,3.+/
+@ERR005448.112593 IL40_2446:5:2:73:7/1
+AAACTCAGGTCCTTCTGATTCAAAAGACACTGTTCTTAATGACTGCAAGATGGA
++
+CCBB<8@>:A?CC=CBAA@BCC@?A<<=><86/=5<6/1
+@ERR005448.112594 IL40_2446:5:2:73:2/1
+ACTGTCTTCTAGGCCACTACCTTTTATTTGGACAACTGCTATAATCTCTCAGAT
++
+@>@?=;@>;95:@<==B><:;A@=BB7/26;?:98-7;=@;?>=:3;63*78
+@ERR005448.113018 IL40_2446:5:2:81:5/1
+AAAGGACTGCAGCCTCGGGGAGCCAGGGTCCCCTCGCAGACGAGCTGCCAACGC
++
+@B;.9>A?@@A?<@A@96:<9:8<<69:58:5=8;666131/52005431/1*2
+@ERR005448.113030 IL40_2446:5:2:81:1185/2
+TGGTATTTGGTTTTCTGTTCTTGTGTTAGTTTGCTAAAGATAATGGCCCCCAGC
++
+B?C(>CA@BA;ABCC=8>@B>8BBB@A69A9>8<;9=@??9?=9?=;;>6
+@ERR005448.113477 IL40_2446:5:2:90:4/1
+CACAGAAAGGTCTCCAGGACTCAGGGATTCTACACTCAAAAGAGGAAGCCGGAG
++
+8:@:486@@8(>B@@2?>??:?;7=?1=BA718B?B9<=33=186/;738211:
+@ERR005448.113486 IL40_2446:5:2:90:9/1
+CCCAGGAGTTCAAGACCTGCTTGGGCAAAATGGTGAAACCTCGTCTCTACAAAA
++
+BBB==;?;8.;?B@AA=;;3;>=;;7=9:6=A>BAB87;9
+@ERR005448.113892 IL40_2446:5:2:97:3/1
+TCCCACCAGTGTCCGGGGACCTCCCCCAGCCCACCAGTATCAGATTCTATTCCA
++
+BBBBBBA@B@?>BA<99@@><8=0A;;65=7
+@ERR005448.113981 IL40_2446:5:2:99:8/1
+CACTATTTTCTTCTGTAACTTCACTGTCATATATTCATAAAGTAAACATACACA
++
+CC=B>7B@A@ECC>BDCEAAA:AA<;???CB:C
+@ERR005448.114363 IL40_2446:5:2:106:9/1
+AACAGTGGCCATCTGTAAGACATGGGCTAGATACCAGGTGATTTATAGGCATTA
++
+@@?BB????@BB8>@<=ABB>=:B>.@A:;=1@?@@7:A>=?8/:<<@43
+@ERR005448.114528 IL40_2446:5:2:109:7/1
+AGAGCAGTTAGGAAACACTCTGTTTGTAAAGTCTGCAAGTGGATATTCAGACCT
++
+B@=@C<4>CC?>ACA?=BBB?@C@@==?<:=<=200:=AC=8;4B<77(:=:?6=:751,*7'6:=;==9;>A906--062521278
+@ERR005448.114977 IL40_2446:5:2:117:10/1
+GAGTGCTCTGTTTACCTGGCTCAGTGTCTTAAAAATGGTATGGCCCTGCAGACC
++
+>A?8>@BBA;?>?BBBBA>AA?=?>BB?B@A?79=?<95<<:563199746:7;
+@ERR005448.115120 IL40_2446:5:2:120:4/1
+ACTTGCCTCCTTCACTATAGGCAACCTTTCAACCACCTGTCCTCCTTTTTTCGC
++
+?A==;?>@?3'4BA<;?:>7B?8/1-5;000'-6'53'.43;4-,06'15)&&/
+@ERR005448.115222 IL40_2446:5:2:122:6/1
+CCAACACTAAGATCGAAGTGTAGAAGTCCGTGAGTAGAGATCGGAAGAGCGGTT
++
+>;@B>@A@?BBB>8:<<0:?A<>@??>=9;5;<7,>@A???3??8<;9?699
+@ERR005448.115757 IL40_2446:5:2:130:2/1
+CTCAAGGGTGGAGGGTGGGGGGAGAGAGAGGATCAGAAAAAAATAACTATCGCG
++
+BBBAB??>25;B@5:6?<>@>98?;@=A=08-7.=;4>7?:?;(<8'4<1'/'1
+@ERR005448.115780 IL40_2446:5:2:131:7/1
+TTCAGGCCGTTAATTTTTATGGCGGGGAGGGGGGGGATGGCTGTGGGGGTGGTG
++
+@;@;.3??B2<:<=2?52:865<66%,%%%/.3-)%%%,.%))%&%%%,%%*,.
+@ERR005448.115980 IL40_2446:5:2:134:5/1
+TATTGAGTTCTTAAACTGCCAGTACCTCTACAAACACTTTACATTTTCTTGTTC
++
+CBCCABA?CCC?@=C?BAB9=<;B@?C?B@:B>=>@>@@===<2
+@ERR005448.116052 IL40_2446:5:2:135:9/1
+ATGATCCTTGCCTGTGCTTCTTCGGACCATGCGAGTTTGGACACTCACTGCAGA
++
+=>;@8=>16/8B1)89>>;12<;(64=7@@3(;761>99(0080087++3''5;
+@ERR005448.116175 IL40_2446:5:2:138:9/1
+ACAGACTAATACAGTAAATTGGTACCAGGGGTGGGGTGGGTCTCTGCTCCAAAG
++
+B@3:A;>AA@@52==?AA@=@@7>914<@(=4<3>5&7;4--4(65(<(6.--3
+@ERR005448.116325 IL40_2446:5:2:140:10/1
+GGAGTAGCAGGGATCTCCCTTCAGAAACAACAAAAATAAGGAGTACCAACAGAG
++
+==5=4=?66)14>:>?AA5)4-768;2'-:<:=;3''07471-'4,985*0432
+@ERR005448.116328 IL40_2446:5:2:140:4/1
+CTTCAAGGCATGTCTGGGACATTGTGGACAACCCTTTGTGCCTAGGGAGCATGT
++
+@BBB?;;BBBB@BBA:7;?BAB==BA>>>BA8B<=4A<2><:
+@ERR005448.116567 IL40_2446:5:2:144:6/1
+TGAAATCCAGGCAGAGGTGGTCTCAGATGGAGATGAGGTATTTGTTGGGAACTG
++
+@?BABBAB>9<=;;=A>7@>97)2<;:;702<0:?582&3=;>::5*56/6059
+@ERR005448.116665 IL40_2446:5:2:146:123/2
+AGACAAGGCACCCATGTCTTATGTATAATCAGTCATTGTTATTATTTATCAACT
++
+B<<+=A5=@<9<@=0;6>BB=<<6>CBA@B9635=@@:49C==16?83<7;A2;
+@ERR005448.116734 IL40_2446:5:2:147:8/1
+CTTGTTTTTCTCAGGTTTGTCAAAGATCAGATAGTTGTAGATATGTGGCGTTAT
++
+B@<;A?;BC@<<<9@?CCBAB==@?9<'884??A>CB:=:9<9<@6;549;A9B
+@ERR005448.116758 IL40_2446:5:2:147:6/1
+AAAATCCCTCAGCATTTGCTTGTCTGTAAAGTATTTTATTTCTCCTTCACTTAT
++
+B?>8@A;?CC=BA=ACAA=B@::@A??@@=@;<A?>>@<;A>B;6=;8??@;9.6
+@ERR005448.117056 IL40_2446:5:2:152:8/1
+TAGAGAGGAAGGTAGGAAGAAAGGAAAGAAGAGAGTGAGTGGAAAAGAGGAAAG
++
+?=:?B8=;:;;<(6?=>=76++0:3?2842.(-,7,:48(6.2(,65,434707
+@ERR005448.117136 IL40_2446:5:2:153:6/1
+TCATTAAAGCAAAGTGCCTGACATTTCCATTGTCCAGTCAATGATGTCCTCGGT
++
+B>;>=@>=6326:<6<<(;??:886?712687-1;;98=2790-0=3--0
+@ERR005448.117143 IL40_2446:5:2:154:1/1
+TTAACCCCAAGAAGAAACCCTGCTCCCCTGACACGTCACTCAACAAAATTGCTA
++
+@BBA@>?:?9)>=>AAA?50<95>:8>(:))(7+005'-2775<=525'-,+-1
+@ERR005448.117448 IL40_2446:5:2:159:3/1
+ATAGACCAATGGAACAGAACAGAGGCCTCAGAAATAATACCCCACATCTACAAC
++
+BBBBBBBBBBBA@B?@@BAB?B<;;<;BA@<=<>@=<@6=@8=80
+@ERR005448.117514 IL40_2446:5:2:160:8/1
+CCTCCCTCCCCTCACATGGTGTTAGGGTGTCATCTCTGTACCCTCCCTCCCCTC
++
+BBBABBBBBB?BBBBA@<;;?=/-;>;?<.,988
+@ERR005448.118230 IL40_2446:5:2:171:2/1
+ATATCCTTTTCTAACAATGAATTCTCACAAGCCAGCCAATTAGAATACATTTAT
++
+87:ACB@@70=9:<5>=8AACC<=A<8=877=:;:@3/8=>6;<9;<'><
+@ERR005448.118272 IL40_2446:5:2:172:5/1
+CAGTCTATGGTATTTTGCTATAGCAGCCTGAATGTTCTAAGACATGATTTCTGA
++
+><;;<@???A.@CB?*:45,(::6A796/77699><788<0;/0547523-'2'*/71154/72/9;403.;
+@ERR005448.118551 IL40_2446:5:2:176:11/1
+CTTGGTAAGGCTTTCATCTGTCTTTTTGTCTAGTCGAGCAAAAGTGCGGAAGCG
++
+>>A;A;>;B<<;A>B;B?@?B<;@B??<=8?AB>@99?@BB@A9/>8):<@;1>
+@ERR005448.118621 IL40_2446:5:2:178:4/1
+AATGTGAAACAGAAATGTTTTTATTATTTCTCTTTTCAAGGCTTAGAACAGGAA
++
+C@?CA?AAA>A@BBBCA7ACCCCCCBCAC@CBCCCC>:@
+@ERR005448.118812 IL40_2446:5:2:181:8/1
+TATACGAAGATATTTCCTTTTCTGCCTTTGGCCCCAAAGCGCTTGAAATCTCCA
++
+BB?>-::=?2<7879>9<>=6996;67278(79.0/104/0'5((4,12'2.&&
+@ERR005448.118894 IL40_2446:5:2:182:377/2
+AATTGGATTTAATTTTTAACCAAATTTAAAGTGCTATTTTTTACAACTTCAATT
++
+ADAECDECCACFDCDDFDDDCA@ACBCB?ABBCBC@CC=?B?@:?9<=??;AA=>9;;:5:85;9=
+@ERR005448.118981 IL40_2446:5:2:183:7/1
+CTACACACTGTATGATTTCAACTATATGACATCTCAGAAAAGGTAAAGCTATGG
++
+C@B@C@C>C:5AB<@;@<@=9<5:=8>@:04)6=7.399;;5
+@ERR005448.119133 IL40_2446:5:2:186:283/2
+ATATGAAATACCTGCATGATGAAATGCTACTCCCCATGGTACAGTTTTCTGTAA
++
+@CABBA@B?AB?>@@BAA=<::8B??@:CB@@CB86.
+@ERR005448.119280 IL40_2446:5:2:188:5/1
+TCGATTCCATTCCATATTATTGCATTCCATTCTATTACATTATATTCGAATAAG
++
+A@=@CBC>?CCC@@B@B<=@B@;8B?@41:?:C@=0=B<9;@?95=839;5:
+@ERR005448.119435 IL40_2446:5:2:190:9/1
+GGGGACCAGACAGACCACAGGGACAGAGTAGTAAGGAGAGGTGCTGTGAACTTG
++
+A=6??=;=6>>=A<3988:A
+@ERR005448.119692 IL40_2446:5:2:195:8/1
+CCTTCCCCCTGCCCCCTCTAGTAATCCCCAGTGTCTTTTACTTCCATATTTATG
++
+@B=@@BB@@B@B<>>A8<6@<@<;>8?A::>><2
+@ERR005448.120072 IL40_2446:5:2:201:396/2
+AGAGTCTCACAATGTTGCCCAGGCTGGTGTTGAACTCATGGCCTCAAGTGACTC
++
+AAA=<>A@A;A9@A@@@?>7=77<<
+@ERR005448.120170 IL40_2446:5:2:202:4/1
+CTTTTTTTAGTAAAACCTCCAGCCTTCTCTTCATTCTTCAGACATGCTGAAGAC
++
+BCB@A@CC=5;ACCC@@=?=?CA>;;@@;@AA;;??>C@;8>@B;?8@?@6=:4
+@ERR005448.120175 IL40_2446:5:2:202:7/1
+ACAAGAAAAAACAAACAACCCCATCAAAAAGTTGGCAAAGGATATGAACAGACG
++
+=CCC?CCB<:B7.75<18;76;*>8?<;<5295-46//).4/&-55+1)&&2
+@ERR005448.120183 IL40_2446:5:2:203:2/1
+ACTGTGCCTGGCTTGTCTTTTTTTTTTAATATTTGACATGGGGTCTTGCTCTGT
++
+CC@?6ACC9=>@<<7C>=:>
+@ERR005448.120332 IL40_2446:5:2:205:7/1
+GATTTTCCTGCCTCAGTCTCCCGAGTAGCTGGGATTACAGGCATGTGTCACCAC
++
+8@4??7@69>ABB>><6+:;<:=>B6;<@@@:@=@<99;;29/5;;8&5;265797;535893>>A?A?<>==
+@ERR005448.120951 IL40_2446:5:2:214:1211/2
+AATGCAAATGCATTCTCTCACTCTCTCTCTTTCTTTTTCTCTTTCCTGCNTTCA
++
+?72+56-*1C566D8%385%07+6EEC6)7;6.66%656816?@C+368!5@D.
+@ERR005448.121209 IL40_2446:5:2:218:9/1
+CACTCATTCCTTCAGCAAAGTTTATGGACTGCCTACTTTTGTTTCAGGCTCTGT
++
+BBBBB?BBBBBBBBBBBB@AABBBBBA=>BA<@B@;ABBBAABBA;4;;A?A>>
+@ERR005448.121325 IL40_2446:5:2:220:5/1
+GGGGGTTCAAGCAATTCTCCTGCCTCAGCCTCCCGAGTAACTGGGATTACAGGC
++
+ABA:52:@?@A@?=6>=3<6=988:56668666766329.21,3646531
+@ERR005448.121489 IL40_2446:5:2:222:3/1
+AGTGGCTTGTAGTTCTCCTTGAAGAGGTCCTTCACATCCCTTGTAAGTTGGATT
++
+A<9?<(;7?B@5=?2?6;A2A;@@@B?59:9B9610<748-;@735>7?@2053
+@ERR005448.121515 IL40_2446:5:2:223:7/1
+AAGGATCTTTTATTGGCTCTATAAGTCAATGGCAATTCCTTAAAACAGTTTGTT
++
+CC?A@CC?CCCC>?CCAAA:>?.<@;0::8?<9;?;218A?;:7868?@=;377
+@ERR005448.121678 IL40_2446:5:2:225:6/1
+TGAGACCACTTCAGCCTAGACCTTATTGTCCATATCACTATCAGGCTTTTGGTC
++
++49@A=6784>>674>;83>663)8>7'912
+@ERR005448.121854 IL40_2446:5:2:228:10/1
+CAGTACCATGCTGTTTTCATTACTGTCACCTTGTAGTATAGTGTGAACTCAGGA
++
+CB>4A@2>5@@:@:AB.=?B?BCA<=547;*57<;23<8581(8?93;A1'7/&
+@ERR005448.122399 IL40_2446:5:2:236:10/1
+ACAATCCTGCTGTGGTCTGAAATTTTGACCCTCACACAGGGTTCCAGAACACTG
++
+9?@@>B@<>?@>???@A@<=@=@BB@>?A;?B=:9AA;;;>5@;96;>;>;9=<
+@ERR005448.122462 IL40_2446:5:2:237:2/1
+GTGCCTGTGGCCCCCCCAATTCCTGGTGCTGGCCCCCACCCCCGCCTGGGACCA
++
+8113?339:<>BB<:>8@;4;84;0;82889295<89>@>:4%0256+.2170'
+@ERR005448.122703 IL40_2446:5:2:241:3/1
+CTAATGGAGGTGGACTACTTGACTGCTGTCCTGAAAAGTTATTTTTGTAAAAAT
++
+CC@C@CCCB;7=::4=?@C>:<<=87@7:=@B=?B==98=BC@@@A;<8;?=95
+@ERR005448.122821 IL40_2446:5:2:243:6/1
+ATATATTTCAAAAACACACTAGATATTGTTGAAGTACCTTGAATTTGAACTGTT
++
+?46==>:AC@DBC?4?6?>:2<=;5<=?:8@
+@ERR005448.123252 IL40_2446:5:2:250:2/1
+CATAAATATCCCTCATGAAACCCTGTGGGGTTTTATTGGATCAGTGCTGCAGGA
++
+@BA@??B@?5:@@BA9BA884>5;A9;9;ABA>A?51/>7.9<::<>-230*
+@ERR005448.124047 IL40_2446:5:2:263:5/1
+GGCATTCTGGGCTGGCACAGAGGATCACTGAACACCACTTTCTTCACGGGCCTG
++
+@=A>?>B@<=9@97@037;<13898659655@=:1:20(/1/%-14,
+@ERR005448.124124 IL40_2446:5:2:264:2035/2
+GTTAATCAGTCATCAGATCCTTCATTAAGGCCCTGTTTCATTTCTAAACCCTAC
++
+*7C@BA7:C=A7<>;>8?58?<=1168214/A>*@41):1((:6:>:<00051.
+@ERR005448.124276 IL40_2446:5:2:266:8/1
+CGTGTTTTTTTCTTGGCCTTATTTTTTGTGTTTTTCGCAACAAGTTTGTTTCGC
++
+?C9@?1;9@1B@;-9B=2=8=@?5;<,;.
+@ERR005448.124325 IL40_2446:5:2:267:5/1
+ACGGCACTGCCACTTTTCTCACCGAGGCCCAGCCCTGCCTCTACAGGTGCTGTG
++
+B@?8>(><<@6,8;;5>6@9>(@0-3?@;;;,;7'-3<67646,-%/-3836/%
+@ERR005448.124384 IL40_2446:5:2:268:1/1
+GTTTGAGCTGCATTTTGAAGCATGGGAGTGATTTGGATATGTGGAATGGTTGGG
++
+?1?B>69=B<=?;0);?2?63'5>7;;A<=);>7;@>@9:89@50++:27?2<5
+@ERR005448.124481 IL40_2446:5:2:269:4/1
+TGTGTGCACGCACACACAAATATAGATACACACATGTCCTGGAGCACCTCGATT
++
+B:'91?*9;2:,=<2?9'4285'*')&.2/&/)(.
+@ERR005448.124482 IL40_2446:5:2:269:9/1
+CCCGATATTTAAATCATCAACAGGAAAGGTTATGTACAGGAAGAAGAAACTAAA
++
+CE?A=>???@A7?A99=9<5:<7B@:8?876:-;/-7=C
+@ERR005448.124641 IL40_2446:5:2:272:3/1
+CACCCAGTTAAGACCTTCTATCCAAGTTCCTTGACTAACAAGATTCCAACAAAC
++
+C@CABB>@BC>=>A@C>?@4.7CA?=7>3'>==:=87)+8=2'9*.49/&6-9A
+@ERR005448.124657 IL40_2446:5:2:272:5/1
+TGTTAGGTAAAAAAGTGACAGTTTAACTGAGAAGCTACTCACCCTTAACTCATG
++
+CAACC@?6B@==;=8(@@<;>=CB>6<>76>:@?>;14;46:,32<60'1'256
+@ERR005448.124920 IL40_2446:5:2:277:1/1
+GGAGGCCTCACAATCATGGTGGAAGGCAAGGAGGAGCAAGTTGCATCTAAAGTG
++
+>B@7(6A@?6<:B@=B7;=>A=:>?:72->>>B:;?2(=AC>?:=9<=:A?=9<8@<5?B765:;7?
+@ERR005448.125610 IL40_2446:5:2:288:2/1
+ATTGGACTGTATACAGTCTGCACGTTTACCTTATTTTCCATTATATAATGGTAC
++
+ACCB@BCAA=:;==;;=;==B>9:;A@;@AB=<;9?<477=;5724368
+@ERR005448.125920 IL40_2446:5:2:292:4/1
+GTTTCAAACCTGAACTCTCAAAGGAAGGTTCAACTCTGGGATTTGAATGCAAAC
++
+A:B?CC@@=@+@@@@C<=?A:<=?5;<;:8?9:===72899789:.6177
+@ERR005448.126075 IL40_2446:5:2:295:7/1
+ATATGGATTTTATATAATTTGTCTGGGAAAGTCATTAAACAAATGAAGAAACAA
++
+?DC?C>BCDCCCCCCB=DCC@ACCABA??7(9=?BBCC?ADB<;;8??B=:-7=
+@ERR005448.126174 IL40_2446:5:2:296:2/1
+TACCTGGAAATGAGACCTAAAGCTAAAAATGAAACAACTGTCTTGTTATCATGA
++
+C@?7@;CC=B?CCCCCAC>??<;=>?AC@?=A>B;?AB<=>:?914
+@ERR005448.126338 IL40_2446:5:2:299:8/1
+ATGGAAAGAGAATTTGAGCTGATACTTAAGGCTCTGCTCAGCATTACATTTGGA
++
+A@BCB<<<7'6:8?8>=9=CA>A@A@8:56&1AA;A==<4?7@;;@<2:=?<:1
+@ERR005448.126477 IL40_2446:5:2:301:10/1
+TGTTTAATTGCTAGAGGAAGTATCTTCAACAGTGGTAGAAAGGGGAGGGTGCTA
++
+BBACBB?B?B@BBB?@BB?BA?<>@B><<=3?<55=561=;99*CB=:AC>;:===@;8:699:8:=7'296A=?5;
+@ERR005448.127106 IL40_2446:5:2:310:3/1
+TCTTAATCAGCAAATTATTAAAATTTAGGCTAAGAAAAGTTCTCTGCCCTCTGA
++
+;CA>=ACAA;AB@?BABBCC@AB@A=BB@:?A=?=C<@::A?CA>A98:7)9>6
+@ERR005448.127634 IL40_2446:5:2:319:4/1
+CTAAAAATACTAAAATTAGCTGGTGTGGTGGTGTGCCCCTGTACTTTCAGCTAC
++
+?ABA;;4A=4>@BB@;.(6>@<;:A?=?53;)5*6+'/<;8-&8637&)7'-&3
+@ERR005448.127684 IL40_2446:5:2:319:9/1
+ATCAGAAGCCCCACCAGAGAATGAAAGGTGTTAAATCAGGTCACTTTGAATATT
++
+=BCCCCAC?CAA=:<<@CB?@><=.<==@=;?;8?>5775?<><;;@<@A
+@ERR005448.127813 IL40_2446:5:2:321:4/1
+TTGAATGGAATCATAGAACGGAATCCAATGTAATCATCATTGAATTGAACCCAA
++
+?A=;7;CA4=B=?CAA?BB?C@<<4A@:/;=6=<<:69;:;@:756;4
+@ERR005448.127871 IL40_2446:5:2:322:6/1
+GGGAGAAGGGTGTCTCAGCAGCTCAGCCTCTAGGGGGCTAGCATAGCTTCAGGG
++
+A<;2/6.<7:378?@8416278462/',/.-%+0.260.24''*.-*&*.0-42
+@ERR005448.128705 IL40_2446:5:2:335:10/1
+CTCCATTACATGGCTAAGGATTATTCCTAATAACAGACTTGTCAACTCTCTGGT
++
+CCCCCCCCCBAACCCCABC?BCCCCBBA:@B@A=;