Skip to content

Commit 6762368

Browse files
committed
r940: added the splice:hq preset
for high-quality CCS/mRNA splice alignment
1 parent c2aec88 commit 6762368

File tree

4 files changed

+13
-5
lines changed

4 files changed

+13
-5
lines changed

README.md

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,7 @@ cd minimap2 && make
1818
./minimap2 -ax sr ref.fa read1.fa read2.fa > aln.sam # short genomic paired-end reads
1919
./minimap2 -ax splice ref.fa rna-reads.fa > aln.sam # spliced long reads (strand unknown)
2020
./minimap2 -ax splice -uf -k14 ref.fa reads.fa > aln.sam # noisy Nanopore Direct RNA-seq
21-
./minimap2 -ax splice -uf -C5 ref.fa query.fa > aln.sam # Final PacBio Iso-seq or traditional cDNA
21+
./minimap2 -ax splice:hq -uf ref.fa query.fa > aln.sam # Final PacBio Iso-seq or traditional cDNA
2222
./minimap2 -cx asm5 asm1.fa asm2.fa > aln.paf # intra-species asm-to-asm alignment
2323
./minimap2 -x ava-pb reads.fa reads.fa > overlaps.paf # PacBio read overlap
2424
./minimap2 -x ava-ont reads.fa reads.fa > overlaps.paf # Nanopore read overlap
@@ -139,7 +139,7 @@ Nanopore reads.
139139
#### <a name="map-long-splice"></a>Map long mRNA/cDNA reads
140140

141141
```sh
142-
minimap2 -ax splice -uf -C5 ref.fa iso-seq.fq > aln.sam # PacBio Iso-seq/traditional cDNA
142+
minimap2 -ax splice:hq -uf ref.fa iso-seq.fq > aln.sam # PacBio Iso-seq/traditional cDNA
143143
minimap2 -ax splice ref.fa nanopore-cdna.fa > aln.sam # Nanopore 2D cDNA-seq
144144
minimap2 -ax splice -uf -k14 ref.fa direct-rna.fq > aln.sam # Nanopore Direct RNA-seq
145145
minimap2 -ax splice --splice-flank=no SIRV.fa SIRV-seq.fa # mapping against SIRV control

main.c

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@
66
#include "mmpriv.h"
77
#include "ketopt.h"
88

9-
#define MM_VERSION "2.16-r937-dirty"
9+
#define MM_VERSION "2.16-r940-dirty"
1010

1111
#ifdef __linux__
1212
#include <sys/resource.h>

minimap2.1

Lines changed: 7 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
.TH minimap2 1 "30 April 2019" "minimap2-2.16-dirty (r938)" "Bioinformatics tools"
1+
.TH minimap2 1 "4 May 2019" "minimap2-2.16-dirty (r940)" "Bioinformatics tools"
22
.SH NAME
33
.PP
44
minimap2 - mapping and alignment between collections of DNA sequences
@@ -568,6 +568,12 @@ costs are different during chaining; 4) the computation of the
568568
.RB ` ms '
569569
tag ignores introns to demote hits to pseudogenes.
570570
.TP
571+
.B splice:hq
572+
Long-read splice alignment for PacBio CCS reads
573+
.RB ( -xsplice
574+
.B -C5 -O6,24
575+
.BR -B4 ).
576+
.TP
571577
.B sr
572578
Short single-end reads without splicing
573579
.RB ( -k21

options.c

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -120,14 +120,16 @@ int mm_set_opt(const char *preset, mm_idxopt_t *io, mm_mapopt_t *mo)
120120
mo->mid_occ = 1000;
121121
mo->max_occ = 5000;
122122
mo->mini_batch_size = 50000000;
123-
} else if (strcmp(preset, "splice") == 0 || strcmp(preset, "cdna") == 0) {
123+
} else if (strncmp(preset, "splice", 6) == 0 || strcmp(preset, "cdna") == 0) {
124124
io->flag = 0, io->k = 15, io->w = 5;
125125
mo->flag |= MM_F_SPLICE | MM_F_SPLICE_FOR | MM_F_SPLICE_REV | MM_F_SPLICE_FLANK;
126126
mo->max_gap = 2000, mo->max_gap_ref = mo->bw = 200000;
127127
mo->a = 1, mo->b = 2, mo->q = 2, mo->e = 1, mo->q2 = 32, mo->e2 = 0;
128128
mo->noncan = 9;
129129
mo->junc_bonus = 9;
130130
mo->zdrop = 200, mo->zdrop_inv = 100; // because mo->a is halved
131+
if (strcmp(preset, "splice:hq") == 0)
132+
mo->junc_bonus = 5, mo->b = 4, mo->q = 6, mo->q2 = 24;
131133
} else return -1;
132134
return 0;
133135
}

0 commit comments

Comments
 (0)