2013-02-01 02:59:48 +08:00
|
|
|
#include <stdlib.h>
|
2013-02-01 04:55:22 +08:00
|
|
|
#include <string.h>
|
|
|
|
|
#include <stdio.h>
|
2013-02-05 01:37:38 +08:00
|
|
|
#include <assert.h>
|
2013-02-08 06:15:45 +08:00
|
|
|
#include <math.h>
|
2013-02-08 02:29:01 +08:00
|
|
|
#ifdef HAVE_PTHREAD
|
|
|
|
|
#include <pthread.h>
|
|
|
|
|
#endif
|
2013-02-08 03:36:18 +08:00
|
|
|
#include "kstring.h"
|
2013-02-01 02:59:48 +08:00
|
|
|
#include "bwamem.h"
|
2013-02-02 05:39:50 +08:00
|
|
|
#include "bntseq.h"
|
2013-02-05 01:37:38 +08:00
|
|
|
#include "ksw.h"
|
2013-02-05 06:23:06 +08:00
|
|
|
#include "ksort.h"
|
2013-02-05 01:37:38 +08:00
|
|
|
|
2013-02-08 06:15:45 +08:00
|
|
|
#define MAPQ_COEF 40.
|
|
|
|
|
|
2013-02-08 08:50:37 +08:00
|
|
|
int mem_debug = 0;
|
|
|
|
|
|
2013-02-05 01:37:38 +08:00
|
|
|
void mem_fill_scmat(int a, int b, int8_t mat[25])
|
|
|
|
|
{
|
|
|
|
|
int i, j, k;
|
2013-02-05 04:40:26 +08:00
|
|
|
for (i = k = 0; i < 4; ++i) {
|
2013-02-05 01:37:38 +08:00
|
|
|
for (j = 0; j < 4; ++j)
|
|
|
|
|
mat[k++] = i == j? a : -b;
|
|
|
|
|
mat[k++] = 0; // ambiguous base
|
|
|
|
|
}
|
|
|
|
|
for (j = 0; j < 5; ++j) mat[k++] = 0;
|
|
|
|
|
}
|
2013-02-01 02:59:48 +08:00
|
|
|
|
2013-02-02 05:39:50 +08:00
|
|
|
mem_opt_t *mem_opt_init()
|
2013-02-01 02:59:48 +08:00
|
|
|
{
|
2013-02-02 05:39:50 +08:00
|
|
|
mem_opt_t *o;
|
|
|
|
|
o = calloc(1, sizeof(mem_opt_t));
|
2013-02-05 03:51:51 +08:00
|
|
|
o->a = 1; o->b = 5; o->q = 8; o->r = 1; o->w = 100;
|
2013-02-08 08:50:37 +08:00
|
|
|
o->min_seed_len = 19;
|
|
|
|
|
o->max_occ = 50;
|
2013-02-01 04:55:22 +08:00
|
|
|
o->max_chain_gap = 10000;
|
2013-02-05 13:17:20 +08:00
|
|
|
o->mask_level = 0.50;
|
2013-02-05 13:41:07 +08:00
|
|
|
o->chain_drop_ratio = 0.50;
|
2013-02-08 02:13:43 +08:00
|
|
|
o->chunk_size = 10000000;
|
|
|
|
|
o->n_threads = 1;
|
|
|
|
|
o->pe_dir = 0<<1|1;
|
|
|
|
|
o->is_pe = 0;
|
2013-02-05 01:37:38 +08:00
|
|
|
mem_fill_scmat(o->a, o->b, o->mat);
|
2013-02-01 02:59:48 +08:00
|
|
|
return o;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/***************************
|
|
|
|
|
* SMEM iterator interface *
|
|
|
|
|
***************************/
|
|
|
|
|
|
2013-02-02 03:38:44 +08:00
|
|
|
struct __smem_i {
|
|
|
|
|
const bwt_t *bwt;
|
|
|
|
|
const uint8_t *query;
|
|
|
|
|
int start, len;
|
|
|
|
|
bwtintv_v *matches; // matches; to be returned by smem_next()
|
|
|
|
|
bwtintv_v *sub; // sub-matches inside the longest match; temporary
|
|
|
|
|
bwtintv_v *tmpvec[2]; // temporary arrays
|
|
|
|
|
};
|
|
|
|
|
|
2013-02-01 02:59:48 +08:00
|
|
|
smem_i *smem_itr_init(const bwt_t *bwt)
|
|
|
|
|
{
|
|
|
|
|
smem_i *itr;
|
|
|
|
|
itr = calloc(1, sizeof(smem_i));
|
|
|
|
|
itr->bwt = bwt;
|
|
|
|
|
itr->tmpvec[0] = calloc(1, sizeof(bwtintv_v));
|
|
|
|
|
itr->tmpvec[1] = calloc(1, sizeof(bwtintv_v));
|
|
|
|
|
itr->matches = calloc(1, sizeof(bwtintv_v));
|
2013-02-02 03:20:38 +08:00
|
|
|
itr->sub = calloc(1, sizeof(bwtintv_v));
|
2013-02-01 02:59:48 +08:00
|
|
|
return itr;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void smem_itr_destroy(smem_i *itr)
|
|
|
|
|
{
|
2013-02-02 04:26:34 +08:00
|
|
|
free(itr->tmpvec[0]->a); free(itr->tmpvec[0]);
|
|
|
|
|
free(itr->tmpvec[1]->a); free(itr->tmpvec[1]);
|
|
|
|
|
free(itr->matches->a); free(itr->matches);
|
|
|
|
|
free(itr->sub->a); free(itr->sub);
|
2013-02-01 02:59:48 +08:00
|
|
|
free(itr);
|
|
|
|
|
}
|
|
|
|
|
|
2013-02-02 03:20:38 +08:00
|
|
|
void smem_set_query(smem_i *itr, int len, const uint8_t *query)
|
2013-02-01 02:59:48 +08:00
|
|
|
{
|
|
|
|
|
itr->query = query;
|
|
|
|
|
itr->start = 0;
|
|
|
|
|
itr->len = len;
|
|
|
|
|
}
|
|
|
|
|
|
2013-02-08 08:50:37 +08:00
|
|
|
|
2013-02-02 03:38:44 +08:00
|
|
|
const bwtintv_v *smem_next(smem_i *itr, int split_len)
|
2013-02-01 02:59:48 +08:00
|
|
|
{
|
2013-02-02 03:20:38 +08:00
|
|
|
int i, max, max_i;
|
2013-02-02 03:38:44 +08:00
|
|
|
itr->tmpvec[0]->n = itr->tmpvec[1]->n = itr->matches->n = itr->sub->n = 0;
|
|
|
|
|
if (itr->start >= itr->len || itr->start < 0) return 0;
|
2013-02-01 02:59:48 +08:00
|
|
|
while (itr->start < itr->len && itr->query[itr->start] > 3) ++itr->start; // skip ambiguous bases
|
2013-02-02 03:38:44 +08:00
|
|
|
if (itr->start == itr->len) return 0;
|
|
|
|
|
itr->start = bwt_smem1(itr->bwt, itr->len, itr->query, itr->start, 1, itr->matches, itr->tmpvec); // search for SMEM
|
|
|
|
|
if (itr->matches->n == 0) return itr->matches; // well, in theory, we should never come here
|
|
|
|
|
for (i = max = 0, max_i = 0; i < itr->matches->n; ++i) { // look for the longest match
|
2013-02-02 03:20:38 +08:00
|
|
|
bwtintv_t *p = &itr->matches->a[i];
|
|
|
|
|
int len = (uint32_t)p->info - (p->info>>32);
|
|
|
|
|
if (max < len) max = len, max_i = i;
|
|
|
|
|
}
|
2013-02-02 03:38:44 +08:00
|
|
|
if (split_len > 0 && max >= split_len && itr->matches->a[max_i].x[2] == 1) { // if the longest SMEM is unique and long
|
2013-02-02 03:20:38 +08:00
|
|
|
int j;
|
2013-02-02 03:38:44 +08:00
|
|
|
bwtintv_v *a = itr->tmpvec[0]; // reuse tmpvec[0] for merging
|
2013-02-02 03:20:38 +08:00
|
|
|
bwtintv_t *p = &itr->matches->a[max_i];
|
2013-02-02 03:38:44 +08:00
|
|
|
bwt_smem1(itr->bwt, itr->len, itr->query, ((uint32_t)p->info + (p->info>>32))>>1, 2, itr->sub, itr->tmpvec); // starting from the middle of the longest MEM
|
2013-02-02 03:20:38 +08:00
|
|
|
i = j = 0; a->n = 0;
|
|
|
|
|
while (i < itr->matches->n && j < itr->sub->n) { // ordered merge
|
2013-02-05 05:48:11 +08:00
|
|
|
int64_t xi = itr->matches->a[i].info>>32<<32 | (itr->len - (uint32_t)itr->matches->a[i].info);
|
2013-02-05 13:41:07 +08:00
|
|
|
int64_t xj = itr->sub->a[j].info>>32<<32 | (itr->len - (uint32_t)itr->sub->a[j].info);
|
2013-02-05 05:48:11 +08:00
|
|
|
if (xi < xj) {
|
2013-02-02 03:20:38 +08:00
|
|
|
kv_push(bwtintv_t, *a, itr->matches->a[i]);
|
|
|
|
|
++i;
|
2013-02-08 08:50:37 +08:00
|
|
|
} else if ((uint32_t)itr->sub->a[j].info - (itr->sub->a[j].info>>32) >= max>>1) {
|
2013-02-02 03:20:38 +08:00
|
|
|
kv_push(bwtintv_t, *a, itr->sub->a[j]);
|
|
|
|
|
++j;
|
2013-02-08 08:50:37 +08:00
|
|
|
} else ++j;
|
2013-02-02 03:20:38 +08:00
|
|
|
}
|
|
|
|
|
for (; i < itr->matches->n; ++i) kv_push(bwtintv_t, *a, itr->matches->a[i]);
|
2013-02-08 08:50:37 +08:00
|
|
|
for (; j < itr->sub->n; ++j)
|
|
|
|
|
if ((uint32_t)itr->sub->a[j].info - (itr->sub->a[j].info>>32) >= max>>1)
|
|
|
|
|
kv_push(bwtintv_t, *a, itr->sub->a[j]);
|
2013-02-02 03:20:38 +08:00
|
|
|
kv_copy(bwtintv_t, *itr->matches, *a);
|
|
|
|
|
}
|
2013-02-02 03:38:44 +08:00
|
|
|
return itr->matches;
|
2013-02-01 02:59:48 +08:00
|
|
|
}
|
|
|
|
|
|
2013-02-05 06:23:06 +08:00
|
|
|
/********************************
|
|
|
|
|
* Chaining while finding SMEMs *
|
|
|
|
|
********************************/
|
|
|
|
|
|
2013-02-01 04:55:22 +08:00
|
|
|
#include "kbtree.h"
|
|
|
|
|
|
2013-02-01 05:39:24 +08:00
|
|
|
#define chain_cmp(a, b) ((a).pos - (b).pos)
|
2013-02-08 02:13:43 +08:00
|
|
|
KBTREE_INIT(chn, mem_chain_t, chain_cmp)
|
2013-02-01 04:55:22 +08:00
|
|
|
|
2013-02-08 02:13:43 +08:00
|
|
|
static int test_and_merge(const mem_opt_t *opt, mem_chain_t *c, const mem_seed_t *p)
|
2013-02-01 04:55:22 +08:00
|
|
|
{
|
|
|
|
|
int64_t qend, rend, x, y;
|
2013-02-02 05:39:50 +08:00
|
|
|
const mem_seed_t *last = &c->seeds[c->n-1];
|
2013-02-01 04:55:22 +08:00
|
|
|
qend = last->qbeg + last->len;
|
|
|
|
|
rend = last->rbeg + last->len;
|
2013-02-01 05:39:24 +08:00
|
|
|
if (p->qbeg >= c->seeds[0].qbeg && p->qbeg + p->len <= qend && p->rbeg >= c->seeds[0].rbeg && p->rbeg + p->len <= rend)
|
2013-02-01 04:55:22 +08:00
|
|
|
return 1; // contained seed; do nothing
|
2013-02-05 05:48:11 +08:00
|
|
|
x = p->qbeg - last->qbeg; // always non-negtive
|
2013-02-01 04:55:22 +08:00
|
|
|
y = p->rbeg - last->rbeg;
|
2013-02-05 05:48:11 +08:00
|
|
|
if (y >= 0 && x - y <= opt->w && y - x <= opt->w && x - last->len < opt->max_chain_gap && y - last->len < opt->max_chain_gap) { // grow the chain
|
2013-02-01 04:55:22 +08:00
|
|
|
if (c->n == c->m) {
|
|
|
|
|
c->m <<= 1;
|
2013-02-02 05:39:50 +08:00
|
|
|
c->seeds = realloc(c->seeds, c->m * sizeof(mem_seed_t));
|
2013-02-01 04:55:22 +08:00
|
|
|
}
|
|
|
|
|
c->seeds[c->n++] = *p;
|
|
|
|
|
return 1;
|
|
|
|
|
}
|
2013-02-02 03:38:44 +08:00
|
|
|
return 0; // request to add a new chain
|
2013-02-01 04:55:22 +08:00
|
|
|
}
|
|
|
|
|
|
2013-02-02 05:39:50 +08:00
|
|
|
static void mem_insert_seed(const mem_opt_t *opt, kbtree_t(chn) *tree, smem_i *itr)
|
2013-02-01 04:55:22 +08:00
|
|
|
{
|
2013-02-02 03:38:44 +08:00
|
|
|
const bwtintv_v *a;
|
|
|
|
|
while ((a = smem_next(itr, opt->min_seed_len<<1)) != 0) { // to find all SMEM and some internal MEM
|
2013-02-01 04:55:22 +08:00
|
|
|
int i;
|
2013-02-02 03:38:44 +08:00
|
|
|
for (i = 0; i < a->n; ++i) { // go through each SMEM/MEM up to itr->start
|
|
|
|
|
bwtintv_t *p = &a->a[i];
|
2013-02-01 04:55:22 +08:00
|
|
|
int slen = (uint32_t)p->info - (p->info>>32); // seed length
|
|
|
|
|
int64_t k;
|
2013-02-02 03:38:44 +08:00
|
|
|
if (slen < opt->min_seed_len || p->x[2] > opt->max_occ) continue; // ignore if too short or too repetitive
|
2013-02-01 04:55:22 +08:00
|
|
|
for (k = 0; k < p->x[2]; ++k) {
|
2013-02-08 02:13:43 +08:00
|
|
|
mem_chain_t tmp, *lower, *upper;
|
2013-02-02 05:39:50 +08:00
|
|
|
mem_seed_t s;
|
2013-02-01 04:55:22 +08:00
|
|
|
int to_add = 0;
|
2013-02-02 03:38:44 +08:00
|
|
|
s.rbeg = tmp.pos = bwt_sa(itr->bwt, p->x[0] + k); // this is the base coordinate in the forward-reverse reference
|
2013-02-01 05:26:05 +08:00
|
|
|
s.qbeg = p->info>>32;
|
|
|
|
|
s.len = slen;
|
2013-02-01 04:55:22 +08:00
|
|
|
if (kb_size(tree)) {
|
2013-02-02 03:38:44 +08:00
|
|
|
kb_intervalp(chn, tree, &tmp, &lower, &upper); // find the closest chain
|
2013-02-01 05:26:05 +08:00
|
|
|
if (!lower || !test_and_merge(opt, lower, &s)) to_add = 1;
|
|
|
|
|
} else to_add = 1;
|
2013-02-02 03:38:44 +08:00
|
|
|
if (to_add) { // add the seed as a new chain
|
2013-02-01 04:55:22 +08:00
|
|
|
tmp.n = 1; tmp.m = 4;
|
2013-02-02 05:39:50 +08:00
|
|
|
tmp.seeds = calloc(tmp.m, sizeof(mem_seed_t));
|
2013-02-01 05:26:05 +08:00
|
|
|
tmp.seeds[0] = s;
|
2013-02-01 04:55:22 +08:00
|
|
|
kb_putp(chn, tree, &tmp);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2013-02-08 05:27:11 +08:00
|
|
|
void mem_print_chain(const bntseq_t *bns, mem_chain_v *chn)
|
|
|
|
|
{
|
|
|
|
|
int i, j;
|
|
|
|
|
for (i = 0; i < chn->n; ++i) {
|
|
|
|
|
mem_chain_t *p = &chn->a[i];
|
|
|
|
|
printf("%d", p->n);
|
|
|
|
|
for (j = 0; j < p->n; ++j) {
|
|
|
|
|
bwtint_t pos;
|
|
|
|
|
int is_rev, ref_id;
|
|
|
|
|
pos = bns_depos(bns, p->seeds[j].rbeg, &is_rev);
|
|
|
|
|
if (is_rev) pos -= p->seeds[j].len - 1;
|
|
|
|
|
bns_cnt_ambi(bns, pos, p->seeds[j].len, &ref_id);
|
|
|
|
|
printf("\t%d,%d,%ld(%s:%c%ld)", p->seeds[j].len, p->seeds[j].qbeg, (long)p->seeds[j].rbeg, bns->anns[ref_id].name, "+-"[is_rev], (long)(pos - bns->anns[ref_id].offset) + 1);
|
|
|
|
|
}
|
|
|
|
|
putchar('\n');
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2013-02-08 02:13:43 +08:00
|
|
|
mem_chain_v mem_chain(const mem_opt_t *opt, const bwt_t *bwt, int len, const uint8_t *seq)
|
2013-02-01 04:55:22 +08:00
|
|
|
{
|
2013-02-08 02:13:43 +08:00
|
|
|
mem_chain_v chain;
|
2013-02-01 04:55:22 +08:00
|
|
|
smem_i *itr;
|
|
|
|
|
kbtree_t(chn) *tree;
|
|
|
|
|
|
2013-02-08 02:13:43 +08:00
|
|
|
kv_init(chain);
|
2013-02-01 04:55:22 +08:00
|
|
|
if (len < opt->min_seed_len) return chain; // if the query is shorter than the seed length, no match
|
|
|
|
|
tree = kb_init(chn, KB_DEFAULT_SIZE);
|
|
|
|
|
itr = smem_itr_init(bwt);
|
2013-02-02 03:20:38 +08:00
|
|
|
smem_set_query(itr, len, seq);
|
2013-02-01 05:26:05 +08:00
|
|
|
mem_insert_seed(opt, tree, itr);
|
|
|
|
|
|
2013-02-08 02:13:43 +08:00
|
|
|
kv_resize(mem_chain_t, chain, kb_size(tree));
|
2013-02-01 05:26:05 +08:00
|
|
|
|
2013-02-08 02:13:43 +08:00
|
|
|
#define traverse_func(p_) (chain.a[chain.n++] = *(p_))
|
|
|
|
|
__kb_traverse(mem_chain_t, tree, traverse_func);
|
2013-02-01 05:26:05 +08:00
|
|
|
#undef traverse_func
|
2013-02-01 04:55:22 +08:00
|
|
|
|
|
|
|
|
smem_itr_destroy(itr);
|
|
|
|
|
kb_destroy(chn, tree);
|
|
|
|
|
return chain;
|
|
|
|
|
}
|
2013-02-02 05:39:50 +08:00
|
|
|
|
2013-02-05 05:48:11 +08:00
|
|
|
/********************
|
|
|
|
|
* Filtering chains *
|
|
|
|
|
********************/
|
|
|
|
|
|
2013-02-05 06:23:06 +08:00
|
|
|
typedef struct {
|
|
|
|
|
int beg, end, w;
|
|
|
|
|
void *p, *p2;
|
|
|
|
|
} flt_aux_t;
|
|
|
|
|
|
|
|
|
|
#define flt_lt(a, b) ((a).w > (b).w)
|
|
|
|
|
KSORT_INIT(mem_flt, flt_aux_t, flt_lt)
|
|
|
|
|
|
2013-02-08 02:13:43 +08:00
|
|
|
int mem_chain_flt(const mem_opt_t *opt, int n_chn, mem_chain_t *chains)
|
2013-02-05 06:23:06 +08:00
|
|
|
{
|
|
|
|
|
flt_aux_t *a;
|
|
|
|
|
int i, j, n;
|
2013-02-07 02:59:32 +08:00
|
|
|
if (n_chn <= 1) return n_chn; // no need to filter
|
|
|
|
|
a = malloc(sizeof(flt_aux_t) * n_chn);
|
|
|
|
|
for (i = 0; i < n_chn; ++i) {
|
2013-02-08 02:13:43 +08:00
|
|
|
mem_chain_t *c = &chains[i];
|
2013-02-05 06:23:06 +08:00
|
|
|
int w = 0;
|
2013-02-06 10:58:33 +08:00
|
|
|
for (j = 0; j < c->n; ++j) w += c->seeds[j].len; // FIXME: take care of seed overlaps
|
2013-02-05 06:23:06 +08:00
|
|
|
a[i].beg = c->seeds[0].qbeg;
|
|
|
|
|
a[i].end = c->seeds[c->n-1].qbeg + c->seeds[c->n-1].len;
|
2013-02-07 02:59:32 +08:00
|
|
|
a[i].w = w; a[i].p = c; a[i].p2 = 0;
|
2013-02-05 06:23:06 +08:00
|
|
|
}
|
2013-02-07 02:59:32 +08:00
|
|
|
ks_introsort(mem_flt, n_chn, a);
|
2013-02-06 10:58:33 +08:00
|
|
|
{ // reorder chains such that the best chain appears first
|
2013-02-08 02:13:43 +08:00
|
|
|
mem_chain_t *swap;
|
|
|
|
|
swap = malloc(sizeof(mem_chain_t) * n_chn);
|
2013-02-07 02:59:32 +08:00
|
|
|
for (i = 0; i < n_chn; ++i) {
|
2013-02-08 02:13:43 +08:00
|
|
|
swap[i] = *((mem_chain_t*)a[i].p);
|
2013-02-07 02:59:32 +08:00
|
|
|
a[i].p = &chains[i]; // as we will memcpy() below, a[i].p is changed
|
2013-02-06 10:58:33 +08:00
|
|
|
}
|
2013-02-08 02:13:43 +08:00
|
|
|
memcpy(chains, swap, sizeof(mem_chain_t) * n_chn);
|
2013-02-06 10:58:33 +08:00
|
|
|
free(swap);
|
|
|
|
|
}
|
2013-02-07 02:59:32 +08:00
|
|
|
for (i = 1, n = 1; i < n_chn; ++i) {
|
2013-02-05 06:23:06 +08:00
|
|
|
for (j = 0; j < n; ++j) {
|
|
|
|
|
int b_max = a[j].beg > a[i].beg? a[j].beg : a[i].beg;
|
2013-02-05 13:17:20 +08:00
|
|
|
int e_min = a[j].end < a[i].end? a[j].end : a[i].end;
|
2013-02-05 06:23:06 +08:00
|
|
|
if (e_min > b_max) { // have overlap
|
|
|
|
|
int min_l = a[i].end - a[i].beg < a[j].end - a[j].beg? a[i].end - a[i].beg : a[j].end - a[j].beg;
|
|
|
|
|
if (e_min - b_max >= min_l * opt->mask_level) { // significant overlap
|
|
|
|
|
if (a[j].p2 == 0) a[j].p2 = a[i].p;
|
|
|
|
|
if (a[i].w < a[j].w * opt->chain_drop_ratio)
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
if (j == n) a[n++] = a[i]; // if have no significant overlap with better chains, keep it.
|
|
|
|
|
}
|
2013-02-05 13:17:20 +08:00
|
|
|
for (i = 0; i < n; ++i) { // mark chains to be kept
|
2013-02-08 02:13:43 +08:00
|
|
|
mem_chain_t *c = (mem_chain_t*)a[i].p;
|
2013-02-05 13:17:20 +08:00
|
|
|
if (c->n > 0) c->n = -c->n;
|
2013-02-08 02:13:43 +08:00
|
|
|
c = (mem_chain_t*)a[i].p2;
|
2013-02-05 13:17:20 +08:00
|
|
|
if (c && c->n > 0) c->n = -c->n;
|
|
|
|
|
}
|
2013-02-05 06:23:06 +08:00
|
|
|
free(a);
|
2013-02-07 02:59:32 +08:00
|
|
|
for (i = 0; i < n_chn; ++i) { // free discarded chains
|
2013-02-08 02:13:43 +08:00
|
|
|
mem_chain_t *c = &chains[i];
|
2013-02-05 13:17:20 +08:00
|
|
|
if (c->n >= 0) {
|
|
|
|
|
free(c->seeds);
|
|
|
|
|
c->n = c->m = 0;
|
|
|
|
|
} else c->n = -c->n;
|
|
|
|
|
}
|
2013-02-07 02:59:32 +08:00
|
|
|
for (i = n = 0; i < n_chn; ++i) { // squeeze out discarded chains
|
|
|
|
|
if (chains[i].n > 0) {
|
|
|
|
|
if (n != i) chains[n++] = chains[i];
|
2013-02-05 13:17:20 +08:00
|
|
|
else ++n;
|
|
|
|
|
}
|
|
|
|
|
}
|
2013-02-07 02:59:32 +08:00
|
|
|
return n;
|
2013-02-05 06:23:06 +08:00
|
|
|
}
|
|
|
|
|
|
2013-02-07 03:38:40 +08:00
|
|
|
#define alnreg_lt(a, b) ((a).score > (b).score)
|
|
|
|
|
KSORT_INIT(mem_ar, mem_alnreg_t, alnreg_lt)
|
|
|
|
|
|
|
|
|
|
int mem_choose_alnreg_se(const mem_opt_t *opt, int n, mem_alnreg_t *a)
|
|
|
|
|
{ // similar to the loop in mem_chain_flt()
|
|
|
|
|
int i, j, m;
|
|
|
|
|
if (n <= 1) return n;
|
|
|
|
|
ks_introsort(mem_ar, n, a);
|
|
|
|
|
for (i = 0; i < n; ++i) a[i].sub = 0;
|
|
|
|
|
for (i = 1, m = 1; i < n; ++i) {
|
|
|
|
|
for (j = 0; j < m; ++j) {
|
|
|
|
|
int b_max = a[j].qb > a[i].qb? a[j].qb : a[i].qb;
|
|
|
|
|
int e_min = a[j].qe < a[i].qe? a[j].qe : a[i].qe;
|
|
|
|
|
if (e_min > b_max) { // have overlap
|
|
|
|
|
int min_l = a[i].qe - a[i].qb < a[j].qe - a[j].qb? a[i].qe - a[i].qb : a[j].qe - a[j].qb;
|
|
|
|
|
if (e_min - b_max >= min_l * opt->mask_level) { // significant overlap
|
|
|
|
|
if (a[j].sub == 0) a[j].sub = a[i].score;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
if (j == m) a[m++] = a[i];
|
|
|
|
|
}
|
|
|
|
|
return m;
|
|
|
|
|
}
|
|
|
|
|
|
2013-02-05 05:48:11 +08:00
|
|
|
/****************************************
|
|
|
|
|
* Construct the alignment from a chain *
|
|
|
|
|
****************************************/
|
|
|
|
|
|
2013-02-05 01:37:38 +08:00
|
|
|
static inline int cal_max_gap(const mem_opt_t *opt, int qlen)
|
|
|
|
|
{
|
|
|
|
|
int l = (int)((double)(qlen * opt->a - opt->q) / opt->r + 1.);
|
|
|
|
|
return l > 1? l : 1;
|
|
|
|
|
}
|
|
|
|
|
|
2013-02-08 02:13:43 +08:00
|
|
|
void mem_chain2aln(const mem_opt_t *opt, int64_t l_pac, const uint8_t *pac, int l_query, const uint8_t *query, const mem_chain_t *c, mem_alnreg_t *a)
|
2013-02-05 05:48:11 +08:00
|
|
|
{ // FIXME: in general, we SHOULD check funny seed patterns such as contained seeds. When that happens, we should use a SW or extend more seeds
|
2013-02-08 10:20:36 +08:00
|
|
|
int i, k;
|
|
|
|
|
int64_t rlen, rmax[2], tmp, max = 0, max_i = 0;
|
2013-02-05 05:08:00 +08:00
|
|
|
const mem_seed_t *s;
|
2013-02-05 01:37:38 +08:00
|
|
|
uint8_t *rseq = 0;
|
2013-02-08 10:20:36 +08:00
|
|
|
mem_alnreg_t best;
|
2013-02-05 04:02:56 +08:00
|
|
|
|
2013-02-08 10:20:36 +08:00
|
|
|
memset(&best, 0, sizeof(mem_alnreg_t));
|
2013-02-05 01:37:38 +08:00
|
|
|
// get the max possible span
|
2013-02-05 05:08:00 +08:00
|
|
|
rmax[0] = l_pac<<1; rmax[1] = 0;
|
|
|
|
|
for (i = 0; i < c->n; ++i) {
|
|
|
|
|
int64_t b, e;
|
|
|
|
|
const mem_seed_t *t = &c->seeds[i];
|
|
|
|
|
b = t->rbeg - (t->qbeg + cal_max_gap(opt, t->qbeg));
|
|
|
|
|
e = t->rbeg + t->len + ((l_query - t->qbeg - t->len) + cal_max_gap(opt, l_query - t->qbeg - t->len));
|
|
|
|
|
rmax[0] = rmax[0] < b? rmax[0] : b;
|
|
|
|
|
rmax[1] = rmax[1] > e? rmax[1] : e;
|
2013-02-08 10:20:36 +08:00
|
|
|
if (t->len > max) max = t->len, max_i = i;
|
2013-02-05 05:08:00 +08:00
|
|
|
}
|
2013-02-05 01:37:38 +08:00
|
|
|
// retrieve the reference sequence
|
|
|
|
|
rseq = bns_get_seq(l_pac, pac, rmax[0], rmax[1], &rlen);
|
|
|
|
|
|
2013-02-08 10:20:36 +08:00
|
|
|
for (k = 0; k < c->n;) {
|
|
|
|
|
s = &c->seeds[k];
|
|
|
|
|
memset(a, 0, sizeof(mem_alnreg_t));
|
|
|
|
|
if (s->qbeg) { // left extension
|
|
|
|
|
uint8_t *rs, *qs;
|
|
|
|
|
int qle, tle;
|
|
|
|
|
qs = malloc(s->qbeg);
|
|
|
|
|
for (i = 0; i < s->qbeg; ++i) qs[i] = query[s->qbeg - 1 - i];
|
|
|
|
|
tmp = s->rbeg - rmax[0];
|
|
|
|
|
rs = malloc(tmp);
|
|
|
|
|
for (i = 0; i < tmp; ++i) rs[i] = rseq[tmp - 1 - i];
|
2013-02-08 10:22:54 +08:00
|
|
|
a->score = ksw_extend(s->qbeg, qs, tmp, rs, 5, opt->mat, opt->q, opt->r, opt->w, s->len * opt->a, &qle, &tle);
|
2013-02-08 10:20:36 +08:00
|
|
|
a->qb = s->qbeg - qle; a->rb = s->rbeg - tle;
|
|
|
|
|
free(qs); free(rs);
|
|
|
|
|
} else a->score = s->len * opt->a, a->qb = 0, a->rb = s->rbeg;
|
|
|
|
|
|
|
|
|
|
if (s->qbeg + s->len != l_query) { // right extension of the first seed
|
|
|
|
|
int qle, tle, qe, re;
|
|
|
|
|
qe = s->qbeg + s->len;
|
|
|
|
|
re = s->rbeg + s->len - rmax[0];
|
2013-02-08 10:22:54 +08:00
|
|
|
a->score = ksw_extend(l_query - qe, query + qe, rmax[1] - rmax[0] - re, rseq + re, 5, opt->mat, opt->q, opt->r, opt->w, a->score, &qle, &tle);
|
2013-02-08 10:20:36 +08:00
|
|
|
a->qe = qe + qle; a->re = rmax[0] + re + tle;
|
|
|
|
|
} else a->qe = l_query, a->re = s->rbeg + s->len;
|
|
|
|
|
if (mem_debug >= 2) printf("[%d] score=%d\t[%d,%d) <=> [%ld,%ld)\n", k, a->score, a->qb, a->qe, (long)a->rb, (long)a->re);
|
|
|
|
|
// check how many seeds have been covered
|
|
|
|
|
for (i = k + 1; i < c->n; ++i) {
|
|
|
|
|
const mem_seed_t *t = &c->seeds[i];
|
|
|
|
|
if (t->rbeg + t->len > a->re || t->qbeg + t->len > a->qe)
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
if (i >= c->n) break; // all seeds are included; no need to proceed
|
|
|
|
|
if (a->score > best.score) best = *a;
|
|
|
|
|
k = i;
|
2013-02-05 04:09:47 +08:00
|
|
|
}
|
2013-02-08 10:20:36 +08:00
|
|
|
if (a->score < best.score) *a = best;
|
2013-02-05 01:37:38 +08:00
|
|
|
free(rseq);
|
2013-02-02 05:39:50 +08:00
|
|
|
}
|
2013-02-06 10:49:19 +08:00
|
|
|
|
|
|
|
|
uint32_t *mem_gen_cigar(const mem_opt_t *opt, int64_t l_pac, const uint8_t *pac, int l_query, uint8_t *query, int64_t rb, int64_t re, int *score, int *n_cigar)
|
|
|
|
|
{
|
|
|
|
|
uint32_t *cigar = 0;
|
|
|
|
|
uint8_t tmp, *rseq;
|
|
|
|
|
int i, w;
|
|
|
|
|
int64_t rlen;
|
|
|
|
|
*n_cigar = 0;
|
|
|
|
|
if (l_query <= 0 || rb >= re || (rb < l_pac && re > l_pac)) return 0; // reject if negative length or bridging the forward and reverse strand
|
|
|
|
|
rseq = bns_get_seq(l_pac, pac, rb, re, &rlen);
|
|
|
|
|
if (re - rb != rlen) goto ret_gen_cigar; // possible if out of range
|
|
|
|
|
if (rb >= l_pac) { // then reverse both query and rseq; this is to ensure indels to be placed at the leftmost position
|
|
|
|
|
for (i = 0; i < l_query>>1; ++i)
|
|
|
|
|
tmp = query[i], query[i] = query[l_query - 1 - i], query[l_query - 1 - i] = tmp;
|
|
|
|
|
for (i = 0; i < rlen>>1; ++i)
|
2013-02-08 04:52:36 +08:00
|
|
|
tmp = rseq[i], rseq[i] = rseq[rlen - 1 - i], rseq[rlen - 1 - i] = tmp;
|
2013-02-06 10:49:19 +08:00
|
|
|
}
|
2013-02-08 04:52:36 +08:00
|
|
|
//printf("[Q] "); for (i = 0; i < l_query; ++i) putchar("ACGTN"[(int)query[i]]); putchar('\n');
|
|
|
|
|
//printf("[R] "); for (i = 0; i < re - rb; ++i) putchar("ACGTN"[(int)rseq[i]]); putchar('\n');
|
2013-02-06 10:49:19 +08:00
|
|
|
// set the band-width
|
|
|
|
|
w = (int)((double)(l_query * opt->a - opt->q) / opt->r + 1.);
|
|
|
|
|
w = w < 1? w : 1;
|
|
|
|
|
w = w < opt->w? w : opt->w;
|
|
|
|
|
w += abs(rlen - l_query);
|
|
|
|
|
// NW alignment
|
|
|
|
|
*score = ksw_global(l_query, query, rlen, rseq, 5, opt->mat, opt->q, opt->r, w, n_cigar, &cigar);
|
|
|
|
|
if (rb >= l_pac) // reverse back query
|
|
|
|
|
for (i = 0; i < l_query>>1; ++i)
|
|
|
|
|
tmp = query[i], query[i] = query[l_query - 1 - i], query[l_query - 1 - i] = tmp;
|
|
|
|
|
|
|
|
|
|
ret_gen_cigar:
|
|
|
|
|
free(rseq);
|
|
|
|
|
return cigar;
|
|
|
|
|
}
|
2013-02-07 03:38:40 +08:00
|
|
|
|
2013-02-08 03:36:18 +08:00
|
|
|
/************************
|
|
|
|
|
* Integrated interface *
|
|
|
|
|
************************/
|
|
|
|
|
|
|
|
|
|
void mem_sam_se(const mem_opt_t *opt, const bntseq_t *bns, const uint8_t *pac, bseq1_t *s, mem_alnreg_v *a)
|
2013-02-08 02:13:43 +08:00
|
|
|
{
|
2013-02-08 09:07:31 +08:00
|
|
|
int i, k, m;
|
2013-02-08 03:36:18 +08:00
|
|
|
kstring_t str;
|
2013-02-08 04:52:36 +08:00
|
|
|
char *seq;
|
2013-02-08 03:36:18 +08:00
|
|
|
|
|
|
|
|
str.l = str.m = 0; str.s = 0;
|
2013-02-08 03:57:22 +08:00
|
|
|
m = mem_choose_alnreg_se(opt, a->n, a->a);
|
2013-02-08 04:52:36 +08:00
|
|
|
seq = malloc(s->l_seq);
|
2013-02-08 09:07:31 +08:00
|
|
|
if (m == 0) { // no seeds found
|
|
|
|
|
for (i = 0; i < s->l_seq; ++i) seq[i] = "ACGTN"[(int)s->seq[i]];
|
|
|
|
|
kputs(s->name, &str); kputs("\t8\t*\t0\t0\t*\t*\t0\t0\t", &str);
|
|
|
|
|
kputsn(seq, s->l_seq, &str);
|
|
|
|
|
if (s->qual) kputsn(s->qual, s->l_seq, &str);
|
|
|
|
|
else kputc('*', &str);
|
|
|
|
|
kputc('\n', &str);
|
2013-02-08 11:09:58 +08:00
|
|
|
goto ret_sam_se;
|
2013-02-08 09:07:31 +08:00
|
|
|
}
|
2013-02-08 03:57:22 +08:00
|
|
|
for (k = 0; k < m; ++k) {
|
|
|
|
|
uint32_t *cigar = 0;
|
2013-02-08 09:07:31 +08:00
|
|
|
int score, is_rev, nn, rid, flag = 0, n_cigar = 0, mapq = 0;
|
2013-02-08 04:52:36 +08:00
|
|
|
int64_t pos;
|
2013-02-08 03:57:22 +08:00
|
|
|
mem_alnreg_t *p = &a->a[k];
|
|
|
|
|
cigar = mem_gen_cigar(opt, bns->l_pac, pac, p->qe - p->qb, (uint8_t*)&s->seq[p->qb], p->rb, p->re, &score, &n_cigar);
|
|
|
|
|
pos = bns_depos(bns, p->rb < bns->l_pac? p->rb : p->re - 1, &is_rev);
|
|
|
|
|
nn = bns_cnt_ambi(bns, pos, p->re - p->rb, &rid);
|
|
|
|
|
flag |= is_rev? 16 : 0;
|
2013-02-08 04:52:36 +08:00
|
|
|
if (n_cigar == 0) flag |= 8;
|
2013-02-08 03:57:22 +08:00
|
|
|
kputs(s->name, &str); kputc('\t', &str); kputw(flag, &str); kputc('\t', &str);
|
|
|
|
|
kputs(bns->anns[rid].name, &str); kputc('\t', &str); kputuw(pos - bns->anns[rid].offset + 1, &str); kputc('\t', &str);
|
2013-02-08 11:09:58 +08:00
|
|
|
{ // approximate mapQ
|
|
|
|
|
int sub = p->sub? p->sub : opt->min_seed_len * opt->a;
|
|
|
|
|
double identity;
|
|
|
|
|
mapq = p->score? (int)(MAPQ_COEF * (1. - (float)sub / p->score) * log(p->score / opt->a) + .499) : 0;
|
|
|
|
|
identity = (double)p->score / opt->a / (p->qe - p->qb);
|
|
|
|
|
mapq = identity < 0.95? (int)(mapq * identity * identity + .499) : mapq;
|
|
|
|
|
if (mapq > 60) mapq = 60;
|
|
|
|
|
}
|
2013-02-08 06:15:45 +08:00
|
|
|
kputw(mapq, &str); kputc('\t', &str);
|
2013-02-08 03:57:22 +08:00
|
|
|
if (n_cigar) {
|
2013-02-08 05:27:11 +08:00
|
|
|
int clip5, clip3;
|
|
|
|
|
clip5 = is_rev? s->l_seq - p->qe : p->qb;
|
|
|
|
|
clip3 = is_rev? p->qb : s->l_seq - p->qe;
|
|
|
|
|
if (clip5) { kputw(clip5, &str); kputc('S', &str); }
|
2013-02-08 03:57:22 +08:00
|
|
|
for (i = 0; i < n_cigar; ++i) {
|
|
|
|
|
kputw(cigar[i]>>4, &str); kputc("MIDSH"[cigar[i]&0xf], &str);
|
|
|
|
|
}
|
2013-02-08 05:27:11 +08:00
|
|
|
if (clip3) { kputw(clip3, &str); kputc('S', &str); }
|
2013-02-08 03:57:22 +08:00
|
|
|
} else kputc('*', &str);
|
|
|
|
|
kputsn("\t*\t0\t0\t", 7, &str);
|
2013-02-08 04:52:36 +08:00
|
|
|
if (is_rev) for (i = s->l_seq - 1; i >= 0; --i) seq[i] = "TGCAN"[(int)s->seq[i]];
|
|
|
|
|
else for (i = 0; i < s->l_seq; ++i) seq[i] = "ACGTN"[(int)s->seq[i]];
|
|
|
|
|
kputsn(seq, s->l_seq, &str); kputc('\t', &str);
|
2013-02-08 03:57:22 +08:00
|
|
|
if (s->qual) kputsn(s->qual, s->l_seq, &str);
|
2013-02-08 09:07:31 +08:00
|
|
|
else kputc('*', &str);
|
2013-02-08 04:52:36 +08:00
|
|
|
kputsn("\tAS:i:", 6, &str); kputw(p->score, &str);
|
2013-02-08 03:57:22 +08:00
|
|
|
kputsn("\tss:i:", 6, &str); kputw(p->sub, &str);
|
2013-02-08 04:52:36 +08:00
|
|
|
kputsn("\tnw:i:", 6, &str); kputw(score, &str);
|
2013-02-08 03:57:22 +08:00
|
|
|
kputc('\n', &str);
|
|
|
|
|
free(cigar);
|
|
|
|
|
}
|
2013-02-08 11:09:58 +08:00
|
|
|
|
|
|
|
|
ret_sam_se:
|
2013-02-08 04:52:36 +08:00
|
|
|
free(seq);
|
2013-02-08 03:36:18 +08:00
|
|
|
s->sam = str.s;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static mem_alnreg_v find_alnreg(const mem_opt_t *opt, const bwt_t *bwt, const bntseq_t *bns, const uint8_t *pac, bseq1_t *s)
|
|
|
|
|
{
|
|
|
|
|
int i;
|
|
|
|
|
mem_chain_v chn;
|
|
|
|
|
mem_alnreg_v regs;
|
|
|
|
|
for (i = 0; i < s->l_seq; ++i)
|
|
|
|
|
s->seq[i] = nst_nt4_table[(int)s->seq[i]];
|
|
|
|
|
chn = mem_chain(opt, bwt, s->l_seq, (uint8_t*)s->seq);
|
|
|
|
|
chn.n = mem_chain_flt(opt, chn.n, chn.a);
|
2013-02-08 08:50:37 +08:00
|
|
|
if (mem_debug >= 1) mem_print_chain(bns, &chn);
|
2013-02-08 03:36:18 +08:00
|
|
|
regs.n = regs.m = chn.n;
|
|
|
|
|
regs.a = malloc(regs.n * sizeof(mem_alnreg_t));
|
|
|
|
|
for (i = 0; i < chn.n; ++i) {
|
|
|
|
|
mem_chain2aln(opt, bns->l_pac, pac, s->l_seq, (uint8_t*)s->seq, &chn.a[i], ®s.a[i]);
|
|
|
|
|
free(chn.a[i].seeds);
|
|
|
|
|
}
|
|
|
|
|
free(chn.a);
|
|
|
|
|
return regs;
|
2013-02-08 02:13:43 +08:00
|
|
|
}
|
|
|
|
|
|
2013-02-08 02:29:01 +08:00
|
|
|
typedef struct {
|
|
|
|
|
int start, step, n;
|
|
|
|
|
const mem_opt_t *opt;
|
|
|
|
|
const bwt_t *bwt;
|
|
|
|
|
const bntseq_t *bns;
|
|
|
|
|
const uint8_t *pac;
|
|
|
|
|
bseq1_t *seqs;
|
2013-02-08 03:36:18 +08:00
|
|
|
mem_alnreg_v *regs;
|
|
|
|
|
} worker_t;
|
2013-02-08 02:29:01 +08:00
|
|
|
|
|
|
|
|
static void *worker1(void *data)
|
|
|
|
|
{
|
2013-02-08 03:36:18 +08:00
|
|
|
worker_t *w = (worker_t*)data;
|
2013-02-08 02:29:01 +08:00
|
|
|
int i;
|
|
|
|
|
for (i = w->start; i < w->n; i += w->step)
|
2013-02-08 03:36:18 +08:00
|
|
|
w->regs[i] = find_alnreg(w->opt, w->bwt, w->bns, w->pac, &w->seqs[i]);
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
static void *worker2(void *data)
|
|
|
|
|
{
|
|
|
|
|
worker_t *w = (worker_t*)data;
|
|
|
|
|
int i;
|
|
|
|
|
if (!w->opt->is_pe) {
|
|
|
|
|
for (i = 0; i < w->n; i += w->step) {
|
|
|
|
|
mem_sam_se(w->opt, w->bns, w->pac, &w->seqs[i], &w->regs[i]);
|
|
|
|
|
free(w->regs[i].a);
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
for (i = 0; i < w->n>>1; i += w->step) { // not implemented yet
|
|
|
|
|
free(w->regs[i<<1|0].a); free(w->regs[i<<1|1].a);
|
|
|
|
|
}
|
|
|
|
|
}
|
2013-02-08 02:29:01 +08:00
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
|
2013-02-08 02:13:43 +08:00
|
|
|
int mem_process_seqs(const mem_opt_t *opt, const bwt_t *bwt, const bntseq_t *bns, const uint8_t *pac, int n, bseq1_t *seqs)
|
|
|
|
|
{
|
|
|
|
|
int i;
|
2013-02-08 03:36:18 +08:00
|
|
|
worker_t *w;
|
2013-02-08 03:57:22 +08:00
|
|
|
mem_alnreg_v *regs;
|
2013-02-08 03:36:18 +08:00
|
|
|
w = calloc(opt->n_threads, sizeof(worker_t));
|
2013-02-08 03:57:22 +08:00
|
|
|
regs = malloc(n * sizeof(mem_alnreg_v));
|
2013-02-08 02:29:01 +08:00
|
|
|
for (i = 0; i < opt->n_threads; ++i) {
|
2013-02-08 03:57:22 +08:00
|
|
|
worker_t *p = &w[i];
|
|
|
|
|
p->start = i; p->step = opt->n_threads; p->n = n;
|
|
|
|
|
p->opt = opt; p->bwt = bwt; p->bns = bns; p->pac = pac;
|
|
|
|
|
p->seqs = seqs; p->regs = regs;
|
2013-02-08 02:29:01 +08:00
|
|
|
}
|
|
|
|
|
#ifdef HAVE_PTHREAD
|
|
|
|
|
if (opt->n_threads == 1) {
|
2013-02-08 03:36:18 +08:00
|
|
|
worker1(w); worker2(w);
|
2013-02-08 02:29:01 +08:00
|
|
|
} else {
|
|
|
|
|
pthread_t *tid;
|
|
|
|
|
tid = (pthread_t*)calloc(opt->n_threads, sizeof(pthread_t));
|
2013-02-08 03:36:18 +08:00
|
|
|
for (i = 0; i < opt->n_threads; ++i) pthread_create(&tid[i], 0, worker1, &w[i]);
|
|
|
|
|
for (i = 0; i < opt->n_threads; ++i) pthread_join(tid[i], 0);
|
|
|
|
|
for (i = 0; i < opt->n_threads; ++i) pthread_create(&tid[i], 0, worker2, &w[i]);
|
2013-02-08 02:29:01 +08:00
|
|
|
for (i = 0; i < opt->n_threads; ++i) pthread_join(tid[i], 0);
|
|
|
|
|
free(tid);
|
|
|
|
|
}
|
|
|
|
|
#else
|
2013-02-08 03:36:18 +08:00
|
|
|
worker1(w); worker2(w);
|
2013-02-08 02:29:01 +08:00
|
|
|
#endif
|
2013-02-08 03:36:18 +08:00
|
|
|
for (i = 0; i < n; ++i) {
|
2013-02-08 03:57:22 +08:00
|
|
|
fputs(seqs[i].sam, stdout);
|
2013-02-08 03:36:18 +08:00
|
|
|
free(seqs[i].name); free(seqs[i].comment); free(seqs[i].seq); free(seqs[i].qual); free(seqs[i].sam);
|
|
|
|
|
}
|
2013-02-08 03:57:22 +08:00
|
|
|
free(regs); free(w);
|
2013-02-08 02:13:43 +08:00
|
|
|
return 0;
|
|
|
|
|
}
|