Skip to content

Commit f838175

Browse files
lh3gemini-cli
andcommitted
r1299: fix wrong subchain selection
This and the last bug were both reported by Jeremy Wang. Co-authored-by: gemini-cli <gemini-cli@users.noreply.github.com>
1 parent 80d92c6 commit f838175

3 files changed

Lines changed: 27 additions & 11 deletions

File tree

hit.c

Lines changed: 19 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -256,19 +256,25 @@ void mm_select_sub(void *km, float pri_ratio, int min_diff, int best_n, int chec
256256
{
257257
if (pri_ratio > 0.0f && *n_ > 0) {
258258
int i, k, n = *n_, n_2nd = 0;
259-
for (i = k = 0; i < n; ++i) {
259+
uint8_t *keep = (uint8_t*)kmalloc(km, n);
260+
for (i = 0; i < n; ++i) {
260261
int p = r[i].parent;
262+
keep[i] = 0;
261263
if (p == i || r[i].inv) { // primary or inversion
262-
r[k++] = r[i];
264+
keep[i] = 1;
263265
} else if ((r[i].score >= r[p].score * pri_ratio || r[i].score + min_diff >= r[p].score) && n_2nd < best_n) {
264266
if (!(r[i].qs == r[p].qs && r[i].qe == r[p].qe && r[i].rid == r[p].rid && r[i].rs == r[p].rs && r[i].re == r[p].re)) // not identical hits
265-
r[k++] = r[i], ++n_2nd;
266-
else if (r[i].p) free(r[i].p);
267+
keep[i] = 1, ++n_2nd;
267268
} else if (check_strand && n_2nd < best_n && r[i].score > min_strand_sc && r[i].rev != r[p].rev) {
268269
r[i].strand_retained = 1;
269-
r[k++] = r[i], ++n_2nd;
270-
} else if (r[i].p) free(r[i].p);
270+
keep[i] = 1, ++n_2nd;
271+
}
272+
}
273+
for (i = k = 0; i < n; ++i) {
274+
if (keep[i]) r[k++] = r[i];
275+
else if (r[i].p) free(r[i].p);
271276
}
277+
kfree(km, keep);
272278
if (k != n) mm_sync_regs(km, k, r); // removing hits requires sync()
273279
*n_ = k;
274280
}
@@ -277,13 +283,18 @@ void mm_select_sub(void *km, float pri_ratio, int min_diff, int best_n, int chec
277283
int mm_filter_strand_retained(int n_regs, mm_reg1_t *r)
278284
{
279285
int i, k;
280-
for (i = k = 0; i < n_regs; ++i) {
286+
uint8_t *keep = (uint8_t*)malloc(n_regs);
287+
for (i = 0; i < n_regs; ++i) {
281288
int p = r[i].parent;
282-
if (!r[i].strand_retained || r[i].div < r[p].div * 5.0f || r[i].div < 0.01f) {
289+
keep[i] = (!r[i].strand_retained || r[i].div < r[p].div * 5.0f || r[i].div < 0.01f);
290+
}
291+
for (i = k = 0; i < n_regs; ++i) {
292+
if (keep[i]) {
283293
if (k < i) r[k++] = r[i];
284294
else ++k;
285295
}
286296
}
297+
free(keep);
287298
return k;
288299
}
289300

minimap.h

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@
55
#include <stdio.h>
66
#include <sys/types.h>
77

8-
#define MM_VERSION "2.30-r1298-dirty"
8+
#define MM_VERSION "2.30-r1299-dirty"
99

1010
#define MM_F_NO_DIAG (0x001LL) // no exact diagonal hit
1111
#define MM_F_NO_DUAL (0x002LL) // skip pairs where query name is lexicographically larger than target name

pe.c

Lines changed: 7 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,8 @@ void mm_select_sub_multi(void *km, float pri_ratio, float pri1, float pri2, int
88
if (pri_ratio > 0.0f && *n_ > 0) {
99
int i, k, n = *n_, n_2nd = 0;
1010
int max_dist = n_segs == 2? qlens[0] + qlens[1] + max_gap_ref : 0;
11-
for (i = k = 0; i < n; ++i) {
11+
uint8_t *keep = (uint8_t*)kmalloc(km, n);
12+
for (i = 0; i < n; ++i) {
1213
int to_keep = 0;
1314
if (r[i].parent == i) { // primary
1415
to_keep = 1;
@@ -34,9 +35,13 @@ void mm_select_sub_multi(void *km, float pri_ratio, float pri1, float pri2, int
3435
if (to_keep && r[i].parent != i) {
3536
if (n_2nd++ >= best_n) to_keep = 0; // don't keep if there are too many secondary hits
3637
}
37-
if (to_keep) r[k++] = r[i];
38+
keep[i] = to_keep;
39+
}
40+
for (i = k = 0; i < n; ++i) {
41+
if (keep[i]) r[k++] = r[i];
3842
else if (r[i].p) free(r[i].p);
3943
}
44+
kfree(km, keep);
4045
if (k != n) mm_sync_regs(km, k, r); // removing hits requires sync()
4146
*n_ = k;
4247
}

0 commit comments

Comments
 (0)