Skip to content

Commit a86816f

Browse files
authored
Fixed how overlapping genes are identified during training (#15)
1 parent f84dda5 commit a86816f

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

gecco/cli/commands/_mixins.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -460,7 +460,7 @@ def _label_genes(self, genes: List["Gene"], clusters: "ClusterTable") -> List["G
460460
for seq_id, seq_genes in itertools.groupby(genes, key=operator.attrgetter("source.id")):
461461
for gene in seq_genes:
462462
if any(
463-
cluster_start <= gene.start and gene.end <= cluster_end
463+
cluster_start <= gene.end and gene.start <= cluster_end
464464
for (cluster_start, cluster_end) in cluster_by_seq[seq_id]
465465
):
466466
gene = gene.with_probability(1)
@@ -496,7 +496,7 @@ def _extract_clusters(self, genes: List["Gene"], clusters: "ClusterTable") -> Li
496496
for seq_id, seq_genes in itertools.groupby(genes, key=operator.attrgetter("source.id")):
497497
for gene in seq_genes:
498498
for cluster_start, cluster_end, cluster_id in cluster_by_seq[seq_id]:
499-
if cluster_start <= gene.start and gene.end <= cluster_end:
499+
if cluster_start <= gene.end and gene.start <= cluster_end:
500500
genes_by_cluster[cluster_id].append(gene)
501501

502502
return [

0 commit comments

Comments
 (0)