Skip to content

Commit 486f636

Browse files
committed
Merge branch 'hotfix-pandas-na' into dev
2 parents 695c09c + f7f99ea commit 486f636

File tree

2 files changed

+9
-1
lines changed

2 files changed

+9
-1
lines changed

autometa/binning/recursive_dbscan.py

+5-1
Original file line numberDiff line numberDiff line change
@@ -186,7 +186,11 @@ def recursive_dbscan(
186186
coverage_stddev_cutoff=coverage_stddev_cutoff,
187187
gc_content_stddev_cutoff=gc_content_stddev_cutoff,
188188
)
189-
median_completeness = filtered_df.completeness.median()
189+
if filtered_df.empty:
190+
median_completeness = float("-inf")
191+
else:
192+
median_completeness = filtered_df.completeness.median()
193+
190194
if median_completeness >= best_median:
191195
best_median = median_completeness
192196
best_df = df

autometa/binning/utilities.py

+4
Original file line numberDiff line numberDiff line change
@@ -31,6 +31,8 @@
3131

3232
import pandas as pd
3333

34+
import numpy as np
35+
3436
from typing import Iterable, Tuple
3537

3638
from autometa.taxonomy.database import TaxonomyDatabase
@@ -183,7 +185,9 @@ def add_metrics(
183185
# redundant_marker_count = cluster_marker_counts.gt(1).sum(axis=1)
184186
# calculate completeness and purity and std. dev. metrics
185187
completeness = present_marker_count / reference_markers_count * 100
188+
completeness = completeness.where(~np.isnan(completeness),pd.NA)
186189
purity = single_copy_marker_count / present_marker_count * 100
190+
purity = purity.where(~np.isnan(purity), pd.NA)
187191
coverage_stddev = main_grouped_by_cluster.coverage.std()
188192
gc_content_stddev = main_grouped_by_cluster.gc_content.std()
189193
# merge metrics with given dataframe

0 commit comments

Comments
 (0)