diff --git a/malariagen_data/anoph/sample_metadata.py b/malariagen_data/anoph/sample_metadata.py index 1008cd56c..ed5938610 100644 --- a/malariagen_data/anoph/sample_metadata.py +++ b/malariagen_data/anoph/sample_metadata.py @@ -908,6 +908,16 @@ def count_samples( ) return df_pivot + + def sample_metadata_summary(self): + + df = self.sample_metadata() + + return { + "total_samples": len(df), + "countries": sorted(df["country"].dropna().unique().tolist()), + "species_distribution": df["taxon"].value_counts().to_dict() + } @_check_types @doc( @@ -1907,3 +1917,4 @@ def _locate_cohorts(*, cohorts, data, min_cohort_size): ) return coh_dict +