Skip to content

Commit 24c2fe6

Browse files
committed
WIP: make taxon_by optional in ...frequencies_advanced funcs. Fix bug in groupby.
1 parent f347969 commit 24c2fe6

4 files changed

Lines changed: 6 additions & 8 deletions

File tree

malariagen_data/anoph/cnv_frq.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -445,7 +445,7 @@ def gene_cnv_frequencies_advanced(
445445
ci_method: Optional[frq_params.ci_method] = frq_params.ci_method_default,
446446
chunks: base_params.chunks = base_params.native_chunks,
447447
inline_array: base_params.inline_array = base_params.inline_array_default,
448-
taxon_by: frq_params.taxon_by = frq_params.taxon_by_default,
448+
taxon_by: Optional[frq_params.taxon_by] = frq_params.taxon_by_default,
449449
) -> xr.Dataset:
450450
regions: List[Region] = parse_multi_region(self, region)
451451
del region
@@ -530,7 +530,7 @@ def _gene_cnv_frequencies_advanced(
530530
)
531531

532532
debug("group samples to make cohorts")
533-
group_samples_by_cohort = df_samples.groupby(["taxon", "area", "period"])
533+
group_samples_by_cohort = df_samples.groupby([taxon_by, "area", "period"])
534534

535535
debug("build cohorts dataframe")
536536
df_cohorts = build_cohorts_from_sample_grouping(

malariagen_data/anoph/frq_base.py

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -14,9 +14,7 @@
1414
from .base import AnophelesBase
1515

1616

17-
def prep_samples_for_cohort_grouping(
18-
*, df_samples, area_by, period_by, taxon_by="taxon"
19-
):
17+
def prep_samples_for_cohort_grouping(*, df_samples, area_by, period_by, taxon_by):
2018
# Take a copy, as we will modify the dataframe.
2119
df_samples = df_samples.copy()
2220

malariagen_data/anoph/hap_frq.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -153,7 +153,7 @@ def haplotypes_frequencies_advanced(
153153
ci_method: Optional[frq_params.ci_method] = frq_params.ci_method_default,
154154
chunks: base_params.chunks = base_params.native_chunks,
155155
inline_array: base_params.inline_array = base_params.inline_array_default,
156-
taxon_by: frq_params.taxon_by = frq_params.taxon_by_default,
156+
taxon_by: Optional[frq_params.taxon_by] = frq_params.taxon_by_default,
157157
) -> xr.Dataset:
158158
# Load sample metadata.
159159
df_samples = self.sample_metadata(
@@ -171,7 +171,7 @@ def haplotypes_frequencies_advanced(
171171
)
172172

173173
# Group samples to make cohorts.
174-
group_samples_by_cohort = df_samples.groupby(["taxon_by", "area", "period"])
174+
group_samples_by_cohort = df_samples.groupby([taxon_by, "area", "period"])
175175

176176
# Build cohorts dataframe.
177177
df_cohorts = build_cohorts_from_sample_grouping(

malariagen_data/anoph/snp_frq.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -451,7 +451,7 @@ def snp_allele_frequencies_advanced(
451451
ci_method: Optional[frq_params.ci_method] = frq_params.ci_method_default,
452452
chunks: base_params.chunks = base_params.native_chunks,
453453
inline_array: base_params.inline_array = base_params.inline_array_default,
454-
taxon_by: frq_params.taxon_by = frq_params.taxon_by_default,
454+
taxon_by: Optional[frq_params.taxon_by] = frq_params.taxon_by_default,
455455
) -> xr.Dataset:
456456
# Load sample metadata.
457457
df_samples = self.sample_metadata(

0 commit comments

Comments
 (0)