in spotify_confidence/analysis/frequentist/confidence_computers/sample_size_computer.py [0:0]
def _sufficient_statistics(self) -> DataFrame:
if self._sufficient is None:
groupby = [self._metric_column]
self._sufficient = (
self._df.groupby(groupby, sort=False, group_keys=True)
.apply(
lambda df: df.assign(**{POINT_ESTIMATE: lambda df: df[self._point_estimate_column]})
.assign(**{ORIGINAL_POINT_ESTIMATE: lambda df: df[self._point_estimate_column]})
.assign(**{VARIANCE: lambda df: df[self._var_column]})
.assign(**{ORIGINAL_VARIANCE: lambda df: df[self._var_column]})
)
.pipe(reset_named_indices)
)
return self._sufficient