diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml deleted file mode 100644 index 29e9a186d..000000000 --- a/.github/workflows/ci.yml +++ /dev/null @@ -1,70 +0,0 @@ -name: unit-tests - -on: - workflow_dispatch: - push: - branches: - - main - - dev - pull_request: - branches: - - main - - dev - - breaking-improvments - -jobs: - unit-tests: - runs-on: ubuntu-20.04 - container: - image: hopkinsidd/flepimop:latest-dev - options: --user root - steps: - - name: Checkout - uses: actions/checkout@v3 - with: - lfs: true - - name: Set up Rprofile - run: | - cp build/docker/Docker.Rprofile $HOME/.Rprofile - cp /home/app/.bashrc $HOME/.bashrc - shell: bash - - name: Install the gempyor package - run: | - source /var/python/3.10/virtualenv/bin/activate - python -m pip install --upgrade pip - python -m pip install "flepimop/gempyor_pkg[test]" - shell: bash - - name: Install local R packages - run: Rscript build/local_install.R - shell: bash - - name: Run gempyor tests - run: | - source /var/python/3.10/virtualenv/bin/activate - cd flepimop/gempyor_pkg - pytest -s - shell: bash - - name: Run gempyor-cli integration tests from examples - run: | - source /var/python/3.10/virtualenv/bin/activate - cd examples - pytest -s - shell: bash - - name: Run flepicommon tests - run: | - setwd("flepimop/R_packages/flepicommon") - devtools::test(stop_on_failure=TRUE) - shell: Rscript {0} - - name: Run inference tests - run: | - setwd("flepimop/R_packages/inference") - devtools::test(stop_on_failure=TRUE) - shell: Rscript {0} -# - name: Run integration tests -# env: -# CENSUS_API_KEY: ${{ secrets.CENSUS_API_KEY }} -# run: | -# Rscript build/local_install.R -# cd test -# source /var/python/3.10/virtualenv/bin/activate -# pytest run_tests.py -# shell: bash diff --git a/.github/workflows/flepicommon-ci.yml b/.github/workflows/flepicommon-ci.yml new file mode 100644 index 000000000..9f8abc089 --- /dev/null +++ b/.github/workflows/flepicommon-ci.yml @@ -0,0 +1,79 @@ +name: flepicommon-ci + +on: + workflow_dispatch: + push: + paths: + - flepimop/R_packages/flepicommon/**/* + branches: + - main + pull_request: + paths: + - flepimop/R_packages/flepicommon/**/* + branches: + - main + +jobs: + tests: + runs-on: ubuntu-latest + strategy: + matrix: + R-version: ["4.3.3"] + steps: + - name: Checkout + uses: actions/checkout@v4 + with: + lfs: true + sparse-checkout: | + * + !documentation/ + sparse-checkout-cone-mode: false + - name: Setup R + uses: r-lib/actions/setup-r@v2 + with: + r-version: ${{ matrix.R-version }} + update-rtools: true + - name: Install System Dependencies + run: sudo apt install libcurl4-openssl-dev libharfbuzz-dev libfribidi-dev libtiff5-dev libudunits2-dev libgdal-dev libgeos-dev libproj-dev + - name: Determine R Library Location + run: | + R_LIBPATH=$( R -s -e "cat(.libPaths()[1L])" | xargs ) + echo "R_LIBPATH=$R_LIBPATH" >> $GITHUB_ENV + R_LIBPATH_CKSUM=$( echo "$R_LIBPATH" | cksum | cut -d ' ' -f 1 ) + echo "R_LIBPATH_CKSUM=$R_LIBPATH_CKSUM" >> $GITHUB_ENV + CACHE_DATE=$( date -d "last Sunday" +%Y%m%d ) + echo "CACHE_DATE=$CACHE_DATE" >> $GITHUB_ENV + - name: R Library Cache + uses: actions/cache@v4 + with: + key: flepicommon-rlibs-${{ runner.os }}-${{ matrix.R-version }}-${{ hashFiles('flepimop/R_packages/flepicommon/DESCRIPTION', 'flepimop/R_packages/flepicommon/NAMESPACE') }}-${{ env.R_LIBPATH_CKSUM }}-${{ env.CACHE_DATE }} + path: ${{ env.R_LIBPATH }} + - name: Install R Dependencies + if: steps.r-library-cache.outputs.cache-hit != 'true' + run: | + install.packages( + "devtools", + repos = "https://cloud.r-project.org", + ) + library(devtools) + devtools::install_deps( + pkg = "flepimop/R_packages/flepicommon", + dependencies = TRUE + ) + install.packages("covidcast", repos = "https://cloud.r-project.org") + shell: Rscript {0} + - name: Install The flepicommon Package + run: | + devtools::install( + pkg = "flepimop/R_packages/flepicommon", + args = c(getOption("devtools.install.args"), "--install-tests"), + quick = TRUE, + dependencies = TRUE, + force = TRUE + ) + shell: Rscript {0} + - name: Run Tests + run: | + library(testthat) + test_package("flepicommon") + shell: Rscript {0} diff --git a/.github/workflows/gempyor-ci.yml b/.github/workflows/gempyor-ci.yml new file mode 100644 index 000000000..e2637f1af --- /dev/null +++ b/.github/workflows/gempyor-ci.yml @@ -0,0 +1,51 @@ +name: gempyor-ci + +on: + workflow_dispatch: + push: + paths: + - examples/**/* + - flepimop/gempyor_pkg/**/* + branches: + - main + pull_request: + paths: + - examples/**/* + - flepimop/gempyor_pkg/**/* + branches: + - main + +jobs: + tests: + runs-on: ubuntu-latest + strategy: + matrix: + python-version: ["3.10", "3.11"] + steps: + - name: Checkout + uses: actions/checkout@v4 + with: + lfs: true + sparse-checkout: | + * + !documentation/ + sparse-checkout-cone-mode: false + - name: Setup Python ${{ matrix.python-version }} + uses: actions/setup-python@v5 + with: + python-version: ${{ matrix.python-version }} + - name: Install gempyor + run: | + python -m pip install --upgrade pip + python -m pip install "flepimop/gempyor_pkg[test]" + shell: bash + - name: Run gempyor tests + run: | + cd flepimop/gempyor_pkg + pytest --exitfirst + shell: bash + - name: Run gempyor-cli integration tests from examples + run: | + cd examples + pytest --exitfirst + shell: bash diff --git a/.github/workflows/inference-ci.yml b/.github/workflows/inference-ci.yml new file mode 100644 index 000000000..d80a2e735 --- /dev/null +++ b/.github/workflows/inference-ci.yml @@ -0,0 +1,112 @@ +name: inference-ci + +on: + workflow_dispatch: + workflow_run: + workflows: ['flepicommon-ci', 'gempyor-ci'] + types: + - completed + push: + paths: + - flepimop/R_packages/inference/**/* + branches: + - main + pull_request: + paths: + - flepimop/R_packages/inference/**/* + branches: + - main + +jobs: + tests: + runs-on: ubuntu-latest + if: ${{ github.event_name != 'workflow_run' || github.event.workflow_run.conclusion == 'success' }} + strategy: + matrix: + R-version: ["4.3.3"] + python-version: ["3.10", "3.11"] + steps: + - name: Checkout + uses: actions/checkout@v4 + with: + lfs: true + sparse-checkout: | + * + !documentation/ + sparse-checkout-cone-mode: false + - name: Setup Python ${{ matrix.python-version }} + uses: actions/setup-python@v5 + with: + python-version: ${{ matrix.python-version }} + - name: Install gempyor + run: | + python -m pip install --upgrade pip + python -m pip install "flepimop/gempyor_pkg[test]" + shell: bash + - name: Setup R + uses: r-lib/actions/setup-r@v2 + with: + r-version: ${{ matrix.R-version }} + update-rtools: true + - name: Install System Dependencies + run: sudo apt install libcurl4-openssl-dev libharfbuzz-dev libfribidi-dev libtiff5-dev libudunits2-dev libgdal-dev libgeos-dev libproj-dev + - name: Determine R Library Location + run: | + R_LIBPATH=$( R -s -e "cat(.libPaths()[1L])" | xargs ) + echo "R_LIBPATH=$R_LIBPATH" >> $GITHUB_ENV + R_LIBPATH_CKSUM=$( echo "$R_LIBPATH" | cksum | cut -d ' ' -f 1 ) + echo "R_LIBPATH_CKSUM=$R_LIBPATH_CKSUM" >> $GITHUB_ENV + CACHE_DATE=$( date -d "last Sunday" +%Y%m%d ) + echo "CACHE_DATE=$CACHE_DATE" >> $GITHUB_ENV + - name: R Library Cache + uses: actions/cache@v4 + with: + key: inference-rlibs-${{ runner.os }}-${{ matrix.R-version }}-${{ hashFiles('flepimop/R_packages/flepicommon/DESCRIPTION', 'flepimop/R_packages/flepicommon/NAMESPACE', 'flepimop/R_packages/inference/DESCRIPTION', 'flepimop/R_packages/inference/NAMESPACE') }}-${{ env.R_LIBPATH_CKSUM }}-${{ env.CACHE_DATE }} + path: ${{ env.R_LIBPATH }} + - name: Install R Dependencies For flepicommon + if: steps.r-library-cache.outputs.cache-hit != 'true' + run: | + install.packages( + "devtools", + repos = "https://cloud.r-project.org", + ) + library(devtools) + devtools::install_deps( + pkg = "flepimop/R_packages/flepicommon", + dependencies = TRUE + ) + install.packages("covidcast", repos = "https://cloud.r-project.org") + shell: Rscript {0} + - name: Install The flepicommon Package + run: | + devtools::install( + pkg = "flepimop/R_packages/flepicommon", + quick = TRUE, + dependencies = TRUE, + force = TRUE + ) + shell: Rscript {0} + - name: Install R Dependencies For inference + if: steps.r-library-cache.outputs.cache-hit != 'true' + run: | + devtools::install_deps( + pkg = "flepimop/R_packages/inference", + dependencies = TRUE + ) + install.packages("covidcast", repos = "https://cloud.r-project.org") + shell: Rscript {0} + - name: Install The inference Package + run: | + devtools::install( + pkg = "flepimop/R_packages/inference", + args = c(getOption("devtools.install.args"), "--install-tests"), + quick = TRUE, + dependencies = TRUE, + force = TRUE + ) + shell: Rscript {0} + - name: Run Tests + run: | + library(testthat) + test_package("inference") + shell: Rscript {0} diff --git a/.github/workflows/labeler.yml b/.github/workflows/labeler.yml deleted file mode 100644 index 2b022fe7a..000000000 --- a/.github/workflows/labeler.yml +++ /dev/null @@ -1,18 +0,0 @@ -name: "Issue Labeler" -on: - issues: - types: [opened, edited] - -permissions: - issues: write - contents: read - -jobs: - triage: - runs-on: ubuntu-latest - steps: - - uses: github/issue-labeler@v3.3 - with: - configuration-path: .github/labeler.yml - enable-versioned-regex: 0 - repo-token: ${{ github.token }} diff --git a/flepimop/gempyor_pkg/src/gempyor/statistics.py b/flepimop/gempyor_pkg/src/gempyor/statistics.py index ea2cc72a3..ea10e7aa1 100644 --- a/flepimop/gempyor_pkg/src/gempyor/statistics.py +++ b/flepimop/gempyor_pkg/src/gempyor/statistics.py @@ -1,29 +1,69 @@ -import xarray as xr -import pandas as pd -import numpy as np +""" +Abstractions for interacting with output statistic configurations. + +This module provides the `Statistic` class which represents a entry in the inference -> +statistics section. +""" + +__all__ = ["Statistic"] + + import confuse +import numpy as np import scipy.stats +import xarray as xr class Statistic: """ - A statistic is a function that takes two time series and returns a scalar value. - It applies resample, scale, and regularization to the data before computing the statistic's log-loss. - Configuration: - - sim_var: the variable in the simulation data - - data_var: the variable in the ground truth data - - resample: resample the data before computing the statistic - - freq: the frequency to resample the data to - - aggregator: the aggregation function to use - - skipna: whether to skip NA values - - regularize: apply a regularization term to the data before computing the statistic - - # SkipNA is False by default, which results in NA values broadcasting when resampling (e.g a NA withing a sum makes the whole sum a NA) - # if True, then NA are replaced with 0 (for sum), 1 for product, ... - # In doubt, plot stat.plot_transformed() to see the effect of the resampling + Encapsulates logic for representing/implementing output statistic configurations. + + A statistic is a function that takes two time series and returns a scalar value. It + applies resample, scale, and regularization to the data before computing the + statistic's log-loss. + + Attributes: + data_var: The variable in the ground truth data. + dist: The name of the distribution to use for calculating log-likelihood. + name: The human readable name for the statistic given during instantiation. + params: Distribution parameters used in the log-likelihood calculation and + dependent on `dist`. + regularizations: Regularization functions that are added to the log loss of this + statistic. + resample: If the data should be resampled before computing the statistic. + Defaults to `False`. + resample_aggregator_name: The name of the aggregation function to use. This + attribute is not set when a "resample" section is not defined in the + `statistic_config` arg. + resample_freq: The frequency to resample the data to if the `resample` attribute + is `True`. This attribute is not set when a "resample" section is not + defined in the `statistic_config` arg. + resample_skipna: If NAs should be skipped when aggregating. `False` by default. + This attribute is not set when a "resample" section is not defined in the + `statistic_config` arg. + scale: If the data should be rescaled before computing the statistic. + scale_func: The function to use when rescaling the data. Can be any function + exported by `numpy`. This attribute is not set when a "scale" value is not + defined in the `statistic_config` arg. + zero_to_one: Should non-zero values be coerced to 1 when calculating + log-likelihood. """ - def __init__(self, name, statistic_config: confuse.ConfigView): + def __init__(self, name: str, statistic_config: confuse.ConfigView) -> None: + """ + Create an `Statistic` instance from a confuse config view. + + Args: + name: A human readable name for the statistic, mostly used for error + messages. + statistic_config: A confuse configuration view object describing an output + statistic. + + Raises: + ValueError: If an unsupported regularization name is provided via the + `statistic_config` arg. Currently only 'forecast' and 'allsubpop' are + supported. + """ self.sim_var = statistic_config["sim_var"].as_str() self.data_var = statistic_config["data_var"].as_str() self.name = name @@ -32,7 +72,7 @@ def __init__(self, name, statistic_config: confuse.ConfigView): if statistic_config["regularize"].exists(): for reg_config in statistic_config["regularize"]: # Iterate over the list reg_name = reg_config["name"].get() - reg_func = getattr(self, f"_{reg_name}_regularize") + reg_func = getattr(self, f"_{reg_name}_regularize", None) if reg_func is None: raise ValueError(f"Unsupported regularization: {reg_name}") self.regularizations.append((reg_func, reg_config.get())) @@ -47,12 +87,16 @@ def __init__(self, name, statistic_config: confuse.ConfigView): self.resample_aggregator = "" if resample_config["aggregator"].exists(): self.resample_aggregator_name = resample_config["aggregator"].get() - self.resample_skipna = False # TODO - if resample_config["aggregator"].exists() and resample_config["skipna"].exists(): + self.resample_skipna = False + if ( + resample_config["aggregator"].exists() + and resample_config["skipna"].exists() + ): self.resample_skipna = resample_config["skipna"].get() self.scale = False if statistic_config["scale"].exists(): + self.scale = True self.scale_func = getattr(np, statistic_config["scale"].get()) self.dist = statistic_config["likelihood"]["dist"].get() @@ -62,49 +106,138 @@ def __init__(self, name, statistic_config: confuse.ConfigView): self.params = {} self.zero_to_one = False - # TODO: this should be set_zeros_to and only do it for the probabilily if statistic_config["zero_to_one"].exists(): self.zero_to_one = statistic_config["zero_to_one"].get() - def _forecast_regularize(self, model_data, gt_data, **kwargs): - # scale the data so that the lastest X items are more important + def __str__(self) -> str: + return ( + f"{self.name}: {self.dist} between {self.sim_var} " + f"(sim) and {self.data_var} (data)." + ) + + def __repr__(self) -> str: + return f"A Statistic(): {self.__str__()}" + + def _forecast_regularize( + self, + model_data: xr.DataArray, + gt_data: xr.DataArray, + **kwargs: dict[str, int | float], + ) -> float: + """ + Regularization function to add weight to more recent forecasts. + + Args: + model_data: An xarray Dataset of the model data with date and subpop + dimensions. + gt_data: An xarray Dataset of the ground truth data with date and subpop + dimensions. + **kwargs: Optional keyword arguments that influence regularization. + Currently uses `last_n` for the number of observations to up weight and + `mult` for the coefficient of the regularization value. + + Returns: + The log-likelihood of the `last_n` observation up weighted by a factor of + `mult`. + """ + # scale the data so that the latest X items are more important last_n = kwargs.get("last_n", 4) mult = kwargs.get("mult", 2) - last_n_llik = self.llik(model_data.isel(date=slice(-last_n, None)), gt_data.isel(date=slice(-last_n, None))) + last_n_llik = self.llik( + model_data.isel(date=slice(-last_n, None)), + gt_data.isel(date=slice(-last_n, None)), + ) return mult * last_n_llik.sum().sum().values - def _allsubpop_regularize(self, model_data, gt_data, **kwargs): - """add a regularization term that is the sum of all subpopulations""" + def _allsubpop_regularize( + self, + model_data: xr.DataArray, + gt_data: xr.DataArray, + **kwargs: dict[str, int | float], + ) -> float: + """ + Regularization function to add the sum of all subpopulations. + + Args: + model_data: An xarray Dataset of the model data with date and subpop + dimensions. + gt_data: An xarray Dataset of the ground truth data with date and subpop + dimensions. + **kwargs: Optional keyword arguments that influence regularization. + Currently uses `mult` for the coefficient of the regularization value. + + Returns: + The sum of the subpopulations multiplied by `mult`. + """ mult = kwargs.get("mult", 1) llik_total = self.llik(model_data.sum("subpop"), gt_data.sum("subpop")) return mult * llik_total.sum().sum().values - def __str__(self) -> str: - return f"{self.name}: {self.dist} between {self.sim_var} (sim) and {self.data_var} (data)." + def apply_resample(self, data: xr.DataArray) -> xr.DataArray: + """ + Resample a data set to the given frequency using the specified aggregation. - def __repr__(self) -> str: - return f"A Statistic(): {self.__str__()}" + Args: + data: An xarray dataset with "date" and "subpop" dimensions. - def apply_resample(self, data): + Returns: + A resample dataset with similar dimensions to `data`. + """ if self.resample: - aggregator_method = getattr(data.resample(date=self.resample_freq), self.resample_aggregator_name) + aggregator_method = getattr( + data.resample(date=self.resample_freq), self.resample_aggregator_name + ) return aggregator_method(skipna=self.resample_skipna) else: return data - def apply_scale(self, data): + def apply_scale(self, data: xr.DataArray) -> xr.DataArray: + """ + Scale a data set using the specified scaling function. + + Args: + data: An xarray dataset with "date" and "subpop" dimensions. + + Returns: + An xarray dataset of the same shape and dimensions as `data` with the + `scale_func` attribute applied. + """ if self.scale: return self.scale_func(data) else: return data - def apply_transforms(self, data): + def apply_transforms(self, data: xr.DataArray): + """ + Convenient wrapper for resampling and scaling a data set. + + The resampling is applied *before* scaling which can affect the log-likelihood. + + Args: + data: An xarray dataset with "date" and "subpop" dimensions. + + Returns: + An scaled and resampled dataset with similar dimensions to `data`. + """ data_scaled_resampled = self.apply_scale(self.apply_resample(data)) return data_scaled_resampled - def llik(self, model_data: xr.DataArray, gt_data: xr.DataArray): + def llik(self, model_data: xr.DataArray, gt_data: xr.DataArray) -> xr.DataArray: + """ + Compute the log-likelihood of observing the ground truth given model output. + + Args: + model_data: An xarray Dataset of the model data with date and subpop + dimensions. + gt_data: An xarray Dataset of the ground truth data with date and subpop + dimensions. + + Returns: + The log-likelihood of observing `gt_data` from the model `model_data` as an + xarray DataArray with a "subpop" dimension. + """ dist_map = { "pois": scipy.stats.poisson.logpmf, "norm": lambda x, loc, scale: scipy.stats.norm.logpdf( @@ -112,8 +245,10 @@ def llik(self, model_data: xr.DataArray, gt_data: xr.DataArray): ), # wrong: "norm_cov": lambda x, loc, scale: scipy.stats.norm.logpdf( x, loc=loc, scale=scale * loc.where(loc > 5, 5) - ), # TODO: check, that it's really the loc - "nbinom": lambda x, n, p: scipy.stats.nbinom.logpmf(x, n=self.params.get("n"), p=model_data), + ), + "nbinom": lambda x, n, p: scipy.stats.nbinom.logpmf( + x, n=self.params.get("n"), p=model_data + ), "rmse": lambda x, y: -np.log(np.nansum(np.sqrt((x - y) ** 2))), "absolute_error": lambda x, y: -np.log(np.nansum(np.abs(x - y))), } @@ -133,20 +268,44 @@ def llik(self, model_data: xr.DataArray, gt_data: xr.DataArray): likelihood = xr.DataArray(likelihood, coords=gt_data.coords, dims=gt_data.dims) - # TODO: check the order of the arguments return likelihood - def compute_logloss(self, model_data, gt_data): + def compute_logloss( + self, model_data: xr.Dataset, gt_data: xr.Dataset + ) -> tuple[xr.DataArray, float]: + """ + Compute the logistic loss of observing the ground truth given model output. + + Args: + model_data: An xarray Dataset of the model data with date and subpop + dimensions. + gt_data: An xarray Dataset of the ground truth data with date and subpop + dimensions. + + Returns: + The logistic loss of observing `gt_data` from the model `model_data` + decomposed into the log-likelihood along the "subpop" dimension and + regularizations. + + Raises: + ValueError: If `model_data` and `gt_data` do not have the same shape. + """ model_data = self.apply_transforms(model_data[self.sim_var]) gt_data = self.apply_transforms(gt_data[self.data_var]) if not model_data.shape == gt_data.shape: raise ValueError( - f"{self.name} Statistic error: data and groundtruth do not have the same shape: model_data.shape={model_data.shape} != gt_data.shape={gt_data.shape}" + ( + f"{self.name} Statistic error: data and groundtruth do not have " + f"the same shape: model_data.shape={model_data.shape} != " + f"gt_data.shape={gt_data.shape}" + ) ) - regularization = 0 + regularization = 0.0 for reg_func, reg_config in self.regularizations: - regularization += reg_func(model_data=model_data, gt_data=gt_data, **reg_config) # Pass config parameters + regularization += reg_func( + model_data=model_data, gt_data=gt_data, **reg_config + ) # Pass config parameters return self.llik(model_data, gt_data).sum("date"), regularization diff --git a/flepimop/gempyor_pkg/tests/statistics/test_statistic_class.py b/flepimop/gempyor_pkg/tests/statistics/test_statistic_class.py new file mode 100644 index 000000000..e18861e9e --- /dev/null +++ b/flepimop/gempyor_pkg/tests/statistics/test_statistic_class.py @@ -0,0 +1,561 @@ +from datetime import date +from itertools import product +from typing import Any, Callable + +import confuse +import numpy as np +import pandas as pd +import pytest +import scipy +import xarray as xr + +from gempyor.statistics import Statistic +from gempyor.testing import create_confuse_configview_from_dict + + +class MockStatisticInput: + def __init__( + self, + name: str, + config: dict[str, Any], + model_data: xr.DataArray | None = None, + gt_data: xr.DataArray | None = None, + ) -> None: + self.name = name + self.config = config + self.model_data = model_data + self.gt_data = gt_data + self._confuse_subview = None + + def create_confuse_subview(self) -> confuse.Subview: + if self._confuse_subview is None: + self._confuse_subview = create_confuse_configview_from_dict( + self.config, name=self.name + ) + return self._confuse_subview + + def create_statistic_instance(self) -> Statistic: + return Statistic(self.name, self.create_confuse_subview()) + + +def invalid_regularization_factory() -> MockStatisticInput: + return MockStatisticInput( + "total_hospitalizations", + { + "name": "sum_hospitalizations", + "sim_var": "incidH", + "data_var": "incidH", + "remove_na": True, + "add_one": True, + "likelihood": {"dist": "rmse"}, + "regularize": [{"name": "forecast"}, {"name": "invalid"}], + }, + ) + + +def invalid_misshaped_data_factory() -> MockStatisticInput: + model_data = xr.Dataset( + data_vars={"incidH": (["date", "subpop"], np.random.randn(10, 3))}, + coords={ + "date": pd.date_range(date(2024, 1, 1), date(2024, 1, 10)), + "subpop": ["01", "02", "03"], + }, + ) + gt_data = xr.Dataset( + data_vars={"incidH": (["date", "subpop"], np.random.randn(11, 2))}, + coords={ + "date": pd.date_range(date(2024, 1, 1), date(2024, 1, 11)), + "subpop": ["02", "03"], + }, + ) + return MockStatisticInput( + "total_hospitalizations", + { + "name": "sum_hospitalizations", + "sim_var": "incidH", + "data_var": "incidH", + "remove_na": True, + "add_one": True, + "likelihood": {"dist": "norm", "params": {"scale": 2.0}}, + }, + model_data=model_data, + gt_data=gt_data, + ) + + +def simple_valid_factory() -> MockStatisticInput: + data_coords = { + "date": pd.date_range(date(2024, 1, 1), date(2024, 1, 10)), + "subpop": ["01", "02", "03"], + } + data_dim = [len(v) for v in data_coords.values()] + model_data = xr.Dataset( + data_vars={ + "incidH": (list(data_coords.keys()), np.random.randn(*data_dim)), + "incidD": (list(data_coords.keys()), np.random.randn(*data_dim)), + }, + coords=data_coords, + ) + gt_data = xr.Dataset( + data_vars={ + "incidH": (list(data_coords.keys()), np.random.randn(*data_dim)), + "incidD": (list(data_coords.keys()), np.random.randn(*data_dim)), + }, + coords=data_coords, + ) + return MockStatisticInput( + "total_hospitalizations", + { + "name": "sum_hospitalizations", + "sim_var": "incidH", + "data_var": "incidH", + "remove_na": True, + "add_one": True, + "likelihood": {"dist": "norm", "params": {"scale": 2.0}}, + }, + model_data=model_data, + gt_data=gt_data, + ) + + +def simple_valid_resample_factory() -> MockStatisticInput: + data_coords = { + "date": pd.date_range(date(2024, 1, 1), date(2024, 12, 31)), + "subpop": ["01", "02", "03", "04"], + } + data_dim = [len(v) for v in data_coords.values()] + model_data = xr.Dataset( + data_vars={ + "incidH": (list(data_coords.keys()), np.random.randn(*data_dim)), + "incidD": (list(data_coords.keys()), np.random.randn(*data_dim)), + }, + coords=data_coords, + ) + gt_data = xr.Dataset( + data_vars={ + "incidH": (list(data_coords.keys()), np.random.randn(*data_dim)), + "incidD": (list(data_coords.keys()), np.random.randn(*data_dim)), + }, + coords=data_coords, + ) + return MockStatisticInput( + "total_hospitalizations", + { + "name": "sum_hospitalizations", + "sim_var": "incidH", + "data_var": "incidH", + "remove_na": True, + "add_one": True, + "likelihood": {"dist": "rmse"}, + "resample": {"freq": "MS", "aggregator": "sum"}, + }, + model_data=model_data, + gt_data=gt_data, + ) + + +def simple_valid_scale_factory() -> MockStatisticInput: + data_coords = { + "date": pd.date_range(date(2024, 1, 1), date(2024, 12, 31)), + "subpop": ["01", "02", "03", "04"], + } + data_dim = [len(v) for v in data_coords.values()] + model_data = xr.Dataset( + data_vars={ + "incidH": (list(data_coords.keys()), np.random.randn(*data_dim)), + "incidD": (list(data_coords.keys()), np.random.randn(*data_dim)), + }, + coords=data_coords, + ) + gt_data = xr.Dataset( + data_vars={ + "incidH": (list(data_coords.keys()), np.random.randn(*data_dim)), + "incidD": (list(data_coords.keys()), np.random.randn(*data_dim)), + }, + coords=data_coords, + ) + return MockStatisticInput( + "total_hospitalizations", + { + "name": "sum_hospitalizations", + "sim_var": "incidH", + "data_var": "incidH", + "remove_na": True, + "add_one": True, + "likelihood": {"dist": "rmse"}, + "scale": "exp", + }, + model_data=model_data, + gt_data=gt_data, + ) + + +def simple_valid_resample_and_scale_factory() -> MockStatisticInput: + data_coords = { + "date": pd.date_range(date(2024, 1, 1), date(2024, 12, 31)), + "subpop": ["01", "02", "03", "04"], + } + data_dim = [len(v) for v in data_coords.values()] + model_data = xr.Dataset( + data_vars={ + "incidH": (list(data_coords.keys()), np.random.randn(*data_dim)), + "incidD": (list(data_coords.keys()), np.random.randn(*data_dim)), + }, + coords=data_coords, + ) + gt_data = xr.Dataset( + data_vars={ + "incidH": (list(data_coords.keys()), np.random.randn(*data_dim)), + "incidD": (list(data_coords.keys()), np.random.randn(*data_dim)), + }, + coords=data_coords, + ) + return MockStatisticInput( + "total_hospitalizations", + { + "name": "sum_hospitalizations", + "sim_var": "incidD", + "data_var": "incidD", + "remove_na": True, + "add_one": True, + "likelihood": {"dist": "rmse"}, + "resample": {"freq": "W", "aggregator": "max"}, + "scale": "sin", + }, + model_data=model_data, + gt_data=gt_data, + ) + + +all_valid_factories = [ + (simple_valid_factory), + (simple_valid_resample_factory), + (simple_valid_resample_factory), + (simple_valid_resample_and_scale_factory), +] + + +class TestStatistic: + @pytest.mark.parametrize("factory", [(invalid_regularization_factory)]) + def test_unsupported_regularizations_value_error( + self, factory: Callable[[], MockStatisticInput] + ) -> None: + mock_inputs = factory() + unsupported_name = next( + reg_name + for reg_name in [ + reg["name"] for reg in mock_inputs.config.get("regularize", []) + ] + if reg_name not in ["forecast", "allsubpop"] + ) + with pytest.raises( + ValueError, match=rf"^Unsupported regularization\: {unsupported_name}$" + ): + mock_inputs.create_statistic_instance() + + @pytest.mark.parametrize("factory", all_valid_factories) + def test_statistic_instance_attributes( + self, factory: Callable[[], MockStatisticInput] + ) -> None: + # Setup + mock_inputs = factory() + statistic = mock_inputs.create_statistic_instance() + + # `data_var` attribute + assert statistic.data_var == mock_inputs.config["data_var"] + + # `dist` attribute + assert statistic.dist == mock_inputs.config["likelihood"]["dist"] + + # `name` attribute + assert statistic.name == mock_inputs.name + + # `params` attribute + assert statistic.params == mock_inputs.config["likelihood"].get("params", {}) + + # `regularizations` attribute + assert statistic.regularizations == [ + (r["name"], r) for r in mock_inputs.config.get("regularize", []) + ] + + # `resample` attribute + resample_config = mock_inputs.config.get("resample", {}) + assert statistic.resample == (resample_config != {}) + + if resample_config: + # `resample_aggregator_name` attribute + assert statistic.resample_aggregator_name == resample_config.get( + "aggregator", "" + ) + + # `resample_freq` attribute + assert statistic.resample_freq == resample_config.get("freq", "") + + # `resample_skipna` attribute + assert ( + statistic.resample_skipna == resample_config.get("skipna", False) + if resample_config.get("aggregator") is not None + else False + ) + + # `scale` attribute + assert statistic.scale == (mock_inputs.config.get("scale") is not None) + + # `scale_func` attribute + if (scale_func := mock_inputs.config.get("scale")) is not None: + assert statistic.scale_func == getattr(np, scale_func) + + # `sim_var` attribute + assert statistic.sim_var == mock_inputs.config["sim_var"] + + # `zero_to_one` attribute + assert statistic.zero_to_one == mock_inputs.config.get("zero_to_one", False) + + @pytest.mark.parametrize("factory", all_valid_factories) + def test_statistic_str_and_repr( + self, factory: Callable[[], MockStatisticInput] + ) -> None: + # Setup + mock_inputs = factory() + statistic = mock_inputs.create_statistic_instance() + + # Tests + statistic_str = ( + f"{mock_inputs.name}: {mock_inputs.config['likelihood']['dist']} between " + f"{mock_inputs.config['sim_var']} (sim) and " + f"{mock_inputs.config['data_var']} (data)." + ) + assert str(statistic) == statistic_str + assert repr(statistic) == f"A Statistic(): {statistic_str}" + + @pytest.mark.parametrize("factory,last_n,mult", [(simple_valid_factory, 4, 2.0)]) + def test_forecast_regularize( + self, factory: Callable[[], MockStatisticInput], last_n: int, mult: int | float + ) -> None: + # Setup + mock_inputs = factory() + statistic = mock_inputs.create_statistic_instance() + + # Tests + forecast_regularization = statistic._forecast_regularize( + mock_inputs.model_data[mock_inputs.config["sim_var"]], + mock_inputs.gt_data[mock_inputs.config["data_var"]], + last_n=last_n, + mult=mult, + ) + assert isinstance(forecast_regularization, float) + + @pytest.mark.parametrize("factory,mult", [(simple_valid_factory, 2.0)]) + def test_allsubpop_regularize( + self, factory: Callable[[], MockStatisticInput], mult: int | float + ) -> None: + # Setup + mock_inputs = factory() + statistic = mock_inputs.create_statistic_instance() + + # Tests + forecast_regularization = statistic._allsubpop_regularize( + mock_inputs.model_data[mock_inputs.config["sim_var"]], + mock_inputs.gt_data[mock_inputs.config["data_var"]], + mult=mult, + ) + assert isinstance(forecast_regularization, float) + + @pytest.mark.parametrize("factory", all_valid_factories) + def test_apply_resample(self, factory: Callable[[], MockStatisticInput]) -> None: + # Setup + mock_inputs = factory() + statistic = mock_inputs.create_statistic_instance() + + # Tests + resampled_data = statistic.apply_resample( + mock_inputs.model_data[mock_inputs.config["sim_var"]] + ) + if resample_config := mock_inputs.config.get("resample", {}): + # Resample config + expected_resampled_data = mock_inputs.model_data[ + mock_inputs.config["sim_var"] + ].resample(date=resample_config.get("freq", "")) + aggregation_func = getattr( + expected_resampled_data, resample_config.get("aggregator", "") + ) + expected_resampled_data = aggregation_func( + skipna=( + resample_config.get("skipna", False) + if resample_config.get("aggregator") is not None + else False + ) + ) + assert resampled_data.identical(expected_resampled_data) + else: + # No resample config, `apply_resample` returns our input + assert resampled_data.identical( + mock_inputs.model_data[mock_inputs.config["sim_var"]] + ) + + @pytest.mark.parametrize("factory", all_valid_factories) + def test_apply_scale(self, factory: Callable[[], MockStatisticInput]) -> None: + # Setup + mock_inputs = factory() + statistic = mock_inputs.create_statistic_instance() + + # Tests + scaled_data = statistic.apply_scale( + mock_inputs.model_data[mock_inputs.config["sim_var"]] + ) + if (scale_func := mock_inputs.config.get("scale")) is not None: + # Scale config + expected_scaled_data = getattr(np, scale_func)( + mock_inputs.model_data[mock_inputs.config["sim_var"]] + ) + assert scaled_data.identical(expected_scaled_data) + else: + # No scale config, `apply_scale` is a no-op + assert scaled_data.identical( + mock_inputs.model_data[mock_inputs.config["sim_var"]] + ) + + @pytest.mark.parametrize("factory", all_valid_factories) + def test_apply_transforms(self, factory: Callable[[], MockStatisticInput]) -> None: + # Setup + mock_inputs = factory() + statistic = mock_inputs.create_statistic_instance() + + # Tests + transformed_data = statistic.apply_transforms( + mock_inputs.model_data[mock_inputs.config["sim_var"]] + ) + expected_transformed_data = mock_inputs.model_data[ + mock_inputs.config["sim_var"] + ].copy() + if resample_config := mock_inputs.config.get("resample", {}): + # Resample config + expected_transformed_data = expected_transformed_data.resample( + date=resample_config.get("freq", "") + ) + aggregation_func = getattr( + expected_transformed_data, resample_config.get("aggregator", "") + ) + expected_transformed_data = aggregation_func( + skipna=( + resample_config.get("skipna", False) + if resample_config.get("aggregator") is not None + else False + ) + ) + if (scale_func := mock_inputs.config.get("scale")) is not None: + # Scale config + expected_transformed_data = getattr(np, scale_func)( + expected_transformed_data + ) + assert transformed_data.identical(expected_transformed_data) + + @pytest.mark.parametrize("factory", all_valid_factories) + def test_llik(self, factory: Callable[[], MockStatisticInput]) -> None: + # Setup + mock_inputs = factory() + statistic = mock_inputs.create_statistic_instance() + + # Tests + log_likelihood = statistic.llik( + mock_inputs.model_data[mock_inputs.config["sim_var"]], + mock_inputs.gt_data[mock_inputs.config["data_var"]], + ) + + assert isinstance(log_likelihood, xr.DataArray) + assert ( + log_likelihood.dims + == mock_inputs.gt_data[mock_inputs.config["data_var"]].dims + ) + assert log_likelihood.coords.identical( + mock_inputs.gt_data[mock_inputs.config["data_var"]].coords + ) + dist_name = mock_inputs.config["likelihood"]["dist"] + if dist_name in {"absolute_error", "rmse"}: + # MAE produces a single repeated number + assert np.allclose( + log_likelihood.values, + -np.log( + np.nansum( + np.abs( + mock_inputs.model_data[mock_inputs.config["sim_var"]] + - mock_inputs.gt_data[mock_inputs.config["data_var"]] + ) + ) + ), + ) + elif dist_name == "pois": + assert np.allclose( + log_likelihood.values, + scipy.stats.poisson.logpmf( + mock_inputs.gt_data[mock_inputs.config["data_var"]].values, + mock_inputs.model_data[mock_inputs.config["data_var"]].values, + ), + ) + elif dist_name == {"norm", "norm_cov"}: + scale = mock_inputs.config["likelihood"]["params"]["scale"] + if dist_name == "norm_cov": + scale *= mock_inputs.model_data[mock_inputs.config["sim_var"]].where( + mock_inputs.model_data[mock_inputs.config["sim_var"]] > 5, 5 + ) + assert np.allclose( + log_likelihood.values, + scipy.stats.norm.logpdf( + mock_inputs.gt_data[mock_inputs.config["data_var"]].values, + mock_inputs.model_data[mock_inputs.config["sim_var"]].values, + scale=scale, + ), + ) + elif dist_name == "nbinom": + assert np.allclose( + log_likelihood.values, + scipy.stats.nbinom.logpmf( + mock_inputs.gt_data[mock_inputs.config["data_var"]].values, + n=mock_inputs.config["likelihood"]["params"]["n"], + p=mock_inputs.model_data[mock_inputs.config["sim_var"]].values, + ), + ) + + @pytest.mark.parametrize("factory", [(invalid_misshaped_data_factory)]) + def test_compute_logloss_data_misshape_value_error( + self, factory: Callable[[], MockStatisticInput] + ) -> None: + mock_inputs = factory() + statistic = mock_inputs.create_statistic_instance() + + model_rows, model_cols = mock_inputs.model_data[ + mock_inputs.config["sim_var"] + ].shape + gt_rows, gt_cols = mock_inputs.gt_data[mock_inputs.config["data_var"]].shape + expected_match = ( + rf"^{mock_inputs.name} Statistic error\: data and groundtruth do not have " + rf"the same shape\: model\_data\.shape\=\({model_rows}\, {model_cols}\) " + rf"\!\= gt\_data\.shape\=\({gt_rows}\, {gt_cols}\)$" + ) + with pytest.raises(ValueError, match=expected_match): + statistic.compute_logloss(mock_inputs.model_data, mock_inputs.gt_data) + + @pytest.mark.parametrize("factory", all_valid_factories) + def test_compute_logloss(self, factory: Callable[[], MockStatisticInput]) -> None: + # Setup + mock_inputs = factory() + statistic = mock_inputs.create_statistic_instance() + log_likelihood, regularization = statistic.compute_logloss( + mock_inputs.model_data, mock_inputs.gt_data + ) + regularization_config = mock_inputs.config.get("regularize", []) + + # Assertions on log_likelihood + assert isinstance(log_likelihood, xr.DataArray) + assert log_likelihood.coords.identical( + xr.Coordinates(coords={"subpop": mock_inputs.gt_data.coords.get("subpop")}) + ) + + # Assertions on regularization + assert isinstance(regularization, float) + if regularization_config: + # Regularizations on logistic loss + assert regularization != 0.0 + else: + # No regularizations on logistic loss + assert regularization == 0.0