Source code for glotaran.analysis.optimization_group_calculator_unlinked

from __future__ import annotations

from typing import TYPE_CHECKING

import numpy as np
import xarray as xr

from glotaran.analysis.optimization_group_calculator import OptimizationGroupCalculator
from glotaran.analysis.util import CalculatedMatrix
from glotaran.analysis.util import apply_weight
from glotaran.analysis.util import calculate_clp_penalties
from glotaran.analysis.util import calculate_matrix
from glotaran.analysis.util import reduce_matrix
from glotaran.analysis.util import retrieve_clps
from glotaran.model import DatasetModel

if TYPE_CHECKING:
    from glotaran.analysis.optimization_group import OptimizationGroup


[docs]class OptimizationGroupCalculatorUnlinked(OptimizationGroupCalculator):
    """Represents a problem where the clps are not linked."""

    def __init__(self, group: OptimizationGroup):
        super().__init__(group)

        self._global_matrices = {}
        self._flattened_data = {}
        self._flattened_weights = {}
        for label, dataset_model in group.dataset_models.items():
            if dataset_model.has_global_model():
                self._flattened_data[label] = dataset_model.get_data().T.flatten()
                weight = dataset_model.get_weight()
                if weight is not None:
                    weight = weight.T.flatten()
                    self._flattened_data[label] *= weight
                    self._flattened_weight[label] = weight

    @property
    def global_matrices(self) -> dict[str, CalculatedMatrix]:
        return self._global_matrices

[docs]    def calculate_matrices(
        self,
    ) -> tuple[
        dict[str, CalculatedMatrix | list[CalculatedMatrix]],
        dict[str, CalculatedMatrix | list[CalculatedMatrix]],
    ]:
        """Calculates the model matrices."""

        self._group._matrices = {}
        self._global_matrices = {}
        self._group._reduced_matrices = {}

        for label, dataset_model in self._group.dataset_models.items():

            if dataset_model.is_index_dependent():
                self._calculate_index_dependent_matrix(label, dataset_model)
            else:
                self._calculate_index_independent_matrix(label, dataset_model)

            if dataset_model.has_global_model():
                self._calculate_global_matrix(label, dataset_model)

        return self._group._matrices, self._group._reduced_matrices

    def _calculate_index_dependent_matrix(self, label: str, dataset_model: DatasetModel):
        self._group._matrices[label] = []
        self._group._reduced_matrices[label] = []
        for i, index in enumerate(dataset_model.get_global_axis()):
            matrix = calculate_matrix(
                dataset_model,
                {dataset_model.get_global_dimension(): i},
            )
            self._group._matrices[label].append(matrix)
            if not dataset_model.has_global_model():
                reduced_matrix = reduce_matrix(
                    matrix, self._group.model, self._group.parameters, index
                )
                self._group._reduced_matrices[label].append(reduced_matrix)

    def _calculate_index_independent_matrix(self, label: str, dataset_model: DatasetModel):
        matrix = calculate_matrix(dataset_model, {})
        self._group._matrices[label] = matrix
        if not dataset_model.has_global_model():
            reduced_matrix = reduce_matrix(matrix, self._group.model, self._group.parameters, None)
            self._group._reduced_matrices[label] = reduced_matrix

    def _calculate_global_matrix(self, label: str, dataset_model: DatasetModel):
        matrix = calculate_matrix(dataset_model, {}, as_global_model=True)
        self._global_matrices[label] = matrix

[docs]    def calculate_residual(
        self,
    ) -> tuple[
        dict[str, list[np.ndarray]],
        dict[str, list[np.ndarray]],
        dict[str, list[np.ndarray]],
        dict[str, list[np.ndarray]],
    ]:
        """Calculates the residuals."""

        self._group._reduced_clps = {}
        self._group._clps = {}
        self._group._weighted_residuals = {}
        self._group._residuals = {}
        self._group._additional_penalty = []

        for label, dataset_model in self._group._dataset_models.items():
            if dataset_model.has_global_model():
                self._calculate_full_model_residual(label, dataset_model)
            else:
                self._calculate_residual(label, dataset_model)

        self._group._additional_penalty = (
            np.concatenate(self._group._additional_penalty)
            if len(self._group._additional_penalty) != 0
            else []
        )
        return (
            self._group._reduced_clps,
            self._group._clps,
            self._group._weighted_residuals,
            self._group._residuals,
        )

    def _calculate_residual(self, label: str, dataset_model: DatasetModel):
        self._group._reduced_clps[label] = []
        self._group._clps[label] = []
        self._group._weighted_residuals[label] = []
        self._group._residuals[label] = []

        data = dataset_model.get_data()
        global_axis = dataset_model.get_global_axis()

        for i, index in enumerate(global_axis):
            reduced_clp_labels, reduced_matrix = (
                self._group.reduced_matrices[label][i]
                if dataset_model.is_index_dependent()
                else self._group.reduced_matrices[label]
            )
            if not dataset_model.is_index_dependent():
                reduced_matrix = reduced_matrix.copy()

            if dataset_model.scale is not None:
                reduced_matrix *= dataset_model.scale

            weight = dataset_model.get_weight()
            if weight is not None:
                apply_weight(reduced_matrix, weight[:, i])

            reduced_clps, residual = self._group._residual_function(reduced_matrix, data[:, i])

            self._group._reduced_clps[label].append(reduced_clps)

            clp_labels = self._get_clp_labels(label, i)
            self._group._clps[label].append(
                retrieve_clps(
                    self._group.model,
                    self._group.parameters,
                    clp_labels,
                    reduced_clp_labels,
                    reduced_clps,
                    index,
                )
            )
            self._group._weighted_residuals[label].append(residual)
            if weight is not None:
                self._group._residuals[label].append(residual / weight[:, i])
            else:
                self._group._residuals[label].append(residual)

        clp_labels = self._get_clp_labels(label)
        additional_penalty = calculate_clp_penalties(
            self._group.model,
            self._group.parameters,
            clp_labels,
            self._group._clps[label],
            global_axis,
            self._group.dataset_models,
        )
        if additional_penalty.size != 0:
            self._group._additional_penalty.append(additional_penalty)

    def _calculate_full_model_residual(self, label: str, dataset_model: DatasetModel):

        model_matrix = self._group.matrices[label]
        global_matrix = self.global_matrices[label].matrix

        if dataset_model.is_index_dependent():
            matrix = np.concatenate(
                [
                    np.kron(global_matrix[i, :], model_matrix[i].matrix)
                    for i in range(global_matrix.shape[0])
                ]
            )
        else:
            matrix = np.kron(global_matrix, model_matrix.matrix)
        weight = self._flattened_weights.get(label)
        if weight is not None:
            apply_weight(matrix, weight)
        data = self._flattened_data[label]
        (
            self._group._clps[label],
            self._group._weighted_residuals[label],
        ) = self._group._residual_function(matrix, data)

        self._group._residuals[label] = self._group._weighted_residuals[label]
        if weight is not None:
            self._group._residuals[label] /= weight

    def _get_clp_labels(self, label: str, index: int = 0):
        return (
            self._group.matrices[label][index].clp_labels
            if self._group.dataset_models[label].is_index_dependent()
            else self._group.matrices[label].clp_labels
        )

[docs]    def create_index_dependent_result_dataset(self, label: str, dataset: xr.Dataset) -> xr.Dataset:
        """Creates a result datasets for index dependent matrices."""

        model_dimension = self._group.dataset_models[label].get_model_dimension()
        global_dimension = self._group.dataset_models[label].get_global_dimension()

        dataset.coords["clp_label"] = self._get_clp_labels(label)
        dataset["matrix"] = (
            (
                (global_dimension),
                (model_dimension),
                ("clp_label"),
            ),
            np.asarray([m.matrix for m in self._group.matrices[label]]),
        )

        if self._group.dataset_models[label].has_global_model():
            self._add_global_matrix_to_dataset(label, dataset)
            self._add_full_model_residual_and_clp_to_dataset(label, dataset)
        else:
            self._add_residual_and_clp_to_dataset(label, dataset)

        return dataset

[docs]    def create_index_independent_result_dataset(
        self, label: str, dataset: xr.Dataset
    ) -> xr.Dataset:
        """Creates a result datasets for index independent matrices."""

        matrix = self._group.matrices[label]
        dataset.coords["clp_label"] = matrix.clp_labels
        model_dimension = self._group.dataset_models[label].get_model_dimension()
        dataset["matrix"] = (
            (
                (model_dimension),
                ("clp_label"),
            ),
            matrix.matrix,
        )

        if self._group.dataset_models[label].has_global_model():
            self._add_global_matrix_to_dataset(label, dataset)
            self._add_full_model_residual_and_clp_to_dataset(label, dataset)
        else:
            self._add_residual_and_clp_to_dataset(label, dataset)

        return dataset

    def _add_global_matrix_to_dataset(self, label: str, dataset: xr.Dataset) -> xr.Dataset:
        matrix = self.global_matrices[label]
        dataset.coords["global_clp_label"] = matrix.clp_labels
        global_dimension = self._group.dataset_models[label].get_global_dimension()
        dataset["global_matrix"] = (
            (
                (global_dimension),
                ("global_clp_label"),
            ),
            matrix.matrix,
        )

    def _add_residual_and_clp_to_dataset(self, label: str, dataset: xr.Dataset):
        model_dimension = self._group.dataset_models[label].get_model_dimension()
        global_dimension = self._group.dataset_models[label].get_global_dimension()
        dataset["clp"] = (
            (
                (global_dimension),
                ("clp_label"),
            ),
            np.asarray(self._group.clps[label]),
        )
        dataset["weighted_residual"] = (
            (
                (model_dimension),
                (global_dimension),
            ),
            np.transpose(np.asarray(self._group.weighted_residuals[label])),
        )
        dataset["residual"] = (
            (
                (model_dimension),
                (global_dimension),
            ),
            np.transpose(np.asarray(self._group.residuals[label])),
        )

    def _add_full_model_residual_and_clp_to_dataset(self, label: str, dataset: xr.Dataset):
        model_dimension = self._group.dataset_models[label].get_model_dimension()
        global_dimension = self._group.dataset_models[label].get_global_dimension()
        dataset["clp"] = (
            (
                ("global_clp_label"),
                ("clp_label"),
            ),
            self._group.clps[label].reshape(
                (dataset.coords["global_clp_label"].size, dataset.coords["clp_label"].size)
            ),
        )
        dataset["weighted_residual"] = (
            (
                (model_dimension),
                (global_dimension),
            ),
            self._group.weighted_residuals[label].T.reshape(dataset.data.shape),
        )
        dataset["residual"] = (
            (
                (model_dimension),
                (global_dimension),
            ),
            self._group.residuals[label].T.reshape(dataset.data.shape),
        )

[docs]    def calculate_full_penalty(self) -> np.ndarray:
        if self._group._full_penalty is None:
            residuals = self._group.weighted_residuals
            additional_penalty = self._group.additional_penalty
            residuals = [
                np.concatenate(residuals[label])
                if isinstance(residuals[label], list)
                else residuals[label]
                for label in residuals.keys()
            ]

            self._group._full_penalty = (
                np.concatenate((np.concatenate(residuals), additional_penalty))
                if additional_penalty is not None
                else np.concatenate(residuals)
            )
        return self._group._full_penalty