Trajectory Mixing¤

trainax.TrajectorySubStacker ¤

Bases: Module

Source code in trainax/_mixer.py

class TrajectorySubStacker(eqx.Module):
    data_sub_trajectories: PyTree[Float[Array, "num_total_samples sub_trj_len ..."]]

    num_total_samples: int

    def __init__(
        self,
        data_trajectories: PyTree[Float[Array, "num_samples trj_len ..."]],
        sub_trajectory_len: int,
        *,
        do_sub_stacking: bool = True,
        only_store_ic: bool = False,
    ):
        """
        Slice a batch of trajectories into sub-trajectories.

        Useful to create windows of specific length for (unrolled) training
        methodologies of autoregressive neural emulators.

        **Arguments:**

        - `data_trajectories`: The batch of trajectories to slice. This must be
            a PyTree of Arrays who have at least two leading axes: a batch-axis
            and a time axis. For example, the zeroth axis can be associated with
            multiple initial conditions or constitutive parameters and the first
            axis represents all temporal snapshots. A PyTree can also just be an
            array. You can provide additional leafs in the PyTree, e.g., for the
            corresponding constitutive parameters etc. Make sure that the
            emulator has the corresponding signature.
        - `sub_trajectory_len`: The length of the sub-trajectories. This
            must be smaller equal to the length of the trajectories (`trj_len`).
            For unrolled training with `t` steps, set this to `t+1` to include
            the necessary initial condition.
        - `do_sub_stacking`: Whether to slice out all possible
            (overlapping) windows out of the `trj_len` or just slice the
            `trj_len` axis from `0:sub_trajectory_len`.
        - `only_store_ic`: Whether to only store the initial
            condition of the sub-trajectories. This can be helpful for
            configurations that do not need the reference trajectory like
            residuum-based learning strategies.

        !!! info
            * Since the windows sliced out are overlapping, the produces
                internal array can be large, especially if `sub_trajectory_len`
                is large. Certainly, this is not the most memory-efficient
                solution but is sufficient if your problem easily fits into
                memory. Consider overwriting this class with a more memory
                efficient implementation if you run into memory issues.
        """
        if do_sub_stacking:
            # return shape is (num_samples, num_stacks, sub_trj_len, ...)
            stacked_sub_trajectories = jax.vmap(
                stack_sub_trajectories,
                in_axes=(0, None),
            )(data_trajectories, sub_trajectory_len)
        else:
            # shape is (num_samples, 1, sub_trj_len, ...)
            stacked_sub_trajectories = jtu.tree_map(
                lambda x: x[:, None, :sub_trajectory_len], data_trajectories
            )

        # Merge the two batch axes (num_samples & num_stacks) into (num_total_samples)
        # resulting shape is (num_total_samples, sub_trj_len, ...)
        sub_trajecories = jtu.tree_map(jnp.concatenate, stacked_sub_trajectories)

        if only_store_ic:
            # changes shape to (num_total_samples, 1, ...)
            sub_trajecories = jtu.tree_map(lambda x: x[:, 0:1], sub_trajecories)

        num_total_samples = jtu.tree_map(lambda x: x.shape[0], (sub_trajecories,))[0]

        self.num_total_samples = num_total_samples
        self.data_sub_trajectories = sub_trajecories

    def __call__(
        self,
        indices: slice,
    ) -> PyTree[Float[Array, "len(indices) sub_trj_len ..."]]:
        """
        Slice out sub-samples based on the given indices.

        **Arguments:**

        - `indices`: The indices to slice out the sub-trajectories, e.g., this
            can be `[0, 4, 5]` to slice out the zeroth, fourth, and fifth
            sub-trajectories or it can be a `slice` object.

        **Returns:**

        - `PyTree[Float[Array, "len(indices) sub_trj_len ..."]]`: The sliced
            sub-trajectories.
        """
        return jtu.tree_map(lambda x: x[indices], self.data_sub_trajectories)

init ¤

__init__(
    data_trajectories: PyTree[
        Float[Array, "num_samples trj_len ..."]
    ],
    sub_trajectory_len: int,
    *,
    do_sub_stacking: bool = True,
    only_store_ic: bool = False
)

Slice a batch of trajectories into sub-trajectories.

Useful to create windows of specific length for (unrolled) training methodologies of autoregressive neural emulators.

Arguments:

data_trajectories: The batch of trajectories to slice. This must be a PyTree of Arrays who have at least two leading axes: a batch-axis and a time axis. For example, the zeroth axis can be associated with multiple initial conditions or constitutive parameters and the first axis represents all temporal snapshots. A PyTree can also just be an array. You can provide additional leafs in the PyTree, e.g., for the corresponding constitutive parameters etc. Make sure that the emulator has the corresponding signature.
sub_trajectory_len: The length of the sub-trajectories. This must be smaller equal to the length of the trajectories (trj_len). For unrolled training with t steps, set this to t+1 to include the necessary initial condition.
do_sub_stacking: Whether to slice out all possible (overlapping) windows out of the trj_len or just slice the trj_len axis from 0:sub_trajectory_len.
only_store_ic: Whether to only store the initial condition of the sub-trajectories. This can be helpful for configurations that do not need the reference trajectory like residuum-based learning strategies.

Info

Since the windows sliced out are overlapping, the produces internal array can be large, especially if sub_trajectory_len is large. Certainly, this is not the most memory-efficient solution but is sufficient if your problem easily fits into memory. Consider overwriting this class with a more memory efficient implementation if you run into memory issues.

Source code in trainax/_mixer.py

def __init__(
    self,
    data_trajectories: PyTree[Float[Array, "num_samples trj_len ..."]],
    sub_trajectory_len: int,
    *,
    do_sub_stacking: bool = True,
    only_store_ic: bool = False,
):
    """
    Slice a batch of trajectories into sub-trajectories.

    Useful to create windows of specific length for (unrolled) training
    methodologies of autoregressive neural emulators.

    **Arguments:**

    - `data_trajectories`: The batch of trajectories to slice. This must be
        a PyTree of Arrays who have at least two leading axes: a batch-axis
        and a time axis. For example, the zeroth axis can be associated with
        multiple initial conditions or constitutive parameters and the first
        axis represents all temporal snapshots. A PyTree can also just be an
        array. You can provide additional leafs in the PyTree, e.g., for the
        corresponding constitutive parameters etc. Make sure that the
        emulator has the corresponding signature.
    - `sub_trajectory_len`: The length of the sub-trajectories. This
        must be smaller equal to the length of the trajectories (`trj_len`).
        For unrolled training with `t` steps, set this to `t+1` to include
        the necessary initial condition.
    - `do_sub_stacking`: Whether to slice out all possible
        (overlapping) windows out of the `trj_len` or just slice the
        `trj_len` axis from `0:sub_trajectory_len`.
    - `only_store_ic`: Whether to only store the initial
        condition of the sub-trajectories. This can be helpful for
        configurations that do not need the reference trajectory like
        residuum-based learning strategies.

    !!! info
        * Since the windows sliced out are overlapping, the produces
            internal array can be large, especially if `sub_trajectory_len`
            is large. Certainly, this is not the most memory-efficient
            solution but is sufficient if your problem easily fits into
            memory. Consider overwriting this class with a more memory
            efficient implementation if you run into memory issues.
    """
    if do_sub_stacking:
        # return shape is (num_samples, num_stacks, sub_trj_len, ...)
        stacked_sub_trajectories = jax.vmap(
            stack_sub_trajectories,
            in_axes=(0, None),
        )(data_trajectories, sub_trajectory_len)
    else:
        # shape is (num_samples, 1, sub_trj_len, ...)
        stacked_sub_trajectories = jtu.tree_map(
            lambda x: x[:, None, :sub_trajectory_len], data_trajectories
        )

    # Merge the two batch axes (num_samples & num_stacks) into (num_total_samples)
    # resulting shape is (num_total_samples, sub_trj_len, ...)
    sub_trajecories = jtu.tree_map(jnp.concatenate, stacked_sub_trajectories)

    if only_store_ic:
        # changes shape to (num_total_samples, 1, ...)
        sub_trajecories = jtu.tree_map(lambda x: x[:, 0:1], sub_trajecories)

    num_total_samples = jtu.tree_map(lambda x: x.shape[0], (sub_trajecories,))[0]

    self.num_total_samples = num_total_samples
    self.data_sub_trajectories = sub_trajecories

call ¤

__call__(
    indices: slice,
) -> PyTree[Float[Array, "len(indices) sub_trj_len ..."]]

Slice out sub-samples based on the given indices.

Arguments:

indices: The indices to slice out the sub-trajectories, e.g., this can be [0, 4, 5] to slice out the zeroth, fourth, and fifth sub-trajectories or it can be a slice object.

Returns:

PyTree[Float[Array, "len(indices) sub_trj_len ..."]]: The sliced sub-trajectories.

Source code in trainax/_mixer.py

def __call__(
    self,
    indices: slice,
) -> PyTree[Float[Array, "len(indices) sub_trj_len ..."]]:
    """
    Slice out sub-samples based on the given indices.

    **Arguments:**

    - `indices`: The indices to slice out the sub-trajectories, e.g., this
        can be `[0, 4, 5]` to slice out the zeroth, fourth, and fifth
        sub-trajectories or it can be a `slice` object.

    **Returns:**

    - `PyTree[Float[Array, "len(indices) sub_trj_len ..."]]`: The sliced
        sub-trajectories.
    """
    return jtu.tree_map(lambda x: x[indices], self.data_sub_trajectories)

trainax.PermutationMixer ¤

Bases: Module

Source code in trainax/_mixer.py

class PermutationMixer(eqx.Module):
    num_total_samples: int
    num_minibatches: int
    batch_size: int
    num_minibatches_per_epoch: int
    num_epochs: int

    permutations: Array

    def __init__(
        self,
        num_total_samples: int,
        num_minibatches: int,
        batch_size: int,
        shuffle_key: PRNGKeyArray,
    ):
        """
        Precompute permuations for a given number of minibatches within a
        dataset. Automatically determines the number of necessary epochs (runs
        over the entire dataset). Upon calling returns a collection of indices
        to produce a new minibatch.

        If the remainder minibatch in one epoch is smaller than the batch size,
        it will **not** be extended using data from the next epoch, but returned
        as smaller list of indices.

        **Arguments:**

        - `num_total_samples`: The total number of samples in the dataset.
        - `num_minibatches`: The size of minibatches to train on.
        - `batch_size`: The size of the minibatches.
        - `shuffle_key`: The key to create the permutation; needed for
            deterministic reproducibility.

        !!! warning
            ValueError: If the batch size is larger than the total number of
            samples for one epoch.
        """
        if num_total_samples < batch_size:
            print(
                f"batch size {batch_size} is larger than the total number of samples {num_total_samples}"
            )
            print("Performing full batch training")
            effective_batch_size = num_total_samples
        else:
            effective_batch_size = batch_size

        self.num_total_samples = num_total_samples
        self.num_minibatches = num_minibatches
        self.num_minibatches_per_epoch = int(
            jnp.ceil(num_total_samples / effective_batch_size)
        )
        self.num_epochs = int(
            jnp.ceil(num_minibatches / self.num_minibatches_per_epoch)
        )
        self.batch_size = effective_batch_size

        # Precompute the permutations
        _, self.permutations = jax.lax.scan(
            lambda key, _: (
                jax.random.split(key)[0],
                jax.random.permutation(key, num_total_samples),
            ),
            shuffle_key,
            None,
            length=self.num_epochs,
        )

    def __call__(
        self,
        i: int,
        *,
        return_info: bool = False,
    ) -> Int[Array, "batch_size"]:
        """
        Given the batch index `i`, return the corresponding indices to slice out
        the minibatch.

        **Arguments:**

        - `i`: The batch index.
        - `return_info`: Whether to return additional information about the
            current epoch and batch index.

        **Returns:**

        - The indices to slice out the minibatch in form of an array of
            integers.

        !!! warning
            ValueError: If the batch index is larger than the number of
                minibatches (because likely there will be no permuation for it)
        """
        if i >= self.num_minibatches:
            raise ValueError("Batch index out of range")

        epoch_i = i // self.num_minibatches_per_epoch
        batch_i = i % self.num_minibatches_per_epoch

        batch_start = batch_i * self.batch_size
        batch_end = min((batch_i + 1) * self.batch_size, self.num_total_samples)

        batch_indices = self.permutations[epoch_i, batch_start:batch_end]

        if return_info:
            return batch_indices, (epoch_i, batch_i)
        else:
            return batch_indices

init ¤

__init__(
    num_total_samples: int,
    num_minibatches: int,
    batch_size: int,
    shuffle_key: PRNGKeyArray,
)

Precompute permuations for a given number of minibatches within a dataset. Automatically determines the number of necessary epochs (runs over the entire dataset). Upon calling returns a collection of indices to produce a new minibatch.

If the remainder minibatch in one epoch is smaller than the batch size, it will not be extended using data from the next epoch, but returned as smaller list of indices.

Arguments:

num_total_samples: The total number of samples in the dataset.
num_minibatches: The size of minibatches to train on.
batch_size: The size of the minibatches.
shuffle_key: The key to create the permutation; needed for deterministic reproducibility.

Warning

ValueError: If the batch size is larger than the total number of samples for one epoch.

Source code in trainax/_mixer.py

def __init__(
    self,
    num_total_samples: int,
    num_minibatches: int,
    batch_size: int,
    shuffle_key: PRNGKeyArray,
):
    """
    Precompute permuations for a given number of minibatches within a
    dataset. Automatically determines the number of necessary epochs (runs
    over the entire dataset). Upon calling returns a collection of indices
    to produce a new minibatch.

    If the remainder minibatch in one epoch is smaller than the batch size,
    it will **not** be extended using data from the next epoch, but returned
    as smaller list of indices.

    **Arguments:**

    - `num_total_samples`: The total number of samples in the dataset.
    - `num_minibatches`: The size of minibatches to train on.
    - `batch_size`: The size of the minibatches.
    - `shuffle_key`: The key to create the permutation; needed for
        deterministic reproducibility.

    !!! warning
        ValueError: If the batch size is larger than the total number of
        samples for one epoch.
    """
    if num_total_samples < batch_size:
        print(
            f"batch size {batch_size} is larger than the total number of samples {num_total_samples}"
        )
        print("Performing full batch training")
        effective_batch_size = num_total_samples
    else:
        effective_batch_size = batch_size

    self.num_total_samples = num_total_samples
    self.num_minibatches = num_minibatches
    self.num_minibatches_per_epoch = int(
        jnp.ceil(num_total_samples / effective_batch_size)
    )
    self.num_epochs = int(
        jnp.ceil(num_minibatches / self.num_minibatches_per_epoch)
    )
    self.batch_size = effective_batch_size

    # Precompute the permutations
    _, self.permutations = jax.lax.scan(
        lambda key, _: (
            jax.random.split(key)[0],
            jax.random.permutation(key, num_total_samples),
        ),
        shuffle_key,
        None,
        length=self.num_epochs,
    )

call ¤

__call__(
    i: int, *, return_info: bool = False
) -> Int[Array, batch_size]

Given the batch index i, return the corresponding indices to slice out the minibatch.

Arguments:

i: The batch index.
return_info: Whether to return additional information about the current epoch and batch index.

Returns:

The indices to slice out the minibatch in form of an array of integers.

Warning

ValueError: If the batch index is larger than the number of minibatches (because likely there will be no permuation for it)

Source code in trainax/_mixer.py

def __call__(
    self,
    i: int,
    *,
    return_info: bool = False,
) -> Int[Array, "batch_size"]:
    """
    Given the batch index `i`, return the corresponding indices to slice out
    the minibatch.

    **Arguments:**

    - `i`: The batch index.
    - `return_info`: Whether to return additional information about the
        current epoch and batch index.

    **Returns:**

    - The indices to slice out the minibatch in form of an array of
        integers.

    !!! warning
        ValueError: If the batch index is larger than the number of
            minibatches (because likely there will be no permuation for it)
    """
    if i >= self.num_minibatches:
        raise ValueError("Batch index out of range")

    epoch_i = i // self.num_minibatches_per_epoch
    batch_i = i % self.num_minibatches_per_epoch

    batch_start = batch_i * self.batch_size
    batch_end = min((batch_i + 1) * self.batch_size, self.num_total_samples)

    batch_indices = self.permutations[epoch_i, batch_start:batch_end]

    if return_info:
        return batch_indices, (epoch_i, batch_i)
    else:
        return batch_indices

Trajectory Mixing¤

trainax.TrajectorySubStacker ¤

__init__ ¤

__call__ ¤

trainax.PermutationMixer ¤

__init__ ¤

__call__ ¤

init ¤

call ¤

init ¤

call ¤