`torchebm.samplers.langevin_dynamics` ¶

Langevin Dynamics Sampler Module.

`LangevinDynamics` ¶

Bases: BaseSampler

Langevin Dynamics sampler.

Update rule:

\[ x_{t+1} = x_t - \eta \nabla_x U(x_t) + \sqrt{2\eta} \epsilon_t \]

Parameters:

Name	Type	Description	Default
`model`	`BaseModel`	Energy-based model to sample from.	required
`step_size`	`Union[float, BaseScheduler]`	Step size for gradient descent. Float or `BaseScheduler`.	`0.001`
`noise_scale`	`Union[float, BaseScheduler]`	Scale of Gaussian noise injection. Float or `BaseScheduler`.	`1.0`
`decay`	`float`	Damping coefficient (not supported).	`0.0`
`clamp`	`Optional[Tuple[float, float]]`	Optional (min, max) bounds applied to the state after every step. Standard stabilization for image-space EBMs (e.g. [-1, 1]).	`None`
`dtype`	`dtype`	Data type for computations.	`float32`
`device`	`Optional[Union[str, device]]`	Device for computations.	`None`
`integrator`	`Union[str, BaseSDERungeKuttaIntegrator, None]`	SDE integrator used for the update. `None` (default) uses `EulerMaruyamaIntegrator`; a registry name (e.g. `"heun"`) constructs that integrator with defaults; a `BaseSDERungeKuttaIntegrator` instance is used as-is and must match the sampler's device/dtype.	`None`

Example

from torchebm.samplers import LangevinDynamics
from torchebm.core import DoubleWellModel
import torch

energy = DoubleWellModel()
sampler = LangevinDynamics(energy, step_size=0.01, noise_scale=1.0)
samples = sampler.sample(n_samples=100, dim=2, n_steps=500)

Source code in torchebm/samplers/langevin_dynamics.py

class LangevinDynamics(BaseSampler):
    r"""
    Langevin Dynamics sampler.

    Update rule:

    \[
    x_{t+1} = x_t - \eta \nabla_x U(x_t) + \sqrt{2\eta} \epsilon_t
    \]

    Args:
        model: Energy-based model to sample from.
        step_size: Step size for gradient descent. Float or `BaseScheduler`.
        noise_scale: Scale of Gaussian noise injection. Float or `BaseScheduler`.
        decay: Damping coefficient (not supported).
        clamp: Optional (min, max) bounds applied to the state after every
            step. Standard stabilization for image-space EBMs (e.g. [-1, 1]).
        dtype: Data type for computations.
        device: Device for computations.
        integrator: SDE integrator used for the update. `None` (default)
            uses `EulerMaruyamaIntegrator`; a registry name (e.g.
            `"heun"`) constructs that integrator with defaults; a
            `BaseSDERungeKuttaIntegrator` instance is used as-is and must
            match the sampler's device/dtype.

    Example:
        ```python
        from torchebm.samplers import LangevinDynamics
        from torchebm.core import DoubleWellModel
        import torch

        energy = DoubleWellModel()
        sampler = LangevinDynamics(energy, step_size=0.01, noise_scale=1.0)
        samples = sampler.sample(n_samples=100, dim=2, n_steps=500)
        ```
    """

    def __init__(
        self,
        model: BaseModel,
        step_size: Union[float, BaseScheduler] = 1e-3,
        noise_scale: Union[float, BaseScheduler] = 1.0,
        decay: float = 0.0,
        clamp: Optional[Tuple[float, float]] = None,
        dtype: torch.dtype = torch.float32,
        device: Optional[Union[str, torch.device]] = None,
        integrator: Union[str, BaseSDERungeKuttaIntegrator, None] = None,
    ):
        super().__init__(model=model, dtype=dtype, device=device)

        self._register_param("step_size", step_size, positive=True)
        self._register_param("noise_scale", noise_scale, positive=True)

        if clamp is not None and clamp[0] >= clamp[1]:
            raise ValueError(f"clamp min must be < max, got {clamp}")
        self.clamp = clamp
        self.decay = decay
        self.integrator = resolve_integrator(
            integrator,
            default="euler_maruyama",
            family=BaseSDERungeKuttaIntegrator,
            owner="LangevinDynamics",
            device=self.device,
            dtype=self.dtype,
        )

    @torch.no_grad()
    def sample(
        self,
        x: Optional[torch.Tensor] = None,
        dim: Optional[Union[int, Tuple[int, ...]]] = None,
        n_steps: int = 100,
        n_samples: int = 1,
        thin: int = 1,
        return_trajectory: bool = False,
        return_diagnostics: bool = False,
        reset_schedulers: bool = True,
        *,
        model_kwargs: Optional[Dict[str, Any]] = None,
        generator: Optional[torch.Generator] = None,
    ) -> Union[torch.Tensor, Tuple[torch.Tensor, Dict[str, torch.Tensor]]]:
        r"""Generate samples via Langevin dynamics.

        Args:
            x: Initial state. If `None`, samples from `N(0, I)`.
            dim: State dimension (int) or shape (tuple), used when `x is None`.
            n_steps: Number of MCMC steps to perform.
            n_samples: Number of parallel chains to generate.
            thin: Keep every `thin`-th sample. Final stored length is
                `n_steps // thin`. Must be `>= 1`.
            return_trajectory: If True, return the full kept trajectory of shape
                `[n_samples, n_steps // thin, *data_shape]`.
            return_diagnostics: If True, also return a dict with keys
                ``"mean"`` (`[n_kept, *data_shape]`), ``"var"``
                (`[n_kept, *data_shape]`), and ``"energy"`` (`[n_kept]`).
            reset_schedulers: If True (default), reset registered schedulers.
            model_kwargs: Conditioning arguments (e.g. class labels) forwarded to
                the model at every step. Normalized to the sampler device once at
                entry; ``None`` (default) is the exact unconditional path.
            generator: RNG for the initial state and the per-step Langevin
                noise; the global RNG when ``None``.

        Returns:
            Sample tensor (or trajectory if `return_trajectory=True`),
            optionally paired with the diagnostics dict.

        Raises:
            ValueError: If `thin < 1`, or if `x` and `dim` are both `None`.
        """
        if thin < 1:
            raise ValueError("thin must be >= 1")
        if reset_schedulers:
            self.reset_schedulers()

        x = self._init_state(x, dim, n_samples, generator)
        model_kwargs = self._prepare_model_kwargs(model_kwargs)
        n_samples = x.shape[0]
        data_shape = x.shape[1:]

        n_kept = n_steps // thin

        if return_trajectory:
            trajectory = torch.empty(
                (n_samples, n_kept, *data_shape), dtype=self.dtype, device=self.device
            )

        diagnostics: Optional[Dict[str, torch.Tensor]] = None
        if return_diagnostics:
            diagnostics = {
                "mean": torch.empty(
                    n_kept, *data_shape, dtype=self.dtype, device=self.device
                ),
                "var": torch.empty(
                    n_kept, *data_shape, dtype=self.dtype, device=self.device
                ),
                "energy": torch.empty(n_kept, dtype=self.dtype, device=self.device),
            }

        drift = lambda x_, t_: -self._model_gradient(x_, model_kwargs)
        keep_idx = 0
        with self.autocast_context():
            for i in range(n_steps):
                state = {"x": x}
                x = self.integrator.step(
                    state=state,
                    step_size=self.get_scheduled_value("step_size"),
                    noise_scale=self.get_scheduled_value("noise_scale"),
                    drift=drift,
                    generator=generator,
                )["x"]
                if self.clamp is not None:
                    x = x.clamp_(*self.clamp)
                self.step_schedulers()

                if (i + 1) % thin == 0:
                    if return_trajectory:
                        trajectory[:, keep_idx] = x
                    if return_diagnostics:
                        if n_samples > 1:
                            diagnostics["mean"][keep_idx] = x.mean(dim=0)
                            diagnostics["var"][keep_idx] = x.var(
                                dim=0, unbiased=False
                            ).clamp_(min=1e-10, max=1e10)
                        else:
                            diagnostics["mean"][keep_idx] = x.squeeze(0)
                            diagnostics["var"][keep_idx].zero_()
                        diagnostics["energy"][keep_idx] = self._model_energy(
                            x, model_kwargs
                        ).mean()
                    keep_idx += 1

        output = trajectory if return_trajectory else x
        return (output, diagnostics) if return_diagnostics else output

`sample(x=None, dim=None, n_steps=100, n_samples=1, thin=1, return_trajectory=False, return_diagnostics=False, reset_schedulers=True, *, model_kwargs=None, generator=None)` ¶

Generate samples via Langevin dynamics.

Parameters:

Name	Type	Description	Default
`x`	`Optional[Tensor]`	Initial state. If `None`, samples from `N(0, I)`.	`None`
`dim`	`Optional[Union[int, Tuple[int, ...]]]`	State dimension (int) or shape (tuple), used when `x is None`.	`None`
`n_steps`	`int`	Number of MCMC steps to perform.	`100`
`n_samples`	`int`	Number of parallel chains to generate.	`1`
`thin`	`int`	Keep every `thin`-th sample. Final stored length is `n_steps // thin`. Must be `>= 1`.	`1`
`return_trajectory`	`bool`	If True, return the full kept trajectory of shape `[n_samples, n_steps // thin, *data_shape]`.	`False`
`return_diagnostics`	`bool`	If True, also return a dict with keys `"mean"` (`[n_kept, data_shape]`), `"var"` (`[n_kept, data_shape]`), and `"energy"` (`[n_kept]`).	`False`
`reset_schedulers`	`bool`	If True (default), reset registered schedulers.	`True`
`model_kwargs`	`Optional[Dict[str, Any]]`	Conditioning arguments (e.g. class labels) forwarded to the model at every step. Normalized to the sampler device once at entry; `None` (default) is the exact unconditional path.	`None`
`generator`	`Optional[Generator]`	RNG for the initial state and the per-step Langevin noise; the global RNG when `None`.	`None`

Returns:

Type	Description
`Union[Tensor, Tuple[Tensor, Dict[str, Tensor]]]`	Sample tensor (or trajectory if `return_trajectory=True`),
`Union[Tensor, Tuple[Tensor, Dict[str, Tensor]]]`	optionally paired with the diagnostics dict.

Raises:

Type	Description
`ValueError`	If `thin < 1`, or if `x` and `dim` are both `None`.

Source code in torchebm/samplers/langevin_dynamics.py

@torch.no_grad()
def sample(
    self,
    x: Optional[torch.Tensor] = None,
    dim: Optional[Union[int, Tuple[int, ...]]] = None,
    n_steps: int = 100,
    n_samples: int = 1,
    thin: int = 1,
    return_trajectory: bool = False,
    return_diagnostics: bool = False,
    reset_schedulers: bool = True,
    *,
    model_kwargs: Optional[Dict[str, Any]] = None,
    generator: Optional[torch.Generator] = None,
) -> Union[torch.Tensor, Tuple[torch.Tensor, Dict[str, torch.Tensor]]]:
    r"""Generate samples via Langevin dynamics.

    Args:
        x: Initial state. If `None`, samples from `N(0, I)`.
        dim: State dimension (int) or shape (tuple), used when `x is None`.
        n_steps: Number of MCMC steps to perform.
        n_samples: Number of parallel chains to generate.
        thin: Keep every `thin`-th sample. Final stored length is
            `n_steps // thin`. Must be `>= 1`.
        return_trajectory: If True, return the full kept trajectory of shape
            `[n_samples, n_steps // thin, *data_shape]`.
        return_diagnostics: If True, also return a dict with keys
            ``"mean"`` (`[n_kept, *data_shape]`), ``"var"``
            (`[n_kept, *data_shape]`), and ``"energy"`` (`[n_kept]`).
        reset_schedulers: If True (default), reset registered schedulers.
        model_kwargs: Conditioning arguments (e.g. class labels) forwarded to
            the model at every step. Normalized to the sampler device once at
            entry; ``None`` (default) is the exact unconditional path.
        generator: RNG for the initial state and the per-step Langevin
            noise; the global RNG when ``None``.

    Returns:
        Sample tensor (or trajectory if `return_trajectory=True`),
        optionally paired with the diagnostics dict.

    Raises:
        ValueError: If `thin < 1`, or if `x` and `dim` are both `None`.
    """
    if thin < 1:
        raise ValueError("thin must be >= 1")
    if reset_schedulers:
        self.reset_schedulers()

    x = self._init_state(x, dim, n_samples, generator)
    model_kwargs = self._prepare_model_kwargs(model_kwargs)
    n_samples = x.shape[0]
    data_shape = x.shape[1:]

    n_kept = n_steps // thin

    if return_trajectory:
        trajectory = torch.empty(
            (n_samples, n_kept, *data_shape), dtype=self.dtype, device=self.device
        )

    diagnostics: Optional[Dict[str, torch.Tensor]] = None
    if return_diagnostics:
        diagnostics = {
            "mean": torch.empty(
                n_kept, *data_shape, dtype=self.dtype, device=self.device
            ),
            "var": torch.empty(
                n_kept, *data_shape, dtype=self.dtype, device=self.device
            ),
            "energy": torch.empty(n_kept, dtype=self.dtype, device=self.device),
        }

    drift = lambda x_, t_: -self._model_gradient(x_, model_kwargs)
    keep_idx = 0
    with self.autocast_context():
        for i in range(n_steps):
            state = {"x": x}
            x = self.integrator.step(
                state=state,
                step_size=self.get_scheduled_value("step_size"),
                noise_scale=self.get_scheduled_value("noise_scale"),
                drift=drift,
                generator=generator,
            )["x"]
            if self.clamp is not None:
                x = x.clamp_(*self.clamp)
            self.step_schedulers()

            if (i + 1) % thin == 0:
                if return_trajectory:
                    trajectory[:, keep_idx] = x
                if return_diagnostics:
                    if n_samples > 1:
                        diagnostics["mean"][keep_idx] = x.mean(dim=0)
                        diagnostics["var"][keep_idx] = x.var(
                            dim=0, unbiased=False
                        ).clamp_(min=1e-10, max=1e10)
                    else:
                        diagnostics["mean"][keep_idx] = x.squeeze(0)
                        diagnostics["var"][keep_idx].zero_()
                    diagnostics["energy"][keep_idx] = self._model_energy(
                        x, model_kwargs
                    ).mean()
                keep_idx += 1

    output = trajectory if return_trajectory else x
    return (output, diagnostics) if return_diagnostics else output

torchebm.samplers.langevin_dynamics ¶

LangevinDynamics ¶

sample(x=None, dim=None, n_steps=100, n_samples=1, thin=1, return_trajectory=False, return_diagnostics=False, reset_schedulers=True, *, model_kwargs=None, generator=None) ¶

`torchebm.samplers.langevin_dynamics` ¶

`LangevinDynamics` ¶

`sample(x=None, dim=None, n_steps=100, n_samples=1, thin=1, return_trajectory=False, return_diagnostics=False, reset_schedulers=True, *, model_kwargs=None, generator=None)` ¶