DsysDML · Francill99 · Dec 12, 2025 · Dec 17, 2025 · Dec 19, 2025 · Dec 19, 2025
diff --git a/rbms/ising_gaussian/__init__.py b/rbms/ising_gaussian/__init__.py
@@ -0,0 +1,3 @@
+# ruff: noqa
+from rbms.ising_gaussian.classes import IGRBM
+from rbms.ising_gaussian.functional import *
diff --git a/rbms/ising_gaussian/classes.py b/rbms/ising_gaussian/classes.py
@@ -0,0 +1,239 @@
+from typing import List, Optional
+
+import numpy as np
+import torch
+from torch import Tensor
+
+from rbms.ising_gaussian.implement import (
+    _compute_energy,
+    _compute_energy_hiddens,
+    _compute_energy_visibles,
+    _compute_gradient,
+    _init_chains,
+    _init_parameters,
+    _sample_hiddens,
+    _sample_visibles,
+)
+from rbms.classes import RBM
+
+
+class IGRBM(RBM):
+    """Ising-Gaussian RBM with fixed hidden variance = 1/Nv, \pm 1 visibles, without any bias"""
+
+    def __init__(
+        self,
+        weight_matrix: Tensor,
+        vbias: Tensor,
+        hbias: Tensor,
+        device: Optional[torch.device] = None,
+        dtype: Optional[torch.dtype] = None,
+    ):
+        if device is None:
+            device = weight_matrix.device
+        if dtype is None:
+            dtype = weight_matrix.dtype
+        self.device, self.dtype = device, dtype
+
+        self.weight_matrix = weight_matrix.to(device=self.device, dtype=self.dtype)
+        self.vbias = vbias.to(device=self.device, dtype=self.dtype)
+        self.hbias = hbias.to(device=self.device, dtype=self.dtype)
+
+        log_two_pi = torch.log(torch.tensor(2.0 * torch.pi, dtype=dtype, device=device))
+        const = (
+            0.5
+            * float(self.weight_matrix[1])
+            * (
+                torch.log(
+                    torch.tensor(float(self.weight_matrix[0]), dtype=dtype, device=device)
+                )
+                - log_two_pi
+            )
+        )
+        self.const = const
+        self.name = "IGRBM"
+
+    def __add__(self, other):
+        out = IGRBM(
+            weight_matrix=self.weight_matrix + other.weight_matrix,
+            vbias=self.vbias + other.vbias,
+            hbias=self.hbias + other.hbias,
+            device=self.device,
+            dtype=self.dtype,
+        )
+        return out
+
+    def __mul__(self, other):
+        out = IGRBM(
+            weight_matrix=self.weight_matrix * other,
+            vbias=self.vbias * other,
+            hbias=self.hbias * other,
+            device=self.device,
+            dtype=self.dtype,
+        )
+        return out
+
+    def clone(
+        self, device: Optional[torch.device] = None, dtype: Optional[torch.dtype] = None
+    ):
+        if device is None:
+            device = self.device
+        if dtype is None:
+            dtype = self.dtype
+        return IGRBM(
+            weight_matrix=self.weight_matrix.clone(),
+            vbias=self.vbias.clone(),
+            hbias=self.hbias.clone(),
+            device=device,
+            dtype=dtype,
+        )
+
+    def compute_energy(self, v: Tensor, h: Tensor) -> Tensor:
+        return _compute_energy(
+            v=v, h=h, vbias=self.vbias, hbias=self.hbias, weight_matrix=self.weight_matrix
+        )
+
+    def compute_energy_hiddens(self, h: Tensor) -> Tensor:
+        return _compute_energy_hiddens(
+            h=h, vbias=self.vbias, hbias=self.hbias, weight_matrix=self.weight_matrix
+        )
+
+    def compute_energy_visibles(self, v: Tensor) -> Tensor:
+        return _compute_energy_visibles(
+            v=v, vbias=self.vbias, hbias=self.hbias, weight_matrix=self.weight_matrix
+        )
+
+    def compute_gradient(self, data, chains, centered=True, lambda_l1=0.0, lambda_l2=0.0):
+        _compute_gradient(
+            v_data=data["visible"],
+            h_data=data["hidden_mag"],
+            w_data=data["weights"],
+            v_chain=chains["visible"],
+            h_chain=chains["hidden_mag"],
+            w_chain=chains["weights"],
+            vbias=self.vbias,
+            hbias=self.hbias,
+            weight_matrix=self.weight_matrix,
+            centered=centered,
+            lambda_l1=lambda_l1,
+            lambda_l2=lambda_l2,
+        )
+
+    def independent_model(self):
+        return IGRBM(
+            weight_matrix=torch.zeros_like(self.weight_matrix),
+            vbias=self.vbias,
+            hbias=torch.zeros_like(self.hbias),
+            device=self.device,
+            dtype=self.dtype,
+        )
+
+    def init_chains(self, num_samples, weights=None, start_v=None):
+        visible, hidden, mean_visible, mean_hidden = _init_chains(
+            num_samples=num_samples,
+            weight_matrix=self.weight_matrix,
+            hbias=self.hbias,
+            start_v=start_v,
+        )
+        if weights is None:
+            weights = torch.ones(
+                visible.shape[0], device=visible.device, dtype=visible.dtype
+            )
+        return dict(
+            visible=visible,
+            hidden=hidden,
+            visible_mag=mean_visible,
+            hidden_mag=mean_hidden,
+            weights=weights,
+        )
+
+    @staticmethod
+    def init_parameters(num_hiddens, dataset, device, dtype, var_init=0.0001):
+        data = dataset.data
+        if isinstance(data, np.ndarray):
+            data = torch.from_numpy(dataset.data).to(device=device, dtype=dtype)
+        vbias, hbias, weight_matrix = _init_parameters(
+            num_hiddens=num_hiddens,
+            data=data,
+            device=device,
+            dtype=dtype,
+            var_init=var_init,
+        )
+        return IGRBM(
+            weight_matrix=weight_matrix,
+            vbias=vbias,
+            hbias=hbias,
+            device=device,
+            dtype=dtype,
+        )
+
+    def named_parameters(self):
+        return {
+            "weight_matrix": self.weight_matrix,
+            "vbias": self.vbias,
+            "hbias": self.hbias,
+        }
+
+    def num_hiddens(self):
+        return self.hbias.shape[0]
+
+    def num_visibles(self):
+        return self.vbias.shape[0]
+
+    def parameters(self) -> List[Tensor]:
+        return [self.weight_matrix, self.vbias, self.hbias]
+
+    def ref_log_z(self):
+        K = self.num_hiddens()
+        logZ_v = torch.log1p(torch.exp(self.vbias)).sum()
+        quad = 0.5 * torch.dot(self.hbias, self.hbias) / float(self.num_visibles())
+        log_norm = 0.5 * K * np.log(2.0 * np.pi) - 0.5 * K * np.log(float(self.num_visibles()))
+        return (logZ_v + quad + log_norm).item()
+
+    def sample_hiddens(self, chains: dict[str, Tensor], beta=1) -> dict[str, Tensor]:
+        chains["hidden"], chains["hidden_mag"] = _sample_hiddens(
+            v=chains["visible"],
+            weight_matrix=self.weight_matrix,
+            hbias=self.hbias,
+            beta=beta,
+        )
+        return chains
+
+    def sample_visibles(self, chains: dict[str, Tensor], beta=1) -> dict[str, Tensor]:
+        chains["visible"], chains["visible_mag"] = _sample_visibles(
+            h=chains["hidden"],
+            weight_matrix=self.weight_matrix,
+            vbias=self.vbias,
+            beta=beta,
+        )
+        return chains
+
+    @staticmethod
+    def set_named_parameters(named_params: dict[str, Tensor]) -> "IGRBM":
+        names = ["vbias", "hbias", "weight_matrix"]
+        for k in names:
+            if k not in named_params:
+                raise ValueError(
+                    f"""Dictionary params missing key '{k}'\n Provided keys : {named_params.keys()}\n Expected keys: {names}"""
+                )
+        params = IGRBM(
+            weight_matrix=named_params.pop("weight_matrix"),
+            vbias=named_params.pop("vbias"),
+            hbias=named_params.pop("hbias"),
+        )
+        if len(named_params) > 0:
+            raise ValueError(
+                f"Too many keys in params dictionary. Remaining keys: {named_params.keys()}"
+            )
+        return params
+
+    def to(
+        self, device: Optional[torch.device] = None, dtype: Optional[torch.dtype] = None
+    ) -> "IGRBM":
+        if device is not None:
+            self.device = device
+        if dtype is not None:
+            self.dtype = dtype
+        self.weight_matrix = self.weight_matrix.to(device=self.device, dtype=self.dtype)
+        self.vbias = self.vbias.to(device=self.device, dtype=self.dtype)
+        self.hbias = self.hbias.to(device=self.device, dtype=self.dtype)
+        return self
diff --git a/rbms/ising_gaussian/functional.py b/rbms/ising_gaussian/functional.py
@@ -0,0 +1,135 @@
+from typing import Optional
+
+import numpy as np
+import torch
+from torch import Tensor
+
+from rbms.ising_gaussian.classes import IGRBM
+from rbms.ising_gaussian.implement import (
+    _compute_energy,
+    _compute_energy_hiddens,
+    _compute_energy_visibles,
+    _compute_gradient,
+    _init_chains,
+    _init_parameters,
+    _sample_hiddens,
+    _sample_visibles,
+)
+from rbms.dataset.dataset_class import RBMDataset
+
+
+def sample_hiddens(
+    chains: dict[str, Tensor], params: IGRBM, beta: float = 1.0
+) -> dict[str, Tensor]:
+    chains["hidden"], chains["hidden_mag"] = _sample_hiddens(
+        v=chains["visible"],
+        weight_matrix=params.weight_matrix,
+        hbias=params.hbias,
+        beta=beta,
+    )
+    return chains
+
+
+def sample_visibles(
+    chains: dict[str, Tensor], params: IGRBM, beta: float = 1.0
+) -> dict[str, Tensor]:
+    chains["visible"], chains["visible_mag"] = _sample_visibles(
+        h=chains["hidden"],
+        weight_matrix=params.weight_matrix,
+        vbias=params.vbias,
+        beta=beta,
+    )
+    return chains
+
+
+def compute_energy(v: Tensor, h: Tensor, params: IGRBM) -> Tensor:
+    return _compute_energy(
+        v=v,
+        h=h,
+        vbias=params.vbias,
+        hbias=params.hbias,
+        weight_matrix=params.weight_matrix,
+    )
+
+
+def compute_energy_visibles(v: Tensor, params: IGRBM) -> Tensor:
+    return _compute_energy_visibles(
+        v=v,
+        vbias=params.vbias,
+        hbias=params.hbias,
+        weight_matrix=params.weight_matrix,
+    )
+
+
+def compute_energy_hiddens(h: Tensor, params: IGRBM) -> Tensor:
+    return _compute_energy_hiddens(
+        h=h,
+        vbias=params.vbias,
+        hbias=params.hbias,
+        weight_matrix=params.weight_matrix,
+    )
+
+
+def compute_gradient(
+    data: dict[str, Tensor],
+    chains: dict[str, Tensor],
+    params: IGRBM,
+    centered: bool,
+    lambda_l1: float = 0.0,
+    lambda_l2: float = 0.0,
+) -> None:
+    _compute_gradient(
+        v_data=data["visible"],
+        mh_data=data["hidden_mag"],
+        w_data=data["weights"],
+        v_chain=chains["visible"],
+        h_chain=chains["hidden"],
+        w_chain=chains["weights"],
+        vbias=params.vbias,
+        hbias=params.hbias,
+        weight_matrix=params.weight_matrix,
+        centered=centered,
+        lambda_l1=lambda_l1,
+        lambda_l2=lambda_l2,
+    )
+
+
+def init_chains(
+    num_samples: int,
+    params: IGRBM,
+    weights: Optional[Tensor] = None,
+    start_v: Optional[Tensor] = None,
+) -> dict[str, Tensor]:
+    visible, hidden, mean_visible, mean_hidden = _init_chains(
+        num_samples=num_samples,
+        weight_matrix=params.weight_matrix,
+        hbias=params.hbias,
+        start_v=start_v,
+    )
+    if weights is None:
+        weights = torch.ones(visible.shape[0], device=visible.device, dtype=visible.dtype)
+    return dict(
+        visible=visible,
+        hidden=hidden,
+        visible_mag=mean_visible,
+        hidden_mag=mean_hidden,
+        weights=weights,
+    )
+
+
+def init_parameters(
+    num_hiddens: int,
+    dataset: RBMDataset,
+    device: torch.device,
+    dtype: torch.dtype,
+    var_init: float = 1e-4,
+) -> IGRBM:
+    data = dataset.data
+    if isinstance(data, np.ndarray):
+        data = torch.from_numpy(dataset.data).to(device=device, dtype=dtype)
+    vbias, hbias, weight_matrix = _init_parameters(
+        num_hiddens=num_hiddens, data=data, device=device, dtype=dtype, var_init=var_init
+    )
+    return IGRBM(
+        weight_matrix=weight_matrix, vbias=vbias, hbias=hbias, device=device, dtype=dtype
+    )