TheAlgorithms · Adhithya-Laxman · Oct 21, 2025 · Oct 21, 2025 · Oct 21, 2025 · Oct 21, 2025
diff --git a/neural_network/deep_belief_network.py b/neural_network/deep_belief_network.py
@@ -0,0 +1,393 @@
+"""
+- - - - - -- - - - - - - - - - - - - - - - - - - - - - -
+Name - - Deep Belief Network (DBN) Using Restricted Boltzmann Machines (RBMs)
+Goal - - Unsupervised layer-wise feature learning and pretraining
+         for deep neural networks
+Detail: Multi-layer DBN constructed by stacking RBMs trained via contrastive divergence.
+        Implements Gibbs sampling for binary units, manual weight updates with NumPy.
+        Developed for Intrusion Detection System (IDS) in WiFi networks.
+        This implementation is written entirely in pure NumPy,
+        with no deep learning frameworks.
+        Can be extended for fine-tuning deep neural networks.
+
+Author: Adhithya Laxman Ravi Shankar Geetha
+GitHub: https://github.com/Adhithya-Laxman/
+Date: 2025.10.21
+- - - - - -- - - - - - - - - - - - - - - - - - - - - - -
+"""
+
+import matplotlib.pyplot as plt
+import numpy as np
+
+
+class RBM:
+    def __init__(
+        self,
+        n_visible: int,
+        n_hidden: int,
+        learning_rate: float = 0.01,
+        k: int = 1,
+        epochs: int = 10,
+        batch_size: int = 64,
+        mode: str = "bernoulli",
+    ) -> None:
+        """
+        Initialize an RBM (Restricted Boltzmann Machine).
+
+        Args:
+            n_visible (int): Number of visible units.
+            n_hidden (int): Number of hidden units.
+            learning_rate (float): Learning rate for weight updates.
+            k (int): Number of Gibbs sampling steps.
+            epochs (int): Number of training epochs.
+            batch_size (int): Batch size.
+            mode (str): Sampling mode ('bernoulli' or 'gaussian').
+        """
+        self.n_visible = n_visible
+        self.n_hidden = n_hidden
+        self.learning_rate = learning_rate
+        self.k = k
+        self.epochs = epochs
+        self.batch_size = batch_size
+        self.mode = mode
+
+        self.rng = np.random.default_rng()
+
+        # Initialize weights and biases
+        self.weights = self.rng.normal(0, 0.01, (n_visible, n_hidden))
+        self.hidden_bias = np.zeros(n_hidden)
+        self.visible_bias = np.zeros(n_visible)
+
+    def sigmoid(self, x: np.ndarray) -> np.ndarray:
+        """
+        Compute the sigmoid activation function element-wise.
+
+        Args:
+            x (np.ndarray): Input array.
+
+        Returns:
+            np.ndarray: Sigmoid output of input.
+
+        >>> rbm = RBM(3, 2)
+        >>> import numpy as np
+        >>> np.allclose(
+        ...    dbn.sigmoid(np.array([0, 1])),
+        ...    np.array([0.5, 1/(1+np.exp(-1))])
+        ... )
+        True
+
+        """
+        return 1.0 / (1.0 + np.exp(-x))
+
+    def sample_prob(self, probs: np.ndarray) -> np.ndarray:
+        """
+        Sample binary states from given probabilities.
+
+        Args:
+            probs (np.ndarray): Probabilities of activation.
+
+        Returns:
+            np.ndarray: Binary sampled values.
+
+        >>> rbm = RBM(3, 2)
+        >>> probs = np.array([0., 1.])
+        >>> result = rbm.sample_prob(probs)
+        >>> set(result).issubset({0., 1.})
+        True
+        """
+        return (self.rng.random(probs.shape) < probs).astype(float)
+
+    def sample_hidden_given_visible(
+        self, v: np.ndarray
+    ) -> tuple[np.ndarray, np.ndarray]:
+        """
+        Sample hidden units conditioned on visible units.
+
+        Args:
+            v (np.ndarray): Visible unit batch.
+
+        Returns:
+            tuple: (hidden probabilities, hidden samples)
+        """
+        hid_probs = self.sigmoid(np.dot(v, self.weights) + self.hidden_bias)
+        hid_samples = self.sample_prob(hid_probs)
+        return hid_probs, hid_samples
+
+    def sample_visible_given_hidden(
+        self, h: np.ndarray
+    ) -> tuple[np.ndarray, np.ndarray]:
+        """
+        Sample visible units conditioned on hidden units.
+
+        Args:
+            h (np.ndarray): Hidden unit batch.
+
+        Returns:
+            tuple: (visible probabilities, visible samples)
+        """
+        vis_probs = self.sigmoid(np.dot(h, self.weights.T) + self.visible_bias)
+        vis_samples = self.sample_prob(vis_probs)
+        return vis_probs, vis_samples
+
+    def contrastive_divergence(self, v0: np.ndarray) -> float:
+        """
+        Perform Contrastive Divergence (CD-k) for a single batch.
+
+        Args:
+            v0 (np.ndarray): Initial visible units (data batch).
+
+        Returns:
+            float: Reconstruction loss (mean squared error) for batch.
+        """
+        h_probs0, h0 = self.sample_hidden_given_visible(v0)
+        vk, hk = v0, h0
+
+        for _ in range(self.k):
+            _v_probs, vk = self.sample_visible_given_hidden(hk)
+            h_probs, hk = self.sample_hidden_given_visible(vk)
+
+        positive_grad = np.dot(v0.T, h_probs0)
+        negative_grad = np.dot(vk.T, h_probs)
+
+        self.weights += (
+            self.learning_rate * (positive_grad - negative_grad) / v0.shape[0]
+        )
+        self.visible_bias += self.learning_rate * np.mean(v0 - vk, axis=0)
+        self.hidden_bias += self.learning_rate * np.mean(h_probs0 - h_probs, axis=0)
+
+        loss = np.mean((v0 - vk) ** 2)
+        return loss
+
+    def train(self, data: np.ndarray) -> None:
+        """
+        Train the RBM on the entire dataset.
+
+        Args:
+            data (np.ndarray): Training dataset matrix.
+
+        >>> rbm = RBM(6, 3, epochs=1, batch_size=2)
+        >>> data = np.random.randint(0, 2, (4, 6)).astype(float)
+        >>> rbm.train(data)  # runs without error
+        """
+        n_samples = data.shape[0]
+        for epoch in range(self.epochs):
+            self.rng.shuffle(data)
+            losses = []
+
+            for i in range(0, n_samples, self.batch_size):
+                batch = data[i : i + self.batch_size]
+                loss = self.contrastive_divergence(batch)
+                losses.append(loss)
+
+            print(f"Epoch [{epoch + 1}/{self.epochs}] avg loss: {np.mean(losses):.6f}")
+
+
+class DeepBeliefNetwork:
+    def __init__(
+        self,
+        input_size: int,
+        layers: list[int],
+        mode: str = "bernoulli",
+        k: int = 5,
+        save_path: str | None = None,
+    ) -> None:
+        """
+        Initialize a Deep Belief Network (DBN) with multiple RBM layers.
+
+        Args:
+            input_size (int): Number of features in input layer.
+            layers (list): list of hidden layer unit counts.
+            mode (str): Sampling mode ('bernoulli' or 'gaussian').
+            k (int): Number of sampling steps in generate_input_for_layer.
+            save_path (str, optional): Path for saving trained model parameters.
+
+        """
+        self.input_size = input_size
+        self.layers = layers
+        self.k = k
+        self.mode = mode
+        self.save_path = save_path
+        self.layer_params = [{"W": None, "hb": None, "vb": None} for _ in layers]
+
+    def sigmoid(self, x: np.ndarray) -> np.ndarray:
+        """
+        Compute sigmoid activation function.
+
+        Args:
+            x (np.ndarray): Input array.
+
+        Returns:
+            np.ndarray: Sigmoid of input.
+
+        >>> dbn = DeepBeliefNetwork(4, [3])
+        >>> import numpy as np
+        >>> np.allclose(
+        ...    dbn.sigmoid(np.array([0, 1])),
+        ...    np.array([0.5, 1/(1+np.exp(-1))])
+        ... )
+        True
+
+        """
+        return 1.0 / (1.0 + np.exp(-x))
+
+    def sample_prob(self, probs: np.ndarray) -> np.ndarray:
+        """
+        Sample binary states from probabilities.
+
+        Args:
+            probs (np.ndarray): Activation probabilities.
+
+        Returns:
+            np.ndarray: Binary sampled values.
+        """
+        rng = np.random.default_rng()
+        return (rng.random(probs.shape) < probs).astype(float)
+
+    def sample_h(
+        self, x: np.ndarray, w: np.ndarray, hb: np.ndarray
+    ) -> tuple[np.ndarray, np.ndarray]:
+        """
+        Sample hidden units given visible units for a DBN layer.
+
+        Args:
+            x (np.ndarray): Visible units.
+            w (np.ndarray): Weight matrix.
+            hb (np.ndarray): Hidden bias vector.
+
+        Returns:
+            tuple: Hidden probabilities and binary samples.
+        """
+        probs = self.sigmoid(np.dot(x, w) + hb)
+        samples = self.sample_prob(probs)
+        return probs, samples
+
+    def sample_v(
+        self, y: np.ndarray, w: np.ndarray, vb: np.ndarray
+    ) -> tuple[np.ndarray, np.ndarray]:
+        """
+        Sample visible units given hidden units for a DBN layer.
+
+        Args:
+            y (np.ndarray): Hidden units.
+            w (np.ndarray): Weight matrix.
+            vb (np.ndarray): Visible bias vector.
+
+        Returns:
+            tuple: Visible probabilities and binary samples.
+        """
+        probs = self.sigmoid(np.dot(y, w.T) + vb)
+        samples = self.sample_prob(probs)
+        return probs, samples
+
+    def generate_input_for_layer(self, layer_index: int, x: np.ndarray) -> np.ndarray:
+        """
+        Generate input for a particular DBN layer by sampling and averaging.
+
+        Args:
+            layer_index (int): Layer index for which input is generated.
+            x (np.ndarray): Original input data.
+
+        Returns:
+            np.ndarray: Smoothed input for the layer.
+        """
+        if layer_index == 0:
+            return x.copy()
+        samples = []
+        for _ in range(self.k):
+            x_dash = x.copy()
+            for i in range(layer_index):
+                _, x_dash = self.sample_h(
+                    x_dash, self.layer_params[i]["W"], self.layer_params[i]["hb"]
+                )
+            samples.append(x_dash)
+        return np.mean(np.stack(samples, axis=0), axis=0)
+
+    def train_dbn(self, x: np.ndarray) -> None:
+        """
+        Layer-wise train the DBN using RBMs.
+
+        Args:
+            x (np.ndarray): Training dataset.
+        """
+        for idx, layer_size in enumerate(self.layers):
+            n_visible = self.input_size if idx == 0 else self.layers[idx - 1]
+            n_hidden = layer_size
+
+            rbm = RBM(n_visible, n_hidden, k=5, epochs=300)
+            x_input = self.generate_input_for_layer(idx, x)
+            rbm.train(x_input)
+            self.layer_params[idx]["W"] = rbm.weights
+            self.layer_params[idx]["hb"] = rbm.hidden_bias
+            self.layer_params[idx]["vb"] = rbm.visible_bias
+            print(f"Finished training layer {idx + 1}/{len(self.layers)}")
+
+    def reconstruct(self, x: np.ndarray) -> tuple[np.ndarray, np.ndarray, float]:
+        """
+        Reconstruct input through forward and backward Gibbs sampling.
+
+        Args:
+            x (np.ndarray): Input data to reconstruct.
+
+        Returns:
+            tuple: (encoded representation, reconstructed input, MSE error)
+        """
+        h = x.copy()
+        for i in range(len(self.layer_params)):
+            _, h = self.sample_h(
+                h, self.layer_params[i]["W"], self.layer_params[i]["hb"]
+            )
+        encoded = h.copy()
+
+        for i in reversed(range(len(self.layer_params))):
+            _, h = self.sample_v(
+                h, self.layer_params[i]["W"], self.layer_params[i]["vb"]
+            )
+        reconstructed = h
+
+        error = np.mean((x - reconstructed) ** 2)
+        print(f"Reconstruction error: {error:.6f}")
+
+        return encoded, reconstructed, error
+
+
+# Usage example
+if __name__ == "__main__":
+    rng = np.random.default_rng()  # for random number generation
+    data = rng.integers(0, 2, size=(100, 16)).astype(float)
+
+    dbn = DeepBeliefNetwork(input_size=16, layers=[16, 8, 4])
+
+    dbn.train_dbn(data)
+
+    encoded, reconstructed, error = dbn.reconstruct(data[:5])
+    print("Encoded shape:", encoded.shape)
+    print("Reconstructed shape:", reconstructed.shape)
+
+    features_to_show = 16
+    plt.figure(figsize=(12, 5))
+    for i in range(5):
+        plt.subplot(2, 5, i + 1)
+        plt.title(f"Original {i + 1}")
+        plt.imshow(
+            data[i][:features_to_show].reshape(1, -1),
+            cmap="gray",
+            aspect="auto",
+            interpolation="nearest",
+        )
+        plt.axis("off")
+
+        plt.subplot(2, 5, i + 6)
+        plt.title(f"Reconstructed {i + 1}")
+        plt.imshow(
+            reconstructed[i][:features_to_show].reshape(1, -1),
+            cmap="gray",
+            aspect="auto",
+            interpolation="nearest",
+        )
+        plt.axis("off")
+    plt.suptitle(
+        f"DBN Reconstruction (First {features_to_show} Features, MSE: {error:.6f})"
+    )
+    plt.tight_layout()
+    plt.savefig("reconstruction_subset.png")
+    print("Subset reconstruction plot saved as 'reconstruction_subset.png'")