examples/maf_cifar10.py

import numpy as np
import torch
import torch.utils.data as data
import torchvision.utils as utils
import torchvision.datasets as datasets
import torchvision.transforms as transforms

import deeprob.flows.models as flows
from deeprob.torch.datasets import WrappedDataset
from deeprob.torch.transforms import TransformList, Flatten, RandomHorizontalFlip
from deeprob.torch.routines import train_model, test_model


if __name__ == '__main__':
    # Load the CIFAR10 dataset and split the dataset
    in_shape = (3, 32, 32)
    in_features = np.prod(in_shape).item()
    data_train = datasets.CIFAR10('datasets', train=True, transform=transforms.ToTensor(), download=True)
    data_test = datasets.CIFAR10('datasets', train=False, transform=transforms.ToTensor(), download=True)
    n_val = int(0.1 * len(data_train))
    n_train = len(data_train) - n_val
    data_train, data_val = data.random_split(data_train, [n_train, n_val])

    # Set the preprocessing transformation, i.e. random horizontal flip + flatten
    transform = TransformList([
        RandomHorizontalFlip(),
        Flatten(in_shape)  # Specify the input shape to compute the inverse of the transformation
    ])

    # Wrap CIFAR10 datasets for unsupervised setting
    data_train = WrappedDataset(data_train, unsupervised=True, transform=transform)
    data_val = WrappedDataset(data_val, unsupervised=True, transform=Flatten())
    data_test = WrappedDataset(data_test, unsupervised=True, transform=Flatten())

    # Instantiate a Masked Autoregressive Flow (MAF)
    maf = flows.MAF(
        in_features,
        dequantize=True,  # Apply dequantization
        logit=0.05,       # Apply logit transformation with a factor of 0.05
        n_flows=3,        # The number of transformations
        depth=1,          # The depth of each transformation's conditioner network
        units=1024,       # The number of units of conditioner networks hidden layers
        sequential=False  # Set hidden layer units identifiers randomly (instead of sequentially)
    )

    # Train the model using generative setting, i.e. by maximizing the log-likelihood
    train_model(
        maf, data_train, data_val, setting='generative',
        lr=1e-4, batch_size=64, epochs=20, patience=5,
        checkpoint='checkpoint-maf-cifar10.pt',
        optimizer_kwargs={'weight_decay': 5e-5}  # Introduce a small weight decay
    )

    # Test the model using generative setting
    # Also, compute bits-per-dimension
    mu_ll, sigma_ll = test_model(maf, data_test, setting='generative', batch_size=64)
    bpp = (-mu_ll / np.log(2)) / in_features
    print('Mean LL: {:.4f} - Two Stddev LL: {:.4f} - Bits per Dimension: {:.2f}'.format(mu_ll, sigma_ll, bpp))

    # Sample some data points and plot them
    maf.eval()  # Make sure to switch to evaluation mode
    n_samples = 10
    samples = maf.sample(n_samples ** 2).cpu()
    images = torch.stack([transform.backward(x) for x in samples])
    samples_filename = 'maf-cifar10-samples.png'
    print("Plotting generated samples to {} ...".format(samples_filename))
    utils.save_image(images, samples_filename, nrow=n_samples, padding=0)

    # Save the model to file
    model_filename = 'maf-cifar10.pt'
    print("Saving model's definition and parameters to {}".format(model_filename))
    torch.save(maf.state_dict(), model_filename)