CompPhysics
diff --git a/‎doc/pub/week15/html/week15-bs.html‎
Lines changed: 392 additions & 1 deletion b/‎doc/pub/week15/html/week15-bs.html‎
Lines changed: 392 additions & 1 deletion
diff --git a/‎doc/pub/week15/html/week15-reveal.html‎
Lines changed: 360 additions & 1 deletion b/‎doc/pub/week15/html/week15-reveal.html‎
Lines changed: 360 additions & 1 deletion
diff --git a/‎doc/pub/week15/html/week15-solarized.html‎
Lines changed: 382 additions & 1 deletion b/‎doc/pub/week15/html/week15-solarized.html‎
Lines changed: 382 additions & 1 deletion
diff --git a/‎doc/pub/week15/html/week15.html‎
Lines changed: 382 additions & 1 deletion b/‎doc/pub/week15/html/week15.html‎
Lines changed: 382 additions & 1 deletion
diff --git a/‎doc/pub/week15/ipynb/ipynb-week15-src.tar.gz‎
0 Bytes b/‎doc/pub/week15/ipynb/ipynb-week15-src.tar.gz‎
0 Bytes
diff --git a/‎doc/pub/week15/ipynb/week15.ipynb‎
Lines changed: 379 additions & 40 deletions b/‎doc/pub/week15/ipynb/week15.ipynb‎
Lines changed: 379 additions & 40 deletions
diff --git a/‎doc/pub/week15/pdf/week15.pdf‎
100 KB b/‎doc/pub/week15/pdf/week15.pdf‎
100 KB
diff --git a/‎doc/src/week15/week15.do.txt‎
Lines changed: 197 additions & 1 deletion b/‎doc/src/week15/week15.do.txt‎
Lines changed: 197 additions & 1 deletion
@@ -345,12 +345,208 @@ estimated using only one random variable per timestep.  As it is
 computed by summing up $T-1$ consistency terms, the final estimated
 value may have high variance for large $T$ values.
 
+!split
+===== PyTorch implementation of a Denoising Diffusion Probabilistic Model (DDPM) trained on the MNIST dataset =====
+
+The code covers:
+o Model definition (a simple U-Net-style convolutional network)
+o Forward diffusion (adding noise over $T$ timesteps)
+o Reverse denoising process
+o Training loop
+o Sampling from the trained model
+
+
+This example is adapted from several open-source tutorials and
+implementations, demonstrating how to build a diffusion model from
+scratch in under 200 lines of PyTorch.
+I have borrowed extensively from 
+o Jackson-Kang’s PyTorch diffusion tutorial, see URL:"https://github.com/Jackson-Kang/Pytorch-Diffusion-Model-Tutorial"  and
+o awjuliani’s PyTorch DDPM implementation, see URL:"https://github.com/awjuliani/pytorch-diffusion"  
+
+
+
+!split
+===== Problem with diffusion models =====
+
+
+Diffusion models gradually corrupt data by adding Gaussian noise over
+a sequence of timesteps and then learn to reverse this noising process
+with a neural network.
+
+The corruption schedule is typically linear or cosine in variance.
+
+During training, the network is optimized to predict the original
+noise added at each timestep, using a mean-squared error loss.
+
+At inference, one starts from random noise and iteratively applies the
+learned denoising steps to generate new samples.
+
+!split
+===== Imports and Utilities =====
+
+!bc pycod
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+from torchvision import datasets, transforms
+from torch.utils.data import DataLoader
+import matplotlib.pyplot as plt
+import math
+!ec
+
+!split
+===== Hyperparameters and schedules =====
+
+!bc pycod
+device = 'cuda' if torch.cuda.is_available() else 'cpu'
+
+# Training settings
+batch_size = 128
+epochs     = 5
+lr         = 2e-4
+img_size   = 28
+channels   = 1
+
+# Diffusion hyperparameters
+T = 300  # number of diffusion steps  [oai_citation:5‡Medium](https://papers-100-lines.medium.com/diffusion-models-from-scratch-mnist-data-tutorial-in-100-lines-of-pytorch-code-a609e1558cee?utm_source=chatgpt.com)
+beta_start, beta_end = 1e-4, 0.02
+betas = torch.linspace(beta_start, beta_end, T, device=device)  # linear schedule  [oai_citation:6‡Medium](https://medium.com/data-science/diffusion-model-from-scratch-in-pytorch-ddpm-9d9760528946?utm_source=chatgpt.com)
+alphas = 1. - betas
+alphas_cumprod = torch.cumprod(alphas, dim=0)
+!ec
+
+!split
+===== Data Loading =====
+
+!bc pycod
+transform = transforms.Compose([
+    transforms.ToTensor(),
+    transforms.Normalize((0.5,), (0.5,)),
+])
+
+train_ds = datasets.MNIST('.', train=True, download=True, transform=transform)
+train_loader = DataLoader(train_ds, batch_size=batch_size, shuffle=True)
+!ec
+
+!split
+===== Model definition =====
+
+We present a  lightweight U-Net inspired model for noise prediction:
+!bc pycod
+class SimpleUNet(nn.Module):
+    def __init__(self, c):
+        super().__init__()
+        self.enc1 = nn.Conv2d(c, 64, 3, padding=1)
+        self.enc2 = nn.Conv2d(64, 128, 3, padding=1)
+        self.dec1 = nn.ConvTranspose2d(128, 64, 3, padding=1)
+        self.dec2 = nn.ConvTranspose2d(64, c, 3, padding=1)
+        self.act  = nn.ReLU()
+        # timestep embedding to condition on t
+        self.time_mlp = nn.Sequential(
+            nn.Linear(1, 64),
+            nn.ReLU(),
+            nn.Linear(64, 64),
+        )
+
+    def forward(self, x, t):
+        # x: [B, C, H, W], t: [B]
+        h = self.act(self.enc1(x))                       #  [oai_citation:7‡GitHub](https://github.com/Jackson-Kang/Pytorch-Diffusion-Model-Tutorial?utm_source=chatgpt.com)
+        h = self.act(self.enc2(h))
+        # add time embedding
+        t = t.unsqueeze(-1)                             
+        temb = self.time_mlp(t)                          #  [oai_citation:8‡GitHub](https://github.com/tonyduan/diffusion?utm_source=chatgpt.com)
+        temb = temb.view(-1, 64, 1, 1)
+        h = h + temb
+        h = self.act(self.dec1(h))
+        return self.dec2(h)
+!ec
+
+!split
+===== Forward Diffusion $q(x_t\vert x_0)$ =====
+
+
+!bc pycod
+def q_sample(x0, t, noise=None):
+    """Add noise to x0 at timestep t."""
+    if noise is None:
+        noise = torch.randn_like(x0)
+    sqrt_acp = alphas_cumprod[t]**0.5
+    sqrt_1macp = (1 - alphas_cumprod[t])**0.5
+    return sqrt_acp.view(-1,1,1,1)*x0 + sqrt_1macp.view(-1,1,1,1)*noise
+!ec
+
+!split
+===== Cost/Loss function =====
+
+!bc pycod
+def diffusion_loss(model, x0):
+    """Compute MSE between predicted noise and true noise."""
+    B = x0.size(0)
+    t = torch.randint(0, T, (B,), device=device).long()
+    noise = torch.randn_like(x0)
+    x_noisy = q_sample(x0, t, noise)
+    pred_noise = model(x_noisy, t.float()/T)
+    return F.mse_loss(pred_noise, noise)
+!ec
+
+!split
+===== Training loop =====
+
+
+!bc pycod
+model = SimpleUNet(channels).to(device)
+opt   = torch.optim.Adam(model.parameters(), lr=lr)
+
+for epoch in range(epochs):
+    total_loss = 0
+    for x, _ in train_loader:
+        x = x.to(device)
+        loss = diffusion_loss(model, x)
+        opt.zero_grad()
+        loss.backward()
+        opt.step()
+        total_loss += loss.item()
+    print(f"Epoch {epoch+1}/{epochs}, Loss: {total_loss/len(train_loader):.4f}")
+!ec
+
+!split
+===== Sampling (Reverse Diffusion) =====
+
+
+!bc pycod
+@torch.no_grad()
+def p_sample_loop(model, shape):
+    x = torch.randn(shape, device=device)
+    for i in reversed(range(T)):
+        t = torch.full((shape[0],), i, device=device).float()/T
+        eps_pred = model(x, t)
+        beta_t = betas[i]
+        alpha_t = alphas[i]
+        acp_t   = alphas_cumprod[i]
+        coef1 = 1 / alpha_t.sqrt()
+        coef2 = beta_t / ( (1 - acp_t).sqrt() )
+        x = coef1*(x - coef2*eps_pred)
+        if i > 0:
+            z = torch.randn_like(x)
+            sigma = beta_t.sqrt()
+            x = x + sigma*z
+    return x
+
+# Generate samples
+samples = p_sample_loop(model, (16, channels, img_size, img_size))
+samples = samples.clamp(-1,1).cpu()
+grid = torchvision.utils.make_grid(samples, nrow=4, normalize=True)
+plt.figure(figsize=(5,5))
+plt.imshow(grid.permute(1,2,0))
+plt.axis('off')
+!ec
+
 
 
 !split
 ===== More details =====
 
-For more details and implementaions, see Calvin Luo at URL:"https://arxiv.org/abs/2208.11970"
+For more details and implementations, see Calvin Luo at URL:"https://arxiv.org/abs/2208.11970"