Spaces:

ahsanMah
/

localizing-anomalies

Running

App Files Files Community

ahsanMah commited on Jun 25, 2024

Commit

a186356

1 Parent(s): 1b96548

using groups for command line options

Browse files

Files changed (1) hide show

msma.py +142 -112

msma.py CHANGED Viewed

@@ -3,6 +3,7 @@ import os
 import pickle
 from functools import partial
 from pickle import dump, load
 import click
 import numpy as np
@@ -20,6 +21,7 @@ import dnnlib
 from dataset import ImageFolderDataset
 from flowutils import PatchFlow
 model_root = "https://nvlabs-fi-cdn.nvidia.com/edm2/posthoc-reconstructions"
 config_presets = {
@@ -100,6 +102,7 @@ class ScoreFlow(torch.nn.Module):
         self,
         preset,
         device="cpu",
     ):
         super().__init__()
@@ -107,7 +110,7 @@ class ScoreFlow(torch.nn.Module):
         h = w = scorenet.net.img_resolution
         c = scorenet.net.img_channels
         num_sigmas = len(scorenet.sigma_steps)
-        self.flow = PatchFlow((num_sigmas, c, h, w))
         self.flow = self.flow.to(device)
         self.scorenet = scorenet.to(device).requires_grad_(False)
@@ -187,7 +190,78 @@ def compute_gmm_likelihood(x_score, gmmdir):
     return nll, percentile
-def cache_score_norms(preset, dataset_path, outdir, device="cpu"):
     dsobj = ImageFolderDataset(path=dataset_path, resolution=64)
     refimg, reflabel = dsobj[0]
     print(f"Loading dataset from {dataset_path}")
@@ -215,7 +289,40 @@ def cache_score_norms(preset, dataset_path, outdir, device="cpu"):
     print(f"Computed score norms for {score_norms.shape[0]} samples")
-def train_flow(dataset_path, preset, outdir, epochs=10, device="cuda"):
     dsobj = ImageFolderDataset(path=dataset_path, resolution=64)
     refimg, reflabel = dsobj[0]
     print(f"Loaded {len(dsobj)} samples from {dataset_path}")
@@ -238,7 +345,7 @@ def train_flow(dataset_path, preset, outdir, epochs=10, device="cuda"):
         val_ds, batch_size=128, num_workers=4, prefetch_factor=2
     )
-    model = ScoreFlow(preset, device=device)
     opt = torch.optim.AdamW(model.flow.parameters(), lr=3e-4, weight_decay=1e-5)
     train_step = partial(
         PatchFlow.stochastic_step,
@@ -274,6 +381,10 @@ def train_flow(dataset_path, preset, outdir, epochs=10, device="cuda"):
                 with torch.inference_mode():
                     val_loss = eval_step(scores, x)
             train_loss = train_step(scores, x)
             if (step + 1) % 10 == 0:
@@ -297,117 +408,36 @@ def train_flow(dataset_path, preset, outdir, epochs=10, device="cuda"):
             )
             step += 1
-    # torch.save(model.flow.state_dict(), f"{experiment_dir}/flow.pt")
-    writer.close()
-@torch.inference_mode
-def test_runner(device="cpu"):
-    # f = "doge.jpg"
-    f = "goldfish.JPEG"
-    image = (PIL.Image.open(f)).resize((64, 64), PIL.Image.Resampling.LANCZOS)
-    image = np.array(image)
-    image = image.reshape(*image.shape[:2], -1).transpose(2, 0, 1)
-    x = torch.from_numpy(image).unsqueeze(0).to(device)
-    model = build_model(device=device)
-    scores = model(x)
-    return scores
-def test_flow_runner(preset, device="cpu", load_weights=None):
-    # f = "doge.jpg"
-    f = "goldfish.JPEG"
-    image = (PIL.Image.open(f)).resize((64, 64), PIL.Image.Resampling.LANCZOS)
-    image = np.array(image)
-    image = image.reshape(*image.shape[:2], -1).transpose(2, 0, 1)
-    x = torch.from_numpy(image).unsqueeze(0).to(device)
-    score_flow = ScoreFlow(preset, device=device)
-    if load_weights is not None:
-        score_flow.flow.load_state_dict(torch.load(load_weights))
-    heatmap = score_flow(x)
-    print(heatmap.shape)
-    heatmap = score_flow(x).detach().cpu().numpy()
-    heatmap = (heatmap - heatmap.min()) / (heatmap.max() - heatmap.min()) * 255
-    im = PIL.Image.fromarray(heatmap[0, 0])
-    im.convert("RGB").save(
-        "heatmap.png",
-    )
-    return
-@click.command()
-# Main options.
-@click.option(
-    "--run",
-    help="Which function to run",
-    type=click.Choice(
-        ["cache-scores", "train-flow", "train-gmm"], case_sensitive=False
-    ),
-)
-@click.option(
-    "--outdir",
-    help="Where to load/save the results",
-    metavar="DIR",
-    type=str,
-    required=True,
-)
-@click.option(
-    "--preset",
-    help="Configuration preset",
-    metavar="STR",
-    type=str,
-    default="edm2-img64-s-fid",
-    show_default=True,
-)
-@click.option(
-    "--data", help="Path to the dataset", metavar="ZIP|DIR", type=str, default=None
-)
-def cmdline(run, outdir, **opts):
-    device = "cuda" if torch.cuda.is_available() else "cpu"
-    preset = opts["preset"]
-    dataset_path = opts["data"]
-    if run in ["cache-scores", "train-flow"]:
-        assert opts["data"] is not None, "Provide path to dataset"
-    if run == "cache-scores":
-        cache_score_norms(
-            preset=preset, dataset_path=dataset_path, outdir=outdir, device=device
-        )
-    if run == "train-gmm":
-        train_gmm(
-            score_path=f"{outdir}/{preset}/imagenette_score_norms.pt",
-            outdir=f"{outdir}/{preset}",
-            grid_search=True,
-        )
-    if run == "train-flow":
-        train_flow(dataset_path, outdir=outdir, preset=preset, device=device)
-        test_flow_runner(preset, device=device, load_weights=f"{outdir}/{preset}/flow.pt")
-    # train_flow(imagenette_path, preset, device)
-    # cache_score_norms(
-    #     preset=preset,
-    #     dataset_path="/GROND_STOR/amahmood/datasets/img64/",
-    #     device="cuda",
-    # )
-    # train_gmm(
-    #     f"out/msma/{preset}_imagenette_score_norms.pt", outdir=f"out/msma/{preset}"
-    # )
-    # s = test_runner(device=device)
-    # s = s.square().sum(dim=(2, 3, 4)) ** 0.5
-    # s = s.to("cpu").numpy()
-    # nll, pct = compute_gmm_likelihood(s, gmmdir=f"out/msma/{preset}/")
-    # print(f"Anomaly score for image: {nll[0]:.3f} @ {pct*100:.2f} percentile")
 if __name__ == "__main__":

 import pickle
 from functools import partial
 from pickle import dump, load
+from typing import Literal
 import click
 import numpy as np
 from dataset import ImageFolderDataset
 from flowutils import PatchFlow
+DEVICE: Literal["cuda", "cpu"] = 'cpu'
 model_root = "https://nvlabs-fi-cdn.nvidia.com/edm2/posthoc-reconstructions"
 config_presets = {
         self,
         preset,
         device="cpu",
+        **flow_kwargs
     ):
         super().__init__()
         h = w = scorenet.net.img_resolution
         c = scorenet.net.img_channels
         num_sigmas = len(scorenet.sigma_steps)
+        self.flow = PatchFlow((num_sigmas, c, h, w), **flow_kwargs)
         self.flow = self.flow.to(device)
         self.scorenet = scorenet.to(device).requires_grad_(False)
     return nll, percentile
+@torch.inference_mode
+def test_runner(device="cpu"):
+    # f = "doge.jpg"
+    f = "goldfish.JPEG"
+    image = (PIL.Image.open(f)).resize((64, 64), PIL.Image.Resampling.LANCZOS)
+    image = np.array(image)
+    image = image.reshape(*image.shape[:2], -1).transpose(2, 0, 1)
+    x = torch.from_numpy(image).unsqueeze(0).to(device)
+    model = build_model(device=device)
+    scores = model(x)
+    return scores
+def test_flow_runner(preset, device="cpu", load_weights=None):
+    # f = "doge.jpg"
+    f = "goldfish.JPEG"
+    image = (PIL.Image.open(f)).resize((64, 64), PIL.Image.Resampling.LANCZOS)
+    image = np.array(image)
+    image = image.reshape(*image.shape[:2], -1).transpose(2, 0, 1)
+    x = torch.from_numpy(image).unsqueeze(0).to(device)
+    score_flow = ScoreFlow(preset, device=device)
+    if load_weights is not None:
+        score_flow.flow.load_state_dict(torch.load(load_weights))
+    heatmap = score_flow(x)
+    print(heatmap.shape)
+    heatmap = score_flow(x).detach().cpu().numpy()
+    heatmap = (heatmap - heatmap.min()) / (heatmap.max() - heatmap.min()) * 255
+    im = PIL.Image.fromarray(heatmap[0, 0])
+    im.convert("RGB").save(
+        "heatmap.png",
+    )
+    return
+@click.group()
+def cmdline():
+    global DEVICE
+    DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
+@cmdline.command(name="cache-scores")
+@click.option(
+    "--preset",
+    help="Configuration preset",
+    metavar="STR",
+    type=str,
+    default="edm2-img64-s-fid",
+    show_default=True,
+)
+@click.option(
+    "--dataset_path",
+    help="Path to the dataset",
+    metavar="ZIP|DIR",
+    type=str,
+    default=None,
+)
+@click.option(
+    "--outdir",
+    help="Where to load/save the results",
+    metavar="DIR",
+    type=str,
+    required=True,
+)
+def cache_score_norms(preset, dataset_path, outdir):
+    device = DEVICE
     dsobj = ImageFolderDataset(path=dataset_path, resolution=64)
     refimg, reflabel = dsobj[0]
     print(f"Loading dataset from {dataset_path}")
     print(f"Computed score norms for {score_norms.shape[0]} samples")
+@cmdline.command(name="train-flow")
+@click.option(
+    "--dataset_path",
+    help="Path to the dataset",
+    metavar="ZIP|DIR",
+    type=str,
+    default=None,
+)
+@click.option(
+    "--outdir",
+    help="Where to load/save the results",
+    metavar="DIR",
+    type=str,
+    required=True,
+)
+@click.option(
+    "--preset",
+    help="Configuration preset",
+    metavar="STR",
+    type=str,
+    default="edm2-img64-s-fid",
+    show_default=True,
+)
+@click.option(
+    "--num_flows",
+    help="Number of normalizing flow functions in the PatchFlow model",
+    metavar="INT",
+    type=int,
+    default=4,
+    show_default=True,
+)
+def train_flow(dataset_path, preset, outdir, epochs=10, **flow_kwargs):
+    print("using device:", DEVICE)
+    device = DEVICE
     dsobj = ImageFolderDataset(path=dataset_path, resolution=64)
     refimg, reflabel = dsobj[0]
     print(f"Loaded {len(dsobj)} samples from {dataset_path}")
         val_ds, batch_size=128, num_workers=4, prefetch_factor=2
     )
+    model = ScoreFlow(preset, device=device, **flow_kwargs)
     opt = torch.optim.AdamW(model.flow.parameters(), lr=3e-4, weight_decay=1e-5)
     train_step = partial(
         PatchFlow.stochastic_step,
                 with torch.inference_mode():
                     val_loss = eval_step(scores, x)
+                # Log details about model
+                writer.add_graph(model.flow.flows, (torch.zeros(1, scores.shape[1], device=device),
+                                                    torch.zeros(1, model.flow.position_encoding.cached_penc.shape[-1], device=device)))
             train_loss = train_step(scores, x)
             if (step + 1) % 10 == 0:
             )
             step += 1
+    # Squeeze the juice
+    best_ckpt = torch.load(f"{experiment_dir}/flow.pt")
+    model.flow.load_state_dict(best_ckpt)
+    for i, (x, _) in enumerate(testiter):
+        x = x.to(device)
+        scores = model.scorenet(x)
+        train_loss = train_step(scores, x)
+        writer.add_scalar("loss/train", train_loss, step)
+        pbar.set_description(
+            f"(Tuning) Step: {step:d} - Train: {train_loss:.3f} - Val: {val_loss:.3f}"
+        )
+        step += 1
+    torch.save(model.flow.state_dict(), f"{experiment_dir}/flow.pt")
+    writer.close()
+# cache_score_norms(
+#     preset=preset,
+#     dataset_path="/GROND_STOR/amahmood/datasets/img64/",
+#     device="cuda",
+# )
+# train_gmm(
+#     f"out/msma/{preset}_imagenette_score_norms.pt", outdir=f"out/msma/{preset}"
+# )
+# s = test_runner(device=device)
+# s = s.square().sum(dim=(2, 3, 4)) ** 0.5
+# s = s.to("cpu").numpy()
+# nll, pct = compute_gmm_likelihood(s, gmmdir=f"out/msma/{preset}/")
+# print(f"Anomaly score for image: {nll[0]:.3f} @ {pct*100:.2f} percentile")
 if __name__ == "__main__":