Spaces:

ahsanMah
/

localizing-anomalies

Runtime error

App Files Files Community

ahsanMah commited on Jun 26, 2024

Commit

6e569fe

1 Parent(s): 95a02fd

saving configs and making models easier to load

Browse files

Files changed (2) hide show

flowutils.py +63 -44
msma.py +32 -15

flowutils.py CHANGED Viewed

@@ -8,6 +8,66 @@ from einops import rearrange, repeat
 from normflows.distributions import BaseDistribution
 class ConditionalDiagGaussian(BaseDistribution):
     """
     Conditional multivariate Gaussian distribution with diagonal
@@ -61,50 +121,6 @@ class ConditionalDiagGaussian(BaseDistribution):
         return log_p
-def build_flows(
-    latent_size, num_flows=4, num_blocks_per_flow=2, hidden_units=128, context_size=64
-):
-    # Define flows
-    flows = []
-    flows.append(
-        nf.flows.MaskedAffineAutoregressive(
-            latent_size,
-            hidden_features=hidden_units,
-            num_blocks=num_blocks_per_flow,
-            context_features=context_size,
-        )
-    )
-    for i in range(num_flows):
-        flows += [
-            nf.flows.CoupledRationalQuadraticSpline(
-                latent_size,
-                num_blocks=num_blocks_per_flow,
-                num_hidden_channels=hidden_units,
-                num_context_channels=context_size,
-            )
-        ]
-        flows += [nf.flows.LULinearPermute(latent_size)]
-    # Set base distribution
-    context_encoder = nn.Sequential(
-        nn.Linear(context_size, context_size),
-        nn.SiLU(),
-        # output mean and scales for K=latent_size dimensions
-        nn.Linear(context_size, latent_size * 2),
-    )
-    q0 = ConditionalDiagGaussian(latent_size, context_encoder)
-    # Construct flow model
-    model = nf.ConditionalNormalizingFlow(q0, flows)
-    return model
 def get_emb(sin_inp):
     """
     Gets a base embedding for one dimension with sin and cos intertwined
@@ -204,6 +220,9 @@ class PatchFlow(torch.nn.Module):
         hidden_units=128,
     ):
         super().__init__()
         num_sigmas, c, h, w = input_size
         self.local_pooler = SpatialNormer(
             in_channels=num_sigmas, kernel_size=patch_size

 from normflows.distributions import BaseDistribution
+def sanitize_locals(args_dict, ignore_keys=None):
+    if ignore_keys is None:
+        ignore_keys = []
+    if not isinstance(ignore_keys, list):
+        ignore_keys = [ignore_keys]
+    _dict = args_dict.copy()
+    _dict.pop("self")
+    class_name = _dict.pop("__class__").__name__
+    class_params = {k: v for k, v in _dict.items() if k not in ignore_keys}
+    return {class_name: class_params}
+def build_flows(
+    latent_size, num_flows=4, num_blocks_per_flow=2, hidden_units=128, context_size=64
+):
+    # Define flows
+    flows = []
+    flows.append(
+        nf.flows.MaskedAffineAutoregressive(
+            latent_size,
+            hidden_features=hidden_units,
+            num_blocks=num_blocks_per_flow,
+            context_features=context_size,
+        )
+    )
+    for i in range(num_flows):
+        flows += [
+            nf.flows.CoupledRationalQuadraticSpline(
+                latent_size,
+                num_blocks=num_blocks_per_flow,
+                num_hidden_channels=hidden_units,
+                num_context_channels=context_size,
+            )
+        ]
+        flows += [nf.flows.LULinearPermute(latent_size)]
+    # Set base distribution
+    context_encoder = nn.Sequential(
+        nn.Linear(context_size, context_size),
+        nn.SiLU(),
+        # output mean and scales for K=latent_size dimensions
+        nn.Linear(context_size, latent_size * 2),
+    )
+    q0 = ConditionalDiagGaussian(latent_size, context_encoder)
+    # Construct flow model
+    model = nf.ConditionalNormalizingFlow(q0, flows)
+    return model
 class ConditionalDiagGaussian(BaseDistribution):
     """
     Conditional multivariate Gaussian distribution with diagonal
         return log_p
 def get_emb(sin_inp):
     """
     Gets a base embedding for one dimension with sin and cos intertwined
         hidden_units=128,
     ):
         super().__init__()
+        self.config = sanitize_locals(locals(), ignore_keys=input_size)
         num_sigmas, c, h, w = input_size
         self.local_pooler = SpatialNormer(
             in_channels=num_sigmas, kernel_size=patch_size

msma.py CHANGED Viewed

@@ -19,7 +19,7 @@ from tqdm import tqdm
 import dnnlib
 from dataset import ImageFolderDataset
-from flowutils import PatchFlow
 DEVICE: Literal["cuda", "cpu"] = 'cpu'
 model_root = "https://nvlabs-fi-cdn.nvidia.com/edm2/posthoc-reconstructions"
@@ -53,9 +53,12 @@ class EDMScorer(torch.nn.Module):
         sigma_max=80,  # Maximum supported noise level.
         sigma_data=0.5,  # Expected standard deviation of the training data.
         rho=7,  # Time step discretization.
-        device=torch.device("cpu"),  # Device to use.
     ):
         super().__init__()
         self.use_fp16 = use_fp16
         self.sigma_min = sigma_min
         self.sigma_max = sigma_max
@@ -67,14 +70,13 @@ class EDMScorer(torch.nn.Module):
         self.sigma_min = 1e-1
         self.sigma_max = sigma_max * stop_ratio
-        step_indices = torch.arange(num_steps, dtype=torch.float64, device=device)
         t_steps = (
             self.sigma_max ** (1 / rho)
             + step_indices
             / (num_steps - 1)
             * (self.sigma_min ** (1 / rho) - self.sigma_max ** (1 / rho))
         ) ** rho
-        # print("Using steps:", t_steps)
         self.register_buffer("sigma_steps", t_steps.to(torch.float64))
@@ -100,28 +102,32 @@ class EDMScorer(torch.nn.Module):
 class ScoreFlow(torch.nn.Module):
     def __init__(
         self,
-        preset,
         device="cpu",
         **flow_kwargs
     ):
         super().__init__()
-        scorenet = build_model(preset)
         h = w = scorenet.net.img_resolution
         c = scorenet.net.img_channels
         num_sigmas = len(scorenet.sigma_steps)
         self.flow = PatchFlow((num_sigmas, c, h, w), **flow_kwargs)
         self.flow = self.flow.to(device)
         self.scorenet = scorenet.to(device).requires_grad_(False)
         self.flow.init_weights()
     def forward(self, x, **score_kwargs):
         x_scores = self.scorenet(x, **score_kwargs)
         return self.flow(x_scores)
-def build_model(preset="edm2-img64-s-fid", device="cpu"):
     netpath = config_presets[preset]
     with dnnlib.util.open_url(netpath, verbose=1) as f:
         data = pickle.load(f)
@@ -198,7 +204,7 @@ def test_runner(device="cpu"):
     image = np.array(image)
     image = image.reshape(*image.shape[:2], -1).transpose(2, 0, 1)
     x = torch.from_numpy(image).unsqueeze(0).to(device)
-    model = build_model(device=device)
     scores = model(x)
     return scores
@@ -211,8 +217,8 @@ def test_flow_runner(preset, device="cpu", load_weights=None):
     image = np.array(image)
     image = image.reshape(*image.shape[:2], -1).transpose(2, 0, 1)
     x = torch.from_numpy(image).unsqueeze(0).to(device)
-    score_flow = ScoreFlow(preset, device=device)
     if load_weights is not None:
         score_flow.flow.load_state_dict(torch.load(load_weights))
@@ -272,7 +278,7 @@ def cache_score_norms(preset, dataset_path, outdir):
         dsobj, batch_size=64, num_workers=4, prefetch_factor=2
     )
-    model = build_model(preset=preset, device=device)
     score_norms = []
     for x, _ in tqdm(dsloader):
@@ -312,6 +318,14 @@ def cache_score_norms(preset, dataset_path, outdir):
     default="edm2-img64-s-fid",
     show_default=True,
 )
 @click.option(
     "--num_flows",
     help="Number of normalizing flow functions in the PatchFlow model",
@@ -320,7 +334,7 @@ def cache_score_norms(preset, dataset_path, outdir):
     default=4,
     show_default=True,
 )
-def train_flow(dataset_path, preset, outdir, epochs=10, **flow_kwargs):
     print("using device:", DEVICE)
     device = DEVICE
     dsobj = ImageFolderDataset(path=dataset_path, resolution=64)
@@ -345,7 +359,8 @@ def train_flow(dataset_path, preset, outdir, epochs=10, **flow_kwargs):
         val_ds, batch_size=128, num_workers=4, prefetch_factor=2
     )
-    model = ScoreFlow(preset, device=device, **flow_kwargs)
     opt = torch.optim.AdamW(model.flow.parameters(), lr=3e-4, weight_decay=1e-5)
     train_step = partial(
         PatchFlow.stochastic_step,
@@ -373,6 +388,7 @@ def train_flow(dataset_path, preset, outdir, epochs=10, **flow_kwargs):
     step = 0
     for e in pbar:
         for x, _ in trainiter:
             x = x.to(device)
             scores = model.scorenet(x)
@@ -411,13 +427,14 @@ def train_flow(dataset_path, preset, outdir, epochs=10, **flow_kwargs):
     # Squeeze the juice
     best_ckpt = torch.load(f"{experiment_dir}/flow.pt")
     model.flow.load_state_dict(best_ckpt)
-    for i, (x, _) in enumerate(testiter):
         x = x.to(device)
         scores = model.scorenet(x)
         train_loss = train_step(scores, x)
         writer.add_scalar("loss/train", train_loss, step)
         pbar.set_description(
-            f"(Tuning) Step: {step:d} - Train: {train_loss:.3f} - Val: {val_loss:.3f}"
         )
         step += 1

 import dnnlib
 from dataset import ImageFolderDataset
+from flowutils import PatchFlow, sanitize_locals
 DEVICE: Literal["cuda", "cpu"] = 'cpu'
 model_root = "https://nvlabs-fi-cdn.nvidia.com/edm2/posthoc-reconstructions"
         sigma_max=80,  # Maximum supported noise level.
         sigma_data=0.5,  # Expected standard deviation of the training data.
         rho=7,  # Time step discretization.
     ):
         super().__init__()
+        self.config = sanitize_locals(locals(), ignore_keys='net')
+        self.config['EDMNet'] = dict(net.init_kwargs)
         self.use_fp16 = use_fp16
         self.sigma_min = sigma_min
         self.sigma_max = sigma_max
         self.sigma_min = 1e-1
         self.sigma_max = sigma_max * stop_ratio
+        step_indices = torch.arange(num_steps, dtype=torch.float64)
         t_steps = (
             self.sigma_max ** (1 / rho)
             + step_indices
             / (num_steps - 1)
             * (self.sigma_min ** (1 / rho) - self.sigma_max ** (1 / rho))
         ) ** rho
         self.register_buffer("sigma_steps", t_steps.to(torch.float64))
 class ScoreFlow(torch.nn.Module):
     def __init__(
         self,
+        scorenet,
         device="cpu",
         **flow_kwargs
     ):
         super().__init__()
         h = w = scorenet.net.img_resolution
         c = scorenet.net.img_channels
         num_sigmas = len(scorenet.sigma_steps)
         self.flow = PatchFlow((num_sigmas, c, h, w), **flow_kwargs)
         self.flow = self.flow.to(device)
         self.scorenet = scorenet.to(device).requires_grad_(False)
         self.flow.init_weights()
+        self.config = dict()
+        self.config.update(**self.scorenet.config)
+        self.config.update(self.flow.config)
     def forward(self, x, **score_kwargs):
         x_scores = self.scorenet(x, **score_kwargs)
         return self.flow(x_scores)
+def build_model_from_pickle(preset="edm2-img64-s-fid", device="cpu"):
     netpath = config_presets[preset]
     with dnnlib.util.open_url(netpath, verbose=1) as f:
         data = pickle.load(f)
     image = np.array(image)
     image = image.reshape(*image.shape[:2], -1).transpose(2, 0, 1)
     x = torch.from_numpy(image).unsqueeze(0).to(device)
+    model = build_model_from_pickle(device=device)
     scores = model(x)
     return scores
     image = np.array(image)
     image = image.reshape(*image.shape[:2], -1).transpose(2, 0, 1)
     x = torch.from_numpy(image).unsqueeze(0).to(device)
+    scorenet = build_model_from_pickle(preset)
+    score_flow = ScoreFlow(scorenet, device=device)
     if load_weights is not None:
         score_flow.flow.load_state_dict(torch.load(load_weights))
         dsobj, batch_size=64, num_workers=4, prefetch_factor=2
     )
+    model = build_model_from_pickle(preset=preset, device=device)
     score_norms = []
     for x, _ in tqdm(dsloader):
     default="edm2-img64-s-fid",
     show_default=True,
 )
+@click.option(
+    "--epochs",
+    help="Number of epochs",
+    metavar="INT",
+    type=int,
+    default=10,
+    show_default=True,
+)
 @click.option(
     "--num_flows",
     help="Number of normalizing flow functions in the PatchFlow model",
     default=4,
     show_default=True,
 )
+def train_flow(dataset_path, preset, outdir, epochs, **flow_kwargs):
     print("using device:", DEVICE)
     device = DEVICE
     dsobj = ImageFolderDataset(path=dataset_path, resolution=64)
         val_ds, batch_size=128, num_workers=4, prefetch_factor=2
     )
+    scorenet = build_model_from_pickle(preset)
+    model = ScoreFlow(scorenet, device=device, **flow_kwargs)
     opt = torch.optim.AdamW(model.flow.parameters(), lr=3e-4, weight_decay=1e-5)
     train_step = partial(
         PatchFlow.stochastic_step,
     step = 0
     for e in pbar:
         for x, _ in trainiter:
             x = x.to(device)
             scores = model.scorenet(x)
     # Squeeze the juice
     best_ckpt = torch.load(f"{experiment_dir}/flow.pt")
     model.flow.load_state_dict(best_ckpt)
+    pbar = tqdm(testiter, desc="(Tuning) Step:? - Loss: ?")
+    for x, _ in pbar:
         x = x.to(device)
         scores = model.scorenet(x)
         train_loss = train_step(scores, x)
         writer.add_scalar("loss/train", train_loss, step)
         pbar.set_description(
+            f"(Tuning) Step: {step:d} - Loss: {train_loss:.3f}"
         )
         step += 1